Implementation notes: amd64, gpu, crypto_kem/saber2

Computer: gpu
Architecture: amd64
CPU ID: GenuineIntel-000206d7-bfebfbff
SUPERCOP version: 20190816
Operation: crypto_kem
Primitive: saber2
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
814011103080 0 0122988 776 1968refclang_-O3_-fwrapv_-march=native_-fomit-frame-pointer_-Qunused-arguments2019101220190816
83234796177 0 0118772 776 1616refclang_-mcpu=cortex-a8_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019101220190816
861609103080 0 0122988 776 1968refclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019101220190816
86664996097 0 0117364 776 1616refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019101220190816
87513992146 0 0111388 776 1968refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019101220190816
89081496177 0 0118772 776 1616refclang_-mcpu=cortex-a9_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019101220190816
90215492146 0 0111388 776 1968refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019101220190816
91127196177 0 0118772 776 1616refclang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019101220190816
1582266? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-O3_-fomit-frame-pointer2019101220190816
1593996? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-O3_-fomit-frame-pointer2019101220190816
1607904? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-O3_-fomit-frame-pointer2019101220190816
1620525? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-O3_-fomit-frame-pointer2019101220190816
1628787? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-O3_-fomit-frame-pointer2019101220190816
1632114? ? ?? ? ?refgcc_-m64_-O3_-fomit-frame-pointer2019101220190816
1634691? ? ?? ? ?refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019101220190816
1642143? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019101220190816
1645761? ? ?? ? ?refgcc_-m64_-march=k8_-O3_-fomit-frame-pointer2019101220190816
1647552? ? ?? ? ?refgcc_-O3_-fomit-frame-pointer2019101220190816
1648044? ? ?? ? ?refgcc_-funroll-loops_-m64_-O3_-fomit-frame-pointer2019101220190816
1652682? ? ?? ? ?refgcc_-march=nocona_-O3_-fomit-frame-pointer2019101220190816
1658703? ? ?? ? ?refgcc_-m64_-march=barcelona_-O3_-fomit-frame-pointer2019101220190816
1661160? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-O3_-fomit-frame-pointer2019101220190816
1663044? ? ?? ? ?refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019101220190816
1665921? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-O3_-fomit-frame-pointer2019101220190816
1669239? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-O3_-fomit-frame-pointer2019101220190816
1670859? ? ?? ? ?refgcc_-m64_-march=core2_-O3_-fomit-frame-pointer2019101220190816
1671360? ? ?? ? ?refgcc_-m64_-march=nocona_-O3_-fomit-frame-pointer2019101220190816
1681671? ? ?? ? ?refgcc_-march=barcelona_-O3_-fomit-frame-pointer2019101220190816
1683099? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-O3_-fomit-frame-pointer2019101220190816
1688751? ? ?? ? ?refgcc_-march=k8_-O3_-fomit-frame-pointer2019101220190816
1708986? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-O3_-fomit-frame-pointer2019101220190816
1714455? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-O3_-fomit-frame-pointer2019101220190816
1727532? ? ?? ? ?refgcc_-m64_-march=corei7_-O3_-fomit-frame-pointer2019101220190816
1858269? ? ?? ? ?refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019101220190816
2479335? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-O_-fomit-frame-pointer2019101220190816
2503089? ? ?? ? ?refgcc_-m64_-march=corei7_-O2_-fomit-frame-pointer2019101220190816
2631228? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-O2_-fomit-frame-pointer2019101220190816
2638941? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-O2_-fomit-frame-pointer2019101220190816
2643843? ? ?? ? ?refgcc_-funroll-loops_-m64_-O2_-fomit-frame-pointer2019101220190816
2655618? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-O2_-fomit-frame-pointer2019101220190816
2662650? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-O_-fomit-frame-pointer2019101220190816
2662890? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-O_-fomit-frame-pointer2019101220190816
2668368? ? ?? ? ?refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019101220190816
2669385? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-O2_-fomit-frame-pointer2019101220190816
2673966? ? ?? ? ?refgcc_-m64_-march=corei7_-O_-fomit-frame-pointer2019101220190816
2675649? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-O2_-fomit-frame-pointer2019101220190816
2676555? ? ?? ? ?refgcc_-m64_-O2_-fomit-frame-pointer2019101220190816
2689713? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-O2_-fomit-frame-pointer2019101220190816
2693358? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-O_-fomit-frame-pointer2019101220190816
2695986? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019101220190816
2696769? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-O_-fomit-frame-pointer2019101220190816
2698068? ? ?? ? ?refgcc_-funroll-loops_-m64_-O_-fomit-frame-pointer2019101220190816
2700114? ? ?? ? ?refgcc_-m64_-O_-fomit-frame-pointer2019101220190816
2708808? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019101220190816
2716812? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-O_-fomit-frame-pointer2019101220190816
2718240? ? ?? ? ?refgcc_-m64_-march=k8_-O2_-fomit-frame-pointer2019101220190816
2726163? ? ?? ? ?refgcc_-march=k8_-O2_-fomit-frame-pointer2019101220190816
2729232? ? ?? ? ?refgcc_-m64_-march=k8_-O_-fomit-frame-pointer2019101220190816
2730438? ? ?? ? ?refgcc_-m64_-march=barcelona_-O_-fomit-frame-pointer2019101220190816
2731008? ? ?? ? ?refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019101220190816
2733072? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-O_-fomit-frame-pointer2019101220190816
2740074? ? ?? ? ?refgcc_-m64_-march=core2_-O_-fomit-frame-pointer2019101220190816
2758155? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-O_-fomit-frame-pointer2019101220190816
2771427? ? ?? ? ?refgcc_-m64_-march=barcelona_-O2_-fomit-frame-pointer2019101220190816
2772054? ? ?? ? ?refgcc_-O2_-fomit-frame-pointer2019101220190816
2775450? ? ?? ? ?refgcc_-m64_-march=nocona_-O_-fomit-frame-pointer2019101220190816
2782959? ? ?? ? ?refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019101220190816
2785839? ? ?? ? ?refgcc_-march=barcelona_-O_-fomit-frame-pointer2019101220190816
2786244? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-O2_-fomit-frame-pointer2019101220190816
2790924? ? ?? ? ?refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019101220190816
2796642? ? ?? ? ?refgcc_-march=barcelona_-O2_-fomit-frame-pointer2019101220190816
2806335? ? ?? ? ?refgcc_-O_-fomit-frame-pointer2019101220190816
2807592? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-O2_-fomit-frame-pointer2019101220190816
2807745? ? ?? ? ?refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019101220190816
2810382? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-O_-fomit-frame-pointer2019101220190816
2835852? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-O2_-fomit-frame-pointer2019101220190816
2837181? ? ?? ? ?refgcc_-m64_-march=core2_-O2_-fomit-frame-pointer2019101220190816
2838924? ? ?? ? ?refgcc_-march=nocona_-O2_-fomit-frame-pointer2019101220190816
2849391? ? ?? ? ?refgcc_-march=nocona_-O_-fomit-frame-pointer2019101220190816
2859624? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-O2_-fomit-frame-pointer2019101220190816
2868666? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-O2_-fomit-frame-pointer2019101220190816
2913009? ? ?? ? ?refgcc_-funroll-loops_-O_-fomit-frame-pointer2019101220190816
2917389? ? ?? ? ?refgcc_-funroll-loops_-m64_-Os_-fomit-frame-pointer2019101220190816
2921652? ? ?? ? ?refgcc_-m64_-march=nocona_-O2_-fomit-frame-pointer2019101220190816
2934000? ? ?? ? ?refgcc_-m64_-Os_-fomit-frame-pointer2019101220190816
2935731? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-Os_-fomit-frame-pointer2019101220190816
2940873? ? ?? ? ?refgcc_-m64_-march=core2_-Os_-fomit-frame-pointer2019101220190816
2954415? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-Os_-fomit-frame-pointer2019101220190816
2965128? ? ?? ? ?refgcc_-march=barcelona_-Os_-fomit-frame-pointer2019101220190816
2967606? ? ?? ? ?refgcc_-Os_-fomit-frame-pointer2019101220190816
2968953? ? ?? ? ?refgcc_-m64_-march=nocona_-Os_-fomit-frame-pointer2019101220190816
2991537? ? ?? ? ?refgcc_-march=nocona_-Os_-fomit-frame-pointer2019101220190816
3005988? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-O_-fomit-frame-pointer2019101220190816
3021414? ? ?? ? ?refgcc_-march=k8_-O_-fomit-frame-pointer2019101220190816
3025035? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-Os_-fomit-frame-pointer2019101220190816
3025338? ? ?? ? ?refgcc_-m64_-march=barcelona_-Os_-fomit-frame-pointer2019101220190816
3033009? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-O_-fomit-frame-pointer2019101220190816
3037896? ? ?? ? ?refgcc_-march=k8_-Os_-fomit-frame-pointer2019101220190816
3044574? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-Os_-fomit-frame-pointer2019101220190816
3045714? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-Os_-fomit-frame-pointer2019101220190816
3048633? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-Os_-fomit-frame-pointer2019101220190816
3058014? ? ?? ? ?refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019101220190816
3061656? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-Os_-fomit-frame-pointer2019101220190816
3069360? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-Os_-fomit-frame-pointer2019101220190816
3071829? ? ?? ? ?refgcc_-m64_-march=corei7_-Os_-fomit-frame-pointer2019101220190816
3077799? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-Os_-fomit-frame-pointer2019101220190816
3079398? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-Os_-fomit-frame-pointer2019101220190816
3079989? ? ?? ? ?refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019101220190816
3085716? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-Os_-fomit-frame-pointer2019101220190816
3097077? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019101220190816
3161652? ? ?? ? ?refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019101220190816
3343350? ? ?? ? ?refgcc_-m64_-march=k8_-Os_-fomit-frame-pointer2019101220190816
12731496? ? ?? ? ?refcc2019101220190816
12866145? ? ?? ? ?refgcc2019101220190816
13094745? ? ?? ? ?refgcc_-funroll-loops2019101220190816

Test failure

Implementation: avx2
Security model: unknown
Compiler: gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer avx2
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer avx2
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer avx2
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer ref

Compiler output

Implementation: avx2
Security model: unknown
Compiler: cc
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c: In function 'schoolbook_avx_new1':
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:50:11: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
SABER_indcpa.c: c_avx[0] = _mm256_mullo_epi16 (a[0], b[0]);
SABER_indcpa.c: ~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:41:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avxintrin.h:1295:1: error: inlining failed in call to always_inline '_mm256_set_epi64x': target specific option mismatch
SABER_indcpa.c: _mm256_set_epi64x (long long __A, long long __B, long long __C,
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:535:24: note: called from here
SABER_indcpa.c: c_avx[2*SCM_SIZE-1] = _mm256_set_epi64x(0, 0, 0, 0);
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
SABER_indcpa.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ...

Number of similar (compiler,implementation) pairs: 87, namely:
CompilerImplementations
cc avx2
gcc avx2
gcc -O2 -fomit-frame-pointer avx2
gcc -O3 -fomit-frame-pointer avx2
gcc -O -fomit-frame-pointer avx2
gcc -Os -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx2
gcc -fno-schedule-insns -O -fomit-frame-pointer avx2
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx2
gcc -funroll-loops avx2
gcc -funroll-loops -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -O -fomit-frame-pointer avx2
gcc -funroll-loops -Os -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx2
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer avx2
gcc -m64 -O2 -fomit-frame-pointer avx2
gcc -m64 -O3 -fomit-frame-pointer avx2
gcc -m64 -O -fomit-frame-pointer avx2
gcc -m64 -Os -fomit-frame-pointer avx2
gcc -m64 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m64 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m64 -march=core2 -O -fomit-frame-pointer avx2
gcc -m64 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m64 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m64 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m64 -march=corei7 -O -fomit-frame-pointer avx2
gcc -m64 -march=corei7 -Os -fomit-frame-pointer avx2
gcc -m64 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m64 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m64 -march=k8 -O -fomit-frame-pointer avx2
gcc -m64 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m64 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m64 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m64 -march=nocona -O -fomit-frame-pointer avx2
gcc -m64 -march=nocona -Os -fomit-frame-pointer avx2
gcc -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -march=barcelona -O -fomit-frame-pointer avx2
gcc -march=barcelona -Os -fomit-frame-pointer avx2
gcc -march=k8 -O2 -fomit-frame-pointer avx2
gcc -march=k8 -O3 -fomit-frame-pointer avx2
gcc -march=k8 -O -fomit-frame-pointer avx2
gcc -march=k8 -Os -fomit-frame-pointer avx2
gcc -march=nocona -O2 -fomit-frame-pointer avx2
gcc -march=nocona -O3 -fomit-frame-pointer avx2
gcc -march=nocona -O -fomit-frame-pointer avx2
gcc -march=nocona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: avx2
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
SABER_indcpa.c: In file included from SABER_indcpa.c:8:
SABER_indcpa.c: In file included from ././polymul/toom_cook_4/toom-cook_4way.c:1:
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:50:13: error: always_inline function '_mm256_mullo_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: c_avx[0] = _mm256_mullo_epi16 (a[0], b[0]);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:51:13: error: always_inline function '_mm256_mullo_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: c_avx[1] = _mm256_mullo_epi16 (a[0], b[1]);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:52:9: error: always_inline function '_mm256_mullo_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: temp = _mm256_mullo_epi16 (a[1], b[0]);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:53:13: error: always_inline function '_mm256_add_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: c_avx[1] = _mm256_add_epi16(c_avx[1], temp);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:54:13: error: always_inline function '_mm256_mullo_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: c_avx[2] = _mm256_mullo_epi16 (a[0], b[2]);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:55:9: error: always_inline function '_mm256_mullo_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: temp = _mm256_mullo_epi16 (a[1], b[1]);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:56:13: error: always_inline function '_mm256_add_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: c_avx[2] = _mm256_add_epi16(c_avx[2], temp);
SABER_indcpa.c: ^
SABER_indcpa.c: ././polymul/toom_cook_4/scm_avx.c:57:9: error: always_inline function '_mm256_mullo_epi16' requires target feature 'avx2', but would be inlined into function 'schoolbook_avx_new1' that is compiled without support for 'avx2'
SABER_indcpa.c: temp = _mm256_mullo_epi16 (a[2], b[0]);
SABER_indcpa.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx2
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx2
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx2
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx2
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx2
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx2

Compiler output

Implementation: avx2
Security model: unknown
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c: In function 'schoolbook_avx_new1':
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:50:11: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
SABER_indcpa.c: c_avx[0] = _mm256_mullo_epi16 (a[0], b[0]);
SABER_indcpa.c: ~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:41:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avxintrin.h:1295:1: error: inlining failed in call to always_inline '_mm256_set_epi64x': target specific option mismatch
SABER_indcpa.c: _mm256_set_epi64x (long long __A, long long __B, long long __C,
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:535:24: note: called from here
SABER_indcpa.c: c_avx[2*SCM_SIZE-1] = _mm256_set_epi64x(0, 0, 0, 0);
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
SABER_indcpa.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ...
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c: In function 'schoolbook_avx_new1':
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:50:11: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
SABER_indcpa.c: c_avx[0] = _mm256_mullo_epi16 (a[0], b[0]);
SABER_indcpa.c: ~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:41:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avxintrin.h:1295:1: error: inlining failed in call to always_inline '_mm256_set_epi64x': target specific option mismatch
SABER_indcpa.c: _mm256_set_epi64x (long long __A, long long __B, long long __C,
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:535:24: note: called from here
SABER_indcpa.c: c_avx[2*SCM_SIZE-1] = _mm256_set_epi64x(0, 0, 0, 0);
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
SABER_indcpa.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m64 -march=barcelona -O -fomit-frame-pointer avx2
gcc -m64 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: avx2
Security model: unknown
Compiler: gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c: In function 'schoolbook_avx_new1':
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
SABER_indcpa.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:532:14: note: called from here
SABER_indcpa.c: c_avx[30] = _mm256_mullo_epi16 (a[15], b[15]);
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: from SABER_indcpa.c:4:
SABER_indcpa.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:112:1: error: inlining failed in call to always_inline '_mm256_add_epi16': target specific option mismatch
SABER_indcpa.c: _mm256_add_epi16 (__m256i __A, __m256i __B)
SABER_indcpa.c: ^~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from ./polymul/toom_cook_4/toom-cook_4way.c:1:0,
SABER_indcpa.c: from SABER_indcpa.c:8:
SABER_indcpa.c: ./polymul/toom_cook_4/scm_avx.c:531:14: note: called from here
SABER_indcpa.c: c_avx[29] = _mm256_add_epi16(c_avx[29], temp);
SABER_indcpa.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
SABER_indcpa.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
SABER_indcpa.c: from SABER_indcpa.h:4,
SABER_indcpa.c: ...

Number of similar (compiler,implementation) pairs: 16, namely:
CompilerImplementations
gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m64 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m64 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m64 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m64 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m64 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m64 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m64 -march=corei7-avx -Os -fomit-frame-pointer avx2
gcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer avx2
gcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer avx2
gcc -m64 -march=native -mtune=native -O -fomit-frame-pointer avx2
gcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer avx2
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx2
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx2

Compiler output

Implementation: ref
Security model: unknown
Compiler: cc
measure.c: /usr/bin/ld: /home/z/supercop/supercop-20190816/supercop-data/gpu/amd64/lib/fastrandombytes.o: relocation R_X86_64_32 against `.bss' can not be used when making a PIE object; recompile with -fPIC
measure.c: /usr/bin/ld: final link failed: Nonrepresentable section on output
measure.c: collect2: error: ld returned 1 exit status

Number of similar (compiler,implementation) pairs: 103, namely:
CompilerImplementations
cc ref
gcc ref
gcc -O2 -fomit-frame-pointer ref
gcc -O3 -fomit-frame-pointer ref
gcc -O -fomit-frame-pointer ref
gcc -Os -fomit-frame-pointer ref
gcc -fno-schedule-insns -O2 -fomit-frame-pointer ref
gcc -fno-schedule-insns -O3 -fomit-frame-pointer ref
gcc -fno-schedule-insns -O -fomit-frame-pointer ref
gcc -fno-schedule-insns -Os -fomit-frame-pointer ref
gcc -funroll-loops ref
gcc -funroll-loops -O2 -fomit-frame-pointer ref
gcc -funroll-loops -O3 -fomit-frame-pointer ref
gcc -funroll-loops -O -fomit-frame-pointer ref
gcc -funroll-loops -Os -fomit-frame-pointer ref
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer ref
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer ref
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer ref
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer ref
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -O -fomit-frame-pointer ref
gcc -funroll-loops -m64 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer ref
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer ref
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer ref
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer ref
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer ref
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer ref
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer ref
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer ref
gcc -m64 -O2 -fomit-frame-pointer ref
gcc -m64 -O3 -fomit-frame-pointer ref
gcc -m64 -O -fomit-frame-pointer ref
gcc -m64 -Os -fomit-frame-pointer ref
gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer ref
gcc -m64 -march=core-avx-i -O3 -fomit-frame-pointer ref
gcc -m64 -march=core-avx-i -O -fomit-frame-pointer ref
gcc -m64 -march=core-avx-i -Os -fomit-frame-pointer ref
gcc -m64 -march=core2 -O2 -fomit-frame-pointer ref
gcc -m64 -march=core2 -O3 -fomit-frame-pointer ref
gcc -m64 -march=core2 -O -fomit-frame-pointer ref
gcc -m64 -march=core2 -Os -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4.1 -O3 -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4 -O3 -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer ref
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer ref
gcc -m64 -march=corei7-avx -O2 -fomit-frame-pointer ref
gcc -m64 -march=corei7-avx -O3 -fomit-frame-pointer ref
gcc -m64 -march=corei7-avx -O -fomit-frame-pointer ref
gcc -m64 -march=corei7-avx -Os -fomit-frame-pointer ref
gcc -m64 -march=corei7 -O2 -fomit-frame-pointer ref
gcc -m64 -march=corei7 -O3 -fomit-frame-pointer ref
gcc -m64 -march=corei7 -O -fomit-frame-pointer ref
gcc -m64 -march=corei7 -Os -fomit-frame-pointer ref
gcc -m64 -march=k8 -O2 -fomit-frame-pointer ref
gcc -m64 -march=k8 -O3 -fomit-frame-pointer ref
gcc -m64 -march=k8 -O -fomit-frame-pointer ref
gcc -m64 -march=k8 -Os -fomit-frame-pointer ref
gcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer ref
gcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer ref
gcc -m64 -march=native -mtune=native -O -fomit-frame-pointer ref
gcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer ref
gcc -m64 -march=nocona -O2 -fomit-frame-pointer ref
gcc -m64 -march=nocona -O3 -fomit-frame-pointer ref
gcc -m64 -march=nocona -O -fomit-frame-pointer ref
gcc -m64 -march=nocona -Os -fomit-frame-pointer ref
gcc -march=barcelona -O2 -fomit-frame-pointer ref
gcc -march=barcelona -O3 -fomit-frame-pointer ref
gcc -march=barcelona -O -fomit-frame-pointer ref
gcc -march=barcelona -Os -fomit-frame-pointer ref
gcc -march=k8 -O2 -fomit-frame-pointer ref
gcc -march=k8 -O3 -fomit-frame-pointer ref
gcc -march=k8 -O -fomit-frame-pointer ref
gcc -march=k8 -Os -fomit-frame-pointer ref
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv ref
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv ref
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv ref
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv ref
gcc -march=nocona -O2 -fomit-frame-pointer ref
gcc -march=nocona -O3 -fomit-frame-pointer ref
gcc -march=nocona -O -fomit-frame-pointer ref
gcc -march=nocona -Os -fomit-frame-pointer ref

Compiler output

Implementation: ref
Security model: unknown
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
measure.c: /usr/bin/ld: /home/z/supercop/supercop-20190816/supercop-data/gpu/amd64/lib/fastrandombytes.o: relocation R_X86_64_32 against `.bss' can not be used when making a PIE object; recompile with -fPIC
measure.c: /usr/bin/ld: final link failed: Nonrepresentable section on output
measure.c: collect2: error: ld returned 1 exit status
measure.c: /usr/bin/ld: /home/z/supercop/supercop-20190816/supercop-data/gpu/amd64/lib/fastrandombytes.o: relocation R_X86_64_32 against `.bss' can not be used when making a PIE object; recompile with -fPIC
measure.c: /usr/bin/ld: final link failed: Nonrepresentable section on output
measure.c: collect2: error: ld returned 1 exit status

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -m64 -march=barcelona -O -fomit-frame-pointer ref
gcc -m64 -march=barcelona -Os -fomit-frame-pointer ref