Implementation notes: amd64, gpu, crypto_core/inv3sntrup653

Computer: gpu
Architecture: amd64
CPU ID: GenuineIntel-000206d7-bfebfbff
SUPERCOP version: 20190816
Operation: crypto_core
Primitive: inv3sntrup653
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
61227395224 0 018440 784 832refgcc_-m64_-march=core-avx-i_-O3_-fomit-frame-pointer2019082120190816
61626185224 0 018440 784 832refgcc_-m64_-march=corei7-avx_-O3_-fomit-frame-pointer2019082120190816
64925775224 0 018440 784 832refgcc_-m64_-march=native_-mtune=native_-O3_-fomit-frame-pointer2019082120190816
65620085381 0 018504 784 832refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019082120190816
68900975538 0 018544 784 832refgcc_-m64_-march=corei7_-O3_-fomit-frame-pointer2019082120190816
69057515538 0 018632 784 832refgcc_-m64_-march=core2_-msse4.1_-O3_-fomit-frame-pointer2019082120190816
70795025538 0 018696 784 832refgcc_-m64_-march=core2_-msse4_-O3_-fomit-frame-pointer2019082120190816
73450845753 0 018904 784 832refgcc_-m64_-march=core2_-O3_-fomit-frame-pointer2019082120190816
826785915000 0 021176 784 832refgcc_-m64_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
82937515689 0 021248 784 832refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019082120190816
83850337500 0 021176 784 832refgcc_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
84391245689 0 021248 784 832refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082120190816
84763415346 0 018344 784 832refgcc_-m64_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
84788678440 0 024592 784 832refgcc_-funroll-loops_-m64_-march=k8_-O3_-fomit-frame-pointer2019082120190816
84791805024 0 018256 784 832refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082120190816
85062367420 0 020928 784 832refgcc_-m64_-march=k8_-O3_-fomit-frame-pointer2019082120190816
85732645024 0 018256 784 832refgcc_-m64_-O3_-fomit-frame-pointer2019082120190816
85749907420 0 020928 784 832refgcc_-march=k8_-O3_-fomit-frame-pointer2019082120190816
86199205346 0 018344 784 832refgcc_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
86459008440 0 024592 784 832refgcc_-funroll-loops_-march=k8_-O3_-fomit-frame-pointer2019082120190816
86736455689 0 021248 784 832refgcc_-funroll-loops_-m64_-O3_-fomit-frame-pointer2019082120190816
87107718640 0 024904 784 832refgcc_-funroll-loops_-m64_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
87446418640 0 024904 784 832refgcc_-funroll-loops_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
87530815024 0 018256 784 832refgcc_-O3_-fomit-frame-pointer2019082120190816
88421926055 0 021368 784 832refgcc_-funroll-loops_-m64_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
89327046055 0 021368 784 832refgcc_-funroll-loops_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
183891285881 0 021565 760 1128refclang_-O3_-fwrapv_-march=native_-fomit-frame-pointer_-Qunused-arguments2019082120190816
187480395500 0 020541 760 1128refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019082120190816
189674765500 0 020541 760 1128refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019082120190816
189704485881 0 021565 760 1128refclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
227871965198 0 021933 760 776refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019082120190816
228562205198 0 023261 760 776refclang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
231213765198 0 023261 760 776refclang_-mcpu=cortex-a9_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
232499165198 0 023261 760 776refclang_-mcpu=cortex-a8_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
322438322762 0 016845 768 832refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082120190816
323430662693 0 016861 768 832refgcc_-funroll-loops_-march=k8_-O_-fomit-frame-pointer2019082120190816
327321852708 0 016693 768 832refgcc_-funroll-loops_-march=k8_-O2_-fomit-frame-pointer2019082120190816
332832852708 0 016693 768 832refgcc_-funroll-loops_-m64_-march=k8_-O2_-fomit-frame-pointer2019082120190816
335156082762 0 016845 768 832refgcc_-funroll-loops_-m64_-O2_-fomit-frame-pointer2019082120190816
338775722762 0 016845 768 832refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019082120190816
340146772732 0 016861 768 832refgcc_-funroll-loops_-m64_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
344001332732 0 016861 768 832refgcc_-funroll-loops_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
357675182727 0 016917 768 832refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019082120190816
358005672693 0 016861 768 832refgcc_-funroll-loops_-m64_-march=k8_-O_-fomit-frame-pointer2019082120190816
362879522693 0 016677 768 832refgcc_-funroll-loops_-m64_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
363792412693 0 016677 768 832refgcc_-funroll-loops_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
369082132727 0 016917 768 832refgcc_-funroll-loops_-O_-fomit-frame-pointer2019082120190816
371254992727 0 016917 768 832refgcc_-funroll-loops_-m64_-O_-fomit-frame-pointer2019082120190816
40464972836 0 011645 768 832refgcc_-march=k8_-O2_-fomit-frame-pointer2019082120190816
40795644862 0 011661 768 832refgcc_-O2_-fomit-frame-pointer2019082120190816
41262623860 0 011941 768 832refgcc_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
41780955862 0 011613 768 832refgcc_-m64_-march=corei7-avx_-O2_-fomit-frame-pointer2019082120190816
41795337862 0 011621 768 832refgcc_-m64_-march=core2_-msse4.1_-O2_-fomit-frame-pointer2019082120190816
419415761720 0 011941 768 832refgcc_-m64_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
42062391862 0 011613 768 832refgcc_-m64_-march=corei7_-O2_-fomit-frame-pointer2019082120190816
42106761862 0 011621 768 832refgcc_-m64_-march=core2_-O2_-fomit-frame-pointer2019082120190816
42209556862 0 011661 768 832refgcc_-m64_-O2_-fomit-frame-pointer2019082120190816
42239264862 0 011613 768 832refgcc_-m64_-march=native_-mtune=native_-O2_-fomit-frame-pointer2019082120190816
42244380862 0 011621 768 832refgcc_-m64_-march=core2_-msse4_-O2_-fomit-frame-pointer2019082120190816
42416808862 0 011613 768 832refgcc_-m64_-march=core-avx-i_-O2_-fomit-frame-pointer2019082120190816
42617637862 0 011613 768 832refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019082120190816
42762224836 0 011645 768 832refgcc_-m64_-march=k8_-O2_-fomit-frame-pointer2019082120190816
43089866862 0 011661 768 832refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082120190816
43332354845 0 011565 768 832refgcc_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
43494600860 0 011597 768 832refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019082120190816
43841274845 0 011637 768 832refgcc_-m64_-march=k8_-O_-fomit-frame-pointer2019082120190816
43981092860 0 011597 768 832refgcc_-O_-fomit-frame-pointer2019082120190816
44123833860 0 011549 768 832refgcc_-m64_-march=core2_-msse4.1_-O_-fomit-frame-pointer2019082120190816
44166290860 0 011597 768 832refgcc_-m64_-O_-fomit-frame-pointer2019082120190816
44180441860 0 011549 768 832refgcc_-m64_-march=core2_-O_-fomit-frame-pointer2019082120190816
44211148860 0 011549 768 832refgcc_-m64_-march=core-avx-i_-O_-fomit-frame-pointer2019082120190816
44333850860 0 011549 768 832refgcc_-m64_-march=core2_-msse4_-O_-fomit-frame-pointer2019082120190816
44430216860 0 011549 768 832refgcc_-m64_-march=corei7_-O_-fomit-frame-pointer2019082120190816
44430416860 0 011549 768 832refgcc_-m64_-march=corei7-avx_-O_-fomit-frame-pointer2019082120190816
44467605860 0 011549 768 832refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019082120190816
44544640860 0 011549 768 832refgcc_-m64_-march=native_-mtune=native_-O_-fomit-frame-pointer2019082120190816
446713581690 0 011565 768 832refgcc_-m64_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
44921055845 0 011637 768 832refgcc_-march=k8_-O_-fomit-frame-pointer2019082120190816
46119600742 0 010505 752 800refgcc_-m64_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
46375050742 0 010505 752 800refgcc_-m64_-march=core2_-Os_-fomit-frame-pointer2019082120190816
46522749766 0 010561 752 800refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019082120190816
46630805766 0 010561 752 800refgcc_-funroll-loops_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
468136651484 0 010505 752 800refgcc_-m64_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
46834136742 0 010505 752 800refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082120190816
47199100742 0 010505 752 800refgcc_-m64_-march=core2_-msse4_-Os_-fomit-frame-pointer2019082120190816
47209656742 0 010505 752 800refgcc_-m64_-march=corei7_-Os_-fomit-frame-pointer2019082120190816
47309419742 0 010505 752 800refgcc_-m64_-march=core2_-msse4.1_-Os_-fomit-frame-pointer2019082120190816
47325876766 0 010561 752 800refgcc_-funroll-loops_-m64_-Os_-fomit-frame-pointer2019082120190816
47382764742 0 010505 752 800refgcc_-m64_-Os_-fomit-frame-pointer2019082120190816
47444915742 0 010505 752 800refgcc_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
47448204742 0 010521 752 800refgcc_-m64_-march=core-avx-i_-Os_-fomit-frame-pointer2019082120190816
47451969742 0 010505 752 800refgcc_-m64_-march=k8_-Os_-fomit-frame-pointer2019082120190816
47505351766 0 010561 752 800refgcc_-funroll-loops_-march=k8_-Os_-fomit-frame-pointer2019082120190816
47548413742 0 010505 752 800refgcc_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
47616357742 0 010521 752 800refgcc_-m64_-march=corei7-avx_-Os_-fomit-frame-pointer2019082120190816
47639745742 0 010521 752 800refgcc_-m64_-march=native_-mtune=native_-Os_-fomit-frame-pointer2019082120190816
47649041742 0 010505 752 800refgcc_-march=k8_-Os_-fomit-frame-pointer2019082120190816
47744187766 0 010561 752 800refgcc_-funroll-loops_-m64_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
47770431742 0 010505 752 800refgcc_-Os_-fomit-frame-pointer2019082120190816
47778824766 0 010561 752 800refgcc_-funroll-loops_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
47833233766 0 010561 752 800refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082120190816
47995736740 0 010505 752 800refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019082120190816
48046888766 0 010561 752 800refgcc_-funroll-loops_-m64_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
494025002494 0 016709 768 832refgcc_-funroll-loops_-m64_-march=nocona_-O_-fomit-frame-pointer2019082120190816
495511132494 0 016709 768 832refgcc_-funroll-loops_-march=nocona_-O_-fomit-frame-pointer2019082120190816
49917591766 0 010561 752 800refgcc_-funroll-loops_-m64_-march=k8_-Os_-fomit-frame-pointer2019082120190816
51077560817 0 011365 768 832refgcc_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
51177258817 0 011365 768 832refgcc_-m64_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
525426242516 0 016301 768 832refgcc_-funroll-loops_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
52818759888 0 011741 768 832refgcc_-m64_-march=nocona_-O_-fomit-frame-pointer2019082120190816
535898402516 0 016301 768 832refgcc_-funroll-loops_-m64_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
53744740888 0 011741 768 832refgcc_-march=nocona_-O_-fomit-frame-pointer2019082120190816
979538551640 0 013718 760 792refgcc_-funroll-loops2019082120190816
1091697361640 0 013718 760 792refcc2019082120190816
1105495761640 0 013718 760 792refgcc2019082120190816

Test failure

Implementation: avx
Security model: unknown
Compiler: gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer avx
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer avx
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer ref

Compiler output

Implementation: avx
Security model: unknown
Compiler: cc
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: r3_recip.c:30:12: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: vec256 b0 = _mm256_loadu_si256((vec256 *) b); b += 32; /* 0,1,...,31 */
r3_recip.c: ^~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:41:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_bit0mask':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avxintrin.h:1459:1: error: inlining failed in call to always_inline '_mm256_castsi256_si128': target specific option mismatch
r3_recip.c: _mm256_castsi256_si128 (__m256i __A)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:230:12: note: called from here
r3_recip.c: return -(_mm_cvtsi128_si32(_mm256_castsi256_si128(f[0])) & 1);
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

Number of similar (compiler,implementation) pairs: 3, namely:
CompilerImplementations
cc avx
gcc avx
gcc -funroll-loops avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
r3_recip.c: r3_recip.c:362:11: error: always_inline function '_mm256_set_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ^
r3_recip.c: r3_recip.c:363:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[1] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:364:11: error: always_inline function '_mm256_set_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[2] = _mm256_set_epi32(0,0,0,0,8,0,8,0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:365:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[0] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:366:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[1] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:367:11: error: always_inline function '_mm256_set_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[2] = _mm256_set_epi32(0,0,0,0,8,0,8,0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:369:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: V0[0] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:370:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: V1[0] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:371:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup653_avx' that is compiled without support for 'sse4.2'
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments
r3_recip.c: r3_recip.c:39:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c0 = _mm256_unpacklo_epi32(b0,b1); /* 0 1 2 3 32 33 34 35 4 5 6 7 36 37 38 39 ... 55 */
r3_recip.c: ^
r3_recip.c: r3_recip.c:40:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c1 = _mm256_unpackhi_epi32(b0,b1); /* 8 9 10 11 40 41 42 43 ... 63 */
r3_recip.c: ^
r3_recip.c: r3_recip.c:41:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c2 = _mm256_unpacklo_epi32(b2,b3);
r3_recip.c: ^
r3_recip.c: r3_recip.c:42:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c3 = _mm256_unpackhi_epi32(b2,b3);
r3_recip.c: ^
r3_recip.c: r3_recip.c:43:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c4 = _mm256_unpacklo_epi32(b4,b5);
r3_recip.c: ^
r3_recip.c: r3_recip.c:44:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c5 = _mm256_unpackhi_epi32(b4,b5);
r3_recip.c: ^
r3_recip.c: r3_recip.c:45:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c6 = _mm256_unpacklo_epi32(b6,b7);
r3_recip.c: ^
r3_recip.c: r3_recip.c:46:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c7 = _mm256_unpackhi_epi32(b6,b7);
r3_recip.c: ^
r3_recip.c: r3_recip.c:48:22: error: always_inline function '_mm256_slli_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -O2 -fomit-frame-pointer
r3_recip.c: r3_recip.c: In function 'crypto_core_inv3sntrup653_avx':
r3_recip.c: r3_recip.c:362:9: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 84, namely:
CompilerImplementations
gcc -O2 -fomit-frame-pointer avx
gcc -O3 -fomit-frame-pointer avx
gcc -O -fomit-frame-pointer avx
gcc -Os -fomit-frame-pointer avx
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops -O2 -fomit-frame-pointer avx
gcc -funroll-loops -O3 -fomit-frame-pointer avx
gcc -funroll-loops -O -fomit-frame-pointer avx
gcc -funroll-loops -Os -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer avx
gcc -m64 -O2 -fomit-frame-pointer avx
gcc -m64 -O3 -fomit-frame-pointer avx
gcc -m64 -O -fomit-frame-pointer avx
gcc -m64 -Os -fomit-frame-pointer avx
gcc -m64 -march=core2 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core2 -O3 -fomit-frame-pointer avx
gcc -m64 -march=core2 -O -fomit-frame-pointer avx
gcc -m64 -march=core2 -Os -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -O3 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer avx
gcc -m64 -march=corei7 -O2 -fomit-frame-pointer avx
gcc -m64 -march=corei7 -O3 -fomit-frame-pointer avx
gcc -m64 -march=corei7 -O -fomit-frame-pointer avx
gcc -m64 -march=corei7 -Os -fomit-frame-pointer avx
gcc -m64 -march=k8 -O2 -fomit-frame-pointer avx
gcc -m64 -march=k8 -O3 -fomit-frame-pointer avx
gcc -m64 -march=k8 -O -fomit-frame-pointer avx
gcc -m64 -march=k8 -Os -fomit-frame-pointer avx
gcc -m64 -march=nocona -O2 -fomit-frame-pointer avx
gcc -m64 -march=nocona -O3 -fomit-frame-pointer avx
gcc -m64 -march=nocona -O -fomit-frame-pointer avx
gcc -m64 -march=nocona -Os -fomit-frame-pointer avx
gcc -march=barcelona -O2 -fomit-frame-pointer avx
gcc -march=barcelona -O3 -fomit-frame-pointer avx
gcc -march=barcelona -O -fomit-frame-pointer avx
gcc -march=barcelona -Os -fomit-frame-pointer avx
gcc -march=k8 -O2 -fomit-frame-pointer avx
gcc -march=k8 -O3 -fomit-frame-pointer avx
gcc -march=k8 -O -fomit-frame-pointer avx
gcc -march=k8 -Os -fomit-frame-pointer avx
gcc -march=nocona -O2 -fomit-frame-pointer avx
gcc -march=nocona -O3 -fomit-frame-pointer avx
gcc -march=nocona -O -fomit-frame-pointer avx
gcc -march=nocona -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
r3_recip.c: r3_recip.c: In function 'crypto_core_inv3sntrup653_avx':
r3_recip.c: r3_recip.c:362:9: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...
r3_recip.c: r3_recip.c: In function 'crypto_core_inv3sntrup653_avx':
r3_recip.c: r3_recip.c:362:9: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer avx
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer avx
gcc -m64 -march=barcelona -O -fomit-frame-pointer avx
gcc -m64 -march=barcelona -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:588:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi8': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi8 (__m256i __X, __m256i __Y)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:67:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi8(h,TRANSPOSE);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 16, namely:
CompilerImplementations
gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer avx
gcc -m64 -march=core-avx-i -O3 -fomit-frame-pointer avx
gcc -m64 -march=core-avx-i -O -fomit-frame-pointer avx
gcc -m64 -march=core-avx-i -Os -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -O2 -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -O3 -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -O -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -Os -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -O -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer avx
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx