Implementation notes: amd64, gpu, crypto_core/inv3sntrup857

Computer: gpu
Architecture: amd64
CPU ID: GenuineIntel-000206d7-bfebfbff
SUPERCOP version: 20190816
Operation: crypto_core
Primitive: inv3sntrup857
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
100395904341 0 017560 784 832refgcc_-m64_-march=corei7-avx_-O3_-fomit-frame-pointer2019082120190816
101116714341 0 017560 784 832refgcc_-m64_-march=core-avx-i_-O3_-fomit-frame-pointer2019082120190816
101458354410 0 017544 784 832refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019082120190816
102781624341 0 017560 784 832refgcc_-m64_-march=native_-mtune=native_-O3_-fomit-frame-pointer2019082120190816
111824794548 0 017640 784 832refgcc_-m64_-march=core2_-msse4.1_-O3_-fomit-frame-pointer2019082120190816
113898964548 0 017704 784 832refgcc_-m64_-march=core2_-msse4_-O3_-fomit-frame-pointer2019082120190816
114882874548 0 017552 784 832refgcc_-m64_-march=corei7_-O3_-fomit-frame-pointer2019082120190816
118917994745 0 017896 784 832refgcc_-m64_-march=core2_-O3_-fomit-frame-pointer2019082120190816
137127607501 0 023768 784 832refgcc_-funroll-loops_-m64_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
137934304120 0 017344 784 832refgcc_-O3_-fomit-frame-pointer2019082120190816
138652744120 0 017344 784 832refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082120190816
1387939213208 0 020280 784 832refgcc_-m64_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
138819757341 0 023504 784 832refgcc_-funroll-loops_-m64_-march=k8_-O3_-fomit-frame-pointer2019082120190816
138873484342 0 017352 784 832refgcc_-m64_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
139449014120 0 017344 784 832refgcc_-m64_-O3_-fomit-frame-pointer2019082120190816
140535814342 0 017352 784 832refgcc_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
140700756564 0 020064 784 832refgcc_-march=k8_-O3_-fomit-frame-pointer2019082120190816
141181834658 0 020208 784 832refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082120190816
141315874658 0 020208 784 832refgcc_-funroll-loops_-m64_-O3_-fomit-frame-pointer2019082120190816
141719826564 0 020064 784 832refgcc_-m64_-march=k8_-O3_-fomit-frame-pointer2019082120190816
141861697501 0 023768 784 832refgcc_-funroll-loops_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
142073106604 0 020280 784 832refgcc_-march=barcelona_-O3_-fomit-frame-pointer2019082120190816
142210137341 0 023504 784 832refgcc_-funroll-loops_-march=k8_-O3_-fomit-frame-pointer2019082120190816
142769404916 0 020232 784 832refgcc_-funroll-loops_-m64_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
144158134658 0 020208 784 832refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019082120190816
144598774916 0 020232 784 832refgcc_-funroll-loops_-march=nocona_-O3_-fomit-frame-pointer2019082120190816
310468294694 0 020365 760 1128refclang_-O3_-fwrapv_-march=native_-fomit-frame-pointer_-Qunused-arguments2019082120190816
320097095996 0 021037 760 1128refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019082120190816
320184294694 0 020365 760 1128refclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
321638535996 0 021037 760 1128refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019082120190816
385737155393 0 022125 760 776refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019082120190816
388969295393 0 023453 760 776refclang_-mcpu=cortex-a9_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
392457275393 0 023453 760 776refclang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
399353045393 0 023453 760 776refclang_-mcpu=cortex-a8_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082120190816
528164852652 0 016645 768 832refgcc_-funroll-loops_-m64_-march=k8_-O2_-fomit-frame-pointer2019082120190816
545063602714 0 016797 768 832refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082120190816
560971922668 0 016797 768 832refgcc_-funroll-loops_-m64_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
571557362714 0 016797 768 832refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019082120190816
573261842668 0 016797 768 832refgcc_-funroll-loops_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
587593412652 0 016645 768 832refgcc_-funroll-loops_-march=k8_-O2_-fomit-frame-pointer2019082120190816
591618002634 0 016613 768 832refgcc_-funroll-loops_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
593150232714 0 016797 768 832refgcc_-funroll-loops_-m64_-O2_-fomit-frame-pointer2019082120190816
593156762634 0 016813 768 832refgcc_-funroll-loops_-march=k8_-O_-fomit-frame-pointer2019082120190816
596798762634 0 016613 768 832refgcc_-funroll-loops_-m64_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
611525562670 0 016853 768 832refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019082120190816
624059642670 0 016853 768 832refgcc_-funroll-loops_-O_-fomit-frame-pointer2019082120190816
630824492670 0 016853 768 832refgcc_-funroll-loops_-m64_-O_-fomit-frame-pointer2019082120190816
631949852634 0 016813 768 832refgcc_-funroll-loops_-m64_-march=k8_-O_-fomit-frame-pointer2019082120190816
68979417862 0 011613 768 832refgcc_-m64_-march=corei7-avx_-O2_-fomit-frame-pointer2019082120190816
69342042862 0 011661 768 832refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082120190816
71254083836 0 011645 768 832refgcc_-m64_-march=k8_-O2_-fomit-frame-pointer2019082120190816
71336985862 0 011661 768 832refgcc_-m64_-O2_-fomit-frame-pointer2019082120190816
71346636836 0 011645 768 832refgcc_-march=k8_-O2_-fomit-frame-pointer2019082120190816
71542401862 0 011621 768 832refgcc_-m64_-march=core2_-msse4.1_-O2_-fomit-frame-pointer2019082120190816
71903949862 0 011621 768 832refgcc_-m64_-march=core2_-O2_-fomit-frame-pointer2019082120190816
72040737860 0 011941 768 832refgcc_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
72082160860 0 011549 768 832refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019082120190816
720845131720 0 011941 768 832refgcc_-m64_-march=barcelona_-O2_-fomit-frame-pointer2019082120190816
72124815862 0 011613 768 832refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019082120190816
72169911862 0 011621 768 832refgcc_-m64_-march=core2_-msse4_-O2_-fomit-frame-pointer2019082120190816
72172137862 0 011613 768 832refgcc_-m64_-march=core-avx-i_-O2_-fomit-frame-pointer2019082120190816
72232164862 0 011613 768 832refgcc_-m64_-march=native_-mtune=native_-O2_-fomit-frame-pointer2019082120190816
72246840862 0 011613 768 832refgcc_-m64_-march=corei7_-O2_-fomit-frame-pointer2019082120190816
72483198862 0 011661 768 832refgcc_-O2_-fomit-frame-pointer2019082120190816
72767547860 0 011549 768 832refgcc_-m64_-march=core-avx-i_-O_-fomit-frame-pointer2019082120190816
73224240845 0 011565 768 832refgcc_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
74778471860 0 011549 768 832refgcc_-m64_-march=native_-mtune=native_-O_-fomit-frame-pointer2019082120190816
74823732860 0 011549 768 832refgcc_-m64_-march=corei7_-O_-fomit-frame-pointer2019082120190816
75289659860 0 011549 768 832refgcc_-m64_-march=core2_-msse4_-O_-fomit-frame-pointer2019082120190816
75293994845 0 011637 768 832refgcc_-march=k8_-O_-fomit-frame-pointer2019082120190816
753094141690 0 011565 768 832refgcc_-m64_-march=barcelona_-O_-fomit-frame-pointer2019082120190816
75460893860 0 011549 768 832refgcc_-m64_-march=corei7-avx_-O_-fomit-frame-pointer2019082120190816
75523206860 0 011549 768 832refgcc_-m64_-march=core2_-O_-fomit-frame-pointer2019082120190816
75646956860 0 011549 768 832refgcc_-m64_-march=core2_-msse4.1_-O_-fomit-frame-pointer2019082120190816
75839151845 0 011637 768 832refgcc_-m64_-march=k8_-O_-fomit-frame-pointer2019082120190816
76236201860 0 011597 768 832refgcc_-O_-fomit-frame-pointer2019082120190816
76516258860 0 011597 768 832refgcc_-m64_-O_-fomit-frame-pointer2019082120190816
76953568860 0 011597 768 832refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019082120190816
79204625766 0 010561 752 800refgcc_-funroll-loops_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
79635111766 0 010561 752 800refgcc_-funroll-loops_-m64_-Os_-fomit-frame-pointer2019082120190816
79694829742 0 010521 752 800refgcc_-m64_-march=core-avx-i_-Os_-fomit-frame-pointer2019082120190816
79766136742 0 010505 752 800refgcc_-m64_-march=core2_-msse4.1_-Os_-fomit-frame-pointer2019082120190816
79794627742 0 010521 752 800refgcc_-m64_-march=corei7-avx_-Os_-fomit-frame-pointer2019082120190816
79885014742 0 010521 752 800refgcc_-m64_-march=native_-mtune=native_-Os_-fomit-frame-pointer2019082120190816
79962759766 0 010561 752 800refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019082120190816
80095662740 0 010505 752 800refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019082120190816
80104248742 0 010505 752 800refgcc_-m64_-Os_-fomit-frame-pointer2019082120190816
801587761484 0 010505 752 800refgcc_-m64_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
80225865742 0 010505 752 800refgcc_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
80498205766 0 010561 752 800refgcc_-funroll-loops_-m64_-march=barcelona_-Os_-fomit-frame-pointer2019082120190816
80677401742 0 010505 752 800refgcc_-m64_-march=core2_-msse4_-Os_-fomit-frame-pointer2019082120190816
80794767742 0 010505 752 800refgcc_-m64_-march=corei7_-Os_-fomit-frame-pointer2019082120190816
81011193766 0 010561 752 800refgcc_-funroll-loops_-m64_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
81036309766 0 010561 752 800refgcc_-funroll-loops_-m64_-march=k8_-Os_-fomit-frame-pointer2019082120190816
81269289742 0 010505 752 800refgcc_-m64_-march=k8_-Os_-fomit-frame-pointer2019082120190816
81413867766 0 010561 752 800refgcc_-funroll-loops_-march=k8_-Os_-fomit-frame-pointer2019082120190816
81549897742 0 010505 752 800refgcc_-m64_-march=core2_-Os_-fomit-frame-pointer2019082120190816
81554145766 0 010561 752 800refgcc_-funroll-loops_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
81669260742 0 010505 752 800refgcc_-Os_-fomit-frame-pointer2019082120190816
81844443742 0 010505 752 800refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082120190816
82041231742 0 010505 752 800refgcc_-march=k8_-Os_-fomit-frame-pointer2019082120190816
82065126742 0 010505 752 800refgcc_-m64_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
82087342766 0 010561 752 800refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082120190816
82137195742 0 010505 752 800refgcc_-march=nocona_-Os_-fomit-frame-pointer2019082120190816
85631178817 0 011365 768 832refgcc_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
87687348888 0 011741 768 832refgcc_-m64_-march=nocona_-O_-fomit-frame-pointer2019082120190816
88234020817 0 011365 768 832refgcc_-m64_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
882395132437 0 016645 768 832refgcc_-funroll-loops_-march=nocona_-O_-fomit-frame-pointer2019082120190816
892963502437 0 016645 768 832refgcc_-funroll-loops_-m64_-march=nocona_-O_-fomit-frame-pointer2019082120190816
89610999888 0 011741 768 832refgcc_-march=nocona_-O_-fomit-frame-pointer2019082120190816
908293442458 0 016237 768 832refgcc_-funroll-loops_-m64_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
927966092458 0 016237 768 832refgcc_-funroll-loops_-march=nocona_-O2_-fomit-frame-pointer2019082120190816
1878025841640 0 013718 760 792refgcc_-funroll-loops2019082120190816
1890614101640 0 013718 760 792refcc2019082120190816
1929087771640 0 013718 760 792refgcc2019082120190816

Test failure

Implementation: avx
Security model: unknown
Compiler: gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer avx
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer avx
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer ref

Compiler output

Implementation: avx
Security model: unknown
Compiler: cc
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: r3_recip.c:30:12: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: vec256 b0 = _mm256_loadu_si256((vec256 *) b); b += 32; /* 0,1,...,31 */
r3_recip.c: ^~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:41:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_bit0mask':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avxintrin.h:1459:1: error: inlining failed in call to always_inline '_mm256_castsi256_si128': target specific option mismatch
r3_recip.c: _mm256_castsi256_si128 (__m256i __A)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:230:12: note: called from here
r3_recip.c: return -(_mm_cvtsi128_si32(_mm256_castsi256_si128(f[0])) & 1);
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

Number of similar (compiler,implementation) pairs: 3, namely:
CompilerImplementations
cc avx
gcc avx
gcc -funroll-loops avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
r3_recip.c: r3_recip.c:418:11: error: always_inline function '_mm256_set_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ^
r3_recip.c: r3_recip.c:419:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[1] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:420:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[2] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:421:11: error: always_inline function '_mm256_set_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F0[3] = _mm256_set_epi32(0,0,0,0,0,4194304,0,4194304);
r3_recip.c: ^
r3_recip.c: r3_recip.c:422:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[0] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:423:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[1] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:424:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[2] = _mm256_set1_epi32(0);
r3_recip.c: ^
r3_recip.c: r3_recip.c:425:11: error: always_inline function '_mm256_set_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: F1[3] = _mm256_set_epi32(0,0,0,0,0,4194304,0,4194304);
r3_recip.c: ^
r3_recip.c: r3_recip.c:427:11: error: always_inline function '_mm256_set1_epi32' requires target feature 'sse4.2', but would be inlined into function 'crypto_core_inv3sntrup857_avx' that is compiled without support for 'sse4.2'
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments
r3_recip.c: r3_recip.c:39:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c0 = _mm256_unpacklo_epi32(b0,b1); /* 0 1 2 3 32 33 34 35 4 5 6 7 36 37 38 39 ... 55 */
r3_recip.c: ^
r3_recip.c: r3_recip.c:40:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c1 = _mm256_unpackhi_epi32(b0,b1); /* 8 9 10 11 40 41 42 43 ... 63 */
r3_recip.c: ^
r3_recip.c: r3_recip.c:41:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c2 = _mm256_unpacklo_epi32(b2,b3);
r3_recip.c: ^
r3_recip.c: r3_recip.c:42:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c3 = _mm256_unpackhi_epi32(b2,b3);
r3_recip.c: ^
r3_recip.c: r3_recip.c:43:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c4 = _mm256_unpacklo_epi32(b4,b5);
r3_recip.c: ^
r3_recip.c: r3_recip.c:44:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c5 = _mm256_unpackhi_epi32(b4,b5);
r3_recip.c: ^
r3_recip.c: r3_recip.c:45:17: error: always_inline function '_mm256_unpacklo_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c6 = _mm256_unpacklo_epi32(b6,b7);
r3_recip.c: ^
r3_recip.c: r3_recip.c:46:17: error: always_inline function '_mm256_unpackhi_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: vec256 c7 = _mm256_unpackhi_epi32(b6,b7);
r3_recip.c: ^
r3_recip.c: r3_recip.c:48:22: error: always_inline function '_mm256_slli_epi32' requires target feature 'avx2', but would be inlined into function 'vec256_frombits' that is compiled without support for 'avx2'
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -O2 -fomit-frame-pointer
r3_recip.c: r3_recip.c: In function 'crypto_core_inv3sntrup857_avx':
r3_recip.c: r3_recip.c:418:9: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 84, namely:
CompilerImplementations
gcc -O2 -fomit-frame-pointer avx
gcc -O3 -fomit-frame-pointer avx
gcc -O -fomit-frame-pointer avx
gcc -Os -fomit-frame-pointer avx
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops -O2 -fomit-frame-pointer avx
gcc -funroll-loops -O3 -fomit-frame-pointer avx
gcc -funroll-loops -O -fomit-frame-pointer avx
gcc -funroll-loops -Os -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer avx
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer avx
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer avx
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer avx
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer avx
gcc -m64 -O2 -fomit-frame-pointer avx
gcc -m64 -O3 -fomit-frame-pointer avx
gcc -m64 -O -fomit-frame-pointer avx
gcc -m64 -Os -fomit-frame-pointer avx
gcc -m64 -march=core2 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core2 -O3 -fomit-frame-pointer avx
gcc -m64 -march=core2 -O -fomit-frame-pointer avx
gcc -m64 -march=core2 -Os -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -O3 -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer avx
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer avx
gcc -m64 -march=corei7 -O2 -fomit-frame-pointer avx
gcc -m64 -march=corei7 -O3 -fomit-frame-pointer avx
gcc -m64 -march=corei7 -O -fomit-frame-pointer avx
gcc -m64 -march=corei7 -Os -fomit-frame-pointer avx
gcc -m64 -march=k8 -O2 -fomit-frame-pointer avx
gcc -m64 -march=k8 -O3 -fomit-frame-pointer avx
gcc -m64 -march=k8 -O -fomit-frame-pointer avx
gcc -m64 -march=k8 -Os -fomit-frame-pointer avx
gcc -m64 -march=nocona -O2 -fomit-frame-pointer avx
gcc -m64 -march=nocona -O3 -fomit-frame-pointer avx
gcc -m64 -march=nocona -O -fomit-frame-pointer avx
gcc -m64 -march=nocona -Os -fomit-frame-pointer avx
gcc -march=barcelona -O2 -fomit-frame-pointer avx
gcc -march=barcelona -O3 -fomit-frame-pointer avx
gcc -march=barcelona -O -fomit-frame-pointer avx
gcc -march=barcelona -Os -fomit-frame-pointer avx
gcc -march=k8 -O2 -fomit-frame-pointer avx
gcc -march=k8 -O3 -fomit-frame-pointer avx
gcc -march=k8 -O -fomit-frame-pointer avx
gcc -march=k8 -Os -fomit-frame-pointer avx
gcc -march=nocona -O2 -fomit-frame-pointer avx
gcc -march=nocona -O3 -fomit-frame-pointer avx
gcc -march=nocona -O -fomit-frame-pointer avx
gcc -march=nocona -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
r3_recip.c: r3_recip.c: In function 'crypto_core_inv3sntrup857_avx':
r3_recip.c: r3_recip.c:418:9: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...
r3_recip.c: r3_recip.c: In function 'crypto_core_inv3sntrup857_avx':
r3_recip.c: r3_recip.c:418:9: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
r3_recip.c: F0[0] = _mm256_set_epi32(0,0,0,0,0,0,0,1);
r3_recip.c: ~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c: In function 'vec256_swap':
r3_recip.c: r3_recip.c:178:20: note: The ABI for passing parameters with 32-byte alignment has changed in GCC 4.6
r3_recip.c: static inline void vec256_swap(vec256 *f,vec256 *g,int len,vec256 mask)
r3_recip.c: ^~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer avx
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer avx
gcc -m64 -march=barcelona -O -fomit-frame-pointer avx
gcc -m64 -march=barcelona -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: r3_recip.c: In function 'vec256_frombits':
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:597:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi32': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi32 (__m256i __A, const int __mask)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:69:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi32(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
r3_recip.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:68:7: note: called from here
r3_recip.c: h = _mm256_permute4x64_epi64(h,0xd8);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
r3_recip.c: from r3_recip.c:3:
r3_recip.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:588:1: error: inlining failed in call to always_inline '_mm256_shuffle_epi8': target specific option mismatch
r3_recip.c: _mm256_shuffle_epi8 (__m256i __X, __m256i __Y)
r3_recip.c: ^~~~~~~~~~~~~~~~~~~
r3_recip.c: r3_recip.c:67:7: note: called from here
r3_recip.c: h = _mm256_shuffle_epi8(h,TRANSPOSE);
r3_recip.c: ~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
r3_recip.c: ...

Number of similar (compiler,implementation) pairs: 16, namely:
CompilerImplementations
gcc -m64 -march=core-avx-i -O2 -fomit-frame-pointer avx
gcc -m64 -march=core-avx-i -O3 -fomit-frame-pointer avx
gcc -m64 -march=core-avx-i -O -fomit-frame-pointer avx
gcc -m64 -march=core-avx-i -Os -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -O2 -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -O3 -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -O -fomit-frame-pointer avx
gcc -m64 -march=corei7-avx -Os -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -O -fomit-frame-pointer avx
gcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer avx
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv avx
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv avx