Test results for amd64, speed2supercop, crypto_core/multsntrup761

[Page version: 20250424 01:42:31]

Measurements for amd64, speed2supercop, crypto_core Test results for amd64, speed2supercop, crypto_core Test results for crypto_core/multsntrup761

Computer: speed2supercop
Microarchitecture: amd64; Haswell+AES (306c3)
Architecture: amd64
CPU ID: GenuineIntel-000306c3-1fc9cbf5
SUPERCOP version: 20250415
Operation: crypto_core
Primitive: multsntrup761

Time	Object size	Test size	Implementation	Compiler	Benchmark date	SUPERCOP version
18088	20428 0 0	37358 792 856	`avx`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
18200	19775 0 0	31902 792 760	`avx`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
18260	20164 0 0	37094 792 856	`avx800`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
18288	19887 0 0	32014 792 760	`avx800`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
18476	19532 0 0	36302 792 856	`avx`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
18580	19300 0 0	36070 792 856	`avx800`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
18968	17565 0 0	30655 784 856	`avx`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
19040	17468 0 0	30551 784 856	`avx800`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
19496	18103 0 0	30556 744 832	`avx800`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
19624	17628 0 0	34526 792 856	`round2`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
19756	16343 0 0	28438 792 760	`round2`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
19764	16724 0 0	33462 792 856	`round2`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
19884	18605 0 0	31052 744 832	`avx`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20352	17140 0 0	31541 752 832	`round2`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20372	17635 0 0	28868 736 800	`avx800`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20440	14780 0 0	27365 752 832	`round2`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20512	13737 0 0	26799 784 856	`round2`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20796	14830 0 0	27300 744 832	`round2`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20852	18045 0 0	29276 736 800	`avx`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20896	18077 0 0	30677 752 832	`avx800`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
20904	19485 0 0	33901 752 832	`avx800`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
21140	13759 0 0	25004 736 800	`round2`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
21384	19901 0 0	34317 752 832	`avx`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
21516	18493 0 0	31093 752 832	`avx`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
30428	13058 0 0	29894 792 856	`round1`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
30916	11000 0 0	27894 792 856	`round1`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
31076	13517 0 0	27917 752 832	`round1`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
33700	9757 0 0	22357 752 832	`round1`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
34064	8487 0 0	21631 784 856	`round1`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
34324	9704 0 0	21798 792 760	`round1`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
35620	8285 0 0	19484 736 800	`round1`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
38960	9245 0 0	21773 752 832	`round1`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
187800	4040 0 0	18397 752 832	`ref`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
211772	2913 0 0	19750 792 856	`compact`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
216660	1434 0 0	15829 752 832	`compact`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
228368	2379 0 0	19262 792 856	`ref`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
232196	2914 0 0	19718 792 856	`ref`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
248912	1846 0 0	18718 792 856	`compact`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
609796	1180 0 0	19742 792 760	`compact`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
755852	2321 0 0	20878 792 760	`ref`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
968972	1214 0 0	14311 784 856	`compact`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1081436	1000 0 0	13541 752 832	`ref`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1098352	643 0 0	12710 792 760	`ref`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1186444	463 0 0	12534 792 760	`compact`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1211452	641 0 0	13783 784 856	`ref`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1263920	463 0 0	11628 736 800	`ref`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1370612	545 0 0	12948 744 832	`ref`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1407028	408 0 0	11572 736 800	`compact`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1469128	473 0 0	13029 752 832	`compact`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415
1474892	453 0 0	12868 744 832	`compact`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20250417	20250415

Compiler output

mult768.c: mult768.c:267:7: error: always_inline function '_mm256_set1_epi16' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_avx_constbranchindex' that is compiled without support for 'avx'
mult768.c:   267 |   x = const_x16(0);
mult768.c:       |       ^
mult768.c: mult768.c:12:19: note: expanded from macro 'const_x16'
mult768.c:    12 | #define const_x16 _mm256_set1_epi16
mult768.c:       |                   ^
mult768.c: mult768.c:267:7: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
mult768.c: mult768.c:12:19: note: expanded from macro 'const_x16'
mult768.c:    12 | #define const_x16 _mm256_set1_epi16
mult768.c:       |                   ^
mult768.c: mult768.c:268:35: error: always_inline function '_mm256_storeu_si256' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_avx_constbranchindex' that is compiled without support for 'avx'
mult768.c:   268 |   for (i = p&~15;i < 768;i += 16) store_x16(&f[i],x);
mult768.c:       |                                   ^
mult768.c: mult768.c:11:24: note: expanded from macro 'store_x16'
mult768.c:    11 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c:       |                        ^
mult768.c: mult768.c:268:35: error: AVX vector argument of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
mult768.c: mult768.c:11:24: note: expanded from macro 'store_x16'
mult768.c:    11 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c:       |                        ^
mult768.c: mult768.c:269:35: error: always_inline function '_mm256_storeu_si256' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_avx_constbranchindex' that is compiled without support for 'avx'
mult768.c:   269 |   for (i = p&~15;i < 768;i += 16) store_x16(&g[i],x);
mult768.c:       |                                   ^
mult768.c: mult768.c:11:24: note: expanded from macro 'store_x16'
mult768.c:    11 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`avx`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`

Compiler output

mult768.c: mult768.c:267:7: error: always_inline function '_mm256_set1_epi16' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_avx800_constbranchindex' that is compiled without support for 'avx'
mult768.c:   267 |   x = const_x16(0);
mult768.c:       |       ^
mult768.c: mult768.c:12:19: note: expanded from macro 'const_x16'
mult768.c:    12 | #define const_x16 _mm256_set1_epi16
mult768.c:       |                   ^
mult768.c: mult768.c:267:7: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
mult768.c: mult768.c:12:19: note: expanded from macro 'const_x16'
mult768.c:    12 | #define const_x16 _mm256_set1_epi16
mult768.c:       |                   ^
mult768.c: mult768.c:268:35: error: always_inline function '_mm256_storeu_si256' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_avx800_constbranchindex' that is compiled without support for 'avx'
mult768.c:   268 |   for (i = p&~15;i < 768;i += 16) store_x16(&f[i],x);
mult768.c:       |                                   ^
mult768.c: mult768.c:11:24: note: expanded from macro 'store_x16'
mult768.c:    11 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c:       |                        ^
mult768.c: mult768.c:268:35: error: AVX vector argument of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
mult768.c: mult768.c:11:24: note: expanded from macro 'store_x16'
mult768.c:    11 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c:       |                        ^
mult768.c: mult768.c:269:35: error: always_inline function '_mm256_storeu_si256' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_avx800_constbranchindex' that is compiled without support for 'avx'
mult768.c:   269 |   for (i = p&~15;i < 768;i += 16) store_x16(&g[i],x);
mult768.c:       |                                   ^
mult768.c: mult768.c:11:24: note: expanded from macro 'store_x16'
mult768.c:    11 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`avx800`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`

Compiler output

mult.c: mult.c:147:22: error: invalid output size for constraint '=&x'
mult.c:   147 |   MULSTEP_fromzero(0,h0,h1,h2,h3,h4)
mult.c:       |                      ^
mult.c: mult.c:149:26: error: invalid output size for constraint '+x'
mult.c:   149 |     MULSTEP_noload(j + 1,h1,h2,h3,h4,h0)
mult.c:       |                          ^
mult.c: mult.c:150:26: error: invalid output size for constraint '+x'
mult.c:   150 |     MULSTEP_noload(j + 2,h2,h3,h4,h0,h1)
mult.c:       |                          ^
mult.c: mult.c:151:26: error: invalid output size for constraint '+x'
mult.c:   151 |     MULSTEP_noload(j + 3,h3,h4,h0,h1,h2)
mult.c:       |                          ^
mult.c: mult.c:152:26: error: invalid output size for constraint '+x'
mult.c:   152 |     MULSTEP_noload(j + 4,h4,h0,h1,h2,h3)
mult.c:       |                          ^
mult.c: mult.c:153:26: error: invalid output size for constraint '+x'
mult.c:   153 |     MULSTEP_noload(j + 5,h0,h1,h2,h3,h4)
mult.c:       |                          ^
mult.c: mult.c:155:24: error: invalid output size for constraint '+x'
mult.c:   155 |   MULSTEP_noload(j + 1,h1,h2,h3,h4,h0)
mult.c:       |                        ^
mult.c: mult.c:156:24: error: invalid output size for constraint '+x'
mult.c:   156 |   MULSTEP_noload(j + 2,h2,h3,h4,h0,h1)
mult.c:       |                        ^
mult.c: mult.c:157:24: error: invalid output size for constraint '+x'
mult.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`round1`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`

Compiler output

mult.c: mult.c: In function 'mult768_mix2_m256i':
mult.c: mult.c:568:3: warning: 'mult96x16' accessing 6144 bytes in a region of size 512 [-Wstringop-overflow=]
mult.c:   568 |   mult96x16(hkara[12],fkara[6],(__m256i *) (1 + (__m128i *) gkara));
mult.c:       |   ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
mult.c: mult.c:568:3: note: referencing argument 1 of type '__m256i[192]'
mult.c: mult.c:568:3: warning: 'mult96x16' reading 3072 bytes from a region of size 512 [-Wstringop-overread]
mult.c: mult.c:568:3: note: referencing argument 2 of type 'const __m256i[96]'
mult.c: mult.c:568:3: warning: 'mult96x16' reading 3072 bytes from a region of size 3056 [-Wstringop-overread]
mult.c: mult.c:568:3: note: referencing argument 3 of type 'const __m256i[96]'
mult.c: mult.c:279:13: note: in a call to function 'mult96x16'
mult.c:   279 | static void mult96x16(__m256i h[192],const __m256i f[96],const __m256i g[96])
mult.c:       |             ^~~~~~~~~
mult.c: mult.c:569:3: warning: 'mult96x16' accessing 6144 bytes in a region of size 512 [-Wstringop-overflow=]
mult.c:   569 |   mult96x16(hkara[0],fkara[0],gkara[0]);
mult.c:       |   ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
mult.c: mult.c:569:3: note: referencing argument 1 of type '__m256i[192]'
mult.c: mult.c:569:3: warning: 'mult96x16' reading 3072 bytes from a region of size 512 [-Wstringop-overread]
mult.c: mult.c:569:3: note: referencing argument 2 of type 'const __m256i[96]'
mult.c: mult.c:569:3: warning: 'mult96x16' reading 3072 bytes from a region of size 1024 [-Wstringop-overread]
mult.c: mult.c:569:3: note: referencing argument 3 of type 'const __m256i[96]'
mult.c: mult.c:279:13: note: in a call to function 'mult96x16'
mult.c:   279 | static void mult96x16(__m256i h[192],const __m256i f[96],const __m256i g[96])
mult.c:       |             ^~~~~~~~~

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`round1`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`

Compiler output

ntt.c: ntt.c:562:35: warning: unused variable 'h0' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                   ^~
ntt.c: ntt.c:562:38: warning: unused variable 'h1' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                      ^~
ntt.c: ntt.c:562:41: warning: unused variable 'h2' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                         ^~
ntt.c: ntt.c:562:44: warning: unused variable 'h3' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                            ^~
ntt.c: ntt.c:864:35: warning: unused variable 'h0' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                   ^~
ntt.c: ntt.c:864:38: warning: unused variable 'h1' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                      ^~
ntt.c: ntt.c:864:41: warning: unused variable 'h2' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                         ^~
ntt.c: ntt.c:864:44: warning: unused variable 'h3' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                            ^~
ntt.c: ntt.c:865:10: warning: unused variable 'origf' [-Wunused-variable]
ntt.c: ...

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`round2`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`

Compiler output

mult768.c: mult768.c:268:7: error: always_inline function '_mm256_set1_epi16' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_round2_constbranchindex' that is compiled without support for 'avx'
mult768.c:   268 |   x = const_x16(0);
mult768.c:       |       ^
mult768.c: mult768.c:11:19: note: expanded from macro 'const_x16'
mult768.c:    11 | #define const_x16 _mm256_set1_epi16
mult768.c:       |                   ^
mult768.c: mult768.c:268:7: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
mult768.c: mult768.c:11:19: note: expanded from macro 'const_x16'
mult768.c:    11 | #define const_x16 _mm256_set1_epi16
mult768.c:       |                   ^
mult768.c: mult768.c:269:35: error: always_inline function '_mm256_storeu_si256' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_round2_constbranchindex' that is compiled without support for 'avx'
mult768.c:   269 |   for (i = p&~15;i < 768;i += 16) store_x16(&f[i],x);
mult768.c:       |                                   ^
mult768.c: mult768.c:10:24: note: expanded from macro 'store_x16'
mult768.c:    10 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c:       |                        ^
mult768.c: mult768.c:269:35: error: AVX vector argument of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
mult768.c: mult768.c:10:24: note: expanded from macro 'store_x16'
mult768.c:    10 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c:       |                        ^
mult768.c: mult768.c:270:35: error: always_inline function '_mm256_storeu_si256' requires target feature 'avx', but would be inlined into function 'crypto_core_multsntrup761_round2_constbranchindex' that is compiled without support for 'avx'
mult768.c:   270 |   for (i = p&~15;i < 768;i += 16) store_x16(&g[i],x);
mult768.c:       |                                   ^
mult768.c: mult768.c:10:24: note: expanded from macro 'store_x16'
mult768.c:    10 | #define store_x16(p,v) _mm256_storeu_si256((int16x16 *) (p),(v))
mult768.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`round2`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`

Compiler output

ntt.c: ntt.c: In function 'ntt512':
ntt.c: ntt.c:562:44: warning: unused variable 'h3' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                            ^~
ntt.c: ntt.c:562:41: warning: unused variable 'h2' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                         ^~
ntt.c: ntt.c:562:38: warning: unused variable 'h1' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                      ^~
ntt.c: ntt.c:562:35: warning: unused variable 'h0' [-Wunused-variable]
ntt.c:   562 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                   ^~
ntt.c: ntt.c: In function 'invntt512':
ntt.c: ntt.c:865:10: warning: unused variable 'origf' [-Wunused-variable]
ntt.c:   865 |   int16 *origf = f;
ntt.c:       |          ^~~~~
ntt.c: ntt.c:864:44: warning: unused variable 'h3' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                            ^~
ntt.c: ntt.c:864:41: warning: unused variable 'h2' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c:       |                                         ^~
ntt.c: ntt.c:864:38: warning: unused variable 'h1' [-Wunused-variable]
ntt.c:   864 |   __m256i f0,f1,f2,f3,g0,g1,g2,g3,h0,h1,h2,h3;
ntt.c: ...

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`round2`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`

Passed TIMECOP

TIMECOP iterations: 1

Number of similar (implementation,compiler) pairs: 50, namely:

Implementation	Compiler
`avx`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx800`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx800`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx800`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx800`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`avx800`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx800`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx800`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`avx800`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`compact`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`compact`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`compact`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`compact`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`compact`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`compact`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`compact`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`compact`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`compact`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`ref`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`ref`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`ref`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`ref`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`ref`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`ref`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`ref`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`ref`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`ref`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round1`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round1`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round1`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round1`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round1`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_19.1.7_(1+b1))`
`round2`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`
`round2`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (14.2.0)`