Test results for amd64, cubi10, crypto_sort/int64

[Page version: 20260703 17:10:59]

Measurements for amd64, cubi10, crypto_sort Test results for amd64, cubi10, crypto_sort Test results for crypto_sort/int64

Computer: cubi10
Microarchitecture: amd64; Comet Lake (806ec)
Architecture: amd64
CPU ID: GenuineIntel-000806ec-bfebfbff
SUPERCOP version: 20260627
Operation: crypto_sort
Primitive: int64

Time	Object size	Test size	Implementation	Compiler	Benchmark date	SUPERCOP version
16599	31711 0 0	55504 1272 1472	`2026avx2`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
17076	30930 0 0	51366 1264 1504	`2026avx2`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
17385	33919 0 0	58184 1272 1504	`2026avx2`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
17664	30767 0 0	50712 1272 1472	`2026avx2`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
17698	35501 0 0	58599 1200 1536	`2026avx2`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
17865	31764 0 0	52062 1192 1536	`2026avx2`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
17967	32277 0 0	53183 1200 1536	`2026avx2`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
18779	34462 0 0	53674 1176 1504	`2026avx2`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
29939	35388 0 0	59984 1272 1504	`sse42`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
30109	35388 0 0	59512 1272 1472	`sse42`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
30331	34633 0 0	55414 1264 1504	`sse42`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
30979	34500 0 0	54736 1272 1472	`sse42`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
31691	35461 0 0	56319 1200 1536	`sse42`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
31803	36394 0 0	59471 1200 1536	`sse42`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
32806	34580 0 0	54862 1192 1536	`sse42`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
33578	38133 0 0	57330 1176 1504	`sse42`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
44799	8807 0 0	29670 1264 1504	`x863`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
46399	10056 0 0	34288 1272 1472	`x863`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
46546	9690 0 0	30032 1272 1472	`x863`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
47714	11689 0 0	34472 1272 1472	`x863`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
47809	11704 0 0	36408 1272 1504	`x863`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
50090	11236 0 0	34127 1200 1536	`x863`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
50216	10437 0 0	30542 1192 1536	`x863`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
50782	10756 0 0	31423 1200 1536	`x863`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
52325	676 0 0	21550 1264 1504	`portable4`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
53884	3876 0 0	22842 1176 1504	`x863`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
54669	837 0 0	21208 1272 1472	`portable4`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
54751	837 0 0	25064 1272 1472	`portable4`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
55618	918 0 0	23696 1272 1472	`portable4`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
55836	917 0 0	25616 1272 1504	`portable4`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
60865	865 0 0	23759 1200 1536	`portable4`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
61013	865 0 0	21535 1200 1536	`portable4`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
81849	954 0 0	21022 1192 1536	`portable4`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217
86458	1313 0 0	24725 1296 1568	`T:stdsort`	`g++ -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
86596	1331 0 0	24833 1352 1504	`T:stdsort`	`clang++ -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
87176	1365 0 0	26205 1296 1568	`T:stdsort`	`g++ -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
87785	1653 0 0	27820 1352 1472	`T:stdsort`	`clang++ -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
88060	1892 0 0	28640 1352 1504	`T:stdsort`	`clang++ -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
89008	1588 0 0	24447 1360 1472	`T:stdsort`	`clang++ -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
89353	936 0 0	22282 1272 1536	`T:stdsort`	`g++ -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
92280	1173 0 0	23906 1288 1568	`T:stdsort`	`g++ -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260330	20260330
122901	664 0 0	19642 1176 1504	`portable4`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`	20260302	20260217

Compiler output

sort.c: sort.c:123:8: error: always_inline function '_mm256_loadu_si256' requires target feature 'avx', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx'
sort.c:   x0 = int64x4_load(x+0); // 0 4 8 12
sort.c:        ^
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:123:8: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:124:8: error: always_inline function '_mm256_loadu_si256' requires target feature 'avx', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx'
sort.c:   x1 = int64x4_load(x+4); // 1 5 9 13
sort.c:        ^
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:124:8: error: AVX vector return of type '__m256i' (vector of 4 'long long' values) without 'avx' enabled changes the ABI
sort.c: sort.c:17:25: note: expanded from macro 'int64x4_load'
sort.c: #define int64x4_load(z) _mm256_loadu_si256((__m256i *) (z))
sort.c:                         ^
sort.c: sort.c:125:11: error: always_inline function '_mm256_set1_epi64x' requires target feature 'avx', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'avx'
sort.c:   infty = int64x4_broadcast(int64_largest);
sort.c:           ^
sort.c: sort.c:41:27: note: expanded from macro 'int64x4_broadcast'
sort.c: #define int64x4_broadcast _mm256_set1_epi64x
sort.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`2026avx2`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`

Compiler output

sort.c: sort.c:130:93: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'ssse3'
sort.c:   x4 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(8,9),int64x2_broadcast(pos4)),int8x16_varextract(int64x2_load(x+pos4-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos4&1)))),infty); // 4 12
sort.c:                                                                                             ^
sort.c: sort.c:39:28: note: expanded from macro 'int8x16_varextract'
sort.c: #define int8x16_varextract _mm_shuffle_epi8
sort.c:                            ^
sort.c: sort.c:130:30: error: always_inline function '_mm_cmpgt_epi64' requires target feature 'sse4.2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'sse4.2'
sort.c:   x4 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(8,9),int64x2_broadcast(pos4)),int8x16_varextract(int64x2_load(x+pos4-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos4&1)))),infty); // 4 12
sort.c:                              ^
sort.c: sort.c:20:35: note: expanded from macro 'int64x2_smaller_mask'
sort.c: #define int64x2_smaller_mask(a,b) _mm_cmpgt_epi64(b,a)
sort.c:                                   ^
sort.c: sort.c:130:8: error: always_inline function '_mm_blendv_epi8' requires target feature 'sse4.1', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'sse4.1'
sort.c:   x4 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(8,9),int64x2_broadcast(pos4)),int8x16_varextract(int64x2_load(x+pos4-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos4&1)))),infty); // 4 12
sort.c:        ^
sort.c: sort.c:23:38: note: expanded from macro 'int8x16_iftopthenelse'
sort.c: #define int8x16_iftopthenelse(c,t,e) _mm_blendv_epi8(e,t,c)
sort.c:                                      ^
sort.c: sort.c:132:95: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'ssse3'
sort.c:   x5 = int8x16_iftopthenelse(int64x2_smaller_mask(int64x2_set(10,11),int64x2_broadcast(pos5)),int8x16_varextract(int64x2_load(x+pos5-2),int8x16_sub(int8x16_set(16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31),int8x16_broadcast(8*(pos5&1)))),infty); // 5 13
sort.c:                                                                                               ^
sort.c: sort.c:39:28: note: expanded from macro 'int8x16_varextract'
sort.c: #define int8x16_varextract _mm_shuffle_epi8
sort.c:                            ^
sort.c: sort.c:132:30: error: always_inline function '_mm_cmpgt_epi64' requires target feature 'sse4.2', but would be inlined into function 'int64_sort_8through16' that is compiled without support for 'sse4.2'
sort.c: ...

Number of similar (implementation,compiler) pairs: 1, namely:

Implementation	Compiler
`sse42`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`

Compiler output

try.cpp: In file included from try-anything.cpp:22:
try.cpp: .../supercop-data/cubi10/amd64/include/stq.h:32:13: warning: unused function 'stq_sort' [-Wunused-function]
try.cpp: static void stq_sort(stq_doublearray S,long long n)
try.cpp:             ^
try.cpp: 1 warning generated.
try.cpp: In file included from try-anything.cpp:22:
try.cpp: .../supercop-data/cubi10/amd64/include/stq.h:32:13: warning: unused function 'stq_sort' [-Wunused-function]
try.cpp: static void stq_sort(stq_doublearray S,long long n)
try.cpp:             ^
try.cpp: 1 warning generated.
measure.cpp: In file included from measure-anything.cpp:19:
measure.cpp: .../supercop-data/cubi10/amd64/include/stq.h:32:13: warning: unused function 'stq_sort' [-Wunused-function]
measure.cpp: static void stq_sort(stq_doublearray S,long long n)
measure.cpp:             ^
measure.cpp: 1 warning generated.

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`T:stdsort`	`clang++ -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`T:stdsort`	`clang++ -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`T:stdsort`	`clang++ -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`T:stdsort`	`clang++ -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`

Compiler output

try.cpp: In file included from try-anything.cpp:22:
try.cpp: .../supercop-data/cubi10/amd64/include/stq.h:32:13: warning: 'void stq_sort(std::vector<double>, long long int)' defined but not used [-Wunused-function]
try.cpp:    32 | static void stq_sort(stq_doublearray S,long long n)
try.cpp:       |             ^~~~~~~~
try.cpp: In file included from try-anything.cpp:22:
try.cpp: .../supercop-data/cubi10/amd64/include/stq.h:32:13: warning: 'void stq_sort(std::vector<double>, long long int)' defined but not used [-Wunused-function]
try.cpp:    32 | static void stq_sort(stq_doublearray S,long long n)
try.cpp:       |             ^~~~~~~~
measure.cpp: In file included from measure-anything.cpp:19:
measure.cpp: .../supercop-data/cubi10/amd64/include/stq.h:32:13: warning: 'void stq_sort(std::vector<double>, long long int)' defined but not used [-Wunused-function]
measure.cpp:    32 | static void stq_sort(stq_doublearray S,long long n)
measure.cpp:       |             ^~~~~~~~

Number of similar (implementation,compiler) pairs: 4, namely:

Implementation	Compiler
`T:stdsort`	`g++ -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`T:stdsort`	`g++ -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`T:stdsort`	`g++ -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`T:stdsort`	`g++ -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall`

Passed TIMECOP

TIMECOP iterations: 10

Number of similar (implementation,compiler) pairs: 34, namely:

Implementation	Compiler
`2026avx2`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`2026avx2`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`2026avx2`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`2026avx2`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`2026avx2`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`portable4`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`portable4`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`sse42`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`sse42`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`clang -march=native -O2 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -march=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -march=native -O -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -march=native -Os -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6)`
`x863`	`gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`
`x863`	`gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0)`