Test results for aarch64, pi5, crypto_kem/ntskem1380
[Page version: 20250609 19:52:35]
Measurements for aarch64, pi5, crypto_kem
Test results for aarch64, pi5, crypto_kem
Test results for crypto_kem/ntskem1380
Computer: pi5
Microarchitecture: aarch64; Cortex-A76 (414fd0b1)
Architecture: aarch64
CPU ID: 414fd0b1 
SUPERCOP version: 20250415
Operation: crypto_kem
Primitive: ntskem1380
| Time | Object size | Test size | Implementation | Compiler | Benchmark date | SUPERCOP version | 
|---|
| 1312692 | 73056 84 16 | 90962 904 1584 | T:opt | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 1325544 | 110469 84 16 | 129787 952 1568 | T:opt | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 1337308 | 61380 84 16 | 78426 904 1584 | T:opt | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 1401559 | 59976 84 16 | 76810 896 1568 | T:opt | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 1442442 | 57777 84 16 | 73481 880 1552 | T:opt | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 9542388 | 34261 76 16 | 53699 944 1568 | T:ref | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 11384672 | 30376 76 16 | 48202 888 1584 | T:ref | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 12730944 | 24336 76 16 | 41314 888 1584 | T:ref | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 13739034 | 23520 76 16 | 40282 888 1568 | T:ref | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
| 13940407 | 20789 76 16 | 36417 872 1552 | T:ref | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall | 20250602 | 20250415 | 
Compiler output
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/immintrin.h:14:2: error: "This header is only meant to be used on x86 and x64 architecture"
bitslice_bma_128.c: #error "This header is only meant to be used on x86 and x64 architecture"
bitslice_bma_128.c:  ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-14/lib/clang/14.0.6/include/immintrin.h:17:
bitslice_bma_128.c: In file included from /usr/lib/llvm-14/lib/clang/14.0.6/include/x86gprintrin.h:15:
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/hresetintrin.h:42:27: error: invalid input constraint 'a' in asm
bitslice_bma_128.c:   __asm__ ("hreset $0" :: "a"(__eax));
bitslice_bma_128.c:                           ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-14/lib/clang/14.0.6/include/immintrin.h:21:
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/mmintrin.h:14:2: error: "This header is only meant to be used on x86 and x64 architecture"
bitslice_bma_128.c: #error "This header is only meant to be used on x86 and x64 architecture"
bitslice_bma_128.c:  ^
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/mmintrin.h:54:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c:     return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
bitslice_bma_128.c:            ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/mmintrin.h:133:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c:     return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
bitslice_bma_128.c:            ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/mmintrin.h:163:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
bitslice_bma_128.c: ...
Number of similar (implementation,compiler) pairs: 1, namely:
| Implementation | Compiler | 
| T:avx2 | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6) | 
Compiler output
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.h:18:10: fatal error: immintrin.h: No such file or directory
bitslice_bma_128.c:    18 | #include <immintrin.h>
bitslice_bma_128.c:       |          ^~~~~~~~~~~~~
bitslice_bma_128.c: compilation terminated.
Number of similar (implementation,compiler) pairs: 4, namely:
| Implementation | Compiler | 
| T:avx2 | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:avx2 | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:avx2 | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:avx2 | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
Compiler output
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: ./bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i     vector;
bitslice_bma_128.c:         ^
bitslice_bma_128.c: ./bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c:     const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c:           ^
bitslice_bma_128.c: ./bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' is invalid in C99 [-Wimplicit-function-declaration]
bitslice_bma_128.c:     const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c:                          ^
bitslice_bma_128.c: ./bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' is invalid in C99 [-Wimplicit-function-declaration]
bitslice_bma_128.c:     return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c:                     ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/immintrin.h:14:2: error: "This header is only meant to be used on x86 and x64 architecture"
bitslice_bma_128.c: #error "This header is only meant to be used on x86 and x64 architecture"
bitslice_bma_128.c:  ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:
bitslice_bma_128.c: In file included from ./bitslice_bma_128.h:18:
bitslice_bma_128.c: In file included from /usr/lib/llvm-14/lib/clang/14.0.6/include/immintrin.h:17:
bitslice_bma_128.c: In file included from /usr/lib/llvm-14/lib/clang/14.0.6/include/x86gprintrin.h:15:
bitslice_bma_128.c: /usr/lib/llvm-14/lib/clang/14.0.6/include/hresetintrin.h:42:27: error: invalid input constraint 'a' in asm
bitslice_bma_128.c:   __asm__ ("hreset $0" :: "a"(__eax));
bitslice_bma_128.c:                           ^
bitslice_bma_128.c: ...
Number of similar (implementation,compiler) pairs: 1, namely:
| Implementation | Compiler | 
| T:sse2 | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6) | 
Compiler output
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:
bitslice_bma_128.c: bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c:    47 | typedef __m128i     vector;
bitslice_bma_128.c:       |         ^~~~~~~
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c:    98 |     const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c:       |           ^~~~~~~
bitslice_bma_128.c: bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' [-Wimplicit-function-declaration]
bitslice_bma_128.c:    98 |     const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c:       |                          ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' [-Wimplicit-function-declaration]
bitslice_bma_128.c:    99 |     return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c:       |                     ^~~~~~~~~~~~~~~~~
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c:    93 | #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c:       |                                          ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:
bitslice_bma_128.c: bitslice_bma_128.h: At top level:
bitslice_bma_128.c: bitslice_bma_128.h:18:10: fatal error: immintrin.h: No such file or directory
bitslice_bma_128.c:    18 | #include <immintrin.h>
bitslice_bma_128.c:       |          ^~~~~~~~~~~~~
bitslice_bma_128.c: compilation terminated.
Number of similar (implementation,compiler) pairs: 4, namely:
| Implementation | Compiler | 
| T:sse2 | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:sse2 | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:sse2 | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:sse2 | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
Namespace violations
bitslice_bma_64.o bitslice_bma T
bitslice_fft_64.o _twist_factors13_80_64 R
bitslice_fft_64.o bitslice_fft13_64 T
bitslice_fft_64.o twiddle_factors R
bitslice_fft_64.o twist_factors D
ff.o bitslice_mul13_64 T
ff.o ff_add_m T
ff.o ff_create T
ff.o ff_inv_13 T
ff.o ff_mul_13 T
ff.o ff_reduce_13 T
ff.o ff_release T
ff.o ff_sqr_13 T
ff.o vector_ff_inv_13 T
ff.o vector_ff_mul_13 T
ff.o vector_ff_pow16_13 T
ff.o vector_ff_pow4_13 T
ff.o vector_ff_pow8_13 T
ff.o vector_ff_sqr_13 T
ff.o vector_ff_sqr_inv_13 T
ff.o vector_ff_transpose_xor_13 T
keccak.o shake_256 T
m4r.o _gray_codes_lut D
m4r.o _gray_codes_lut2 R
m4r.o _gray_codes_lut3 R
m4r.o _gray_codes_lut4 R
m4r.o _gray_codes_lut5 R
m4r.o _gray_codes_lut6 R
m4r.o _gray_codes_lut7 R
m4r.o _gray_codes_lut8 R
m4r.o _m4ri_gauss_submatrix T
m4r.o _m4ri_make_table_rev T
m4r.o m4r_rref T
matrix_ff2.o alloc_matrix_ff2 T
matrix_ff2.o calloc_matrix_ff2 T
matrix_ff2.o clone_matrix_ff2 T
matrix_ff2.o column_swap_matrix_ff2 T
matrix_ff2.o free_matrix_ff2 T
matrix_ff2.o is_equal_matrix_ff2 T
matrix_ff2.o reduce_row_echelon_matrix_ff2 T
matrix_ff2.o zero_matrix_ff2 T
nts_kem.o compute_syndrome T
nts_kem.o correct_error_and_recover_ke T
nts_kem.o create_matrix_G T
nts_kem.o create_random_goppa_polynomial T
nts_kem.o deserialise_private_key T
nts_kem.o fisher_yates_shuffle T
nts_kem.o is_valid_goppa_polynomial T
nts_kem.o load_input_ciphertext T
nts_kem.o nts_kem_ciphertext_size T
nts_kem.o nts_kem_create T
nts_kem.o nts_kem_decapsulate T
nts_kem.o nts_kem_encapsulate T
nts_kem.o nts_kem_init_from_private_key T
nts_kem.o nts_kem_key_size T
nts_kem.o nts_kem_release T
nts_kem.o pack_buffer T
nts_kem.o random_vector T
nts_kem.o serialise_private_key T
nts_kem.o serialise_public_key T
nts_kem.o unpack_buffer T
polynomial.o clone_poly T
polynomial.o create_random_poly T
polynomial.o evaluate_poly T
polynomial.o formal_derivative_poly T
polynomial.o free_poly T
polynomial.o gcd_poly T
polynomial.o init_poly T
polynomial.o is_equal_poly T
polynomial.o modulo_reduce_poly T
polynomial.o poly_from_roots T
polynomial.o update_poly_degree T
polynomial.o zero_poly T
random.o random_uint16_bounded T
random.o randombit T
vector_utils.o vector_ff_or_64 T
vector_utils.o vector_load_1d_64 T
vector_utils.o vector_load_2d_64 T
vector_utils.o vector_store_1d_64 T
vector_utils.o vector_store_2d_64 T
Number of similar (implementation,compiler) pairs: 5, namely:
| Implementation | Compiler | 
| T:opt | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6) | 
| T:opt | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:opt | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:opt | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:opt | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
Namespace violations
additive_fft.o _additive_fft_construct_basis T
additive_fft.o _additive_fft_core T
additive_fft.o _additive_fft_ff_value T
additive_fft.o additive_fft T
additive_fft.o ff_poly_taylor_expansion T
berlekamp_massey.o berlekamp_massey T
ff.o ff_add_m T
ff.o ff_create T
ff.o ff_inv_13 T
ff.o ff_mul_13 T
ff.o ff_reduce_13 T
ff.o ff_release T
ff.o ff_sqr_13 T
keccak.o Keccak T
keccak.o KeccakF1600_StatePermute T
keccak.o LFSR86540 T
keccak.o sha3_256 T
keccak.o sha3_384 T
keccak.o sha3_512 T
keccak.o shake_256 T
m4r.o _gray_codes_lut D
m4r.o _gray_codes_lut2 R
m4r.o _gray_codes_lut3 R
m4r.o _gray_codes_lut4 R
m4r.o _gray_codes_lut5 R
m4r.o _gray_codes_lut6 R
m4r.o _gray_codes_lut7 R
m4r.o _gray_codes_lut8 R
m4r.o _m4ri_gauss_submatrix T
m4r.o _m4ri_make_table_rev T
m4r.o m4r_rref T
matrix_ff2.o alloc_matrix_ff2 T
matrix_ff2.o calloc_matrix_ff2 T
matrix_ff2.o clone_matrix_ff2 T
matrix_ff2.o column_swap_matrix_ff2 T
matrix_ff2.o free_matrix_ff2 T
matrix_ff2.o is_equal_matrix_ff2 T
matrix_ff2.o reduce_row_echelon_matrix_ff2 T
matrix_ff2.o zero_matrix_ff2 T
nts_kem.o compute_syndrome T
nts_kem.o correct_error_and_recover_ke T
nts_kem.o create_matrix_G T
nts_kem.o create_random_goppa_polynomial T
nts_kem.o deserialise_private_key T
nts_kem.o fisher_yates_shuffle T
nts_kem.o is_valid_goppa_polynomial T
nts_kem.o nts_kem_ciphertext_size T
nts_kem.o nts_kem_create T
nts_kem.o nts_kem_decapsulate T
nts_kem.o nts_kem_encapsulate T
nts_kem.o nts_kem_init_from_private_key T
nts_kem.o nts_kem_key_size T
nts_kem.o nts_kem_release T
nts_kem.o pack_buffer T
nts_kem.o random_vector T
nts_kem.o serialise_private_key T
nts_kem.o serialise_public_key T
nts_kem.o unpack_buffer T
polynomial.o clone_poly T
polynomial.o create_random_poly T
polynomial.o evaluate_poly T
polynomial.o formal_derivative_poly T
polynomial.o free_poly T
polynomial.o gcd_poly T
polynomial.o init_poly T
polynomial.o is_equal_poly T
polynomial.o modulo_reduce_poly T
polynomial.o poly_from_roots T
polynomial.o update_poly_degree T
polynomial.o zero_poly T
random.o random_uint16_bounded T
random.o randombit T
stack.o stack_create T
stack.o stack_free T
stack.o stack_pop T
stack.o stack_push T
stack.o stack_size T
Number of similar (implementation,compiler) pairs: 5, namely:
| Implementation | Compiler | 
| T:ref | clang -mcpu=native -O3 -fwrapv -Qunused-arguments -fPIC -fPIE -gdwarf-4 -Wall (Debian_Clang_14.0.6) | 
| T:ref | gcc -march=native -mtune=native -O2 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:ref | gcc -march=native -mtune=native -O3 -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:ref | gcc -march=native -mtune=native -O -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) | 
| T:ref | gcc -march=native -mtune=native -Os -fwrapv -fPIC -fPIE -gdwarf-4 -Wall (12.2.0) |