Implementation notes: armeabi, novena, crypto_core/aes256encrypt

Computer: novena
Architecture: armeabi
CPU ID: unknown CPU ID
SUPERCOP version: 20220506
Operation: crypto_core
Primitive: aes256encrypt
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
200176 0 011137 424 712T:opensslclang_-march=native_-O_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
200176 0 020867 428 728T:opensslclang_-mcpu=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
24002924 0 011291 416 712T:dolbeau/std-1ftgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
24003944 0 012307 416 712T:dolbeau/std-2ftgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
240076 0 012755 428 712T:opensslclang_-march=native_-O2_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
240076 0 012347 428 720T:opensslclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
240076 0 011009 424 712T:opensslclang_-march=native_-Os_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
240040 0 08570 432 712T:opensslgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
240040 0 09834 432 712T:opensslgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
240040 0 08385 428 712T:opensslgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
240040 0 07922 424 712T:opensslgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
24016556 0 016179 416 712T:dolbeau/std-4ftgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
27994532 0 014155 416 712T:dolbeau/std-2ftgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
28002916 0 015413 420 712T:dolbeau/std-1ftclang_-march=native_-O2_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28002916 0 015005 420 720T:dolbeau/std-1ftclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28002916 0 013667 416 712T:dolbeau/std-1ftclang_-march=native_-Os_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28002876 0 023485 420 728T:dolbeau/std-1ftclang_-mcpu=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28003532 0 013155 416 712T:dolbeau/std-1ftgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
28002896 0 010611 408 712T:dolbeau/std-1ftgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
28003920 0 024533 420 728T:dolbeau/std-2ftclang_-mcpu=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28003920 0 011635 408 712T:dolbeau/std-2ftgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
28006060 0 018557 420 712T:dolbeau/std-4ftclang_-march=native_-O2_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28006060 0 018149 420 720T:dolbeau/std-4ftclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28006060 0 016811 416 712T:dolbeau/std-4ftclang_-march=native_-Os_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28005980 0 013699 408 712T:dolbeau/std-4ftgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
28013956 0 016453 420 712T:dolbeau/std-2ftclang_-march=native_-O2_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28013956 0 016045 420 720T:dolbeau/std-2ftclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28013956 0 014707 416 712T:dolbeau/std-2ftclang_-march=native_-Os_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28016196 0 017051 416 712T:dolbeau/std-4ftclang_-march=native_-O_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28016012 0 026621 420 728T:dolbeau/std-4ftclang_-mcpu=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
28015960 0 014138 412 712T:dolbeau/std-4ftgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
32002872 0 011050 412 712T:dolbeau/std-1ftgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
32004248 0 015107 416 712T:dolbeau/std-2ftclang_-march=native_-O_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
32005976 0 014339 416 712T:dolbeau/std-4ftgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
32013228 0 014083 416 712T:dolbeau/std-1ftclang_-march=native_-O_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
32013896 0 012074 412 712T:dolbeau/std-2ftgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
6144492668 0 012279 416 712refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
7920633468 0 024049 420 728refclang_-mcpu=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
8384673468 0 015529 420 720refclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
11236912908 0 015377 420 712refclang_-march=native_-O2_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
17137381112 0 09463 416 712refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
17565421548 0 012271 416 712refclang_-march=native_-Os_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
17669431074 0 08783 408 712refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506
20493661556 0 012391 416 712refclang_-march=native_-O_-fomit-frame-pointer_-fwrapv_-Qunused-arguments_-fPIC_-fPIE2022060320220506
24970021114 0 09278 412 712refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2022060320220506

Compiler output

Implementation: T:dolbeau/armv8crypto
Security model: timingleaks
Compiler: clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE
core.c: In file included from core.c:9:
core.c: /usr/lib/llvm-11/lib/clang/11.0.1/include/arm_neon.h:32:2: error: "NEON support not enabled"
core.c: #error "NEON support not enabled"
core.c: ^
core.c: core.c:22:3: error: use of undeclared identifier 'uint8x16_t'
core.c: uint8x16_t vzero = vreinterpretq_u8_u32(vdupq_n_u32(0));
core.c: ^
core.c: core.c:47:16: warning: implicit declaration of function 'vgetq_lane_u32' is invalid in C99 [-Wimplicit-function-declaration]
core.c: temp_lds = armv8_aese_sbox(rotl_aes_edrk);
core.c: ^
core.c: core.c:24:2: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ^
core.c: core.c:47:16: warning: implicit declaration of function 'vreinterpretq_u32_u8' is invalid in C99 [-Wimplicit-function-declaration]
core.c: core.c:24:17: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ^
core.c: core.c:47:16: warning: implicit declaration of function 'vaeseq_u8' is invalid in C99 [-Wimplicit-function-declaration]
core.c: core.c:24:38: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ^
core.c: core.c:47:16: warning: implicit declaration of function 'vreinterpretq_u8_u32' is invalid in C99 [-Wimplicit-function-declaration]
core.c: core.c:24:48: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ^
core.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE T:dolbeau/armv8crypto
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE T:dolbeau/armv8crypto
clang -march=native -O -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE T:dolbeau/armv8crypto
clang -march=native -Os -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE T:dolbeau/armv8crypto

Compiler output

Implementation: T:dolbeau/armv8crypto
Security model: timingleaks
Compiler: clang -mcpu=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE
core.c: core.c:47:16: warning: implicit declaration of function 'vaeseq_u8' is invalid in C99 [-Wimplicit-function-declaration]
core.c: temp_lds = armv8_aese_sbox(rotl_aes_edrk);
core.c: ^
core.c: core.c:24:38: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ^
core.c: core.c:47:16: error: passing 'int' to parameter of incompatible type 'uint8x16_t' (vector of 16 'uint8_t' values)
core.c: temp_lds = armv8_aese_sbox(rotl_aes_edrk);
core.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
core.c: core.c:24:38: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
core.c: /usr/lib/llvm-11/lib/clang/11.0.1/include/arm_neon.h:7509:21: note: expanded from macro 'vgetq_lane_u32'
core.c: uint32x4_t __s0 = __p0; \
core.c: ^~~~
core.c: /usr/lib/llvm-11/lib/clang/11.0.1/include/arm_neon.h:32650:49: note: passing argument to parameter '__p0' here
core.c: __ai uint32x4_t vreinterpretq_u32_u8(uint8x16_t __p0) {
core.c: ^
core.c: core.c:60:16: warning: implicit declaration of function 'vaeseq_u8' is invalid in C99 [-Wimplicit-function-declaration]
core.c: temp_lds = armv8_aese_sbox(tmp11);
core.c: ^
core.c: core.c:24:38: note: expanded from macro 'armv8_aese_sbox'
core.c: vgetq_lane_u32(vreinterpretq_u32_u8(vaeseq_u8(vreinterpretq_u8_u32(vdupq_n_u32(input)), vzero)),0)
core.c: ^
core.c: core.c:60:16: error: passing 'int' to parameter of incompatible type 'uint8x16_t' (vector of 16 'uint8_t' values)
core.c: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -mcpu=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE T:dolbeau/armv8crypto

Compiler output

Implementation: T:dolbeau/armv8crypto
Security model: timingleaks
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv -fPIC -fPIE
core.c: In file included from core.c:9:
core.c: core.c: In function ‘aes256_armv8_encrypt’:
core.c: /usr/lib/gcc/arm-linux-gnueabihf/10/include/arm_neon.h:10403:1: error: inlining failed in call to ‘always_inline’ ‘vld1q_u8’: target specific option mismatch
core.c: 10403 | vld1q_u8 (const uint8_t * __a)
core.c: | ^~~~~~~~
core.c: core.c:91:21: note: called from here
core.c: 91 | uint8x16_t temp = vld1q_u8(n);
core.c: | ^~~~~~~~~~~
core.c: In file included from core.c:9:
core.c: /usr/lib/gcc/arm-linux-gnueabihf/10/include/arm_neon.h:10417:1: error: inlining failed in call to ‘always_inline’ ‘vld1q_u32’: target specific option mismatch
core.c: 10417 | vld1q_u32 (const uint32_t * __a)
core.c: | ^~~~~~~~~
core.c: core.c:106:9: note: called from here
core.c: 106 | t = vld1q_u32((unsigned int*)(rkeys+i*16));\
core.c: | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
core.c: In file included from core.c:9:
core.c: /usr/lib/gcc/arm-linux-gnueabihf/10/include/arm_neon.h:10981:1: error: inlining failed in call to ‘always_inline’ ‘vst1q_u8’: target specific option mismatch
core.c: 10981 | vst1q_u8 (uint8_t * __a, uint8x16_t __b)
core.c: | ^~~~~~~~
core.c: core.c:125:3: note: called from here
core.c: 125 | vst1q_u8(out, temp);
core.c: | ^~~~~~~~~~~~~~~~~~~
core.c: In file included from core.c:9:
core.c: /usr/lib/gcc/arm-linux-gnueabihf/10/include/arm_neon.h:14048:1: error: inlining failed in call to ‘always_inline’ ‘veorq_u8’: target specific option mismatch
core.c: 14048 | veorq_u8 (uint8x16_t __a, uint8x16_t __b)
core.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv -fPIC -fPIE T:dolbeau/armv8crypto
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv -fPIC -fPIE T:dolbeau/armv8crypto
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv -fPIC -fPIE T:dolbeau/armv8crypto
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv -fPIC -fPIE T:dolbeau/armv8crypto