Implementation notes: aarch64, hikey960, crypto_sign/picnicl1ur

Computer: hikey960
Architecture: aarch64
CPU ID: 410fd034
SUPERCOP version: 20190816
Operation: crypto_sign
Primitive: picnicl1ur
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
4443885094651 2600 16129003 3616 1608optimizedct/cgcc_-O_-fomit-frame-pointer2019120320190816
48074796102414 2056 16135852 2928 1624optimizedct/cclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019120320190816
5124870084737 2600 16118151 3600 1608optimizedct/cgcc_-Os_-fomit-frame-pointer2019120320190816
5388772595159 2600 16129515 3616 1608optimizedct/cgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019120320190816
57377551102414 2056 16135852 2928 1624optimizedct/cclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019120320190816
6279141084685 2600 16118095 3600 1608optimizedct/cgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019120320190816
6280310394743 2600 16129139 3616 1608optimizedct/cgcc_-O2_-fomit-frame-pointer2019120320190816
67398452102414 2056 16135852 2928 1624optimizedct/cclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019120320190816
6767047084737 2600 16118151 3600 1608optimizedct/cgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019120320190816
67912944102562 2056 16135980 2928 1624optimizedct/cclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019120320190816
70368474123819 2600 16161203 3616 1608optimizedct/cgcc_-funroll-loops_-O2_-fomit-frame-pointer2019120320190816
70508790106819 2600 16142819 3616 1640optimizedct/cgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019120320190816
70824501106891 2600 16142947 3616 1640optimizedct/cgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019120320190816
71035300106435 2600 16142499 3616 1640optimizedct/cgcc_-O3_-fomit-frame-pointer2019120320190816
75139218120931 2600 16158483 3616 1608optimizedct/cgcc_-funroll-loops_-O_-fomit-frame-pointer2019120320190816
75349692120931 2600 16158483 3616 1608optimizedct/cgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019120320190816
76834703140687 2600 16178387 3616 1640optimizedct/cgcc_-funroll-loops_-O3_-fomit-frame-pointer2019120320190816
7776496084801 2600 16118239 3600 1608optimizedct/cgcc_-funroll-loops_-Os_-fomit-frame-pointer2019120320190816
81558675140843 2600 16178475 3616 1640optimizedct/cgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019120320190816
9679284494967 2600 16129363 3616 1608optimizedct/cgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019120320190816
9914242595175 2600 16129499 3616 1608optimizedct/cgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019120320190816
10230592594651 2600 16129003 3616 1608optimizedct/cgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019120320190816
11362075984801 2600 16118239 3600 1608optimizedct/cgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019120320190816
117906975124207 2600 16161587 3616 1608optimizedct/cgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019120320190816
1249305121034029 4 01066392 1008 1592refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019120320190816
131628101135040 2600 16173591 3600 1608optimizedct/ccc2019120320190816
135340940135040 2600 16173591 3600 1608optimizedct/cgcc_-funroll-loops2019120320190816
2327586751036814 4 01069168 1008 1592refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2019120320190816
238494600135040 2600 16173591 3600 1608optimizedct/cgcc2019120320190816
2390773501046057 4 01079000 888 1608refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019120320190816
2395352251057671 4 01091616 1008 1624refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019120320190816
2523973501030922 4 01062388 992 1592refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2019120320190816
2721276001057271 4 01091272 1008 1624refgcc_-O3_-fomit-frame-pointer2019120320190816
2749997251057316 4 01091304 1008 1624refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2019120320190816
2775721501034401 4 01066768 1008 1592refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2019120320190816
2804025001046057 4 01079016 888 1608refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019120320190816
3016147501050397 4 01085960 1008 1592refgcc_-funroll-loops_-O_-fomit-frame-pointer2019120320190816
3182133021046057 4 01079016 888 1608refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019120320190816
3370126501030962 4 01062428 992 1592refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019120320190816
3518116701036565 4 01068920 1008 1592refgcc_-O2_-fomit-frame-pointer2019120320190816
4093719301034029 4 01066392 1008 1592refgcc_-O_-fomit-frame-pointer2019120320190816
4499246251036717 4 01068992 1008 1592refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019120320190816
4661339401062153 4 01097496 1008 1592refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019120320190816
5276810651030982 4 01062476 992 1592refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019120320190816
5516311501093611 4 01129256 1008 1624refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019120320190816
5944533001093831 4 01129408 1008 1624refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019120320190816
6455871001050397 4 01085960 1008 1592refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019120320190816
6909030501046057 4 01079016 888 1608refclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019120320190816
7931310751030982 4 01062476 992 1592refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019120320190816
8624956101062029 4 01097376 1008 1592refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019120320190816
10385852401060091 292 01096404 1280 1592refgcc_-funroll-loops2019120320190816
13929995201030962 4 01062428 992 1592refgcc_-Os_-fomit-frame-pointer2019120320190816
14573452601060091 292 01096404 1280 1592refgcc2019120320190816
15835058001060091 292 01096404 1280 1592refcc2019120320190816

Compiler output

Implementation: optimizedct/neon
Security model: unknown
Compiler: cc
picnic2_simulate_mul.c: picnic2_simulate_mul.c: In function 'transpose_64_64_s128':
picnic2_simulate_mul.c: picnic2_simulate_mul.c:316:24: warning: implicit declaration of function '_mm_set1_epi64x' [-Wimplicit-function-declaration]
picnic2_simulate_mul.c: word128 mask = _mm_set1_epi64x(TRANSPOSE_MASKS64[i]);
picnic2_simulate_mul.c: ^~~~~~~~~~~~~~~
picnic2_simulate_mul.c: picnic2_simulate_mul.c:316:24: error: incompatible types when initializing type 'word128' using type 'int'
picnic2_simulate_mul.c: In file included from mzd_additional.h:24:0,
picnic2_simulate_mul.c: from lowmc_pars.h:15,
picnic2_simulate_mul.c: from lowmc.h:13,
picnic2_simulate_mul.c: from picnic_impl.h:13,
picnic2_simulate_mul.c: from picnic2_impl.h:18,
picnic2_simulate_mul.c: from picnic2_types.h:16,
picnic2_simulate_mul.c: from picnic2_simulate_mul.h:13,
picnic2_simulate_mul.c: from picnic2_simulate_mul.c:14:
picnic2_simulate_mul.c: picnic2_simulate_mul.c:317:40: error: incompatible type for argument 2 of 'veorq_u64'
picnic2_simulate_mul.c: word128 inv_mask = mm128_xor(mask, _mm_set1_epi64x(UINT64_C(0xFFFFFFFFFFFFFFFF)));
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: simd.h:103:38: note: in definition of macro 'mm128_xor'
picnic2_simulate_mul.c: #define mm128_xor(l, r) veorq_u64(l, r)
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: In file included from simd.h:21:0,
picnic2_simulate_mul.c: from mzd_additional.h:24,
picnic2_simulate_mul.c: from lowmc_pars.h:15,
picnic2_simulate_mul.c: from lowmc.h:13,
picnic2_simulate_mul.c: from picnic_impl.h:13,
picnic2_simulate_mul.c: from picnic2_impl.h:18,
picnic2_simulate_mul.c: ...

Number of similar (compiler,implementation) pairs: 23, namely:
CompilerImplementations
cc optimizedct/neon
gcc optimizedct/neon
gcc -O2 -fomit-frame-pointer optimizedct/neon
gcc -O3 -fomit-frame-pointer optimizedct/neon
gcc -O -fomit-frame-pointer optimizedct/neon
gcc -Os -fomit-frame-pointer optimizedct/neon
gcc -fno-schedule-insns -O2 -fomit-frame-pointer optimizedct/neon
gcc -fno-schedule-insns -O3 -fomit-frame-pointer optimizedct/neon
gcc -fno-schedule-insns -O -fomit-frame-pointer optimizedct/neon
gcc -fno-schedule-insns -Os -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops optimizedct/neon
gcc -funroll-loops -O2 -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -O3 -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -O -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -Os -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer optimizedct/neon
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer optimizedct/neon
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv optimizedct/neon
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv optimizedct/neon
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv optimizedct/neon
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv optimizedct/neon

Compiler output

Implementation: optimizedct/neon
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
picnic2_simulate_mul.c: picnic2_simulate_mul.c:316:24: warning: implicit declaration of function '_mm_set1_epi64x' is invalid in C99 [-Wimplicit-function-declaration]
picnic2_simulate_mul.c: word128 mask = _mm_set1_epi64x(TRANSPOSE_MASKS64[i]);
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: picnic2_simulate_mul.c:316:13: error: initializing 'word128' (aka 'uint64x2_t') with an expression of incompatible type 'int'
picnic2_simulate_mul.c: word128 mask = _mm_set1_epi64x(TRANSPOSE_MASKS64[i]);
picnic2_simulate_mul.c: ^ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
picnic2_simulate_mul.c: picnic2_simulate_mul.c:329:57: warning: implicit declaration of function '_mm_srli_epi64' is invalid in C99 [-Wimplicit-function-declaration]
picnic2_simulate_mul.c: out128[i1 / 2] = mm128_xor(mm128_and(t1, mask), _mm_srli_epi64(mm128_and(t2, mask), width));
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: picnic2_simulate_mul.c:331:48: warning: implicit declaration of function '_mm_slli_epi64' is invalid in C99 [-Wimplicit-function-declaration]
picnic2_simulate_mul.c: mm128_xor(mm128_and(t2, inv_mask), _mm_slli_epi64(mm128_and(t1, inv_mask), width));
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: picnic2_simulate_mul.c:331:48: error: passing 'int' to parameter of incompatible type 'uint64x2_t' (vector of 2 'uint64_t' values)
picnic2_simulate_mul.c: mm128_xor(mm128_and(t2, inv_mask), _mm_slli_epi64(mm128_and(t1, inv_mask), width));
picnic2_simulate_mul.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
picnic2_simulate_mul.c: ./simd.h:103:38: note: expanded from macro 'mm128_xor'
picnic2_simulate_mul.c: #define mm128_xor(l, r) veorq_u64(l, r)
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: /usr/lib/llvm-3.8/bin/../lib/clang/3.8.1/include/arm_neon.h:5463:55: note: passing argument to parameter '__p1' here
picnic2_simulate_mul.c: __ai uint64x2_t veorq_u64(uint64x2_t __p0, uint64x2_t __p1) {
picnic2_simulate_mul.c: ^
picnic2_simulate_mul.c: 3 warnings and 2 errors generated.

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments optimizedct/neon
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments optimizedct/neon
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments optimizedct/neon
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments optimizedct/neon