Implementation notes: aarch64, supercoplxc, crypto_decode/761x1531

Computer: supercoplxc
Architecture: aarch64
CPU ID: 410fd034
SUPERCOP version: 20190816
Operation: crypto_decode
Primitive: 761x1531
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
89605228 0 017790 800 760int16clang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082820190816
96005216 0 017702 800 760int16clang_-O3_-fomit-frame-pointer_-Qunused-arguments2019082820190816
96005204 0 017742 800 760int16clang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019082820190816
96005204 0 017742 800 760int16clang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019082820190816
96005204 0 017742 800 760int16clang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019082820190816
157607384 0 019942 800 760portableclang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082820190816
172007388 0 019870 800 760portableclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019082820190816
172007376 0 019910 800 760portableclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019082820190816
172007376 0 019910 800 760portableclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019082820190816
172007376 0 019910 800 760portableclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019082820190816
333604576 0 016848 880 736int16gcc_-funroll-loops_-O2_-fomit-frame-pointer2019082820190816
333604576 0 017425 888 752int16gcc_-funroll-loops_-O3_-fomit-frame-pointer2019082820190816
343202276 0 011680 864 728int16gcc_-funroll-loops_-Os_-fomit-frame-pointer2019082820190816
343202276 0 011680 864 728int16gcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082820190816
350404176 0 016488 880 736int16gcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082820190816
350404176 0 016945 888 752int16gcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082820190816
356004120 0 015337 888 752int16gcc_-O3_-fomit-frame-pointer2019082820190816
361602376 0 012320 880 736int16gcc_-O2_-fomit-frame-pointer2019082820190816
364802280 0 011616 864 728int16gcc_-Os_-fomit-frame-pointer2019082820190816
364802280 0 011616 864 728int16gcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082820190816
390403784 0 014985 888 752int16gcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082820190816
392002280 0 012176 880 736int16gcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082820190816
420804280 0 017888 880 736int16gcc_-funroll-loops_-O_-fomit-frame-pointer2019082820190816
420804280 0 017888 880 736int16gcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019082820190816
422402400 0 012576 880 736int16gcc_-O_-fomit-frame-pointer2019082820190816
422402400 0 012576 880 736int16gcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019082820190816
452003312 0 015576 880 736portablegcc_-funroll-loops_-O2_-fomit-frame-pointer2019082820190816
452003304 0 016153 888 752portablegcc_-funroll-loops_-O3_-fomit-frame-pointer2019082820190816
460803256 0 015560 880 736portablegcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082820190816
460803256 0 016017 888 752portablegcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082820190816
461602880 0 014105 888 752portablegcc_-O3_-fomit-frame-pointer2019082820190816
464002780 0 013993 888 752portablegcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082820190816
464802400 0 012344 880 736portablegcc_-O2_-fomit-frame-pointer2019082820190816
465602308 0 012208 880 736portablegcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082820190816
772001588 0 011016 864 728portablegcc_-funroll-loops_-Os_-fomit-frame-pointer2019082820190816
772001588 0 011016 864 728portablegcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082820190816
788001524 0 010880 864 728portablegcc_-Os_-fomit-frame-pointer2019082820190816
788001524 0 010880 864 728portablegcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082820190816
865601364 0 012601 888 752refgcc_-O3_-fomit-frame-pointer2019082820190816
868001364 0 012585 888 752refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082820190816
874402788 0 015553 888 752refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2019082820190816
887202784 0 015633 888 752refgcc_-funroll-loops_-O3_-fomit-frame-pointer2019082820190816
890401332 0 013806 800 760refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2019082820190816
899203056 0 016680 880 736portablegcc_-funroll-loops_-O_-fomit-frame-pointer2019082820190816
899203056 0 016680 880 736portablegcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019082820190816
902401720 0 011904 880 736portablegcc_-O_-fomit-frame-pointer2019082820190816
902401720 0 011904 880 736portablegcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019082820190816
908002620 0 014920 880 736refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082820190816
920002616 0 014880 880 736refgcc_-funroll-loops_-O2_-fomit-frame-pointer2019082820190816
962401392 0 013950 800 760refclang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2019082820190816
964801300 0 011256 880 736refgcc_-O2_-fomit-frame-pointer2019082820190816
968801300 0 011200 880 736refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2019082820190816
985601388 0 013918 800 760refclang_-O3_-fwrapv_-mavx2_-fomit-frame-pointer_-Qunused-arguments2019082820190816
985601388 0 013918 800 760refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2019082820190816
986401388 0 013918 800 760refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2019082820190816
1088801064 0 010392 864 728refgcc_-Os_-fomit-frame-pointer2019082820190816
1088801064 0 010392 864 728refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082820190816
1088801064 0 010456 864 728refgcc_-funroll-loops_-Os_-fomit-frame-pointer2019082820190816
1088801064 0 010456 864 728refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2019082820190816
1220801968 0 015576 880 736refgcc_-funroll-loops_-O_-fomit-frame-pointer2019082820190816
1220801968 0 015576 880 736refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2019082820190816
1231201144 0 011320 880 736refgcc_-O_-fomit-frame-pointer2019082820190816
1231201144 0 011320 880 736refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2019082820190816
1907206680 0 019144 864 736int16cc2019082820190816
1907206680 0 019144 864 736int16gcc2019082820190816
1907206680 0 019144 864 736int16gcc_-funroll-loops2019082820190816
2965603220 0 015696 864 736portablecc2019082820190816
2965603220 0 015696 864 736portablegcc2019082820190816
2965603220 0 015696 864 736portablegcc_-funroll-loops2019082820190816
4342402776 0 015224 864 736refcc2019082820190816
4342402776 0 015224 864 736refgcc2019082820190816
4343202776 0 015224 864 736refgcc_-funroll-loops2019082820190816

Compiler output

Implementation: avx
Security model: unknown
Compiler: cc
decode.c: decode.c:3:10: fatal error: immintrin.h: No such file or directory
decode.c: #include <immintrin.h>
decode.c: ^~~~~~~~~~~~~
decode.c: compilation terminated.

Number of similar (compiler,implementation) pairs: 19, namely:
CompilerImplementations
cc avx
gcc avx
gcc -O2 -fomit-frame-pointer avx
gcc -O3 -fomit-frame-pointer avx
gcc -O -fomit-frame-pointer avx
gcc -Os -fomit-frame-pointer avx
gcc -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -fno-schedule-insns -Os -fomit-frame-pointer avx
gcc -funroll-loops avx
gcc -funroll-loops -O2 -fomit-frame-pointer avx
gcc -funroll-loops -O3 -fomit-frame-pointer avx
gcc -funroll-loops -O -fomit-frame-pointer avx
gcc -funroll-loops -Os -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer avx
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
decode.c: In file included from decode.c:3:
decode.c: In file included from /usr/lib/llvm-7/lib/clang/7.0.1/include/immintrin.h:28:
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:64:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_vec_init_v2si(__i, 0);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:143:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packsswb((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:173:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packssdw((__v2si)__m1, (__v2si)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:203:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_packuswb((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:230:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhbw((__v8qi)__m1, (__v8qi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:253:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhwd((__v4hi)__m1, (__v4hi)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:274:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpckhdq((__v2si)__m1, (__v2si)__m2);
decode.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
decode.c: /usr/lib/llvm-7/lib/clang/7.0.1/include/mmintrin.h:301:12: error: invalid conversion between vector type '__m64' (vector of 1 'long long' value) and integer type 'int' of different size
decode.c: return (__m64)__builtin_ia32_punpcklbw((__v8qi)__m1, (__v8qi)__m2);
decode.c: ...

Number of similar (compiler,implementation) pairs: 5, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx2 -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -fomit-frame-pointer -Qunused-arguments avx
clang -O3 -fwrapv -mavx -maes -mpclmul -fomit-frame-pointer -Qunused-arguments avx
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments avx