Implementation notes: amd64, waldorf, crypto_hash/keccakc768

Computer: waldorf
Architecture: amd64
CPU ID: GenuineIntel-000106e5-bfebfbff
SUPERCOP version: 20160715
Operation: crypto_hash
Primitive: keccakc768
TimeImplementationCompilerBenchmark dateSUPERCOP version
53884opt64lcu6gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
53968opt64u6clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
55344opt64lcu24shldgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
55412opt64lcu6gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
56008opt64lcu24shldgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
56280opt64lcu6clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
56424inplacegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
56484opt64lcu24clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
57680x86_64_asmgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
57984x86_64_asmgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
58140x86_64_asmgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
58208inplacegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
58332opt64lcu24gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
58828x86_64_shldgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
59104x86_64_shldgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
59136opt64lcu6gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
59372x86_64_asmgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
59460x86_64_shldgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
59608inplaceclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
59608simplegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
59632opt64u6gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
59700x86_64_shldgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
59868simplegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
60108opt64lcu24gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
60196opt64lcu24gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
60552opt64lcu24shldgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
60748opt64lcu6gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
60992inplacegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
61492opt64lcu24gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
61616sseu2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
61884sseu2clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
62344opt64lcu24shldclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
62348opt64u6gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
62600inplacegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
63312sseu2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
63328opt64lcu24shldgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
64228sseu2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
65108simplegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
65404simpleclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
65504opt64u6gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
65584opt64u6gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
66132simplegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
72832mmxu1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
75288mmxu1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
79168sseu2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
79616mmxu1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
84164mmxu1clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
84952mmxu1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
113812opt32bi-s2lcu4gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
117980opt32bi-s2lcu4gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
125876opt32biT-s2lcu4gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
126188opt32bi-rvku2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
126324inplace32biclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
127508opt32biT-s2lcu4gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
129336opt32biT-s2lcu4gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
129828opt32bi-s2lcu4gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
131604inplace32bigcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
131920compactgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
131980opt32bi-s2lcu4clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
132360simple32bigcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
132828opt32biT-s2lcu4clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
135296opt32biT-s2lcu4gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
136268opt32bi-s2lcu4gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
137468simple32bigcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
137604opt32bi-rvku2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
143464simple32biclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
144660opt32bi-rvku2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
145192inplace32bigcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
145788opt32bi-rvku2clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
148148simple32bigcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
149516opt32bi-rvku2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
152720inplace32bigcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
156048compactclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
156056simple32bigcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
156260inplace32bigcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
243940compactgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
258872compactgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
260200compactgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
516480compact8gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
570700compact8gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
582616compact8gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
601532compact8clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
1084788compact8gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715

Compiler output

Implementation: crypto_hash/keccakc768/xopu24
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:185:5: warning: implicit declaration of function '_mm_roti_epi64' is invalid in C99 [-Wimplicit-function-declaration]
KeccakF-1600-opt64.c: rounds
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: ./KeccakF-1600-unrolling.macros:17:5: note: expanded from macro 'rounds'
KeccakF-1600-opt64.c: thetaRhoPiChiIotaPrepareTheta( 0, A, E) \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: ./KeccakF-1600-xop.macros:53:5: note: expanded from macro 'thetaRhoPiChiIotaPrepareTheta'
KeccakF-1600-opt64.c: computeD \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: ./KeccakF-1600-xop.macros:40:23: note: expanded from macro 'computeD'
KeccakF-1600-opt64.c: Dei = XOR128(Cae, ROL6464same(Cio, 1)); \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:102:33: note: expanded from macro 'ROL6464same'
KeccakF-1600-opt64.c: #define ROL6464same(a, o) _mm_roti_epi64(a, o)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:90:50: note: expanded from macro 'XOR128'
KeccakF-1600-opt64.c: #define XOR128(a, b) _mm_xor_si128(a, b)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:185:5: error: passing 'int' to parameter of incompatible type '__m128i' (vector of 2 'long long' values)
KeccakF-1600-opt64.c: rounds
KeccakF-1600-opt64.c: ^~~~~~
KeccakF-1600-opt64.c: ./KeccakF-1600-unrolling.macros:17:5: note: expanded from macro 'rounds'
KeccakF-1600-opt64.c: thetaRhoPiChiIotaPrepareTheta( 0, A, E) \
KeccakF-1600-opt64.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
KeccakF-1600-opt64.c: ./KeccakF-1600-xop.macros:53:5: note: expanded from macro 'thetaRhoPiChiIotaPrepareTheta'
KeccakF-1600-opt64.c: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments xopu24

Compiler output

Implementation: crypto_hash/keccakc768/x86_64_asm
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:50:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ apState, %rdi
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:51:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ apInput, %rsi
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:52:18: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ aNbrWords, %rdx
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:55:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ xpState, %r9
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:58:12: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rT1, %rax
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:59:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rpState, %rdi
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:60:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rpStack, %rsp
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:62:12: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rDa, %rbx
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:63:12: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments x86_64_asm

Compiler output

Implementation: crypto_hash/keccakc768/x86_64_shld
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:50:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ apState, %rdi
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:51:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ apInput, %rsi
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:52:18: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ aNbrWords, %rdx
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:55:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ xpState, %r9
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:58:12: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rT1, %rax
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:59:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rpState, %rdi
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:60:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rpStack, %rsp
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:62:12: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rDa, %rbx
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:63:12: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments x86_64_shld

Compiler output

Implementation: crypto_hash/keccakc768/xopu24
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
KeccakF-1600-opt64.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/x86intrin.h:52:0,
KeccakF-1600-opt64.c: from KeccakF-1600-opt64.c:74:
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c: In function 'KeccakPermutationOnWords':
KeccakF-1600-opt64.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/xopintrin.h:266:1: error: inlining failed in call to always_inline '_mm_roti_epi64': target specific option mismatch
KeccakF-1600-opt64.c: _mm_roti_epi64(__m128i __A, const int __B)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:90:33: error: called from here
KeccakF-1600-opt64.c: #define XOR128(a, b) _mm_xor_si128(a, b)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-xop.macros:40:11: note: in expansion of macro 'XOR128'
KeccakF-1600-opt64.c: Dei = XOR128(Cae, ROL6464same(Cio, 1)); \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-xop.macros:53:5: note: in expansion of macro 'computeD'
KeccakF-1600-opt64.c: computeD \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-unrolling.macros:17:5: note: in expansion of macro 'thetaRhoPiChiIotaPrepareTheta'
KeccakF-1600-opt64.c: thetaRhoPiChiIotaPrepareTheta( 0, A, E) \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:185:5: note: in expansion of macro 'rounds'
KeccakF-1600-opt64.c: rounds
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/x86intrin.h:52:0,
KeccakF-1600-opt64.c: from KeccakF-1600-opt64.c:74:
KeccakF-1600-opt64.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/xopintrin.h:266:1: error: inlining failed in call to always_inline '_mm_roti_epi64': target specific option mismatch
KeccakF-1600-opt64.c: _mm_roti_epi64(__m128i __A, const int __B)
KeccakF-1600-opt64.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv xopu24
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv xopu24
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv xopu24
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv xopu24