Implementation notes: amd64, waldorf, crypto_hash/keccak

Computer: waldorf
Architecture: amd64
CPU ID: GenuineIntel-000106e5-bfebfbff
SUPERCOP version: 20160715
Operation: crypto_hash
Primitive: keccak
TimeImplementationCompilerBenchmark dateSUPERCOP version
45780opt64lcu24shldgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
46176opt64lcu6gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
47500x86_64_asmgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
47848opt64lcu24gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
47928opt64lcu6gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
48920x86_64_shldgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
49016opt64u6clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
49424opt64lcu6clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
49636opt64lcu24gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
50116x86_64_asmgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
50120opt64lcu24clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
50496x86_64_shldgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
50536opt64lcu24shldgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
50624opt64lcu24gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
50720x86_64_shldgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
50956simplegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
51508opt64lcu24shldgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
51708opt64lcu24gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
51876x86_64_asmgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
52028simplegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
52700opt64lcu6gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
52708inplacegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
53020x86_64_asmgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
53032opt64u6gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
53212x86_64_shldgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
53716opt64u6gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
53728opt64u6gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
53804inplacegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
53892simplegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
54320opt64lcu6gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
54488sseu2clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
54640inplaceclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
54872sseu2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
55412inplacegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
55456inplacegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
55632sseu2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
55768opt64lcu24shldclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
55972sseu2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
57972simplegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
58152opt64lcu24shldgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
58328opt64u6gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
58580simpleclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
61884mmxu1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
63128sseu2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
64792mmxu1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
65980mmxu1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
68736mmxu1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
83032mmxu1clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
100908opt32biT-s2lcu4gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
104900opt32biT-s2lcu4gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
107760opt32bi-rvku2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
110512opt32bi-s2lcu4gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
111828opt32biT-s2lcu4gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
112372opt32bi-s2lcu4gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
113644inplace32bigcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
116600opt32biT-s2lcu4gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
118736opt32biT-s2lcu4clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
119920simple32bigcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
119976compactgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
120428opt32bi-s2lcu4gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
121540opt32bi-s2lcu4gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
121920inplace32biclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
122256opt32bi-rvku2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
123976opt32bi-rvku2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
127344simple32bigcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
129188opt32bi-rvku2clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
130192opt32bi-s2lcu4clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
130252simple32biclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
130568opt32bi-rvku2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
131880inplace32bigcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
132852simple32bigcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
132884simple32bigcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
134808inplace32bigcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
135832compactclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
140508inplace32bigcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
213576compactgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
222240compactgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
228204compactgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
397852compact8gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
476768compact8gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
491180compact8gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
504612compact8clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
937500compact8gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715

Compiler output

Implementation: crypto_hash/keccak/xopu24
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:185:5: warning: implicit declaration of function '_mm_roti_epi64' is invalid in C99 [-Wimplicit-function-declaration]
KeccakF-1600-opt64.c: rounds
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: ./KeccakF-1600-unrolling.macros:17:5: note: expanded from macro 'rounds'
KeccakF-1600-opt64.c: thetaRhoPiChiIotaPrepareTheta( 0, A, E) \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: ./KeccakF-1600-xop.macros:53:5: note: expanded from macro 'thetaRhoPiChiIotaPrepareTheta'
KeccakF-1600-opt64.c: computeD \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: ./KeccakF-1600-xop.macros:40:23: note: expanded from macro 'computeD'
KeccakF-1600-opt64.c: Dei = XOR128(Cae, ROL6464same(Cio, 1)); \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:102:33: note: expanded from macro 'ROL6464same'
KeccakF-1600-opt64.c: #define ROL6464same(a, o) _mm_roti_epi64(a, o)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:90:50: note: expanded from macro 'XOR128'
KeccakF-1600-opt64.c: #define XOR128(a, b) _mm_xor_si128(a, b)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:185:5: error: passing 'int' to parameter of incompatible type '__m128i' (vector of 2 'long long' values)
KeccakF-1600-opt64.c: rounds
KeccakF-1600-opt64.c: ^~~~~~
KeccakF-1600-opt64.c: ./KeccakF-1600-unrolling.macros:17:5: note: expanded from macro 'rounds'
KeccakF-1600-opt64.c: thetaRhoPiChiIotaPrepareTheta( 0, A, E) \
KeccakF-1600-opt64.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
KeccakF-1600-opt64.c: ./KeccakF-1600-xop.macros:53:5: note: expanded from macro 'thetaRhoPiChiIotaPrepareTheta'
KeccakF-1600-opt64.c: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments xopu24

Compiler output

Implementation: crypto_hash/keccak/x86_64_asm
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:50:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ apState, %rdi
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:51:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ apInput, %rsi
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:52:18: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ aNbrWords, %rdx
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:55:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ xpState, %r9
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:58:12: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rT1, %rax
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:59:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rpState, %rdi
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:60:16: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rpStack, %rsp
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:62:12: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: .equ rDa, %rbx
KeccakF-1600-x86-64-gas.s: ^
KeccakF-1600-x86-64-gas.s: KeccakF-1600-x86-64-gas.s:63:12: error: unknown token in expression
KeccakF-1600-x86-64-gas.s: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments x86_64_asm

Compiler output

Implementation: crypto_hash/keccak/x86_64_shld
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:50:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ apState, %rdi
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:51:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ apInput, %rsi
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:52:18: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ aNbrWords, %rdx
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:55:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ xpState, %r9
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:58:12: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rT1, %rax
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:59:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rpState, %rdi
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:60:16: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rpStack, %rsp
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:62:12: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: .equ rDa, %rbx
KeccakF-1600-x86-64-shld-gas.s: ^
KeccakF-1600-x86-64-shld-gas.s: KeccakF-1600-x86-64-shld-gas.s:63:12: error: unknown token in expression
KeccakF-1600-x86-64-shld-gas.s: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments x86_64_shld

Compiler output

Implementation: crypto_hash/keccak/xopu24
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
KeccakF-1600-opt64.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/x86intrin.h:52:0,
KeccakF-1600-opt64.c: from KeccakF-1600-opt64.c:74:
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c: In function 'KeccakPermutationOnWords':
KeccakF-1600-opt64.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/xopintrin.h:266:1: error: inlining failed in call to always_inline '_mm_roti_epi64': target specific option mismatch
KeccakF-1600-opt64.c: _mm_roti_epi64(__m128i __A, const int __B)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:90:33: error: called from here
KeccakF-1600-opt64.c: #define XOR128(a, b) _mm_xor_si128(a, b)
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-xop.macros:40:11: note: in expansion of macro 'XOR128'
KeccakF-1600-opt64.c: Dei = XOR128(Cae, ROL6464same(Cio, 1)); \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-xop.macros:53:5: note: in expansion of macro 'computeD'
KeccakF-1600-opt64.c: computeD \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-unrolling.macros:17:5: note: in expansion of macro 'thetaRhoPiChiIotaPrepareTheta'
KeccakF-1600-opt64.c: thetaRhoPiChiIotaPrepareTheta( 0, A, E) \
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: KeccakF-1600-opt64.c:185:5: note: in expansion of macro 'rounds'
KeccakF-1600-opt64.c: rounds
KeccakF-1600-opt64.c: ^
KeccakF-1600-opt64.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/x86intrin.h:52:0,
KeccakF-1600-opt64.c: from KeccakF-1600-opt64.c:74:
KeccakF-1600-opt64.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/xopintrin.h:266:1: error: inlining failed in call to always_inline '_mm_roti_epi64': target specific option mismatch
KeccakF-1600-opt64.c: _mm_roti_epi64(__m128i __A, const int __B)
KeccakF-1600-opt64.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv xopu24
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv xopu24
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv xopu24
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv xopu24