Implementation notes: amd64, waldorf, crypto_hash/bmw256

Computer: waldorf
Architecture: amd64
CPU ID: GenuineIntel-000106e5-bfebfbff
SUPERCOP version: 20160715
Operation: crypto_hash
Primitive: bmw256
TimeImplementationCompilerBenchmark dateSUPERCOP version
14704opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
15440opt29_v5_ssse3_asm64clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
15516core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
15764core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
15832core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
15832core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
15912core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
16268opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
16376amd_k10/x86-64/sse2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
16456core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
16480opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
16568core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
16772opt31ssse3_asm64gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
16864core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
16896core_2_45nm/x86-64/sse4_v1clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
16928core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
16988core_i7_45nm/x86-64/sse4_v1clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
17272amd_k10/x86-64/sse2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
17304core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
17316amd_k10/x86-64/sse2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
17532core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
17584amd_k10/x86-64/sse2clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
17588core_2_65nm/x86-64/ssse3_v1clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
17636amd_k10/x86-64/sse2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
17648core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
17876opt29_v5_ssse3_asm64gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
18328opt31ssse3_asm64gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
19280opt31ssse3_asm64clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
19752opt31ssse3_asm64gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
20252opt31ssse3_asm64gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
23580amd_k8/x86-64/noSSEgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
24140amd_k8/x86-64/noSSEclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
25080amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
26268amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
26436amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
26704optc03gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
26960optc04gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
27376optbbegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
27404optc01gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
27532optabegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
27600optc01gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
27796optc04gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
28188optc02gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
28324optabegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
28612optabegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
28692optbbegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
29268optc02gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
29300optabeclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
29540optabegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
29696optbbegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
29968optbbeclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
30204optc02gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
30316sphlibgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
30360optc03gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
30572sphlibgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
30772optc01gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
30852optc04gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
30920optbgbegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
30924optbbegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
30936optc03gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
31000optc03gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
31276optc04gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
31344optc01clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
31508optc03clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
31660sphlibclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
31912optbgbegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
31992optbgbegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
32000optc02gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
32004sphlib-smallgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
32404sphlib-smallgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
32456optbgbeclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
32576optbgbegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
33040sphlib-smallgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
33136optc02clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
33544sphlibgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
34796sphlibgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
34988optc01gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
35632optc04clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
35956sphlib-smallgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
38240sphlib-smallclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715
48420refgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016071820160715
48568refgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016071820160715
51760refgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016071820160715
55192refgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016071820160715
61696refclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016071820160715

Compiler output

Implementation: crypto_hash/bmw256/optc31ssse3
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
Compress256_sse_31.c: Compress256_sse_31.c:374:18: warning: incompatible pointer types passing 'u_int32_t *' (aka 'unsigned int *') to parameter of type '__m128i *' [-Wincompatible-pointer-types]
Compress256_sse_31.c: _mm_store_si128(&p256[00], copyTemp);
Compress256_sse_31.c: ^~~~~~~~~
Compress256_sse_31.c: /usr/include/clang/3.5.0/include/emmintrin.h:1177:26: note: passing argument to parameter '__p' here
Compress256_sse_31.c: _mm_store_si128(__m128i *__p, __m128i __b)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:377:28: warning: incompatible pointer types passing 'u_int32_t *' (aka 'unsigned int *') to parameter of type 'const __m128i *' [-Wincompatible-pointer-types]
Compress256_sse_31.c: copyTemp = _mm_load_si128(&hashState256(state)->gt;DoublePipe[ 4]);
Compress256_sse_31.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
Compress256_sse_31.c: /usr/include/clang/3.5.0/include/emmintrin.h:1063:31: note: passing argument to parameter '__p' here
Compress256_sse_31.c: _mm_load_si128(__m128i const *__p)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:378:18: warning: incompatible pointer types passing 'u_int32_t *' (aka 'unsigned int *') to parameter of type '__m128i *' [-Wincompatible-pointer-types]
Compress256_sse_31.c: _mm_store_si128(&p256[04], copyTemp);
Compress256_sse_31.c: ^~~~~~~~~
Compress256_sse_31.c: /usr/include/clang/3.5.0/include/emmintrin.h:1177:26: note: passing argument to parameter '__p' here
Compress256_sse_31.c: _mm_store_si128(__m128i *__p, __m128i __b)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:379:28: warning: incompatible pointer types passing 'u_int32_t *' (aka 'unsigned int *') to parameter of type 'const __m128i *' [-Wincompatible-pointer-types]
Compress256_sse_31.c: copyTemp = _mm_load_si128(&hashState256(state)->gt;DoublePipe[ 8]);
Compress256_sse_31.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
Compress256_sse_31.c: /usr/include/clang/3.5.0/include/emmintrin.h:1063:31: note: passing argument to parameter '__p' here
Compress256_sse_31.c: _mm_load_si128(__m128i const *__p)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:380:18: warning: incompatible pointer types passing 'u_int32_t *' (aka 'unsigned int *') to parameter of type '__m128i *' [-Wincompatible-pointer-types]
Compress256_sse_31.c: ...

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments optc31ssse3

Compiler output

Implementation: crypto_hash/bmw256/opt31ssse3_asm64
Compiler: clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments
wrapper.c: wrapper.c:37:9: warning: 'crypto_hash_BYTES' macro redefined [-Wmacro-redefined]
wrapper.c: #define crypto_hash_BYTES 32
wrapper.c: ^
wrapper.c: ./crypto_hash.h:7:9: note: previous definition is here
wrapper.c: #define crypto_hash_BYTES crypto_hash_bmw256_BYTES
wrapper.c: ^
wrapper.c: wrapper.c:39:8: warning: type specifier missing, defaults to 'int' [-Wimplicit-int]
wrapper.c: extern Compress256(u_int32_t *data32, u_int32_t *data32_end, hashState *state);
wrapper.c: ~~~~~~ ^
wrapper.c: wrapper.c:238:34: warning: incompatible pointer types passing 'u_int32_t *' (aka 'unsigned int *') to parameter of type 'hashState *' [-Wincompatible-pointer-types]
wrapper.c: Compress256(data32, data32 +16, CONST32final-4); // TODO: This is a HACK...
wrapper.c: ^~~~~~~~~~~~~~
wrapper.c: wrapper.c:39:73: note: passing argument to parameter 'state' here
wrapper.c: extern Compress256(u_int32_t *data32, u_int32_t *data32_end, hashState *state);
wrapper.c: ^
wrapper.c: 3 warnings generated.

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments opt31ssse3_asm64

Compiler output

Implementation: crypto_hash/bmw256/optc31ssse3
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
Compress256_sse_31.c: Compress256_sse_31.c: In function 'Compress256':
Compress256_sse_31.c: Compress256_sse_31.c:374:18: warning: passing argument 1 of '_mm_store_si128' from incompatible pointer type
Compress256_sse_31.c: _mm_store_si128(&p256[00], copyTemp);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/pmmintrin.h:31:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/tmmintrin.h:31,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/emmintrin.h:704:1: note: expected '__vector(2) long long int *' but argument is of type 'u_int32_t *'
Compress256_sse_31.c: _mm_store_si128 (__m128i *__P, __m128i __B)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:377:28: warning: passing argument 1 of '_mm_load_si128' from incompatible pointer type
Compress256_sse_31.c: copyTemp = _mm_load_si128(&hashState256(state)->gt;DoublePipe[ 4]);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/pmmintrin.h:31:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/tmmintrin.h:31,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/emmintrin.h:686:1: note: expected 'const __vector(2) long long int *' but argument is of type 'u_int32_t *'
Compress256_sse_31.c: _mm_load_si128 (__m128i const *__P)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:378:18: warning: passing argument 1 of '_mm_store_si128' from incompatible pointer type
Compress256_sse_31.c: _mm_store_si128(&p256[04], copyTemp);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/pmmintrin.h:31:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/tmmintrin.h:31,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv optc31ssse3

Compiler output

Implementation: crypto_hash/bmw256/opt31ssse3_asm64
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
wrapper.c: wrapper.c:37:0: warning: "crypto_hash_BYTES" redefined
wrapper.c: #define crypto_hash_BYTES 32
wrapper.c: ^
wrapper.c: In file included from wrapper.c:20:0:
wrapper.c: crypto_hash.h:7:0: note: this is the location of the previous definition
wrapper.c: #define crypto_hash_BYTES crypto_hash_bmw256_BYTES
wrapper.c: ^
wrapper.c: wrapper.c: In function 'crypto_hash_bmw256_opt31ssse3_asm64':
wrapper.c: wrapper.c:238:34: warning: passing argument 3 of 'Compress256' from incompatible pointer type
wrapper.c: Compress256(data32, data32 +16, CONST32final-4); // TODO: This is a HACK...
wrapper.c: ^
wrapper.c: wrapper.c:39:8: note: expected 'struct hashState *' but argument is of type 'u_int32_t *'
wrapper.c: extern Compress256(u_int32_t *data32, u_int32_t *data32_end, hashState *state);
wrapper.c: ^

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv opt31ssse3_asm64