Implementation notes: amd64, utrecht, crypto_hash/bmw256

Computer: utrecht
Architecture: amd64
CPU ID: GenuineIntel-000006fb-bfebfbff
SUPERCOP version: 20160806
Operation: crypto_hash
Primitive: bmw256
TimeImplementationCompilerBenchmark dateSUPERCOP version
9693core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
9954core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
10881opt31ssse3_asm64gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
10890opt31ssse3_asm64gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
10899opt31ssse3_asm64gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
10980opt31ssse3_asm64gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
12411amd_k10/x86-64/sse2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
12429amd_k10/x86-64/sse2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
12537amd_k10/x86-64/sse2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
12888amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
13032amd_k8/x86-64/noSSEgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
13878optc01gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
14112optc01gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
14121optabegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14157optc01gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14184optbbegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14193optc03gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14247optc04gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14283optc02gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14346optc01gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
14409optbgbegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
14616optbgbegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
14706optbgbegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
14859core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15129core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
15201optbbegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15219optbbegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
15219optabegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15273opt29_v5_ssse3_asm64gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
15300optabegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
15300opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15327opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
15336sphlibgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15345optabegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
15426optbbegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
15480optc03gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15480optbgbegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
15489optc03gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
15489sphlibgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
15534sphlibgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
15606optc04gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
15642opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
15687optc04gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15849optc02gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
15894optc04gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
15975sphlib-smallgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
16029optc02gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
16029optc02gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
16146optc03gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
16326sphlib-smallgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
16578sphlib-smallgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
17955amd_k10/x86-64/sse2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
18441sphlibgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
18828sphlib-smallgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731
19386amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
19476amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
27054refgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016080420160731
27225refgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016080420160731
27234refgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016080420160731
33156refgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016080420160731

Test failure

Implementation: crypto_hash/bmw256/core_2_45nm/x86-64/sse4_v1
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
error 111

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv core_2_45nm/x86-64/sse4_v1 core_i7_45nm/x86-64/sse4_v1
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv core_2_45nm/x86-64/sse4_v1 core_i7_45nm/x86-64/sse4_v1
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv core_2_45nm/x86-64/sse4_v1 core_i7_45nm/x86-64/sse4_v1
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv core_2_45nm/x86-64/sse4_v1 core_i7_45nm/x86-64/sse4_v1

Compiler output

Implementation: crypto_hash/bmw256/optc31ssse3
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
Compress256_sse_31.c: Compress256_sse_31.c: In function 'Compress256':
Compress256_sse_31.c: Compress256_sse_31.c:374:2: warning: passing argument 1 of '_mm_store_si128' from incompatible pointer type [enabled by default]
Compress256_sse_31.c: _mm_store_si128(&p256[00], copyTemp);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.8/include/pmmintrin.h:35:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.8/include/tmmintrin.h:35,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: /usr/lib/gcc/x86_64-linux-gnu/4.8/include/emmintrin.h:694:1: note: expected '__vector(2) long long int *' but argument is of type 'u_int32_t *'
Compress256_sse_31.c: _mm_store_si128 (__m128i *__P, __m128i __B)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:377:2: warning: passing argument 1 of '_mm_load_si128' from incompatible pointer type [enabled by default]
Compress256_sse_31.c: copyTemp = _mm_load_si128(&hashState256(state)->gt;DoublePipe[ 4]);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.8/include/pmmintrin.h:35:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.8/include/tmmintrin.h:35,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: /usr/lib/gcc/x86_64-linux-gnu/4.8/include/emmintrin.h:676:1: note: expected 'const __vector(2) long long int *' but argument is of type 'u_int32_t *'
Compress256_sse_31.c: _mm_load_si128 (__m128i const *__P)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:378:2: warning: passing argument 1 of '_mm_store_si128' from incompatible pointer type [enabled by default]
Compress256_sse_31.c: _mm_store_si128(&p256[04], copyTemp);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.8/include/pmmintrin.h:35:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.8/include/tmmintrin.h:35,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv optc31ssse3

Compiler output

Implementation: crypto_hash/bmw256/opt31ssse3_asm64
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
wrapper.c: wrapper.c:37:0: warning: "crypto_hash_BYTES" redefined [enabled by default]
wrapper.c: #define crypto_hash_BYTES 32
wrapper.c: ^
wrapper.c: In file included from wrapper.c:20:0:
wrapper.c: crypto_hash.h:7:0: note: this is the location of the previous definition
wrapper.c: #define crypto_hash_BYTES crypto_hash_bmw256_BYTES
wrapper.c: ^
wrapper.c: wrapper.c: In function 'crypto_hash_bmw256_opt31ssse3_asm64':
wrapper.c: wrapper.c:238:2: warning: passing argument 3 of 'Compress256' from incompatible pointer type [enabled by default]
wrapper.c: Compress256(data32, data32 +16, CONST32final-4); // TODO: This is a HACK...
wrapper.c: ^
wrapper.c: wrapper.c:39:8: note: expected 'struct hashState *' but argument is of type 'u_int32_t *'
wrapper.c: extern Compress256(u_int32_t *data32, u_int32_t *data32_end, hashState *state);
wrapper.c: ^

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv opt31ssse3_asm64