Implementation notes: amd64, slide, crypto_hash/bmw256

Computer: slide
Architecture: amd64
CPU ID: GenuineIntel-00040651-bfebfbff
SUPERCOP version: 20160806
Operation: crypto_hash
Primitive: bmw256
TimeImplementationCompilerBenchmark dateSUPERCOP version
7620amd_k10/x86-64/sse2gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
7884core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
7904core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
7912core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
7928core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
7940core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
7940core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
7952core_2_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
8352core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
8392opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
8392core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
8400core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
8400core_2_65nm/x86-64/ssse3_v1gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
8420opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
8420opt29_v5_ssse3_asm64gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
8428opt29_v5_ssse3_asm64gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
8544amd_k10/x86-64/sse2gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
8556amd_k10/x86-64/sse2gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
8568amd_k10/x86-64/sse2gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
8656opt31ssse3_asm64gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
8660opt31ssse3_asm64gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
8740opt31ssse3_asm64gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
8808core_i7_45nm/x86-64/sse4_v1gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
8860opt31ssse3_asm64gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
9330amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
10516amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
10516amd_k8/x86-64/noSSEgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
10736amd_k8/x86-64/noSSEgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
11193optabegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
11684optabegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
11748optbbegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
11820optc01gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
11968optc01gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
11972optbbegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
12064optc01gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
12112optabegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
12204optabegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
12240optc03gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
12264optc03gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
12288optc02gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
12292optc04gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
12296optbbegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
12308optc03gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
12412optc04gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
12424optc02gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
12428optc04gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
12452optbbegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
12592optc02gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
13008sphlibgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
13036optbgbegcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
13068optbgbegcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
13096optc01gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
13100sphlibgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
13152optbgbegcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
13160sphlibgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
13209sphlibgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
13712optbgbegcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
14260optc03gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
14320optc04gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
14568sphlib-smallgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
14720sphlib-smallgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
14740optc02gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
14908sphlib-smallgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
15292sphlib-smallgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806
19088refgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016090620160806
19160refgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016090620160806
19188refgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016090620160806
32836refgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016090620160806

Compiler output

Implementation: crypto_hash/bmw256/optc31ssse3
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
Compress256_sse_31.c: Compress256_sse_31.c: In function 'Compress256':
Compress256_sse_31.c: Compress256_sse_31.c:374:18: warning: passing argument 1 of '_mm_store_si128' from incompatible pointer type
Compress256_sse_31.c: _mm_store_si128(&p256[00], copyTemp);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/pmmintrin.h:31:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/tmmintrin.h:31,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/emmintrin.h:704:1: note: expected '__vector(2) long long int *' but argument is of type 'u_int32_t *'
Compress256_sse_31.c: _mm_store_si128 (__m128i *__P, __m128i __B)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:377:28: warning: passing argument 1 of '_mm_load_si128' from incompatible pointer type
Compress256_sse_31.c: copyTemp = _mm_load_si128(&hashState256(state)->gt;DoublePipe[ 4]);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/pmmintrin.h:31:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/tmmintrin.h:31,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: /usr/lib/gcc/x86_64-linux-gnu/4.9/include/emmintrin.h:686:1: note: expected 'const __vector(2) long long int *' but argument is of type 'u_int32_t *'
Compress256_sse_31.c: _mm_load_si128 (__m128i const *__P)
Compress256_sse_31.c: ^
Compress256_sse_31.c: Compress256_sse_31.c:378:18: warning: passing argument 1 of '_mm_store_si128' from incompatible pointer type
Compress256_sse_31.c: _mm_store_si128(&p256[04], copyTemp);
Compress256_sse_31.c: ^
Compress256_sse_31.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/pmmintrin.h:31:0,
Compress256_sse_31.c: from /usr/lib/gcc/x86_64-linux-gnu/4.9/include/tmmintrin.h:31,
Compress256_sse_31.c: from Compress256_sse_31.c:12:
Compress256_sse_31.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv optc31ssse3
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv optc31ssse3

Compiler output

Implementation: crypto_hash/bmw256/opt31ssse3_asm64
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv
wrapper.c: wrapper.c:37:0: warning: "crypto_hash_BYTES" redefined
wrapper.c: #define crypto_hash_BYTES 32
wrapper.c: ^
wrapper.c: In file included from wrapper.c:20:0:
wrapper.c: crypto_hash.h:7:0: note: this is the location of the previous definition
wrapper.c: #define crypto_hash_BYTES crypto_hash_bmw256_BYTES
wrapper.c: ^
wrapper.c: wrapper.c: In function 'crypto_hash_bmw256_opt31ssse3_asm64':
wrapper.c: wrapper.c:238:34: warning: passing argument 3 of 'Compress256' from incompatible pointer type
wrapper.c: Compress256(data32, data32 +16, CONST32final-4); // TODO: This is a HACK...
wrapper.c: ^
wrapper.c: wrapper.c:39:8: note: expected 'struct hashState *' but argument is of type 'u_int32_t *'
wrapper.c: extern Compress256(u_int32_t *data32, u_int32_t *data32_end, hashState *state);
wrapper.c: ^

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv opt31ssse3_asm64
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv opt31ssse3_asm64