Implementation notes: amd64, hydra1, crypto_aead/tiaoxinv2

Computer: hydra1
Architecture: amd64
CPU ID: AuthenticAMD-00100fa0-178bfbff
SUPERCOP version: 20161220
Operation: crypto_aead
Primitive: tiaoxinv2
TimeImplementationCompilerBenchmark dateSUPERCOP version
50446refgcc -funroll-loops -Os -fomit-frame-pointer2016102320161009
50466refgcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer2016102320161009
50501refgcc -funroll-loops -m64 -Os -fomit-frame-pointer2016102320161009
50531refgcc -funroll-loops -march=k8 -Os -fomit-frame-pointer2016102320161009
50553refgcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer2016102320161009
50560refgcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer2016102320161009
50625refgcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer2016102320161009
51932refgcc -funroll-loops -O2 -fomit-frame-pointer2016102320161009
51997refgcc -funroll-loops -m64 -O2 -fomit-frame-pointer2016102320161009
52029refgcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer2016102320161009
52085refgcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer2016102320161009
52150refgcc -funroll-loops -O3 -fomit-frame-pointer2016102320161009
52173refgcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer2016102320161009
52202refgcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer2016102320161009
52210refgcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer2016102320161009
52224refgcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer2016102320161009
52251refgcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer2016102320161009
52269refgcc -funroll-loops -m64 -O3 -fomit-frame-pointer2016102320161009
52272refgcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer2016102320161009
52333refgcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer2016102320161009
52345refgcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer2016102320161009
54443refgcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer2016102320161009
54456refgcc -m64 -march=corei7 -Os -fomit-frame-pointer2016102320161009
54457refgcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer2016102320161009
54459refgcc -m64 -march=core2 -Os -fomit-frame-pointer2016102320161009
54507refgcc -Os -fomit-frame-pointer2016102320161009
54556refgcc -march=barcelona -Os -fomit-frame-pointer2016102320161009
54596refgcc -fno-schedule-insns -Os -fomit-frame-pointer2016102320161009
54611refgcc -m64 -Os -fomit-frame-pointer2016102320161009
54718refgcc -march=k8 -Os -fomit-frame-pointer2016102320161009
54789refgcc -m64 -march=k8 -Os -fomit-frame-pointer2016102320161009
54867refgcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer2016102320161009
55003refgcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer2016102320161009
55151refgcc -march=nocona -Os -fomit-frame-pointer2016102320161009
55173refgcc -funroll-loops -march=nocona -Os -fomit-frame-pointer2016102320161009
55213refgcc -m64 -march=nocona -Os -fomit-frame-pointer2016102320161009
55346refgcc -fno-schedule-insns -O -fomit-frame-pointer2016102320161009
55367refgcc -O -fomit-frame-pointer2016102320161009
55380refgcc -m64 -march=barcelona -Os -fomit-frame-pointer2016102320161009
55397refgcc -m64 -O -fomit-frame-pointer2016102320161009
55535refgcc -m64 -march=k8 -O -fomit-frame-pointer2016102320161009
55577refgcc -m64 -march=corei7 -O -fomit-frame-pointer2016102320161009
55657refgcc -funroll-loops -m64 -O -fomit-frame-pointer2016102320161009
55659refgcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer2016102320161009
55661refgcc -march=k8 -O -fomit-frame-pointer2016102320161009
55703refgcc -m64 -march=barcelona -O -fomit-frame-pointer2016102320161009
55705refgcc -m64 -march=core2 -O -fomit-frame-pointer2016102320161009
55728refgcc -m64 -march=native -mtune=native -O -fomit-frame-pointer2016102320161009
55736refgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2016102320161009
55741refgcc -funroll-loops -O -fomit-frame-pointer2016102320161009
55766refgcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer2016102320161009
55786refgcc -march=nocona -O -fomit-frame-pointer2016102320161009
55792refgcc -march=barcelona -O -fomit-frame-pointer2016102320161009
55800refgcc -funroll-loops -march=k8 -O -fomit-frame-pointer2016102320161009
55806refgcc -m64 -O3 -fomit-frame-pointer2016102320161009
55815refgcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer2016102320161009
55832refgcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer2016102320161009
55863refgcc -funroll-loops -march=nocona -O -fomit-frame-pointer2016102320161009
55866refgcc -m64 -march=nocona -O -fomit-frame-pointer2016102320161009
55901refgcc -O2 -fomit-frame-pointer2016102320161009
55910refgcc -m64 -march=nocona -O3 -fomit-frame-pointer2016102320161009
55921refgcc -O3 -fomit-frame-pointer2016102320161009
55923refgcc -fno-schedule-insns -O3 -fomit-frame-pointer2016102320161009
55958refgcc -m64 -O2 -fomit-frame-pointer2016102320161009
55990refgcc -funroll-loops -march=barcelona -O -fomit-frame-pointer2016102320161009
55998refgcc -march=nocona -O3 -fomit-frame-pointer2016102320161009
56008refgcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer2016102320161009
56021refgcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer2016102320161009
56022refgcc -m64 -march=barcelona -O3 -fomit-frame-pointer2016102320161009
56059refgcc -m64 -march=corei7 -O2 -fomit-frame-pointer2016102320161009
56072refgcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer2016102320161009
56084refgcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2016102320161009
56091refgcc -march=nocona -O2 -fomit-frame-pointer2016102320161009
56093refgcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer2016102320161009
56094refgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2016102320161009
56124refgcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer2016102320161009
56128refgcc -m64 -march=nocona -O2 -fomit-frame-pointer2016102320161009
56143refgcc -march=barcelona -O3 -fomit-frame-pointer2016102320161009
56182refgcc -m64 -march=core2 -O2 -fomit-frame-pointer2016102320161009
56186refgcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer2016102320161009
56194refgcc -m64 -march=barcelona -O2 -fomit-frame-pointer2016102320161009
56208refgcc -fno-schedule-insns -O2 -fomit-frame-pointer2016102320161009
56209refgcc -m64 -march=k8 -O3 -fomit-frame-pointer2016102320161009
56256refgcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer2016102320161009
56268refgcc -march=k8 -O3 -fomit-frame-pointer2016102320161009
56274refgcc -march=barcelona -O2 -fomit-frame-pointer2016102320161009
56497refgcc -march=k8 -O2 -fomit-frame-pointer2016102320161009
56573refgcc -m64 -march=k8 -O2 -fomit-frame-pointer2016102320161009
56594refgcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer2016102320161009
56704refgcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer2016102320161009
57173refgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2016102320161009
57398refgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2016102320161009
86227refclang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments2016102320161009
86274refclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016102320161009
88443refclang -O3 -fomit-frame-pointer -Qunused-arguments2016102320161009
88451refclang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016102320161009
88467refclang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016102320161009
88485refclang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2016102320161009
112769refgcc2016102320161009
112773refgcc -funroll-loops2016102320161009
112818refcc2016102320161009

Test failure

Implementation: crypto_aead/tiaoxinv2/ref
Compiler: gcc -m64 -march=core2 -O3 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
gcc -m64 -march=core2 -O3 -fomit-frame-pointer ref

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: cc
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: tiaoxin-optimized.c: In function 'tiaoxin_optimized_encrypt':
tiaoxin-optimized.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: error: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:42:108: note: in expansion of macro 'enc'
tiaoxin-optimized.c: #define RT6( T , M ) tmp = T[0];T[0] = enc(T[5],M);T[5] = T[4];T[4] = T[3];T[3] = T[2];T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:50:1: note: in expansion of macro 'RT6'
tiaoxin-optimized.c: RT6( T6, M2 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:151:2: note: in expansion of macro 'UPDATE'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: error: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:42:41: note: in expansion of macro 'enc'
tiaoxin-optimized.c: ...

Number of similar (compiler,implementation) pairs: 92, namely:
CompilerImplementations
cc nim
gcc nim
gcc -O2 -fomit-frame-pointer nim
gcc -O3 -fomit-frame-pointer nim
gcc -O -fomit-frame-pointer nim
gcc -Os -fomit-frame-pointer nim
gcc -fno-schedule-insns -O2 -fomit-frame-pointer nim
gcc -fno-schedule-insns -O3 -fomit-frame-pointer nim
gcc -fno-schedule-insns -O -fomit-frame-pointer nim
gcc -fno-schedule-insns -Os -fomit-frame-pointer nim
gcc -funroll-loops nim
gcc -funroll-loops -O2 -fomit-frame-pointer nim
gcc -funroll-loops -O3 -fomit-frame-pointer nim
gcc -funroll-loops -O -fomit-frame-pointer nim
gcc -funroll-loops -Os -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer nim
gcc -m64 -O2 -fomit-frame-pointer nim
gcc -m64 -O3 -fomit-frame-pointer nim
gcc -m64 -O -fomit-frame-pointer nim
gcc -m64 -Os -fomit-frame-pointer nim
gcc -m64 -march=core2 -O2 -fomit-frame-pointer nim
gcc -m64 -march=core2 -O3 -fomit-frame-pointer nim
gcc -m64 -march=core2 -O -fomit-frame-pointer nim
gcc -m64 -march=core2 -Os -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer nim
gcc -m64 -march=corei7 -O2 -fomit-frame-pointer nim
gcc -m64 -march=corei7 -O -fomit-frame-pointer nim
gcc -m64 -march=corei7 -Os -fomit-frame-pointer nim
gcc -m64 -march=k8 -O2 -fomit-frame-pointer nim
gcc -m64 -march=k8 -O3 -fomit-frame-pointer nim
gcc -m64 -march=k8 -O -fomit-frame-pointer nim
gcc -m64 -march=k8 -Os -fomit-frame-pointer nim
gcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer nim
gcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer nim
gcc -m64 -march=native -mtune=native -O -fomit-frame-pointer nim
gcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer nim
gcc -m64 -march=nocona -O2 -fomit-frame-pointer nim
gcc -m64 -march=nocona -O3 -fomit-frame-pointer nim
gcc -m64 -march=nocona -O -fomit-frame-pointer nim
gcc -m64 -march=nocona -Os -fomit-frame-pointer nim
gcc -march=barcelona -O2 -fomit-frame-pointer nim
gcc -march=barcelona -O3 -fomit-frame-pointer nim
gcc -march=barcelona -O -fomit-frame-pointer nim
gcc -march=barcelona -Os -fomit-frame-pointer nim
gcc -march=k8 -O2 -fomit-frame-pointer nim
gcc -march=k8 -O3 -fomit-frame-pointer nim
gcc -march=k8 -O -fomit-frame-pointer nim
gcc -march=k8 -Os -fomit-frame-pointer nim
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv nim
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv nim
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv nim
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv nim
gcc -march=nocona -O2 -fomit-frame-pointer nim
gcc -march=nocona -O3 -fomit-frame-pointer nim
gcc -march=nocona -O -fomit-frame-pointer nim
gcc -march=nocona -Os -fomit-frame-pointer nim

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
tiaoxin-optimized.c: tiaoxin-optimized.c:126:7: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'ssse3'
tiaoxin-optimized.c: W0 = _mm_shuffle_epi8( W0 , perm );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:127:7: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'ssse3'
tiaoxin-optimized.c: W1 = _mm_shuffle_epi8( W1 , perm );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:137:2: error: always_inline function '_mm_aesenc_si128' requires target feature 'aes', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'aes'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:47:46: note: expanded from macro 'UPDATE'
tiaoxin-optimized.c: #define UPDATE( T3 , T4 , T6 , M0 , M1 , M2 )\
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:40:41: note: expanded from macro '\
tiaoxin-optimized.c: RT3'
tiaoxin-optimized.c: #define RT3( T , M ) tmp = T[0];T[0] = enc(T[2],M);T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: expanded from macro 'enc'
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:137:2: error: always_inline function '_mm_aesenc_si128' requires target feature 'aes', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'aes'
tiaoxin-optimized.c: tiaoxin-optimized.c:47:46: note: expanded from macro 'UPDATE'
tiaoxin-optimized.c: #define UPDATE( T3 , T4 , T6 , M0 , M1 , M2 )\
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:40:72: note: expanded from macro '\
tiaoxin-optimized.c: RT3'
tiaoxin-optimized.c: ...

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments nim
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments nim
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim

Compiler output

Implementation: crypto_aead/tiaoxinv2/ref
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
tiaoxin-tablebased.c: tiaoxin-tablebased.c:257:12: warning: comparison of unsigned expression tiaoxin-tablebased.c: if( clen tiaoxin-tablebased.c: ~~~~ ^ ~
tiaoxin-tablebased.c: 1 warning generated.

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments ref
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments ref
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: tiaoxin-optimized.c: In function 'tiaoxin_optimized_encrypt':
tiaoxin-optimized.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: error: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:42:108: note: in expansion of macro 'enc'
tiaoxin-optimized.c: #define RT6( T , M ) tmp = T[0];T[0] = enc(T[5],M);T[5] = T[4];T[4] = T[3];T[3] = T[2];T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:50:1: note: in expansion of macro 'RT6'
tiaoxin-optimized.c: RT6( T6, M2 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:151:2: note: in expansion of macro 'UPDATE'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: error: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:42:41: note: in expansion of macro 'enc'
tiaoxin-optimized.c: ...
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: tiaoxin-optimized.c: In function 'tiaoxin_optimized_encrypt':
tiaoxin-optimized.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: error: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:42:108: note: in expansion of macro 'enc'
tiaoxin-optimized.c: #define RT6( T , M ) tmp = T[0];T[0] = enc(T[5],M);T[5] = T[4];T[4] = T[3];T[3] = T[2];T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:50:1: note: in expansion of macro 'RT6'
tiaoxin-optimized.c: RT6( T6, M2 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:151:2: note: in expansion of macro 'UPDATE'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: error: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:42:41: note: in expansion of macro 'enc'
tiaoxin-optimized.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer nim
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer nim
gcc -m64 -march=barcelona -O -fomit-frame-pointer nim
gcc -m64 -march=barcelona -Os -fomit-frame-pointer nim