Implementation notes: amd64, glyme, crypto_aead/tiaoxinv2

Computer: glyme
Architecture: amd64
CPU ID: GenuineIntel-00020652-bfebfbff
SUPERCOP version: 201720170105
Operation: crypto_aead
Primitive: tiaoxinv2
TimeImplementationCompilerBenchmark dateSUPERCOP version
3972nimgcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer2017020520170105
3972nimgcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer2017020520170105
3972nimgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2017020520170105
3972nimgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2017020520170105
4164nimgcc -m64 -march=native -mtune=native -O -fomit-frame-pointer2017020520170105
4164nimgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2017020520170105
4176nimclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2017020520170105
4180nimclang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments2017020520170105
4880nimgcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer2017020520170105
4880nimgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2017020520170105
53100refgcc -m64 -march=core2 -O3 -fomit-frame-pointer2017020520170105
53140refgcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer2017020520170105
53144refgcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer2017020520170105
53392refgcc -march=nocona -O3 -fomit-frame-pointer2017020520170105
54072refgcc -m64 -march=nocona -O3 -fomit-frame-pointer2017020520170105
55180refgcc -m64 -march=barcelona -O3 -fomit-frame-pointer2017020520170105
55180refgcc -march=barcelona -O3 -fomit-frame-pointer2017020520170105
55196refgcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer2017020520170105
55200refgcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer2017020520170105
55224refgcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer2017020520170105
55224refgcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer2017020520170105
55272refgcc -march=k8 -O3 -fomit-frame-pointer2017020520170105
55288refgcc -m64 -march=k8 -O3 -fomit-frame-pointer2017020520170105
55440refgcc -m64 -O -fomit-frame-pointer2017020520170105
55448refgcc -fno-schedule-insns -O -fomit-frame-pointer2017020520170105
55448refgcc -m64 -march=core2 -O -fomit-frame-pointer2017020520170105
55448refgcc -m64 -march=nocona -O -fomit-frame-pointer2017020520170105
55460refgcc -O -fomit-frame-pointer2017020520170105
55460refgcc -march=nocona -O -fomit-frame-pointer2017020520170105
55484refgcc -m64 -march=k8 -O -fomit-frame-pointer2017020520170105
55488refgcc -march=k8 -O -fomit-frame-pointer2017020520170105
55532refgcc -m64 -march=core2 -Os -fomit-frame-pointer2017020520170105
55540refgcc -funroll-loops -O -fomit-frame-pointer2017020520170105
55544refgcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer2017020520170105
55544refgcc -m64 -march=barcelona -O -fomit-frame-pointer2017020520170105
55544refgcc -march=barcelona -O -fomit-frame-pointer2017020520170105
55552refgcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer2017020520170105
55552refgcc -funroll-loops -march=nocona -O -fomit-frame-pointer2017020520170105
55560refgcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer2017020520170105
55564refgcc -funroll-loops -m64 -O -fomit-frame-pointer2017020520170105
55588refgcc -funroll-loops -march=k8 -O -fomit-frame-pointer2017020520170105
55592refgcc -funroll-loops -march=nocona -Os -fomit-frame-pointer2017020520170105
55612refgcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer2017020520170105
55632refgcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer2017020520170105
55632refgcc -funroll-loops -march=barcelona -O -fomit-frame-pointer2017020520170105
55644refgcc -m64 -march=nocona -Os -fomit-frame-pointer2017020520170105
55656refgcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer2017020520170105
55660refgcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer2017020520170105
55664refgcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer2017020520170105
55664refgcc -funroll-loops -march=k8 -Os -fomit-frame-pointer2017020520170105
55668refgcc -funroll-loops -Os -fomit-frame-pointer2017020520170105
55684refgcc -m64 -Os -fomit-frame-pointer2017020520170105
55684refgcc -march=nocona -Os -fomit-frame-pointer2017020520170105
55700refgcc -fno-schedule-insns -Os -fomit-frame-pointer2017020520170105
55700refgcc -m64 -march=barcelona -Os -fomit-frame-pointer2017020520170105
55700refgcc -m64 -march=k8 -Os -fomit-frame-pointer2017020520170105
55700refgcc -march=barcelona -Os -fomit-frame-pointer2017020520170105
55724refgcc -march=k8 -Os -fomit-frame-pointer2017020520170105
55788refgcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer2017020520170105
55940refgcc -Os -fomit-frame-pointer2017020520170105
56160refgcc -funroll-loops -m64 -Os -fomit-frame-pointer2017020520170105
56244refgcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer2017020520170105
56252refgcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer2017020520170105
56372refgcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer2017020520170105
56372refgcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer2017020520170105
56400refgcc -m64 -march=core2 -O2 -fomit-frame-pointer2017020520170105
56416refgcc -march=nocona -O2 -fomit-frame-pointer2017020520170105
56428refgcc -m64 -march=nocona -O2 -fomit-frame-pointer2017020520170105
56444refgcc -m64 -march=corei7 -O3 -fomit-frame-pointer2017020520170105
56448refgcc -m64 -O2 -fomit-frame-pointer2017020520170105
56448refgcc -m64 -march=native -mtune=native -O3 -fomit-frame-pointer2017020520170105
56452refgcc -O2 -fomit-frame-pointer2017020520170105
56452refgcc -fno-schedule-insns -O2 -fomit-frame-pointer2017020520170105
56460refgcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer2017020520170105
56504refgcc -march=barcelona -O2 -fomit-frame-pointer2017020520170105
56508refgcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer2017020520170105
56556refgcc -funroll-loops -m64 -O2 -fomit-frame-pointer2017020520170105
56560refgcc -funroll-loops -O2 -fomit-frame-pointer2017020520170105
56584refgcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer2017020520170105
56672refgcc -m64 -march=barcelona -O2 -fomit-frame-pointer2017020520170105
56676refgcc -march=k8 -O2 -fomit-frame-pointer2017020520170105
56688refgcc -m64 -march=k8 -O2 -fomit-frame-pointer2017020520170105
56892refgcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer2017020520170105
56892refgcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer2017020520170105
56908refgcc -m64 -march=corei7 -Os -fomit-frame-pointer2017020520170105
56908refgcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer2017020520170105
56924refgcc -m64 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2017020520170105
56924refgcc -m64 -march=core2 -msse4 -O3 -fomit-frame-pointer2017020520170105
57772refgcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv2017020520170105
58056refgcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer2017020520170105
58076refgcc -m64 -march=native -mtune=native -O2 -fomit-frame-pointer2017020520170105
58080refgcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2017020520170105
58080refgcc -m64 -march=corei7 -O2 -fomit-frame-pointer2017020520170105
58220refgcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv2017020520170105
58436refgcc -m64 -march=corei7 -O -fomit-frame-pointer2017020520170105
58440refgcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer2017020520170105
58464refgcc -m64 -march=native -mtune=native -O -fomit-frame-pointer2017020520170105
58468refgcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer2017020520170105
58560refgcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv2017020520170105
58584refgcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv2017020520170105
59040refgcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer2017020520170105
59040refgcc -funroll-loops -m64 -O3 -fomit-frame-pointer2017020520170105
59044refgcc -funroll-loops -O3 -fomit-frame-pointer2017020520170105
59636refgcc -fno-schedule-insns -O3 -fomit-frame-pointer2017020520170105
59816refgcc -m64 -O3 -fomit-frame-pointer2017020520170105
60228refgcc -O3 -fomit-frame-pointer2017020520170105
78728refcc2017020520170105
79120refclang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2017020520170105
79652refclang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments2017020520170105
80192refclang -O3 -fomit-frame-pointer -Qunused-arguments2017020520170105
80456refclang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2017020520170105
80728refclang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2017020520170105
81092refclang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments2017020520170105
82112refgcc2017020520170105
82412refgcc -funroll-loops2017020520170105

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: cc
tiaoxin-optimized.c: tiaoxin-optimized.c:126:7: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'ssse3'
tiaoxin-optimized.c: W0 = _mm_shuffle_epi8( W0 , perm );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:127:7: error: always_inline function '_mm_shuffle_epi8' requires target feature 'ssse3', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'ssse3'
tiaoxin-optimized.c: W1 = _mm_shuffle_epi8( W1 , perm );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:137:2: error: always_inline function '_mm_aesenc_si128' requires target feature 'aes', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'aes'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:47:46: note: expanded from macro 'UPDATE'
tiaoxin-optimized.c: #define UPDATE( T3 , T4 , T6 , M0 , M1 , M2 )\
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:40:41: note: expanded from macro '\
tiaoxin-optimized.c: RT3'
tiaoxin-optimized.c: #define RT3( T , M ) tmp = T[0];T[0] = enc(T[2],M);T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: expanded from macro 'enc'
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:137:2: error: always_inline function '_mm_aesenc_si128' requires target feature 'aes', but would be inlined into function 'tiaoxin_optimized_encrypt' that is compiled without support for 'aes'
tiaoxin-optimized.c: tiaoxin-optimized.c:47:46: note: expanded from macro 'UPDATE'
tiaoxin-optimized.c: #define UPDATE( T3 , T4 , T6 , M0 , M1 , M2 )\
tiaoxin-optimized.c: ^
tiaoxin-optimized.c: tiaoxin-optimized.c:40:72: note: expanded from macro '\
tiaoxin-optimized.c: RT3'
tiaoxin-optimized.c: ...

Number of similar (compiler,implementation) pairs: 5, namely:
CompilerImplementations
cc nim
clang -O3 -fomit-frame-pointer -Qunused-arguments nim
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim

Compiler output

Implementation: crypto_aead/tiaoxinv2/ref
Compiler: cc
tiaoxin-tablebased.c: tiaoxin-tablebased.c:257:12: warning: comparison of unsigned expression tiaoxin-tablebased.c: if( clen tiaoxin-tablebased.c: ~~~~ ^ ~
tiaoxin-tablebased.c: 1 warning generated.

Number of similar (compiler,implementation) pairs: 7, namely:
CompilerImplementations
cc ref
clang -O3 -fomit-frame-pointer -Qunused-arguments ref
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments ref
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments ref

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments
tiaoxin-optimized.c: tiaoxin-optimized.c:375:11: warning: comparison of unsigned expression tiaoxin-optimized.c: if( clen tiaoxin-optimized.c: ~~~~ ^ ~
tiaoxin-optimized.c: 1 warning generated.

Number of similar (compiler,implementation) pairs: 2, namely:
CompilerImplementations
clang -O3 -fwrapv -march=native -fomit-frame-pointer -Qunused-arguments nim
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments nim

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: gcc
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: tiaoxin-optimized.c: In function 'tiaoxin_optimized_encrypt':
tiaoxin-optimized.c: /usr/local/lib/gcc6/gcc/x86_64-portbld-freebsd11.0/6.3.0/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:42:108: note: in expansion of macro 'enc'
tiaoxin-optimized.c: #define RT6( T , M ) tmp = T[0];T[0] = enc(T[5],M);T[5] = T[4];T[4] = T[3];T[3] = T[2];T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^~~
tiaoxin-optimized.c: tiaoxin-optimized.c:50:1: note: in expansion of macro 'RT6'
tiaoxin-optimized.c: RT6( T6, M2 );
tiaoxin-optimized.c: ^~~
tiaoxin-optimized.c: tiaoxin-optimized.c:151:2: note: in expansion of macro 'UPDATE'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^~~~~~
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: /usr/local/lib/gcc6/gcc/x86_64-portbld-freebsd11.0/6.3.0/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:42:41: note: in expansion of macro 'enc'
tiaoxin-optimized.c: ...

Number of similar (compiler,implementation) pairs: 86, namely:
CompilerImplementations
gcc nim
gcc -O2 -fomit-frame-pointer nim
gcc -O3 -fomit-frame-pointer nim
gcc -O -fomit-frame-pointer nim
gcc -Os -fomit-frame-pointer nim
gcc -fno-schedule-insns -O2 -fomit-frame-pointer nim
gcc -fno-schedule-insns -O3 -fomit-frame-pointer nim
gcc -fno-schedule-insns -O -fomit-frame-pointer nim
gcc -fno-schedule-insns -Os -fomit-frame-pointer nim
gcc -funroll-loops nim
gcc -funroll-loops -O2 -fomit-frame-pointer nim
gcc -funroll-loops -O3 -fomit-frame-pointer nim
gcc -funroll-loops -O -fomit-frame-pointer nim
gcc -funroll-loops -Os -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer nim
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer nim
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer nim
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer nim
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer nim
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer nim
gcc -m64 -O2 -fomit-frame-pointer nim
gcc -m64 -O3 -fomit-frame-pointer nim
gcc -m64 -O -fomit-frame-pointer nim
gcc -m64 -Os -fomit-frame-pointer nim
gcc -m64 -march=core2 -O2 -fomit-frame-pointer nim
gcc -m64 -march=core2 -O3 -fomit-frame-pointer nim
gcc -m64 -march=core2 -O -fomit-frame-pointer nim
gcc -m64 -march=core2 -Os -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -O2 -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -O3 -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -O -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -O2 -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -O3 -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -O -fomit-frame-pointer nim
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer nim
gcc -m64 -march=corei7 -O2 -fomit-frame-pointer nim
gcc -m64 -march=corei7 -O3 -fomit-frame-pointer nim
gcc -m64 -march=corei7 -O -fomit-frame-pointer nim
gcc -m64 -march=corei7 -Os -fomit-frame-pointer nim
gcc -m64 -march=k8 -O2 -fomit-frame-pointer nim
gcc -m64 -march=k8 -O3 -fomit-frame-pointer nim
gcc -m64 -march=k8 -O -fomit-frame-pointer nim
gcc -m64 -march=k8 -Os -fomit-frame-pointer nim
gcc -m64 -march=nocona -O2 -fomit-frame-pointer nim
gcc -m64 -march=nocona -O3 -fomit-frame-pointer nim
gcc -m64 -march=nocona -O -fomit-frame-pointer nim
gcc -m64 -march=nocona -Os -fomit-frame-pointer nim
gcc -march=barcelona -O2 -fomit-frame-pointer nim
gcc -march=barcelona -O3 -fomit-frame-pointer nim
gcc -march=barcelona -O -fomit-frame-pointer nim
gcc -march=barcelona -Os -fomit-frame-pointer nim
gcc -march=k8 -O2 -fomit-frame-pointer nim
gcc -march=k8 -O3 -fomit-frame-pointer nim
gcc -march=k8 -O -fomit-frame-pointer nim
gcc -march=k8 -Os -fomit-frame-pointer nim
gcc -march=nocona -O2 -fomit-frame-pointer nim
gcc -march=nocona -O3 -fomit-frame-pointer nim
gcc -march=nocona -O -fomit-frame-pointer nim
gcc -march=nocona -Os -fomit-frame-pointer nim

Compiler output

Implementation: crypto_aead/tiaoxinv2/nim
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: tiaoxin-optimized.c: In function 'tiaoxin_optimized_encrypt':
tiaoxin-optimized.c: /usr/local/lib/gcc6/gcc/x86_64-portbld-freebsd11.0/6.3.0/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:42:108: note: in expansion of macro 'enc'
tiaoxin-optimized.c: #define RT6( T , M ) tmp = T[0];T[0] = enc(T[5],M);T[5] = T[4];T[4] = T[3];T[3] = T[2];T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^~~
tiaoxin-optimized.c: tiaoxin-optimized.c:50:1: note: in expansion of macro 'RT6'
tiaoxin-optimized.c: RT6( T6, M2 );
tiaoxin-optimized.c: ^~~
tiaoxin-optimized.c: tiaoxin-optimized.c:151:2: note: in expansion of macro 'UPDATE'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^~~~~~
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: /usr/local/lib/gcc6/gcc/x86_64-portbld-freebsd11.0/6.3.0/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:42:41: note: in expansion of macro 'enc'
tiaoxin-optimized.c: ...
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: tiaoxin-optimized.c: In function 'tiaoxin_optimized_encrypt':
tiaoxin-optimized.c: /usr/local/lib/gcc6/gcc/x86_64-portbld-freebsd11.0/6.3.0/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:42:108: note: in expansion of macro 'enc'
tiaoxin-optimized.c: #define RT6( T , M ) tmp = T[0];T[0] = enc(T[5],M);T[5] = T[4];T[4] = T[3];T[3] = T[2];T[2] = T[1];T[1] = enc(tmp,Z0);T[0] = xor(T[0], tmp);
tiaoxin-optimized.c: ^~~
tiaoxin-optimized.c: tiaoxin-optimized.c:50:1: note: in expansion of macro 'RT6'
tiaoxin-optimized.c: RT6( T6, M2 );
tiaoxin-optimized.c: ^~~
tiaoxin-optimized.c: tiaoxin-optimized.c:151:2: note: in expansion of macro 'UPDATE'
tiaoxin-optimized.c: UPDATE( T3 , T4 , T6, Z0 , Z1 , Z0 );
tiaoxin-optimized.c: ^~~~~~
tiaoxin-optimized.c: In file included from tiaoxin-optimized.c:22:0:
tiaoxin-optimized.c: /usr/local/lib/gcc6/gcc/x86_64-portbld-freebsd11.0/6.3.0/include/wmmintrin.h:61:1: error: inlining failed in call to always_inline '_mm_aesenc_si128': target specific option mismatch
tiaoxin-optimized.c: _mm_aesenc_si128 (__m128i __X, __m128i __Y)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:30:19: note: called from here
tiaoxin-optimized.c: #define enc(a,b) _mm_aesenc_si128(a,b)
tiaoxin-optimized.c: ^~~~~~~~~~~~~~~~~~~~~
tiaoxin-optimized.c: tiaoxin-optimized.c:42:41: note: in expansion of macro 'enc'
tiaoxin-optimized.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer nim
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer nim
gcc -m64 -march=barcelona -O -fomit-frame-pointer nim
gcc -m64 -march=barcelona -Os -fomit-frame-pointer nim