Implementation notes: x86, titan0, crypto_sign/sphincsf256shake256robust

Computer: titan0
Architecture: x86
CPU ID: GenuineIntel-000306c3-bfebfbff
SUPERCOP version: 20190803
Operation: crypto_sign
Primitive: sphincsf256shake256robust
TimeImplementationCompilerBenchmark dateSUPERCOP version
1071675836avx2gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2019080920190803
1072019048avx2gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2019080920190803
1801300364avx2gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2019080920190803
1801818780avx2gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2019080920190803
1808964432avx2gcc -m32 -march=core-avx2 -O -fomit-frame-pointer2019080920190803
1812372548avx2gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2019080920190803
1877697076avx2gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2019080920190803
1880174208avx2gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2019080920190803
3661824776refgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2019080920190803
3665413796refgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2019080920190803
3670860868refgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2019080920190803
3715518640refgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2019080920190803
3731023960refgcc -m32 -march=core2 -O3 -fomit-frame-pointer2019080920190803
3801685784refgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2019080920190803
3884853948refgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2019080920190803
3885049840refgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2019080920190803
4003949928refgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2019080920190803
4192468576refgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2019080920190803
4198232044refgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2019080920190803
4208976860refgcc -m32 -march=prescott -O3 -fomit-frame-pointer2019080920190803
4209558572refgcc -m32 -march=nocona -O3 -fomit-frame-pointer2019080920190803
4228383256refgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2019080920190803
4275004824refgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2019080920190803
4278114556refgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2019080920190803
4291725996refgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2019080920190803
4332639592refgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2019080920190803
4335811796refgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2019080920190803
4381490408refgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2019080920190803
4392513988refgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2019080920190803
4401689408refgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2019080920190803
4405239316refgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2019080920190803
4407566140refgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2019080920190803
4445761964refgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2019080920190803
4545105920refgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2019080920190803
4700659432refgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2019080920190803
4701120680refgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2019080920190803
4719595060refgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2019080920190803
4724237824refgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2019080920190803
4783766676refgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2019080920190803
4813019040refgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2019080920190803
4877991328refgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2019080920190803
4901085384refgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2019080920190803
4916411240refgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2019080920190803
4967567160refgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2019080920190803
4972443348refgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2019080920190803
4974684824refgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2019080920190803
5253959520refgcc -m32 -O3 -fomit-frame-pointer2019080920190803
5276902808refgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2019080920190803
5279565992refgcc -m32 -march=athlon -O3 -fomit-frame-pointer2019080920190803
5287925820refgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2019080920190803
5288391608refgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2019080920190803
5306255912refgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2019080920190803
5310785276refgcc -m32 -march=core2 -O2 -fomit-frame-pointer2019080920190803
5315317152refgcc -m32 -march=k6 -O3 -fomit-frame-pointer2019080920190803
5321086068refgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2019080920190803
5323105860refgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2019080920190803
5324020012refgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2019080920190803
5324773464refgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2019080920190803
5326589772refgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2019080920190803
5403506000refgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2019080920190803
5403580232refgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2019080920190803
5406574756refgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2019080920190803
5412652620refgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2019080920190803
5441523760refgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2019080920190803
5455460028refgcc -funroll-loops -m32 -O -fomit-frame-pointer2019080920190803
5458181220refgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2019080920190803
5461507272refgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2019080920190803
5470512216refgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2019080920190803
5471892896refgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2019080920190803
5483775736refgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2019080920190803
5492925136refgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2019080920190803
5493026204refgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2019080920190803
5493311548refgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2019080920190803
5525378180refgcc -m32 -march=pentium4 -O -fomit-frame-pointer2019080920190803
5529605700refgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2019080920190803
5546891772refgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2019080920190803
5551843096refgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2019080920190803
5555656540refgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2019080920190803
5575781344refgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2019080920190803
5591040096refgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2019080920190803
5603811268refgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2019080920190803
5614921160refgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2019080920190803
5622206088refgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2019080920190803
5641569628refgcc -m32 -march=i486 -O3 -fomit-frame-pointer2019080920190803
5650630652refgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2019080920190803
5651376888refgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2019080920190803
5657349628refgcc -m32 -march=nocona -O2 -fomit-frame-pointer2019080920190803
5662957420refgcc -m32 -march=prescott -O2 -fomit-frame-pointer2019080920190803
5663525432refgcc -m32 -march=i386 -O3 -fomit-frame-pointer2019080920190803
5671248340refgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2019080920190803
5676264616refgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2019080920190803
5677752716refgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2019080920190803
5710896780refgcc -m32 -march=pentium-m -O -fomit-frame-pointer2019080920190803
5728822196refgcc -m32 -march=nocona -O -fomit-frame-pointer2019080920190803
5759804288refgcc -m32 -march=k8 -O -fomit-frame-pointer2019080920190803
5760622924refgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2019080920190803
5761301348refgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2019080920190803
5763070876refgcc -m32 -march=core2 -O -fomit-frame-pointer2019080920190803
5771362128refgcc -m32 -march=prescott -O -fomit-frame-pointer2019080920190803
5779654920refgcc -m32 -march=corei7 -O -fomit-frame-pointer2019080920190803
5780728924refgcc -m32 -march=core2 -Os -fomit-frame-pointer2019080920190803
5781259976refgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2019080920190803
5781381344refgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2019080920190803
5786924876refgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2019080920190803
5789106768refgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2019080920190803
5793451212refgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2019080920190803
5806899740refgcc -m32 -march=barcelona -O -fomit-frame-pointer2019080920190803
5852250556refgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2019080920190803
5857757716refgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2019080920190803
5861252616refgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2019080920190803
5867619172refgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2019080920190803
5900497848refgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2019080920190803
5908237400refgcc -m32 -march=corei7 -Os -fomit-frame-pointer2019080920190803
5909815232refgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2019080920190803
5910180956refgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2019080920190803
5921545064refgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2019080920190803
5941743888refgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2019080920190803
5944276956refgcc -m32 -march=prescott -Os -fomit-frame-pointer2019080920190803
5949365896refgcc -m32 -march=nocona -Os -fomit-frame-pointer2019080920190803
5976338128refgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2019080920190803
5992284488refgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2019080920190803
5998988556refgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2019080920190803
6004706504refgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2019080920190803
6020577252refgcc -m32 -march=pentium -O3 -fomit-frame-pointer2019080920190803
6126204972refgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2019080920190803
6134612368refgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2019080920190803
6168460408refgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2019080920190803
6190879944refgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2019080920190803
6192749684refgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2019080920190803
6193025232refgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2019080920190803
6193550036refgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2019080920190803
6218195764refgcc -m32 -march=i386 -Os -fomit-frame-pointer2019080920190803
6224861256refgcc -funroll-loops -m32 -Os -fomit-frame-pointer2019080920190803
6226970512refgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2019080920190803
6238682132refgcc -m32 -march=k6 -Os -fomit-frame-pointer2019080920190803
6238903112refgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2019080920190803
6243138984refgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2019080920190803
6254233212refgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2019080920190803
6254367720refgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2019080920190803
6262995464refgcc -m32 -march=pentium -Os -fomit-frame-pointer2019080920190803
6270715324refgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2019080920190803
6271597912refgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2019080920190803
6277239012refgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2019080920190803
6334590672refgcc -m32 -march=athlon -Os -fomit-frame-pointer2019080920190803
6336313496refgcc -m32 -Os -fomit-frame-pointer2019080920190803
6358086432refgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2019080920190803
6409746936refgcc -m32 -march=i486 -Os -fomit-frame-pointer2019080920190803
6418481192refgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2019080920190803
6604057232refgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2019080920190803
6604072980refgcc -m32 -march=pentium3 -O -fomit-frame-pointer2019080920190803
6636765828refgcc -m32 -march=k6 -O -fomit-frame-pointer2019080920190803
6646507804refgcc -m32 -march=pentium2 -O -fomit-frame-pointer2019080920190803
6661687876refgcc -m32 -march=k6-3 -O -fomit-frame-pointer2019080920190803
6664030580refgcc -m32 -march=k6 -O2 -fomit-frame-pointer2019080920190803
6670658864refgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2019080920190803
6672028308refgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2019080920190803
6689510620refgcc -m32 -march=k6-2 -O -fomit-frame-pointer2019080920190803
6711834996refgcc -m32 -march=athlon -O2 -fomit-frame-pointer2019080920190803
6731233672refgcc -m32 -march=i486 -O -fomit-frame-pointer2019080920190803
6742347464refgcc -m32 -march=i386 -O2 -fomit-frame-pointer2019080920190803
6752793804refgcc -m32 -march=i486 -O2 -fomit-frame-pointer2019080920190803
6810814248refgcc -m32 -march=athlon -O -fomit-frame-pointer2019080920190803
6825184400refgcc -m32 -march=i386 -O -fomit-frame-pointer2019080920190803
6853726592refgcc -m32 -O -fomit-frame-pointer2019080920190803
6888687268refgcc -m32 -O2 -fomit-frame-pointer2019080920190803
6926348396refgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2019080920190803
6929882120refgcc -m32 -march=pentium -O -fomit-frame-pointer2019080920190803
7071210868refgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2019080920190803
7082265308refgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2019080920190803
7082738224refgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2019080920190803
7473712688refgcc -m32 -march=pentium -O2 -fomit-frame-pointer2019080920190803
7473971916refgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2019080920190803
11815112600refgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2019080920190803
11995709020refgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2019080920190803
12658828392refgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2019080920190803
12791898548refgcc -m32 -march=k8 -O3 -fomit-frame-pointer2019080920190803
13207807460refgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2019080920190803
13345880064refgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2019080920190803
13759419880refgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2019080920190803
13996290032refgcc -m32 -march=barcelona -Os -fomit-frame-pointer2019080920190803
14253201140refgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2019080920190803
14311554220refgcc -m32 -march=k8 -Os -fomit-frame-pointer2019080920190803
14472018448refgcc -m32 -march=k8 -O2 -fomit-frame-pointer2019080920190803
14621389228refgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2019080920190803

Compiler output

Implementation: crypto_sign/sphincsf256shake256robust/avx2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:135:40: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
KeccakP-1600-times4-SIMD256.c: #define Xor_In4( argIndex ) lanes0 = LOAD256u( curData0[argIndex]),\
KeccakP-1600-times4-SIMD256.c: ^
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:146:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 0 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ...

Number of similar (compiler,implementation) pairs: 156, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx2
gcc -m32 -O2 -fomit-frame-pointer avx2
gcc -m32 -O3 -fomit-frame-pointer avx2
gcc -m32 -O -fomit-frame-pointer avx2
gcc -m32 -Os -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_sign/sphincsf256shake256robust/avx2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:135:40: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
KeccakP-1600-times4-SIMD256.c: #define Xor_In4( argIndex ) lanes0 = LOAD256u( curData0[argIndex]),\
KeccakP-1600-times4-SIMD256.c: ^
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:146:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 0 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ...
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:135:40: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
KeccakP-1600-times4-SIMD256.c: #define Xor_In4( argIndex ) lanes0 = LOAD256u( curData0[argIndex]),\
KeccakP-1600-times4-SIMD256.c: ^
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:146:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 0 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_sign/sphincsf256shake256robust/avx2
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:142:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+2], lanes2 ),\
KeccakP-1600-times4-SIMD256.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx2