Implementation notes: x86, samba, crypto_sign/sphincsf256shake256robust

Computer: samba
Architecture: x86
CPU ID: GenuineIntel-000506e3-bfebfbff
SUPERCOP version: 20190803
Operation: crypto_sign
Primitive: sphincsf256shake256robust
TimeImplementationCompilerBenchmark dateSUPERCOP version
1020871976avx2gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2019080820190803
1021133332avx2gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2019080820190803
1708860044avx2gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2019080820190803
1710890446avx2gcc -m32 -march=core-avx2 -O -fomit-frame-pointer2019080820190803
1723904813avx2gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2019080820190803
1730358254avx2gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2019080820190803
1776379571avx2gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2019080820190803
1776462597avx2gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2019080820190803
3572105950refgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2019080820190803
3574020492refgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2019080820190803
3584837000refgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2019080820190803
3603879677refgcc -m32 -march=core2 -O3 -fomit-frame-pointer2019080820190803
3646710651refgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2019080920190803
3650749149refgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2019080820190803
3650986274refgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2019080820190803
3736000899refgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2019080820190803
3983584640refgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2019080920190803
4039919299refgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2019080920190803
4042633926refgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2019080820190803
4042782174refgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2019080820190803
4135406065refgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2019080920190803
4135627679refgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2019080920190803
4141320032refgcc -m32 -march=nocona -O3 -fomit-frame-pointer2019080820190803
4141489619refgcc -m32 -march=prescott -O3 -fomit-frame-pointer2019080820190803
4173018034refgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2019080820190803
4228289030refgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2019080920190803
4228342639refgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2019080920190803
4269383162refgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2019080920190803
4271943494refgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2019080920190803
4281439071refgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2019080920190803
4285858032refgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2019080920190803
4309023621refgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2019080920190803
4309262149refgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2019080920190803
4401403516refgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2019080920190803
4415029569refgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2019080820190803
4415195151refgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2019080820190803
4424255627refgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2019080820190803
4424569518refgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2019080820190803
4448563952refgcc -m32 -march=corei7 -Os -fomit-frame-pointer2019080820190803
4448564218refgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2019080820190803
4454913432refgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2019080820190803
4488020431refgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2019080820190803
4499568337refgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2019080820190803
4502561298refgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2019080820190803
4502781863refgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2019080820190803
4527738121refgcc -m32 -march=core2 -Os -fomit-frame-pointer2019080820190803
4543017022refgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2019080920190803
4543021885refgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2019080920190803
4543070962refgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2019080920190803
4580589183refgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2019080820190803
4580611582refgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2019080820190803
4581267087refgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2019080820190803
4616360333refgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2019080820190803
4616451578refgcc -m32 -march=prescott -Os -fomit-frame-pointer2019080820190803
4616761964refgcc -m32 -march=nocona -Os -fomit-frame-pointer2019080820190803
4674401573refgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2019080920190803
4692205988refgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2019080820190803
4751976272refgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2019080820190803
4968016992refgcc -m32 -march=core2 -O2 -fomit-frame-pointer2019080820190803
5034480900refgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2019080820190803
5034485796refgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2019080820190803
5055718424refgcc -m32 -march=athlon -O3 -fomit-frame-pointer2019080820190803
5056764180refgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2019080920190803
5057707309refgcc -m32 -O3 -fomit-frame-pointer2019080820190803
5074924211refgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2019080920190803
5077050960refgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2019080920190803
5078865149refgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2019080920190803
5093478649refgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2019080920190803
5093876407refgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2019080820190803
5101566141refgcc -m32 -march=k6 -O3 -fomit-frame-pointer2019080820190803
5130345121refgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2019080820190803
5132501280refgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2019080820190803
5195075058refgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2019080920190803
5203102956refgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2019080920190803
5203210145refgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2019080920190803
5204102836refgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2019080920190803
5227718500refgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2019080920190803
5231369828refgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2019080920190803
5239345135refgcc -m32 -march=nocona -O2 -fomit-frame-pointer2019080820190803
5239409264refgcc -m32 -march=prescott -O2 -fomit-frame-pointer2019080820190803
5241469726refgcc -funroll-loops -m32 -O -fomit-frame-pointer2019080920190803
5245657145refgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2019080920190803
5246482190refgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2019080920190803
5246535381refgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2019080920190803
5246563607refgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2019080920190803
5246761686refgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2019080920190803
5246851827refgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2019080920190803
5256900771refgcc -m32 -march=pentium-m -O -fomit-frame-pointer2019080820190803
5330840069refgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2019080920190803
5331736115refgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2019080920190803
5341020377refgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2019080920190803
5341407313refgcc -m32 -march=pentium4 -O -fomit-frame-pointer2019080820190803
5392345393refgcc -m32 -march=i386 -O3 -fomit-frame-pointer2019080920190803
5392643971refgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2019080920190803
5405004780refgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2019080820190803
5405139687refgcc -m32 -march=core2 -O -fomit-frame-pointer2019080820190803
5405512526refgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2019080820190803
5412691730refgcc -m32 -march=nocona -O -fomit-frame-pointer2019080820190803
5412720165refgcc -m32 -march=prescott -O -fomit-frame-pointer2019080820190803
5424091708refgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2019080820190803
5424360512refgcc -m32 -march=corei7 -O -fomit-frame-pointer2019080820190803
5424485568refgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2019080820190803
5428603185refgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2019080920190803
5428721992refgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2019080920190803
5435817049refgcc -m32 -march=i486 -O3 -fomit-frame-pointer2019080820190803
5441284137refgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2019080920190803
5462824708refgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2019080920190803
5471864896refgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2019080920190803
5481027738refgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2019080820190803
5481164680refgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2019080820190803
5493675229refgcc -m32 -march=barcelona -O -fomit-frame-pointer2019080820190803
5495844915refgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2019080920190803
5495993123refgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2019080920190803
5501327445refgcc -m32 -march=k8 -O -fomit-frame-pointer2019080820190803
5528360921refgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2019080820190803
5614112167refgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2019080920190803
5614192303refgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2019080920190803
5614453000refgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2019080920190803
5715431554refgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2019080920190803
5715638656refgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2019080920190803
5716034710refgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2019080920190803
5716787141refgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2019080920190803
5732192357refgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2019080920190803
5732208597refgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2019080920190803
5733010089refgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2019080920190803
5735030129refgcc -m32 -march=i386 -Os -fomit-frame-pointer2019080920190803
5761296166refgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2019080820190803
5761652539refgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2019080820190803
5762143579refgcc -m32 -march=k6 -Os -fomit-frame-pointer2019080820190803
5763643508refgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2019080920190803
5763737098refgcc -funroll-loops -m32 -Os -fomit-frame-pointer2019080920190803
5779322849refgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2019080820190803
5779351550refgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2019080820190803
5779772365refgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2019080820190803
5793785180refgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2019080920190803
5793810308refgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2019080920190803
5794108220refgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2019080920190803
5803542571refgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2019080920190803
5803744675refgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2019080920190803
5808000569refgcc -m32 -march=pentium -Os -fomit-frame-pointer2019080820190803
5809315232refgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2019080820190803
5814894184refgcc -m32 -march=pentium -O3 -fomit-frame-pointer2019080820190803
5815968117refgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2019080820190803
5845457678refgcc -m32 -march=i486 -Os -fomit-frame-pointer2019080820190803
5875262446refgcc -m32 -march=athlon -Os -fomit-frame-pointer2019080820190803
5875723895refgcc -m32 -Os -fomit-frame-pointer2019080820190803
5914167591refgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2019080920190803
5952890798refgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2019080920190803
6201077109refgcc -m32 -march=pentium2 -O -fomit-frame-pointer2019080820190803
6201080355refgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2019080820190803
6201279833refgcc -m32 -march=pentium3 -O -fomit-frame-pointer2019080820190803
6232579720refgcc -m32 -march=k6-3 -O -fomit-frame-pointer2019080820190803
6232599020refgcc -m32 -march=k6-2 -O -fomit-frame-pointer2019080820190803
6232943367refgcc -m32 -march=k6 -O -fomit-frame-pointer2019080820190803
6268102337refgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2019080820190803
6268403296refgcc -m32 -march=k6 -O2 -fomit-frame-pointer2019080820190803
6268513170refgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2019080820190803
6318056843refgcc -m32 -march=athlon -O2 -fomit-frame-pointer2019080820190803
6337070959refgcc -m32 -march=i386 -O2 -fomit-frame-pointer2019080920190803
6341330843refgcc -m32 -march=i486 -O2 -fomit-frame-pointer2019080920190803
6346554167refgcc -m32 -march=athlon -O -fomit-frame-pointer2019080820190803
6348980208refgcc -m32 -O -fomit-frame-pointer2019080820190803
6446493930refgcc -m32 -march=i386 -O -fomit-frame-pointer2019080920190803
6463045807refgcc -m32 -O2 -fomit-frame-pointer2019080820190803
6491371464refgcc -m32 -march=i486 -O -fomit-frame-pointer2019080920190803
6575469502refgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2019080820190803
6575813877refgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2019080820190803
6576091228refgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2019080820190803
6661683690refgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2019080820190803
6661773046refgcc -m32 -march=pentium -O -fomit-frame-pointer2019080820190803
6896224956refgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2019080820190803
6896568729refgcc -m32 -march=pentium -O2 -fomit-frame-pointer2019080820190803
11682191109refgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2019080920190803
11829309545refgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2019080820190803
12640057732refgcc -m32 -march=k8 -O3 -fomit-frame-pointer2019080820190803
12654679706refgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2019080920190803
13245235919refgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2019080920190803
13306087469refgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2019080920190803
13646299060refgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2019080920190803
13692262971refgcc -m32 -march=barcelona -Os -fomit-frame-pointer2019080820190803
14255273375refgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2019080920190803
14341316262refgcc -m32 -march=k8 -Os -fomit-frame-pointer2019080820190803
14408334224refgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2019080820190803
14608888558refgcc -m32 -march=k8 -O2 -fomit-frame-pointer2019080820190803

Compiler output

Implementation: crypto_sign/sphincsf256shake256robust/avx2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:135:40: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
KeccakP-1600-times4-SIMD256.c: #define Xor_In4( argIndex ) lanes0 = LOAD256u( curData0[argIndex]),\
KeccakP-1600-times4-SIMD256.c: ^
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:146:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 0 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ...

Number of similar (compiler,implementation) pairs: 156, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx2
gcc -m32 -O2 -fomit-frame-pointer avx2
gcc -m32 -O3 -fomit-frame-pointer avx2
gcc -m32 -O -fomit-frame-pointer avx2
gcc -m32 -Os -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_sign/sphincsf256shake256robust/avx2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:135:40: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
KeccakP-1600-times4-SIMD256.c: #define Xor_In4( argIndex ) lanes0 = LOAD256u( curData0[argIndex]),\
KeccakP-1600-times4-SIMD256.c: ^
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:146:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 0 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ...
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:135:40: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
KeccakP-1600-times4-SIMD256.c: #define Xor_In4( argIndex ) lanes0 = LOAD256u( curData0[argIndex]),\
KeccakP-1600-times4-SIMD256.c: ^
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:146:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 0 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_sign/sphincsf256shake256robust/avx2
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c: In function 'KeccakP1600times4_AddLanesAll':
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:143:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+3], lanes3 )
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:149:9: note: in expansion of macro 'Xor_In4'
KeccakP-1600-times4-SIMD256.c: Xor_In4( 12 );
KeccakP-1600-times4-SIMD256.c: ^~~~~~~
KeccakP-1600-times4-SIMD256.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
KeccakP-1600-times4-SIMD256.c: from KeccakP-1600-times4-SIMD256.c:21:
KeccakP-1600-times4-SIMD256.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
KeccakP-1600-times4-SIMD256.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:55:41: note: called from here
KeccakP-1600-times4-SIMD256.c: #define XOReq256(a, b) a = _mm256_xor_si256(a, b)
KeccakP-1600-times4-SIMD256.c: ^~~~~~~~~~~~~~~~~~~~~~
KeccakP-1600-times4-SIMD256.c: KeccakP-1600-times4-SIMD256.c:142:33: note: in expansion of macro 'XOReq256'
KeccakP-1600-times4-SIMD256.c: XOReq256( stateAsLanes[argIndex+2], lanes2 ),\
KeccakP-1600-times4-SIMD256.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx2