Implementation notes: x86, kizomba, crypto_kem/ntskem13136

Computer: kizomba
Architecture: x86
CPU ID: GenuineIntel-000906e9-bfebfbff
SUPERCOP version: 20181216
Operation: crypto_kem
Primitive: ntskem13136
TimeImplementationCompilerBenchmark dateSUPERCOP version
5480293optgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2018111820181113
5534269optgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2018111820181113
5540166optgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2018111820181113
5594228optgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2018111820181113
5603184optgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2018111820181113
5625804optgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2018111820181113
5672320optgcc -m32 -march=core2 -O3 -fomit-frame-pointer2018111820181113
5699073optgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2018111820181113
5765401optgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2018111820181113
5792385optgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2018111820181113
5793823optgcc -m32 -march=core2 -O2 -fomit-frame-pointer2018111820181113
5826463optgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2018111820181113
5849047optgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2018111820181113
5849994optgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2018111820181113
5860925optgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2018111820181113
5875782optgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2018111820181113
5907639optgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2018111820181113
5923541optgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2018111820181113
5933827optgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2018111820181113
6008094optgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2018111820181113
6042841optgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2018111820181113
6069395optgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2018111820181113
6099813optgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2018111820181113
6105693optgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2018111820181113
6106379optgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2018111820181113
6120061optgcc -m32 -march=nocona -Os -fomit-frame-pointer2018111820181113
6121138optgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2018111820181113
6121796optgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2018111820181113
6132055optgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2018111820181113
6140117optgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2018111820181113
6158161optgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2018111820181113
6162463optgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2018111820181113
6169015optgcc -m32 -march=prescott -Os -fomit-frame-pointer2018111820181113
6180244optgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2018111820181113
6210825optgcc -m32 -march=nocona -O3 -fomit-frame-pointer2018111820181113
6218399optgcc -m32 -march=corei7 -Os -fomit-frame-pointer2018111820181113
6223407optgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2018111820181113
6223961optgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2018111820181113
6229429optgcc -m32 -march=prescott -O3 -fomit-frame-pointer2018111820181113
6232180optgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2018111820181113
6240075optgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2018111820181113
6252087optgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2018111820181113
6285540optgcc -m32 -march=core2 -Os -fomit-frame-pointer2018111820181113
6556202optgcc -m32 -march=nocona -O2 -fomit-frame-pointer2018111820181113
6571915optgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2018111820181113
6589022optgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2018111820181113
6606355optgcc -m32 -march=prescott -O2 -fomit-frame-pointer2018111820181113
6748548optgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2018111820181113
6752659optgcc -m32 -march=k8 -O3 -fomit-frame-pointer2018111820181113
6771099optgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2018111820181113
6859477optgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2018111820181113
7068704optgcc -m32 -march=k8 -O2 -fomit-frame-pointer2018111820181113
7114835optgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2018111820181113
7668135optgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2018111820181113
7793946optgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2018111820181113
8242177optgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2018111820181113
8276015optgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018111820181113
8292234optgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2018111820181113
8302721optgcc -m32 -march=athlon -O3 -fomit-frame-pointer2018111820181113
8303921optgcc -m32 -march=pentium -Os -fomit-frame-pointer2018111820181113
8311780optgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2018111820181113
8314560optgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2018111820181113
8329337optgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018111820181113
8330593optgcc -m32 -O3 -fomit-frame-pointer2018111820181113
8331369optgcc -m32 -march=athlon -Os -fomit-frame-pointer2018111820181113
8333475optgcc -funroll-loops -m32 -Os -fomit-frame-pointer2018111820181113
8334139optgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2018111820181113
8338762optgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2018111820181113
8339584optgcc -m32 -march=i386 -Os -fomit-frame-pointer2018111820181113
8342133optgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2018111820181113
8356978optgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2018111820181113
8359054optgcc -m32 -Os -fomit-frame-pointer2018111820181113
8371347optgcc -funroll-loops -m32 -O -fomit-frame-pointer2018111820181113
8380224optgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2018111820181113
8380659optgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2018111820181113
8384865optgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2018111820181113
8388740optgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2018111820181113
8391508optgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2018111820181113
8403467optgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2018111820181113
8405050optgcc -m32 -march=athlon -O2 -fomit-frame-pointer2018111820181113
8406085optgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2018111820181113
8407284optgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2018111820181113
8421786optgcc -m32 -march=i486 -Os -fomit-frame-pointer2018111820181113
8432301optgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2018111820181113
8433280optgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2018111820181113
8433923optgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2018111820181113
8444819optgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2018111820181113
8453721optgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2018111820181113
8454996optgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2018111820181113
8472353optgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2018111820181113
8481258optgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2018111820181113
8496776optgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2018111820181113
8498236optgcc -m32 -march=k6 -Os -fomit-frame-pointer2018111820181113
8509099optgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2018111820181113
8511470optgcc -m32 -O2 -fomit-frame-pointer2018111820181113
8518971optgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2018111820181113
8519415optgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2018111820181113
8528778optgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2018111820181113
8539659optgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2018111820181113
8543569optgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2018111820181113
8544189optgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2018111820181113
8554111optgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2018111820181113
8557627optgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2018111820181113
8567629optgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2018111820181113
8577677optgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2018111820181113
8585155optgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2018111820181113
8589432optgcc -m32 -march=core2 -O -fomit-frame-pointer2018111820181113
8589779optgcc -m32 -march=corei7 -O -fomit-frame-pointer2018111820181113
8604187optgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2018111820181113
8607625optgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2018111820181113
8610832optgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2018111820181113
8613051optgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2018111820181113
8614347optgcc -m32 -march=pentium4 -O -fomit-frame-pointer2018111820181113
8615391optgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2018111820181113
8620105optgcc -m32 -march=k6 -O3 -fomit-frame-pointer2018111820181113
8620984optgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2018111820181113
8625877optgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2018111820181113
8628329optgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2018111820181113
8630325optgcc -m32 -march=prescott -O -fomit-frame-pointer2018111820181113
8633615optgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2018111820181113
8637450optgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2018111820181113
8637798optgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2018111820181113
8643526optgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2018111820181113
8648355optgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2018111820181113
8650525optgcc -m32 -march=nocona -O -fomit-frame-pointer2018111820181113
8659107optgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2018111820181113
8666651optgcc -m32 -march=k8 -O -fomit-frame-pointer2018111820181113
8668548optgcc -m32 -march=barcelona -O -fomit-frame-pointer2018111820181113
8671903optgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2018111820181113
8683267optgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2018111820181113
8703083optgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2018111820181113
8704551optgcc -m32 -march=athlon -O -fomit-frame-pointer2018111820181113
8718656optgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2018111820181113
8725486optgcc -m32 -O -fomit-frame-pointer2018111820181113
8745797optgcc -m32 -march=k6 -O2 -fomit-frame-pointer2018111820181113
8750381optgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2018111820181113
8763870optgcc -m32 -march=i386 -O3 -fomit-frame-pointer2018111820181113
8827552optgcc -m32 -march=k6-2 -O -fomit-frame-pointer2018111820181113
8832016optgcc -m32 -march=k6 -O -fomit-frame-pointer2018111820181113
8848425optgcc -m32 -march=i386 -O2 -fomit-frame-pointer2018111820181113
8850494optgcc -m32 -march=i486 -O3 -fomit-frame-pointer2018111820181113
8915040optgcc -m32 -march=k6-3 -O -fomit-frame-pointer2018111820181113
8925319optgcc -m32 -march=pentium3 -O -fomit-frame-pointer2018111820181113
8939780optgcc -m32 -march=i486 -O2 -fomit-frame-pointer2018111820181113
8958908optgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2018111820181113
8972090optgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2018111820181113
8979115optgcc -m32 -march=pentium2 -O -fomit-frame-pointer2018111820181113
9007488optgcc -m32 -march=i386 -O -fomit-frame-pointer2018111820181113
9008210optgcc -m32 -march=pentium-m -O -fomit-frame-pointer2018111820181113
9025028optgcc -m32 -march=pentium -O -fomit-frame-pointer2018111820181113
9060552optgcc -m32 -march=i486 -O -fomit-frame-pointer2018111820181113
9335353optgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2018111820181113
9336526optgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2018111820181113
9337264optgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018111820181113
9339260optgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2018111820181113
9343268optgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018111820181113
9414831optgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2018111820181113
9497837optgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018111820181113
9547264optgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018111820181113
9573008optgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2018111820181113
9584959optgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2018111820181113
9590316optgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2018111820181113
9606562optgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2018111820181113
9623540optgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018111820181113
9627172optgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018111820181113
9662345optgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018111820181113
9683861optgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2018111820181113
9701607optgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2018111820181113
9706984optgcc -m32 -march=pentium -O3 -fomit-frame-pointer2018111820181113
9709543optgcc -m32 -march=pentium -O2 -fomit-frame-pointer2018111820181113
9711645optgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018111820181113
10615216optgcc -m32 -march=k8 -Os -fomit-frame-pointer2018111820181113
10709319optgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2018111820181113
10735994optgcc -m32 -march=barcelona -Os -fomit-frame-pointer2018111820181113
10873636optgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2018111820181113
10991520optgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2018111820181113

Test failure

Implementation: crypto_kem/ntskem13136/ref
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 172, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer ref
gcc -m32 -O2 -fomit-frame-pointer ref
gcc -m32 -O3 -fomit-frame-pointer ref
gcc -m32 -O -fomit-frame-pointer ref
gcc -m32 -Os -fomit-frame-pointer ref
gcc -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O -fomit-frame-pointer ref
gcc -m32 -march=corei7 -Os -fomit-frame-pointer ref
gcc -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer ref
gcc -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -m32 -march=prescott -Os -fomit-frame-pointer ref

Test failure

Implementation: crypto_kem/ntskem13136/ref
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -m32 -march=barcelona -Os -fomit-frame-pointer ref

Compiler output

Implementation: crypto_kem/ntskem13136/sse2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i vector;
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h: At top level:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:985:1: error: conflicting types for '_mm_unpackhi_epi64'
bitslice_bma_128.c: _mm_unpackhi_epi64 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 96, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2
gcc -m32 -O2 -fomit-frame-pointer sse2
gcc -m32 -O3 -fomit-frame-pointer sse2
gcc -m32 -O -fomit-frame-pointer sse2
gcc -m32 -Os -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: bitslice_bma_128.c:44:1: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
bitslice_bma_128.c: {
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:45:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -m32 -O2 -fomit-frame-pointer avx2
gcc -m32 -O3 -fomit-frame-pointer avx2
gcc -m32 -O -fomit-frame-pointer avx2
gcc -m32 -Os -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:26,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:26,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 44, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 44, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O -fomit-frame-pointer sse2
gcc -m32 -march=prescott -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:45:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:26,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:26,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:26,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:26,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/sse2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -O -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:301: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 18, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/sse2
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:301: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 24, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:301: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/sse2
Compiler: gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:301: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:301: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem13136/avx2
Compiler: gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:323:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:301: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 2, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer avx2