Implementation notes: x86, kizomba, crypto_kem/ntskem1380

Computer: kizomba
Architecture: x86
CPU ID: GenuineIntel-000906e9-bfebfbff
SUPERCOP version: 20181216
Operation: crypto_kem
Primitive: ntskem1380
TimeImplementationCompilerBenchmark dateSUPERCOP version
2565784optgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2018111820181113
2617190optgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2018111820181113
2620663optgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2018111820181113
2634744optgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2018111820181113
2651054optgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2018111820181113
2659186optgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2018111820181113
2665104optgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2018111820181113
2668954optgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2018111820181113
2675951optgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2018111820181113
2704589optgcc -m32 -march=core2 -O3 -fomit-frame-pointer2018111820181113
2715415optgcc -m32 -march=core2 -O2 -fomit-frame-pointer2018111820181113
2715470optgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2018111820181113
2724845optgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2018111820181113
2738268optgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2018111820181113
2755420optgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2018111820181113
2768821optgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2018111820181113
2773228optgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2018111820181113
2783103optgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2018111820181113
2785988optgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2018111820181113
2829818optgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2018111820181113
2832137optgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2018111820181113
2833020optgcc -m32 -march=nocona -Os -fomit-frame-pointer2018111820181113
2837440optgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2018111820181113
2841879optgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2018111820181113
2843494optgcc -m32 -march=prescott -O3 -fomit-frame-pointer2018111820181113
2848950optgcc -m32 -march=prescott -Os -fomit-frame-pointer2018111820181113
2849970optgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2018111820181113
2851617optgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2018111820181113
2870041optgcc -m32 -march=core2 -Os -fomit-frame-pointer2018111820181113
2881163optgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2018111820181113
2882377optgcc -m32 -march=nocona -O3 -fomit-frame-pointer2018111820181113
2885244optgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2018111820181113
2885938optgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2018111820181113
2886433optgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2018111820181113
2888268optgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2018111820181113
2891402optgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2018111820181113
2894383optgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2018111820181113
2896243optgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2018111820181113
2897333optgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2018111820181113
2900570optgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2018111820181113
2909468optgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2018111820181113
2923373optgcc -m32 -march=corei7 -Os -fomit-frame-pointer2018111820181113
2926587optgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2018111820181113
3039171optgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2018111820181113
3040180optgcc -m32 -march=nocona -O2 -fomit-frame-pointer2018111820181113
3042554optgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2018111820181113
3063784optgcc -m32 -march=prescott -O2 -fomit-frame-pointer2018111820181113
3379046optgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2018111820181113
3388518optgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2018111820181113
3424549optgcc -m32 -march=k8 -O3 -fomit-frame-pointer2018111820181113
3443863optgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2018111820181113
3528399optgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2018111820181113
3563490optgcc -m32 -march=k8 -O2 -fomit-frame-pointer2018111820181113
3733867optgcc -m32 -march=pentium -Os -fomit-frame-pointer2018111820181113
3753109optgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018111820181113
3769567optgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2018111820181113
3770542optgcc -m32 -march=i386 -Os -fomit-frame-pointer2018111820181113
3772589optgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2018111820181113
3773177optgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2018111820181113
3774748optgcc -m32 -march=i486 -Os -fomit-frame-pointer2018111820181113
3776827optgcc -m32 -O3 -fomit-frame-pointer2018111820181113
3780527optgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2018111820181113
3781443optgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2018111820181113
3783437optgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2018111820181113
3788014optgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2018111820181113
3788444optgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2018111820181113
3789563optgcc -m32 -O2 -fomit-frame-pointer2018111820181113
3790008optgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2018111820181113
3790040optgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2018111820181113
3790950optgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2018111820181113
3792040optgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2018111820181113
3792639optgcc -m32 -march=athlon -O3 -fomit-frame-pointer2018111820181113
3793292optgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2018111820181113
3796165optgcc -funroll-loops -m32 -O -fomit-frame-pointer2018111820181113
3798122optgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2018111820181113
3798492optgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2018111820181113
3800595optgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2018111820181113
3800929optgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2018111820181113
3805613optgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2018111820181113
3806438optgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2018111820181113
3809082optgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2018111820181113
3809792optgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2018111820181113
3811711optgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2018111820181113
3814601optgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2018111820181113
3815623optgcc -funroll-loops -m32 -Os -fomit-frame-pointer2018111820181113
3817689optgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2018111820181113
3821050optgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018111820181113
3821625optgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2018111820181113
3821677optgcc -m32 -march=athlon -O2 -fomit-frame-pointer2018111820181113
3821738optgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2018111820181113
3824234optgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2018111820181113
3824444optgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2018111820181113
3825220optgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2018111820181113
3827815optgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2018111820181113
3830869optgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2018111820181113
3836447optgcc -m32 -march=corei7 -O -fomit-frame-pointer2018111820181113
3839204optgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2018111820181113
3842395optgcc -m32 -march=core2 -O -fomit-frame-pointer2018111820181113
3846071optgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2018111820181113
3847371optgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2018111820181113
3851588optgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2018111820181113
3852133optgcc -m32 -Os -fomit-frame-pointer2018111820181113
3855895optgcc -m32 -march=pentium4 -O -fomit-frame-pointer2018111820181113
3861167optgcc -m32 -march=k8 -O -fomit-frame-pointer2018111820181113
3861218optgcc -m32 -march=k6 -Os -fomit-frame-pointer2018111820181113
3865780optgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2018111820181113
3865910optgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2018111820181113
3870732optgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2018111820181113
3873000optgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2018111820181113
3873861optgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2018111820181113
3875328optgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2018111820181113
3877307optgcc -m32 -march=barcelona -O -fomit-frame-pointer2018111820181113
3879270optgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2018111820181113
3880527optgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2018111820181113
3881006optgcc -m32 -march=prescott -O -fomit-frame-pointer2018111820181113
3884230optgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2018111820181113
3889276optgcc -m32 -march=athlon -Os -fomit-frame-pointer2018111820181113
3892708optgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2018111820181113
3896972optgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2018111820181113
3905930optgcc -m32 -march=k6 -O3 -fomit-frame-pointer2018111820181113
3906103optgcc -m32 -O -fomit-frame-pointer2018111820181113
3916172optgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2018111820181113
3917943optgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2018111820181113
3926226optgcc -m32 -march=nocona -O -fomit-frame-pointer2018111820181113
3928587optgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2018111820181113
3930218optgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2018111820181113
3932521optgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2018111820181113
3935474optgcc -m32 -march=athlon -O -fomit-frame-pointer2018111820181113
3935887optgcc -m32 -march=k6 -O2 -fomit-frame-pointer2018111820181113
3935955optgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2018111820181113
3937083optgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2018111820181113
3943982optgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2018111820181113
3944582optgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2018111820181113
3945975optgcc -m32 -march=i486 -O3 -fomit-frame-pointer2018111820181113
3949780optgcc -m32 -march=i386 -O2 -fomit-frame-pointer2018111820181113
3952371optgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2018111820181113
3957530optgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2018111820181113
3968012optgcc -m32 -march=i386 -O3 -fomit-frame-pointer2018111820181113
3993206optgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2018111820181113
3996558optgcc -m32 -march=k6-3 -O -fomit-frame-pointer2018111820181113
3997524optgcc -m32 -march=k6 -O -fomit-frame-pointer2018111820181113
4001992optgcc -m32 -march=pentium -O -fomit-frame-pointer2018111820181113
4003859optgcc -m32 -march=k6-2 -O -fomit-frame-pointer2018111820181113
4030197optgcc -m32 -march=pentium2 -O -fomit-frame-pointer2018111820181113
4031109optgcc -m32 -march=pentium3 -O -fomit-frame-pointer2018111820181113
4036522optgcc -m32 -march=pentium-m -O -fomit-frame-pointer2018111820181113
4042219optgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2018111820181113
4044774optgcc -m32 -march=i486 -O2 -fomit-frame-pointer2018111820181113
4052966optgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2018111820181113
4056490optgcc -m32 -march=i386 -O -fomit-frame-pointer2018111820181113
4066556optgcc -m32 -march=i486 -O -fomit-frame-pointer2018111820181113
4243266optgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2018111820181113
4244427optgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2018111820181113
4248554optgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018111820181113
4251225optgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018111820181113
4255258optgcc -m32 -march=pentium -O3 -fomit-frame-pointer2018111820181113
4262907optgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2018111820181113
4264865optgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018111820181113
4266762optgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2018111820181113
4275609optgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018111820181113
4277294optgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2018111820181113
4287809optgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2018111820181113
4290280optgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2018111820181113
4328438optgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018111820181113
4334869optgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018111820181113
4339397optgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2018111820181113
4352189optgcc -m32 -march=pentium -O2 -fomit-frame-pointer2018111820181113
4382262optgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018111820181113
4383026optgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018111820181113
4393512optgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2018111820181113
4414355optgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2018111820181113
4951744optgcc -m32 -march=k8 -Os -fomit-frame-pointer2018111820181113
4990434optgcc -m32 -march=barcelona -Os -fomit-frame-pointer2018111820181113
5018105optgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2018111820181113
5018331optgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2018111820181113
5051131optgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2018111820181113

Test failure

Implementation: crypto_kem/ntskem1380/ref
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 172, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer ref
gcc -m32 -O2 -fomit-frame-pointer ref
gcc -m32 -O3 -fomit-frame-pointer ref
gcc -m32 -O -fomit-frame-pointer ref
gcc -m32 -Os -fomit-frame-pointer ref
gcc -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O -fomit-frame-pointer ref
gcc -m32 -march=corei7 -Os -fomit-frame-pointer ref
gcc -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer ref
gcc -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -m32 -march=prescott -Os -fomit-frame-pointer ref

Test failure

Implementation: crypto_kem/ntskem1380/ref
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -m32 -march=barcelona -Os -fomit-frame-pointer ref

Compiler output

Implementation: crypto_kem/ntskem1380/sse2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h:47:9: error: unknown type name '__m128i'
bitslice_bma_128.c: typedef __m128i vector;
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:98:11: error: unknown type name '__m128i'
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~
bitslice_bma_128.c: bits.h:98:26: warning: implicit declaration of function '_mm_unpackhi_epi64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: const __m128i a_hi = _mm_unpackhi_epi64(a, a);
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64' [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h: At top level:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:985:1: error: conflicting types for '_mm_unpackhi_epi64'
bitslice_bma_128.c: _mm_unpackhi_epi64 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 96, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2
gcc -m32 -O2 -fomit-frame-pointer sse2
gcc -m32 -O3 -fomit-frame-pointer sse2
gcc -m32 -O -fomit-frame-pointer sse2
gcc -m32 -Os -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: bitslice_bma_128.c:44:1: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
bitslice_bma_128.c: {
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:45:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -m32 -O2 -fomit-frame-pointer avx2
gcc -m32 -O3 -fomit-frame-pointer avx2
gcc -m32 -O -fomit-frame-pointer avx2
gcc -m32 -Os -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 44, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O -fomit-frame-pointer sse2
gcc -m32 -march=prescott -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 44, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O -fomit-frame-pointer avx2
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:45:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/sse2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bits.h:28,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -O -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bit_reverse':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: return _mm_shuffle_epi8(x, _mm_set_epi8(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15));
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:35:0,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/tmmintrin.h:136:1: error: inlining failed in call to always_inline '_mm_shuffle_epi8': target specific option mismatch
bitslice_bma_128.c: _mm_shuffle_epi8 (__m128i __X, __m128i __Y)
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:92:12: note: called from here
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/sse2
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:205: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 16, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:205: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 12, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/sse2
Compiler: gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:17:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:205: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 16, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:205: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 12, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:205: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1380/avx2
Compiler: gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:53:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:210:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:205: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer avx2