Implementation notes: x86, kizomba, crypto_kem/ntskem1264

Computer: kizomba
Architecture: x86
CPU ID: GenuineIntel-000906e9-bfebfbff
SUPERCOP version: 20181216
Operation: crypto_kem
Primitive: ntskem1264
TimeImplementationCompilerBenchmark dateSUPERCOP version
1530666optgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2018111820181113
1531442optgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2018111820181113
1568287optgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2018111820181113
1575193optgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2018111820181113
1577135optgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2018111820181113
1628427optgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2018111820181113
1629232optgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2018111820181113
1629266optgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2018111820181113
1631080optgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2018111820181113
1631508optgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2018111820181113
1631855optgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2018111820181113
1637927optgcc -m32 -march=core2 -O3 -fomit-frame-pointer2018111820181113
1645113optgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2018111820181113
1648970optgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2018111820181113
1650339optgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2018111820181113
1651605optgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2018111820181113
1651776optgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2018111820181113
1655474optgcc -m32 -march=core2 -O2 -fomit-frame-pointer2018111820181113
1658788optgcc -m32 -march=prescott -Os -fomit-frame-pointer2018111820181113
1662686optgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2018111820181113
1663328optgcc -m32 -march=nocona -Os -fomit-frame-pointer2018111820181113
1666724optgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2018111820181113
1669250optgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2018111820181113
1672367optgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2018111820181113
1673149optgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2018111820181113
1674162optgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2018111820181113
1676579optgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2018111820181113
1676754optgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2018111820181113
1679540optgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2018111820181113
1682518optgcc -m32 -march=prescott -O3 -fomit-frame-pointer2018111820181113
1683353optgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2018111820181113
1684998optgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2018111820181113
1690300optgcc -m32 -march=nocona -O3 -fomit-frame-pointer2018111820181113
1690849optgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2018111820181113
1694028optgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2018111820181113
1710665optgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2018111820181113
1718135optgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2018111820181113
1740357optgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2018111820181113
1742857optgcc -m32 -march=prescott -O2 -fomit-frame-pointer2018111820181113
1748492optgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2018111820181113
1753726optgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2018111820181113
1754442optgcc -m32 -march=nocona -O2 -fomit-frame-pointer2018111820181113
1782756optgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2018111820181113
1785649optgcc -m32 -march=corei7 -Os -fomit-frame-pointer2018111820181113
1787152optgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2018111820181113
1797653optgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2018111820181113
1800362optgcc -m32 -march=core2 -Os -fomit-frame-pointer2018111820181113
1954640optgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2018111820181113
1956822optgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2018111820181113
1957853optgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2018111820181113
1959145optgcc -m32 -O3 -fomit-frame-pointer2018111820181113
1960525optgcc -m32 -march=athlon -O3 -fomit-frame-pointer2018111820181113
1966385optgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2018111820181113
1968262optgcc -m32 -O2 -fomit-frame-pointer2018111820181113
1968915optgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2018111820181113
1970853optgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2018111820181113
1972873optgcc -m32 -march=athlon -O2 -fomit-frame-pointer2018111820181113
1974112optgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2018111820181113
1974817optgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2018111820181113
1976928optgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2018111820181113
1978662optgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2018111820181113
1980032optgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018111820181113
1980306optgcc -m32 -march=pentium -Os -fomit-frame-pointer2018111820181113
1981652optgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2018111820181113
1981733optgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2018111820181113
1982169optgcc -funroll-loops -m32 -O -fomit-frame-pointer2018111820181113
1983060optgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2018111820181113
1984339optgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2018111820181113
1985291optgcc -m32 -march=barcelona -O -fomit-frame-pointer2018111820181113
1985594optgcc -m32 -march=k8 -O -fomit-frame-pointer2018111820181113
1987313optgcc -m32 -Os -fomit-frame-pointer2018111820181113
1990020optgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2018111820181113
1990437optgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2018111820181113
1990613optgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018111820181113
1991238optgcc -m32 -march=athlon -Os -fomit-frame-pointer2018111820181113
1991698optgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2018111820181113
1992063optgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2018111820181113
1992085optgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2018111820181113
1994448optgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2018111820181113
1995566optgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2018111820181113
1996155optgcc -funroll-loops -m32 -Os -fomit-frame-pointer2018111820181113
2000420optgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2018111820181113
2000539optgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2018111820181113
2002292optgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2018111820181113
2002732optgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2018111820181113
2002913optgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2018111820181113
2004252optgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2018111820181113
2004994optgcc -m32 -march=nocona -O -fomit-frame-pointer2018111820181113
2005435optgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2018111820181113
2005899optgcc -m32 -march=prescott -O -fomit-frame-pointer2018111820181113
2010345optgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2018111820181113
2010591optgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2018111820181113
2010887optgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2018111820181113
2011621optgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2018111820181113
2012494optgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2018111820181113
2015522optgcc -m32 -march=i486 -Os -fomit-frame-pointer2018111820181113
2016496optgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2018111820181113
2016635optgcc -m32 -march=i386 -Os -fomit-frame-pointer2018111820181113
2021365optgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2018111820181113
2021966optgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2018111820181113
2022153optgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2018111820181113
2024005optgcc -m32 -march=k6 -Os -fomit-frame-pointer2018111820181113
2026609optgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2018111820181113
2026665optgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2018111820181113
2032238optgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2018111820181113
2032777optgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2018111820181113
2033627optgcc -m32 -march=k6 -O3 -fomit-frame-pointer2018111820181113
2035357optgcc -m32 -march=athlon -O -fomit-frame-pointer2018111820181113
2036127optgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2018111820181113
2039548optgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2018111820181113
2040617optgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2018111820181113
2043594optgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2018111820181113
2043645optgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2018111820181113
2050296optgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2018111820181113
2052782optgcc -m32 -march=i486 -O3 -fomit-frame-pointer2018111820181113
2053665optgcc -m32 -march=k6 -O2 -fomit-frame-pointer2018111820181113
2053859optgcc -m32 -march=i386 -O2 -fomit-frame-pointer2018111820181113
2055988optgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2018111820181113
2056968optgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2018111820181113
2057035optgcc -m32 -march=core2 -O -fomit-frame-pointer2018111820181113
2057166optgcc -m32 -march=pentium4 -O -fomit-frame-pointer2018111820181113
2057720optgcc -m32 -march=corei7 -O -fomit-frame-pointer2018111820181113
2058152optgcc -m32 -march=i386 -O3 -fomit-frame-pointer2018111820181113
2059812optgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2018111820181113
2060722optgcc -m32 -march=i486 -O -fomit-frame-pointer2018111820181113
2061257optgcc -m32 -march=k6-2 -O -fomit-frame-pointer2018111820181113
2061282optgcc -m32 -march=k6-3 -O -fomit-frame-pointer2018111820181113
2061420optgcc -m32 -march=k6 -O -fomit-frame-pointer2018111820181113
2064938optgcc -m32 -O -fomit-frame-pointer2018111820181113
2064970optgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2018111820181113
2068641optgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2018111820181113
2070387optgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2018111820181113
2071799optgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2018111820181113
2074137optgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2018111820181113
2074371optgcc -m32 -march=pentium3 -O -fomit-frame-pointer2018111820181113
2081222optgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2018111820181113
2082075optgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2018111820181113
2082935optgcc -m32 -march=pentium2 -O -fomit-frame-pointer2018111820181113
2100895optgcc -m32 -march=i486 -O2 -fomit-frame-pointer2018111820181113
2106796optgcc -m32 -march=pentium-m -O -fomit-frame-pointer2018111820181113
2114738optgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2018111820181113
2117274optgcc -m32 -march=pentium -O -fomit-frame-pointer2018111820181113
2119871optgcc -m32 -march=i386 -O -fomit-frame-pointer2018111820181113
2122970optgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2018111820181113
2130502optgcc -m32 -march=k8 -O3 -fomit-frame-pointer2018111820181113
2150148optgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2018111820181113
2153706optgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018111820181113
2154077optgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2018111820181113
2182678optgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2018111820181113
2182929optgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2018111820181113
2186646optgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2018111820181113
2191222optgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018111820181113
2194173optgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2018111820181113
2194428optgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2018111820181113
2207097optgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2018111820181113
2212339optgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2018111820181113
2223332optgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018111820181113
2232946optgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018111820181113
2232974optgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2018111820181113
2236552optgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2018111820181113
2236976optgcc -m32 -march=k8 -O2 -fomit-frame-pointer2018111820181113
2238357optgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2018111820181113
2249415optgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018111820181113
2251982optgcc -m32 -march=pentium -O3 -fomit-frame-pointer2018111820181113
2253994optgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018111820181113
2264256optgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018111820181113
2267621optgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2018111820181113
2271742optgcc -m32 -march=pentium -O2 -fomit-frame-pointer2018111820181113
2278183optgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018111820181113
2433810optgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2018111820181113
2498100optgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2018111820181113
2917144optgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2018111820181113
2959952optgcc -m32 -march=k8 -Os -fomit-frame-pointer2018111820181113
2977728optgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2018111820181113
3025764optgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2018111820181113
3036738optgcc -m32 -march=barcelona -Os -fomit-frame-pointer2018111820181113

Test failure

Implementation: crypto_kem/ntskem1264/ref
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 172, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer ref
gcc -m32 -O2 -fomit-frame-pointer ref
gcc -m32 -O3 -fomit-frame-pointer ref
gcc -m32 -O -fomit-frame-pointer ref
gcc -m32 -Os -fomit-frame-pointer ref
gcc -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O -fomit-frame-pointer ref
gcc -m32 -march=corei7 -Os -fomit-frame-pointer ref
gcc -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer ref
gcc -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -m32 -march=prescott -Os -fomit-frame-pointer ref

Test failure

Implementation: crypto_kem/ntskem1264/ref
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -m32 -march=barcelona -Os -fomit-frame-pointer ref

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: bitslice_bma_128.c:47:1: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
bitslice_bma_128.c: {
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:48:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2
gcc -m32 -O2 -fomit-frame-pointer sse2
gcc -m32 -O3 -fomit-frame-pointer sse2
gcc -m32 -O -fomit-frame-pointer sse2
gcc -m32 -Os -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: bitslice_bma_128.c:46:1: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
bitslice_bma_128.c: {
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:47:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -m32 -O2 -fomit-frame-pointer avx2
gcc -m32 -O3 -fomit-frame-pointer avx2
gcc -m32 -O -fomit-frame-pointer avx2
gcc -m32 -Os -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 35, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 41, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 14, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 14, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 19, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 21, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer sse2
gcc -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=prescott -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:47:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1290:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:48:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 3, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 3, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 2, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer avx2