Implementation notes: x86, titan0, crypto_kem/ntskem1264

Computer: titan0
Architecture: x86
CPU ID: GenuineIntel-000306c3-bfebfbff
SUPERCOP version: 20190803
Operation: crypto_kem
Primitive: ntskem1264
TimeImplementationCompilerBenchmark dateSUPERCOP version
1565288optgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2019072320190110
1577684optgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2019072320190110
1606120optgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2019072320190110
1615668optgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2019072320190110
1628368optgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2019072320190110
1636616optgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2019072320190110
1639376optgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2019072320190110
1677348optgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2019072320190110
1698072optgcc -m32 -march=core2 -O3 -fomit-frame-pointer2019072320190110
1702852optgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2019072320190110
1703536optgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2019072320190110
1709596optgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2019072320190110
1711000optgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2019072320190110
1717856optgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2019072320190110
1726688optgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2019072320190110
1731304optgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2019072320190110
1732720optgcc -m32 -march=core2 -O2 -fomit-frame-pointer2019072320190110
1733724optgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2019072320190110
1742776optgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2019072320190110
1752840optgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2019072320190110
1758560optgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2019072320190110
1776360optgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2019072320190110
1783040optgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2019072320190110
1785700optgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2019072320190110
1788196optgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2019072320190110
1791016optgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2019072320190110
1791688optgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2019072320190110
1792688optgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2019072320190110
1793460optgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2019072320190110
1828056optgcc -m32 -march=prescott -O3 -fomit-frame-pointer2019072320190110
1847776optgcc -m32 -march=nocona -O3 -fomit-frame-pointer2019072320190110
1857308optgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2019072320190110
1858760optgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2019072320190110
1866888optgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2019072320190110
1876508optgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2019072320190110
1894552optgcc -m32 -march=nocona -O2 -fomit-frame-pointer2019072320190110
1900936optgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2019072320190110
1901160optgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2019072320190110
1904800optgcc -m32 -march=prescott -O2 -fomit-frame-pointer2019072320190110
1920208optgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2019072320190110
1933896optgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2019072320190110
1950516optgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2019072320190110
1953064optgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2019072320190110
1964208optgcc -m32 -march=nocona -Os -fomit-frame-pointer2019072320190110
1971284optgcc -m32 -march=prescott -Os -fomit-frame-pointer2019072320190110
2014628optgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2019072320190110
2018764optgcc -m32 -march=corei7 -Os -fomit-frame-pointer2019072320190110
2022504optgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2019072320190110
2062768optgcc -m32 -march=core2 -Os -fomit-frame-pointer2019072320190110
2069348optgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2019072320190110
2125928optgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2019072320190110
2126824optgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2019072320190110
2128164optgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2019072320190110
2131000optgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2019072320190110
2140620optgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2019072320190110
2145972optgcc -m32 -march=prescott -O -fomit-frame-pointer2019072320190110
2148480optgcc -m32 -march=nocona -O -fomit-frame-pointer2019072320190110
2155084optgcc -m32 -march=k8 -O3 -fomit-frame-pointer2019072320190110
2161872optgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2019072320190110
2162340optgcc -m32 -march=athlon -O3 -fomit-frame-pointer2019072320190110
2165660optgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2019072320190110
2167324optgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2019072320190110
2169108optgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2019072320190110
2169372optgcc -m32 -march=k8 -O -fomit-frame-pointer2019072320190110
2169880optgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2019072320190110
2170376optgcc -m32 -Os -fomit-frame-pointer2019072320190110
2172296optgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2019072320190110
2175252optgcc -m32 -march=barcelona -O -fomit-frame-pointer2019072320190110
2184560optgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2019072320190110
2184820optgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2019072320190110
2186080optgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2019072320190110
2186244optgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2019072320190110
2186720optgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2019072320190110
2188004optgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2019072320190110
2188740optgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2019072320190110
2189180optgcc -m32 -march=athlon -Os -fomit-frame-pointer2019072320190110
2189664optgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2019072320190110
2197988optgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2019072320190110
2198740optgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2019072320190110
2198756optgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2019072320190110
2198908optgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2019072320190110
2199492optgcc -m32 -march=athlon -O2 -fomit-frame-pointer2019072320190110
2201816optgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2019072320190110
2205584optgcc -m32 -O3 -fomit-frame-pointer2019072320190110
2206456optgcc -m32 -march=pentium -Os -fomit-frame-pointer2019072320190110
2206576optgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2019072320190110
2212380optgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2019072320190110
2213996optgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2019072320190110
2215128optgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2019072320190110
2216100optgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2019072320190110
2217192optgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2019072320190110
2219992optgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2019072320190110
2222052optgcc -m32 -O2 -fomit-frame-pointer2019072320190110
2222588optgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2019072320190110
2224244optgcc -m32 -march=k6 -O3 -fomit-frame-pointer2019072320190110
2224780optgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2019072320190110
2227952optgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2019072320190110
2229816optgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2019072320190110
2233308optgcc -m32 -march=i486 -Os -fomit-frame-pointer2019072320190110
2237020optgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2019072320190110
2237280optgcc -m32 -march=i386 -Os -fomit-frame-pointer2019072320190110
2238464optgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2019072320190110
2238812optgcc -funroll-loops -m32 -Os -fomit-frame-pointer2019072320190110
2239584optgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2019072320190110
2239720optgcc -funroll-loops -m32 -O -fomit-frame-pointer2019072320190110
2246536optgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2019072320190110
2248596optgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2019072320190110
2250260optgcc -m32 -march=k6-2 -O -fomit-frame-pointer2019072320190110
2251072optgcc -m32 -march=i386 -O2 -fomit-frame-pointer2019072320190110
2251160optgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2019072320190110
2251180optgcc -m32 -march=k6 -O -fomit-frame-pointer2019072320190110
2251740optgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2019072320190110
2252464optgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2019072320190110
2252844optgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2019072320190110
2253868optgcc -m32 -march=k6-3 -O -fomit-frame-pointer2019072320190110
2256040optgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2019072320190110
2257736optgcc -m32 -march=k6 -O2 -fomit-frame-pointer2019072320190110
2257996optgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2019072320190110
2259692optgcc -m32 -march=k6 -Os -fomit-frame-pointer2019072320190110
2262256optgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2019072320190110
2266196optgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2019072320190110
2267524optgcc -m32 -march=pentium4 -O -fomit-frame-pointer2019072320190110
2269456optgcc -m32 -march=corei7 -O -fomit-frame-pointer2019072320190110
2271184optgcc -m32 -march=athlon -O -fomit-frame-pointer2019072320190110
2271268optgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2019072320190110
2272264optgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2019072320190110
2272976optgcc -m32 -march=core2 -O -fomit-frame-pointer2019072320190110
2272988optgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2019072320190110
2274664optgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2019072320190110
2275376optgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2019072320190110
2276152optgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2019072320190110
2278212optgcc -m32 -march=k8 -O2 -fomit-frame-pointer2019072320190110
2278356optgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2019072320190110
2278964optgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2019072320190110
2279616optgcc -m32 -march=i486 -O -fomit-frame-pointer2019072320190110
2282164optgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2019072320190110
2282556optgcc -m32 -march=i386 -O3 -fomit-frame-pointer2019072320190110
2284256optgcc -m32 -O -fomit-frame-pointer2019072320190110
2285316optgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2019072320190110
2285612optgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2019072320190110
2294416optgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2019072320190110
2314280optgcc -m32 -march=pentium -O -fomit-frame-pointer2019072320190110
2314996optgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2019072320190110
2317324optgcc -m32 -march=pentium3 -O -fomit-frame-pointer2019072320190110
2319236optgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2019072320190110
2320076optgcc -m32 -march=pentium2 -O -fomit-frame-pointer2019072320190110
2322160optgcc -m32 -march=pentium-m -O -fomit-frame-pointer2019072320190110
2338484optgcc -m32 -march=i486 -O3 -fomit-frame-pointer2019072320190110
2343996optgcc -m32 -march=i486 -O2 -fomit-frame-pointer2019072320190110
2359576optgcc -m32 -march=i386 -O -fomit-frame-pointer2019072320190110
2369560optgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2019072320190110
2378984optgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2019072320190110
2386444optgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2019072320190110
2387628optgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2019072320190110
2397280optgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2019072320190110
2402436optgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2019072320190110
2414700optgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2019072320190110
2415460optgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2019072320190110
2427880optgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2019072320190110
2429288optgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2019072320190110
2430128optgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2019072320190110
2434020optgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2019072320190110
2449576optgcc -m32 -march=pentium -O2 -fomit-frame-pointer2019072320190110
2452724optgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2019072320190110
2453372optgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2019072320190110
2454104optgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2019072320190110
2461428optgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2019072320190110
2463252optgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2019072320190110
2464412optgcc -m32 -march=pentium -O3 -fomit-frame-pointer2019072320190110
2465688optgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2019072320190110
2467468optgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2019072320190110
2576792optgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2019072320190110
3172316optgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2019072320190110
3206812optgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2019072320190110
3222780optgcc -m32 -march=barcelona -Os -fomit-frame-pointer2019072320190110
3240588optgcc -m32 -march=k8 -Os -fomit-frame-pointer2019072320190110

Test failure

Implementation: crypto_kem/ntskem1264/ref
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 172, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer ref
gcc -m32 -O2 -fomit-frame-pointer ref
gcc -m32 -O3 -fomit-frame-pointer ref
gcc -m32 -O -fomit-frame-pointer ref
gcc -m32 -Os -fomit-frame-pointer ref
gcc -m32 -march=athlon -O2 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O3 -fomit-frame-pointer ref
gcc -m32 -march=athlon -O -fomit-frame-pointer ref
gcc -m32 -march=athlon -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer ref
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ref
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer ref
gcc -m32 -march=corei7 -O -fomit-frame-pointer ref
gcc -m32 -march=corei7 -Os -fomit-frame-pointer ref
gcc -m32 -march=i386 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i386 -O -fomit-frame-pointer ref
gcc -m32 -march=i386 -Os -fomit-frame-pointer ref
gcc -m32 -march=i486 -O2 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O3 -fomit-frame-pointer ref
gcc -m32 -march=i486 -O -fomit-frame-pointer ref
gcc -m32 -march=i486 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -O -fomit-frame-pointer ref
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer ref
gcc -m32 -march=k6 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k6 -O -fomit-frame-pointer ref
gcc -m32 -march=k6 -Os -fomit-frame-pointer ref
gcc -m32 -march=k8 -O2 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O3 -fomit-frame-pointer ref
gcc -m32 -march=k8 -O -fomit-frame-pointer ref
gcc -m32 -march=k8 -Os -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer ref
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer ref
gcc -m32 -march=nocona -O2 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O3 -fomit-frame-pointer ref
gcc -m32 -march=nocona -O -fomit-frame-pointer ref
gcc -m32 -march=nocona -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer ref
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -O -fomit-frame-pointer ref
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer ref
gcc -m32 -march=pentium -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentium -O -fomit-frame-pointer ref
gcc -m32 -march=pentium -Os -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer ref
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer ref
gcc -m32 -march=prescott -O2 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O3 -fomit-frame-pointer ref
gcc -m32 -march=prescott -O -fomit-frame-pointer ref
gcc -m32 -march=prescott -Os -fomit-frame-pointer ref

Test failure

Implementation: crypto_kem/ntskem1264/ref
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
error 111
crypto_kem_dec returns nonzero
error 111
crypto_kem_dec returns nonzero

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer ref
gcc -m32 -march=barcelona -O -fomit-frame-pointer ref
gcc -m32 -march=barcelona -Os -fomit-frame-pointer ref

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: bitslice_bma_128.c:47:1: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
bitslice_bma_128.c: {
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1291:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:48:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2
gcc -m32 -O2 -fomit-frame-pointer sse2
gcc -m32 -O3 -fomit-frame-pointer sse2
gcc -m32 -O -fomit-frame-pointer sse2
gcc -m32 -Os -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer sse2
gcc -m32 -march=athlon -O -fomit-frame-pointer sse2
gcc -m32 -march=athlon -Os -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i386 -O -fomit-frame-pointer sse2
gcc -m32 -march=i386 -Os -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=i486 -O -fomit-frame-pointer sse2
gcc -m32 -march=i486 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k6 -O -fomit-frame-pointer sse2
gcc -m32 -march=k6 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer sse2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: bitslice_bma_128.c:46:1: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
bitslice_bma_128.c: {
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1291:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:47:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2
gcc -m32 -O2 -fomit-frame-pointer avx2
gcc -m32 -O3 -fomit-frame-pointer avx2
gcc -m32 -O -fomit-frame-pointer avx2
gcc -m32 -Os -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx2
gcc -m32 -march=athlon -O -fomit-frame-pointer avx2
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i386 -O -fomit-frame-pointer avx2
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=i486 -O -fomit-frame-pointer avx2
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k6 -O -fomit-frame-pointer avx2
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx2
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 35, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -m32 -march=prescott -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 41, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -O -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -m32 -march=prescott -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 14, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 14, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 19, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx2
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx2
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx2
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 21, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer sse2
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer sse2
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse2
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer sse2
gcc -m32 -march=corei7 -Os -fomit-frame-pointer sse2
gcc -m32 -march=k8 -Os -fomit-frame-pointer sse2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer sse2
gcc -m32 -march=nocona -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer sse2
gcc -m32 -march=prescott -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:17:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1291:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:47:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: from bitslice_bma_128.h:18,
bitslice_bma_128.c: from bitslice_bma_128.c:18:
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vMUX':
bitslice_bma_128.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/emmintrin.h:1291:1: error: inlining failed in call to always_inline '_mm_xor_si128': target specific option mismatch
bitslice_bma_128.c: _mm_xor_si128 (__m128i __A, __m128i __B)
bitslice_bma_128.c: ^~~~~~~~~~~~~
bitslice_bma_128.c: bitslice_bma_128.c:48:12: note: called from here
bitslice_bma_128.c: return _mm_xor_si128(b,
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_and_si128(_mm_set1_epi64x(-ctl),
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm_xor_si128(a, b)));
bitslice_bma_128.c: ~~~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/xmmintrin.h:1252:0,
bitslice_bma_128.c: from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:29,
bitslice_bma_128.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -O -fomit-frame-pointer sse2
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 3, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 3, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer sse2
gcc -m32 -march=barcelona -Os -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:124:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/sse2
Compiler: gcc -m32 -march=barcelona -O -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'
bitslice_bma_128.c: In file included from bitslice_bma_128.c:20:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:99:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:93:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:181:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:166: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 1, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O -fomit-frame-pointer sse2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer avx2
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer avx2

Compiler output

Implementation: crypto_kem/ntskem1264/avx2
Compiler: gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer
bitslice_bma_128.c: In file included from bitslice_bma_128.c:18:0:
bitslice_bma_128.c: bits.h: In function 'vector_popcount':
bitslice_bma_128.c: bits.h:118:22: warning: implicit declaration of function '_mm256_extract_epi64'; did you mean '_mm256_extract_epi8'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return (int32_t)(_mm256_extract_epi64(popcnt, 3) +
bitslice_bma_128.c: ^~~~~~~~~~~~~~~~~~~~
bitslice_bma_128.c: _mm256_extract_epi8
bitslice_bma_128.c: bitslice_bma_128.c: In function 'vector_popcount_128':
bitslice_bma_128.c: bitslice_bma_128.c:55:21: warning: implicit declaration of function '_mm_cvtsi128_si64'; did you mean '_mm_cvtsi128_si32'? [-Wimplicit-function-declaration]
bitslice_bma_128.c: return popcount(_mm_cvtsi128_si64(a_hi)) + popcount(_mm_cvtsi128_si64(a));
bitslice_bma_128.c: ^
bitslice_bma_128.c: bits.h:97:42: note: in definition of macro 'popcount'
bitslice_bma_128.c: #define popcount(x) __builtin_popcountll(x)
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c: In function 'bitslice_bma':
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: }
bitslice_bma_128.c: ^
bitslice_bma_128.c: bitslice_bma_128.c:180:1: warning: unsupported size for integer register
bitslice_bma_128.c: bitslice_bma_128.c: Assembler messages:
bitslice_bma_128.c: bitslice_bma_128.c:165: Error: invalid instruction suffix for `bsr'

Number of similar (compiler,implementation) pairs: 2, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer avx2
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer avx2