Implementation notes: x86, gpu, crypto_core/mult3sntrup857

Computer: gpu
Architecture: x86
CPU ID: GenuineIntel-000206d7-bfebfbff
SUPERCOP version: 20190816
Operation: crypto_core
Primitive: mult3sntrup857
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
18139883006 0 019789 396 768refgcc_-funroll-loops_-m32_-march=nocona_-O3_-fomit-frame-pointer2019082220190816
18234632900 0 019669 396 768refgcc_-funroll-loops_-m32_-march=pentium4_-O3_-fomit-frame-pointer2019082220190816
18287011618 0 017856 392 768refgcc_-funroll-loops_-m32_-march=nocona_-O2_-fomit-frame-pointer2019082220190816
18676381641 0 017724 392 768refgcc_-funroll-loops_-m32_-march=pentium4_-O2_-fomit-frame-pointer2019082220190816
18832563006 0 019789 396 768refgcc_-funroll-loops_-m32_-march=prescott_-O3_-fomit-frame-pointer2019082220190816
18924061618 0 017856 392 768refgcc_-funroll-loops_-m32_-march=prescott_-O2_-fomit-frame-pointer2019082220190816
19116991744 0 018692 392 768refgcc_-funroll-loops_-m32_-march=barcelona_-O2_-fomit-frame-pointer2019082220190816
19136853623 0 021805 396 768refgcc_-funroll-loops_-m32_-march=k8_-O3_-fomit-frame-pointer2019082220190816
19191961666 0 018776 392 768refgcc_-funroll-loops_-m32_-march=pentiumpro_-O2_-fomit-frame-pointer2019082220190816
19200573663 0 022557 396 768refgcc_-funroll-loops_-m32_-march=barcelona_-O3_-fomit-frame-pointer2019082220190816
19308391743 0 017973 396 768refgcc_-funroll-loops_-m32_-march=athlon_-O2_-fomit-frame-pointer2019082220190816
19406431680 0 017856 392 768refgcc_-funroll-loops_-m32_-march=k8_-O2_-fomit-frame-pointer2019082220190816
19489861666 0 018776 392 768refgcc_-funroll-loops_-m32_-march=pentium3_-O2_-fomit-frame-pointer2019082220190816
19493041703 0 018141 396 768refgcc_-funroll-loops_-m32_-O2_-fomit-frame-pointer2019082220190816
19620932346 0 021564 392 768refgcc_-funroll-loops_-m32_-march=pentium3_-O3_-fomit-frame-pointer2019082220190816
19667731776 0 019282 400 768refgcc_-funroll-loops_-m32_-O3_-fomit-frame-pointer2019082220190816
19972281798 0 019494 400 768refgcc_-funroll-loops_-m32_-march=athlon_-O3_-fomit-frame-pointer2019082220190816
20094422346 0 021356 392 768refgcc_-funroll-loops_-m32_-march=pentium2_-O3_-fomit-frame-pointer2019082220190816
20122263404 0 022488 392 768refgcc_-funroll-loops_-m32_-march=pentium-m_-O3_-fomit-frame-pointer2019082220190816
20427962346 0 021356 392 768refgcc_-funroll-loops_-m32_-march=pentiumpro_-O3_-fomit-frame-pointer2019082220190816
20518981666 0 018776 392 768refgcc_-funroll-loops_-m32_-march=pentium2_-O2_-fomit-frame-pointer2019082220190816
20546071666 0 019588 392 768refgcc_-funroll-loops_-m32_-march=pentium-m_-O2_-fomit-frame-pointer2019082220190816
25359781714 0 017820 392 768refgcc_-funroll-loops_-m32_-march=i386_-O_-fomit-frame-pointer2019082220190816
29269952767 0 018422 400 768refgcc_-m32_-march=core2_-O3_-fomit-frame-pointer2019082220190816
2938770590 0 013397 396 768refgcc_-m32_-march=athlon_-O2_-fomit-frame-pointer2019082220190816
29475331308 0 014360 392 768refgcc_-m32_-march=barcelona_-O2_-fomit-frame-pointer2019082220190816
29619362467 0 018434 400 768refgcc_-m32_-march=corei7-avx_-O3_-fomit-frame-pointer2019082220190816
29653352572 0 018234 400 768refgcc_-m32_-march=corei7_-O3_-fomit-frame-pointer2019082220190816
2980347592 0 013713 396 768refgcc_-m32_-O2_-fomit-frame-pointer2019082220190816
2983368620 0 013340 392 768refgcc_-m32_-march=prescott_-O2_-fomit-frame-pointer2019082220190816
29863386478 0 019753 396 768refgcc_-m32_-march=barcelona_-O3_-fomit-frame-pointer2019082220190816
2991291592 0 013701 396 768refgcc_-m32_-march=core2_-msse4.1_-O2_-fomit-frame-pointer2019082220190816
2992838592 0 013685 396 768refgcc_-m32_-march=corei7-avx_-O2_-fomit-frame-pointer2019082220190816
3047103592 0 013685 396 768refgcc_-m32_-march=native_-mtune=native_-O2_-fomit-frame-pointer2019082220190816
30502243199 0 019225 396 768refgcc_-m32_-march=k8_-O3_-fomit-frame-pointer2019082220190816
3056946592 0 013701 396 768refgcc_-m32_-march=corei7_-O2_-fomit-frame-pointer2019082220190816
3070953592 0 013701 396 768refgcc_-m32_-march=core2_-msse4_-O2_-fomit-frame-pointer2019082220190816
3076836592 0 013685 396 768refgcc_-m32_-march=core-avx-i_-O2_-fomit-frame-pointer2019082220190816
30988681792 0 018105 396 768refgcc_-funroll-loops_-m32_-march=pentium-mmx_-O_-fomit-frame-pointer2019082220190816
31046551941 0 018285 396 768refgcc_-funroll-loops_-m32_-march=k6-3_-O_-fomit-frame-pointer2019082220190816
31129042467 0 018434 400 768refgcc_-m32_-march=core-avx-i_-O3_-fomit-frame-pointer2019082220190816
3114279592 0 013717 396 768refgcc_-m32_-march=core2_-O2_-fomit-frame-pointer2019082220190816
31169701941 0 018285 396 768refgcc_-funroll-loops_-m32_-march=k6-2_-O_-fomit-frame-pointer2019082220190816
31189291814 0 017161 396 768refgcc_-m32_-march=nocona_-O3_-fomit-frame-pointer2019082220190816
31277432572 0 018234 400 768refgcc_-m32_-march=core2_-msse4_-O3_-fomit-frame-pointer2019082220190816
31386921966 0 018305 396 768refgcc_-funroll-loops_-m32_-O_-fomit-frame-pointer2019082220190816
31404391711 0 017013 396 768refgcc_-m32_-march=pentium4_-O3_-fomit-frame-pointer2019082220190816
3140640856 0 016358 400 768refgcc_-m32_-march=athlon_-O3_-fomit-frame-pointer2019082220190816
31421071814 0 017161 396 768refgcc_-m32_-march=prescott_-O3_-fomit-frame-pointer2019082220190816
31569061927 0 018500 392 768refgcc_-funroll-loops_-m32_-march=barcelona_-O_-fomit-frame-pointer2019082220190816
3162138582 0 013552 392 768refgcc_-m32_-march=k8_-O2_-fomit-frame-pointer2019082220190816
31782241927 0 018320 392 768refgcc_-funroll-loops_-m32_-march=k8_-O_-fomit-frame-pointer2019082220190816
31894591792 0 018105 396 768refgcc_-funroll-loops_-m32_-march=pentium_-O_-fomit-frame-pointer2019082220190816
31898662467 0 018434 400 768refgcc_-m32_-march=native_-mtune=native_-O3_-fomit-frame-pointer2019082220190816
3192117620 0 013340 392 768refgcc_-m32_-march=nocona_-O2_-fomit-frame-pointer2019082220190816
31971331918 0 018548 392 768refgcc_-funroll-loops_-m32_-march=prescott_-O_-fomit-frame-pointer2019082220190816
3206169819 0 016434 400 768refgcc_-m32_-O3_-fomit-frame-pointer2019082220190816
32098441714 0 018140 392 768refgcc_-funroll-loops_-m32_-march=i486_-O_-fomit-frame-pointer2019082220190816
32346391941 0 018285 396 768refgcc_-funroll-loops_-m32_-march=k6_-O_-fomit-frame-pointer2019082220190816
32421061373 0 017256 392 768refgcc_-funroll-loops_-m32_-march=i386_-O2_-fomit-frame-pointer2019082220190816
32430751977 0 018596 392 768refgcc_-funroll-loops_-m32_-march=pentium4_-O_-fomit-frame-pointer2019082220190816
3273138558 0 013292 392 768refgcc_-m32_-march=pentium4_-O2_-fomit-frame-pointer2019082220190816
32751811587 0 018792 392 768refgcc_-funroll-loops_-m32_-march=i486_-O3_-fomit-frame-pointer2019082220190816
32999551810 0 019138 400 768refgcc_-funroll-loops_-m32_-march=k6_-O3_-fomit-frame-pointer2019082220190816
33030601979 0 018173 396 768refgcc_-funroll-loops_-m32_-march=athlon_-O_-fomit-frame-pointer2019082220190816
33115831810 0 019746 400 768refgcc_-funroll-loops_-m32_-march=k6-3_-O3_-fomit-frame-pointer2019082220190816
33263941918 0 018548 392 768refgcc_-funroll-loops_-m32_-march=nocona_-O_-fomit-frame-pointer2019082220190816
33424531634 0 017937 396 768refgcc_-funroll-loops_-m32_-march=k6_-O2_-fomit-frame-pointer2019082220190816
33546931433 0 018148 392 768refgcc_-funroll-loops_-m32_-march=i486_-O2_-fomit-frame-pointer2019082220190816
33746191634 0 017937 396 768refgcc_-funroll-loops_-m32_-march=k6-2_-O2_-fomit-frame-pointer2019082220190816
33930272572 0 018182 400 768refgcc_-m32_-march=core2_-msse4.1_-O3_-fomit-frame-pointer2019082220190816
34226311537 0 017376 392 768refgcc_-funroll-loops_-m32_-march=i386_-O3_-fomit-frame-pointer2019082220190816
34430191520 0 018093 396 768refgcc_-funroll-loops_-m32_-march=pentium-mmx_-O2_-fomit-frame-pointer2019082220190816
34498861810 0 019746 400 768refgcc_-funroll-loops_-m32_-march=k6-2_-O3_-fomit-frame-pointer2019082220190816
34507201230 0 013408 392 768refgcc_-m32_-march=barcelona_-O_-fomit-frame-pointer2019082220190816
34920571634 0 017937 396 768refgcc_-funroll-loops_-m32_-march=k6-3_-O2_-fomit-frame-pointer2019082220190816
35386861897 0 019441 396 768refgcc_-funroll-loops_-m32_-march=pentium_-O3_-fomit-frame-pointer2019082220190816
35669041520 0 018093 396 768refgcc_-funroll-loops_-m32_-march=pentium_-O2_-fomit-frame-pointer2019082220190816
35698471897 0 019441 396 768refgcc_-funroll-loops_-m32_-march=pentium-mmx_-O3_-fomit-frame-pointer2019082220190816
35946421835 0 019112 392 768refgcc_-funroll-loops_-m32_-march=pentiumpro_-O_-fomit-frame-pointer2019082220190816
3605406532 0 012196 384 768refgcc_-funroll-loops_-m32_-march=i486_-Os_-fomit-frame-pointer2019082220190816
3608691917 0 016680 392 768refgcc_-m32_-march=i486_-O3_-fomit-frame-pointer2019082220190816
36257011835 0 019232 392 768refgcc_-funroll-loops_-m32_-march=pentium-m_-O_-fomit-frame-pointer2019082220190816
3630861593 0 013164 392 768refgcc_-m32_-march=i386_-O2_-fomit-frame-pointer2019082220190816
36538591835 0 019112 392 768refgcc_-funroll-loops_-m32_-march=pentium3_-O_-fomit-frame-pointer2019082220190816
3669510883 0 017090 400 768refgcc_-m32_-march=k6-2_-O3_-fomit-frame-pointer2019082220190816
36831091835 0 019112 392 768refgcc_-funroll-loops_-m32_-march=pentium2_-O_-fomit-frame-pointer2019082220190816
3687996834 0 015244 392 768refgcc_-m32_-march=i386_-O3_-fomit-frame-pointer2019082220190816
3716049883 0 017090 400 768refgcc_-m32_-march=k6-3_-O3_-fomit-frame-pointer2019082220190816
3730965601 0 013837 396 768refgcc_-m32_-march=k6_-O2_-fomit-frame-pointer2019082220190816
3812538675 0 013412 392 768refgcc_-m32_-march=nocona_-O_-fomit-frame-pointer2019082220190816
3826815619 0 013301 396 768refgcc_-m32_-march=core2_-msse4_-O_-fomit-frame-pointer2019082220190816
3833100927 0 016957 396 768refgcc_-m32_-march=pentium-mmx_-O3_-fomit-frame-pointer2019082220190816
3856248621 0 013924 392 768refgcc_-m32_-march=i486_-O2_-fomit-frame-pointer2019082220190816
3857292601 0 013837 396 768refgcc_-m32_-march=k6-3_-O2_-fomit-frame-pointer2019082220190816
3858468927 0 016957 396 768refgcc_-m32_-march=pentium_-O3_-fomit-frame-pointer2019082220190816
3865842627 0 013417 396 768refgcc_-m32_-march=k6-2_-O_-fomit-frame-pointer2019082220190816
3870504591 0 012372 384 768refgcc_-m32_-march=k6-2_-Os_-fomit-frame-pointer2019082220190816
3881562629 0 013693 396 768refgcc_-m32_-march=pentium_-O2_-fomit-frame-pointer2019082220190816
3890349883 0 016898 400 768refgcc_-m32_-march=k6_-O3_-fomit-frame-pointer2019082220190816
3894714617 0 013037 396 768refgcc_-m32_-march=athlon_-O_-fomit-frame-pointer2019082220190816
3924123619 0 013301 396 768refgcc_-m32_-march=core-avx-i_-O_-fomit-frame-pointer2019082220190816
3928347601 0 013837 396 768refgcc_-m32_-march=k6-2_-O2_-fomit-frame-pointer2019082220190816
3933738629 0 013693 396 768refgcc_-m32_-march=pentium-mmx_-O2_-fomit-frame-pointer2019082220190816
3937056619 0 013301 396 768refgcc_-m32_-march=core2_-msse4.1_-O_-fomit-frame-pointer2019082220190816
3938130585 0 012340 384 768refgcc_-funroll-loops_-m32_-march=k6-3_-Os_-fomit-frame-pointer2019082220190816
3941367619 0 013301 396 768refgcc_-m32_-march=native_-mtune=native_-O_-fomit-frame-pointer2019082220190816
3949635619 0 013301 396 768refgcc_-m32_-march=core2_-O_-fomit-frame-pointer2019082220190816
3951786540 0 012260 384 768refgcc_-m32_-march=nocona_-Os_-fomit-frame-pointer2019082220190816
3965982619 0 013301 396 768refgcc_-m32_-march=corei7_-O_-fomit-frame-pointer2019082220190816
3969900652 0 013416 392 768refgcc_-m32_-march=i486_-O_-fomit-frame-pointer2019082220190816
3978738540 0 012244 384 768refgcc_-m32_-march=core2_-msse4_-Os_-fomit-frame-pointer2019082220190816
3985833540 0 012228 384 768refgcc_-m32_-march=pentium_-Os_-fomit-frame-pointer2019082220190816
3988404591 0 012372 384 768refgcc_-m32_-march=k6_-Os_-fomit-frame-pointer2019082220190816
3991098591 0 012372 384 768refgcc_-m32_-march=k6-3_-Os_-fomit-frame-pointer2019082220190816
4001145538 0 012196 384 768refgcc_-funroll-loops_-m32_-march=pentium_-Os_-fomit-frame-pointer2019082220190816
4002588540 0 012228 384 768refgcc_-m32_-march=pentium-mmx_-Os_-fomit-frame-pointer2019082220190816
4011032540 0 012228 384 768refgcc_-m32_-march=native_-mtune=native_-Os_-fomit-frame-pointer2019082220190816
4025538540 0 012228 384 768refgcc_-m32_-march=corei7-avx_-Os_-fomit-frame-pointer2019082220190816
4029057585 0 012340 384 768refgcc_-funroll-loops_-m32_-march=k6_-Os_-fomit-frame-pointer2019082220190816
4041519540 0 012244 384 768refgcc_-m32_-march=core2_-msse4.1_-Os_-fomit-frame-pointer2019082220190816
4047273652 0 013144 392 768refgcc_-m32_-march=i386_-O_-fomit-frame-pointer2019082220190816
4062456540 0 012244 384 768refgcc_-m32_-march=corei7_-Os_-fomit-frame-pointer2019082220190816
4070700675 0 013412 392 768refgcc_-m32_-march=prescott_-O_-fomit-frame-pointer2019082220190816
4070901538 0 012196 384 768refgcc_-funroll-loops_-m32_-march=pentium-mmx_-Os_-fomit-frame-pointer2019082220190816
4074888536 0 012212 384 768refgcc_-m32_-march=i486_-Os_-fomit-frame-pointer2019082220190816
4077837585 0 012340 384 768refgcc_-funroll-loops_-m32_-march=k6-2_-Os_-fomit-frame-pointer2019082220190816
4091901540 0 012260 384 768refgcc_-m32_-march=core2_-Os_-fomit-frame-pointer2019082220190816
4100898615 0 013152 392 768refgcc_-m32_-march=k8_-O_-fomit-frame-pointer2019082220190816
4105764619 0 013293 396 768refgcc_-m32_-O_-fomit-frame-pointer2019082220190816
4112061650 0 013317 396 768refgcc_-m32_-march=pentium-mmx_-O_-fomit-frame-pointer2019082220190816
4145415538 0 012244 384 768refgcc_-funroll-loops_-m32_-march=k8_-Os_-fomit-frame-pointer2019082220190816
4149552540 0 012260 384 768refgcc_-m32_-march=pentium4_-Os_-fomit-frame-pointer2019082220190816
4152378538 0 012228 384 768refgcc_-funroll-loops_-m32_-march=pentium4_-Os_-fomit-frame-pointer2019082220190816
4156974538 0 012196 384 768refgcc_-funroll-loops_-m32_-march=athlon_-Os_-fomit-frame-pointer2019082220190816
4162174627 0 013417 396 768refgcc_-m32_-march=k6-3_-O_-fomit-frame-pointer2019082220190816
4168048540 0 012228 384 768refgcc_-m32_-march=core-avx-i_-Os_-fomit-frame-pointer2019082220190816
4177299538 0 012228 384 768refgcc_-funroll-loops_-m32_-march=nocona_-Os_-fomit-frame-pointer2019082220190816
4189698538 0 012244 384 768refgcc_-funroll-loops_-m32_-march=barcelona_-Os_-fomit-frame-pointer2019082220190816
4203573540 0 012212 384 768refgcc_-m32_-march=athlon_-Os_-fomit-frame-pointer2019082220190816
4207827617 0 013364 392 768refgcc_-m32_-march=pentium4_-O_-fomit-frame-pointer2019082220190816
4213173540 0 012260 384 768refgcc_-m32_-march=prescott_-Os_-fomit-frame-pointer2019082220190816
4213410538 0 012228 384 768refgcc_-funroll-loops_-m32_-march=prescott_-Os_-fomit-frame-pointer2019082220190816
4220256619 0 013301 396 768refgcc_-m32_-march=corei7-avx_-O_-fomit-frame-pointer2019082220190816
4220766650 0 013317 396 768refgcc_-m32_-march=pentium_-O_-fomit-frame-pointer2019082220190816
4224912627 0 013417 396 768refgcc_-m32_-march=k6_-O_-fomit-frame-pointer2019082220190816
4232301538 0 012196 384 768refgcc_-funroll-loops_-m32_-Os_-fomit-frame-pointer2019082220190816
4235118540 0 012260 384 768refgcc_-m32_-march=k8_-Os_-fomit-frame-pointer2019082220190816
42806941080 0 012260 384 768refgcc_-m32_-march=barcelona_-Os_-fomit-frame-pointer2019082220190816
4284246532 0 012196 384 768refgcc_-funroll-loops_-m32_-march=i386_-Os_-fomit-frame-pointer2019082220190816
4336017536 0 012212 384 768refgcc_-m32_-march=i386_-Os_-fomit-frame-pointer2019082220190816
4352652540 0 012212 384 768refgcc_-m32_-Os_-fomit-frame-pointer2019082220190816
4390200961 0 017016 392 768refgcc_-m32_-march=pentiumpro_-O3_-fomit-frame-pointer2019082220190816
4398651606 0 013804 392 768refgcc_-m32_-march=pentium2_-O2_-fomit-frame-pointer2019082220190816
4666764606 0 013804 392 768refgcc_-m32_-march=pentium3_-O2_-fomit-frame-pointer2019082220190816
46803031879 0 018312 392 768refgcc_-m32_-march=pentium-m_-O3_-fomit-frame-pointer2019082220190816
4688316961 0 017224 392 768refgcc_-m32_-march=pentium3_-O3_-fomit-frame-pointer2019082220190816
4693863606 0 013804 392 768refgcc_-m32_-march=pentiumpro_-O2_-fomit-frame-pointer2019082220190816
4731798606 0 014160 392 768refgcc_-m32_-march=pentium-m_-O2_-fomit-frame-pointer2019082220190816
4755150961 0 017016 392 768refgcc_-m32_-march=pentium2_-O3_-fomit-frame-pointer2019082220190816
4828425606 0 013400 392 768refgcc_-m32_-march=pentium2_-O_-fomit-frame-pointer2019082220190816
4882884606 0 013400 392 768refgcc_-m32_-march=pentiumpro_-O_-fomit-frame-pointer2019082220190816
4927830606 0 013440 392 768refgcc_-m32_-march=pentium-m_-O_-fomit-frame-pointer2019082220190816
4928499606 0 013400 392 768refgcc_-m32_-march=pentium3_-O_-fomit-frame-pointer2019082220190816
5316033521 0 012132 384 768refgcc_-funroll-loops_-m32_-march=pentium3_-Os_-fomit-frame-pointer2019082220190816
5371872518 0 012180 384 768refgcc_-m32_-march=pentium-m_-Os_-fomit-frame-pointer2019082220190816
5516127521 0 012132 384 768refgcc_-funroll-loops_-m32_-march=pentiumpro_-Os_-fomit-frame-pointer2019082220190816
5673129518 0 012148 384 768refgcc_-m32_-march=pentium2_-Os_-fomit-frame-pointer2019082220190816
5687991521 0 012132 384 768refgcc_-funroll-loops_-m32_-march=pentium2_-Os_-fomit-frame-pointer2019082220190816
5706951518 0 012148 384 768refgcc_-m32_-march=pentiumpro_-Os_-fomit-frame-pointer2019082220190816
5800311521 0 012164 384 768refgcc_-funroll-loops_-m32_-march=pentium-m_-Os_-fomit-frame-pointer2019082220190816
5881458518 0 012148 384 768refgcc_-m32_-march=pentium3_-Os_-fomit-frame-pointer2019082220190816

Test failure

Implementation: avx
Security model: unknown
Compiler: gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer avx
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer avx
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer avx
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
mult1024.c: mult1024.c: In function 'squeeze_3_x16':
mult1024.c: mult1024.c:19:1: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
mult1024.c: {
mult1024.c: ^
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:808:1: error: inlining failed in call to always_inline '_mm256_sub_epi16': target specific option mismatch
mult1024.c: _mm256_sub_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ^~~~~~~
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
mult1024.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ...

Number of similar (compiler,implementation) pairs: 156, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer avx
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer avx
gcc -m32 -O2 -fomit-frame-pointer avx
gcc -m32 -O3 -fomit-frame-pointer avx
gcc -m32 -O -fomit-frame-pointer avx
gcc -m32 -Os -fomit-frame-pointer avx
gcc -m32 -march=athlon -O2 -fomit-frame-pointer avx
gcc -m32 -march=athlon -O3 -fomit-frame-pointer avx
gcc -m32 -march=athlon -O -fomit-frame-pointer avx
gcc -m32 -march=athlon -Os -fomit-frame-pointer avx
gcc -m32 -march=core2 -O2 -fomit-frame-pointer avx
gcc -m32 -march=core2 -O3 -fomit-frame-pointer avx
gcc -m32 -march=core2 -O -fomit-frame-pointer avx
gcc -m32 -march=core2 -Os -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer avx
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer avx
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer avx
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer avx
gcc -m32 -march=corei7 -O -fomit-frame-pointer avx
gcc -m32 -march=corei7 -Os -fomit-frame-pointer avx
gcc -m32 -march=i386 -O2 -fomit-frame-pointer avx
gcc -m32 -march=i386 -O3 -fomit-frame-pointer avx
gcc -m32 -march=i386 -O -fomit-frame-pointer avx
gcc -m32 -march=i386 -Os -fomit-frame-pointer avx
gcc -m32 -march=i486 -O2 -fomit-frame-pointer avx
gcc -m32 -march=i486 -O3 -fomit-frame-pointer avx
gcc -m32 -march=i486 -O -fomit-frame-pointer avx
gcc -m32 -march=i486 -Os -fomit-frame-pointer avx
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer avx
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer avx
gcc -m32 -march=k6-2 -O -fomit-frame-pointer avx
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer avx
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer avx
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer avx
gcc -m32 -march=k6-3 -O -fomit-frame-pointer avx
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer avx
gcc -m32 -march=k6 -O2 -fomit-frame-pointer avx
gcc -m32 -march=k6 -O3 -fomit-frame-pointer avx
gcc -m32 -march=k6 -O -fomit-frame-pointer avx
gcc -m32 -march=k6 -Os -fomit-frame-pointer avx
gcc -m32 -march=k8 -O2 -fomit-frame-pointer avx
gcc -m32 -march=k8 -O3 -fomit-frame-pointer avx
gcc -m32 -march=k8 -O -fomit-frame-pointer avx
gcc -m32 -march=k8 -Os -fomit-frame-pointer avx
gcc -m32 -march=nocona -O2 -fomit-frame-pointer avx
gcc -m32 -march=nocona -O3 -fomit-frame-pointer avx
gcc -m32 -march=nocona -O -fomit-frame-pointer avx
gcc -m32 -march=nocona -Os -fomit-frame-pointer avx
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentium-m -O -fomit-frame-pointer avx
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer avx
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer avx
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer avx
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentium2 -O -fomit-frame-pointer avx
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer avx
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentium3 -O -fomit-frame-pointer avx
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer avx
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentium4 -O -fomit-frame-pointer avx
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer avx
gcc -m32 -march=pentium -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentium -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentium -O -fomit-frame-pointer avx
gcc -m32 -march=pentium -Os -fomit-frame-pointer avx
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer avx
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer avx
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer avx
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer avx
gcc -m32 -march=prescott -O2 -fomit-frame-pointer avx
gcc -m32 -march=prescott -O3 -fomit-frame-pointer avx
gcc -m32 -march=prescott -O -fomit-frame-pointer avx
gcc -m32 -march=prescott -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
mult1024.c: mult1024.c: In function 'squeeze_3_x16':
mult1024.c: mult1024.c:19:1: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
mult1024.c: {
mult1024.c: ^
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:808:1: error: inlining failed in call to always_inline '_mm256_sub_epi16': target specific option mismatch
mult1024.c: _mm256_sub_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ^~~~~~~
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
mult1024.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ...
mult1024.c: mult1024.c: In function 'squeeze_3_x16':
mult1024.c: mult1024.c:19:1: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
mult1024.c: {
mult1024.c: ^
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:808:1: error: inlining failed in call to always_inline '_mm256_sub_epi16': target specific option mismatch
mult1024.c: _mm256_sub_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ^~~~~~~
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
mult1024.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer avx
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer avx
gcc -m32 -march=barcelona -O -fomit-frame-pointer avx
gcc -m32 -march=barcelona -Os -fomit-frame-pointer avx

Compiler output

Implementation: avx
Security model: unknown
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: mult1024.c: In function 'squeeze_3_x16':
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:808:1: error: inlining failed in call to always_inline '_mm256_sub_epi16': target specific option mismatch
mult1024.c: _mm256_sub_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ^~~~~~~
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: /usr/lib/gcc/x86_64-linux-gnu/7/include/avx2intrin.h:553:1: error: inlining failed in call to always_inline '_mm256_mullo_epi16': target specific option mismatch
mult1024.c: _mm256_mullo_epi16 (__m256i __A, __m256i __B)
mult1024.c: ^~~~~~~~~~~~~~~~~~
mult1024.c: mult1024.c:12:17: note: called from here
mult1024.c: #define sub_x16 _mm256_sub_epi16
mult1024.c: ^
mult1024.c: mult1024.c:20:10: note: in expansion of macro 'sub_x16'
mult1024.c: return sub_x16(x,mullo_x16(mulhrs_x16(x,const_x16(10923)),const_x16(3)));
mult1024.c: ^~~~~~~
mult1024.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/7/include/immintrin.h:43:0,
mult1024.c: from mult1024.c:2:
mult1024.c: ...

Number of similar (compiler,implementation) pairs: 12, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer avx
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer avx
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer avx
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer avx
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer avx
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer avx
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer avx
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer avx
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer avx
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer avx
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer avx
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer avx