Implementation notes: x86, hydra1, crypto_aead/norx6461v1

Computer: hydra1
Architecture: x86
CPU ID: AuthenticAMD-00100fa0-178bfbff
SUPERCOP version: 20161220
Operation: crypto_aead
Primitive: norx6461v1
TimeImplementationCompilerBenchmark dateSUPERCOP version
67803xmmgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2016102020161009
67805xmmgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2016102020161009
68285xmmgcc -m32 -march=prescott -O3 -fomit-frame-pointer2016102020161009
68299xmmgcc -m32 -march=nocona -O3 -fomit-frame-pointer2016102020161009
68313xmmgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2016102020161009
68359xmmgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2016102020161009
69689xmmgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2016102020161009
69804xmmgcc -m32 -march=nocona -O -fomit-frame-pointer2016102020161009
69826xmmgcc -m32 -march=prescott -O -fomit-frame-pointer2016102020161009
70175xmmgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2016102020161009
70181xmmgcc -m32 -march=barcelona -O -fomit-frame-pointer2016102020161009
70286xmmgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2016102020161009
70306xmmgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2016102020161009
70584xmmgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2016102020161009
71016xmmgcc -m32 -march=nocona -O2 -fomit-frame-pointer2016102020161009
71024xmmgcc -m32 -march=prescott -O2 -fomit-frame-pointer2016102020161009
71096xmmgcc -m32 -march=pentium4 -O -fomit-frame-pointer2016102020161009
71986xmmgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2016102020161009
72065xmmgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2016102020161009
72122xmmgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2016102020161009
72310xmmgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2016102020161009
72472xmmgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2016102020161009
72572xmmgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2016102020161009
73202xmmgcc -m32 -march=pentium-m -O -fomit-frame-pointer2016102020161009
73463xmmgcc -m32 -march=k8 -O -fomit-frame-pointer2016102020161009
78746xmmgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2016102020161009
79501xmmgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2016102020161009
79734xmmgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2016102020161009
79781xmmgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2016102020161009
79947xmmgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2016102020161009
80051xmmgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2016102020161009
80072xmmgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2016102020161009
80878xmmgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2016102020161009
82803xmmgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2016102020161009
83835xmmgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2016102020161009
85102xmmgcc -m32 -march=k8 -O3 -fomit-frame-pointer2016102020161009
85381xmmgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2016102020161009
85792xmmgcc -m32 -march=k8 -O2 -fomit-frame-pointer2016102020161009
86026xmmgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2016102020161009
91495xmmgcc -m32 -march=prescott -Os -fomit-frame-pointer2016102020161009
91504xmmgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2016102020161009
91517xmmgcc -m32 -march=nocona -Os -fomit-frame-pointer2016102020161009
92678xmmgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2016102020161009
92721xmmgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2016102020161009
92779xmmgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2016102020161009
104111xmmgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2016102020161009
104139xmmgcc -m32 -march=barcelona -Os -fomit-frame-pointer2016102020161009
104590xmmgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2016102020161009
104630xmmgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2016102020161009
105482xmmgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2016102020161009
107838xmmgcc -m32 -march=k8 -Os -fomit-frame-pointer2016102020161009
108448xmmgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2016102020161009
380618refgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2016102020161009
381740refgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2016102020161009
385195refgcc -m32 -march=i386 -O3 -fomit-frame-pointer2016102020161009
385475refgcc -m32 -march=i486 -O3 -fomit-frame-pointer2016102020161009
386893refgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2016102020161009
387763refgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2016102020161009
389805refgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2016102020161009
390977refgcc -m32 -march=i386 -O2 -fomit-frame-pointer2016102020161009
391624refgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2016102020161009
391626refgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2016102020161009
392756refgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2016102020161009
393099refgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2016102020161009
393113refgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2016102020161009
393216refgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2016102020161009
393440refgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2016102020161009
393466refgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2016102020161009
393496refgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2016102020161009
393795refgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2016102020161009
393835refgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2016102020161009
393930refgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2016102020161009
393938refgcc -m32 -march=pentium4 -O -fomit-frame-pointer2016102020161009
394400refgcc -m32 -march=i486 -O2 -fomit-frame-pointer2016102020161009
394550refgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2016102020161009
395369refgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2016102020161009
396254refgcc -m32 -march=k8 -O2 -fomit-frame-pointer2016102020161009
396393refgcc -m32 -march=athlon -O2 -fomit-frame-pointer2016102020161009
396563refgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2016102020161009
396648refgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2016102020161009
396786refgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2016102020161009
396795refgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2016102020161009
397158refgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2016102020161009
397552refgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2016102020161009
397979refgcc -m32 -march=core2 -O2 -fomit-frame-pointer2016102020161009
398021refgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2016102020161009
398110refgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2016102020161009
398112refgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2016102020161009
398485refgcc -m32 -march=pentium -O3 -fomit-frame-pointer2016102020161009
398571refgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2016102020161009
398605refgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2016102020161009
398859refgcc -m32 -march=i486 -O -fomit-frame-pointer2016102020161009
399072refgcc -m32 -O3 -fomit-frame-pointer2016102020161009
399587refgcc -m32 -march=i386 -O -fomit-frame-pointer2016102020161009
400065refgcc -m32 -O2 -fomit-frame-pointer2016102020161009
400082refgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2016102020161009
400208refgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2016102020161009
400727refgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2016102020161009
402166refgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2016102020161009
402195refgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2016102020161009
402226refgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2016102020161009
402238refgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2016102020161009
402392refgcc -m32 -march=athlon -O3 -fomit-frame-pointer2016102020161009
402593refgcc -m32 -march=pentium -O2 -fomit-frame-pointer2016102020161009
402640refgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2016102020161009
402727refgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2016102020161009
402812refgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2016102020161009
403572refgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2016102020161009
404560refgcc -m32 -march=k8 -O -fomit-frame-pointer2016102020161009
405016refgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2016102020161009
405019refgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2016102020161009
405053refgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2016102020161009
405126refgcc -m32 -march=athlon -O -fomit-frame-pointer2016102020161009
405979refgcc -m32 -march=nocona -O3 -fomit-frame-pointer2016102020161009
406089refgcc -m32 -march=prescott -O3 -fomit-frame-pointer2016102020161009
406500refgcc -funroll-loops -m32 -O -fomit-frame-pointer2016102020161009
406572refgcc -m32 -march=nocona -O2 -fomit-frame-pointer2016102020161009
406622refgcc -m32 -march=prescott -O2 -fomit-frame-pointer2016102020161009
406872refgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2016102020161009
407606refgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2016102020161009
407757refgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2016102020161009
407772refgcc -m32 -march=pentium -O -fomit-frame-pointer2016102020161009
407789refgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2016102020161009
408921refgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2016102020161009
408984refgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2016102020161009
409000refgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2016102020161009
409516refgcc -m32 -march=k8 -O3 -fomit-frame-pointer2016102020161009
409523refgcc -m32 -march=k6 -O2 -fomit-frame-pointer2016102020161009
409600refgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2016102020161009
409600refgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2016102020161009
409810refgcc -m32 -march=barcelona -O -fomit-frame-pointer2016102020161009
409965refgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2016102020161009
411218refgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2016102020161009
411241refgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2016102020161009
411322refgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2016102020161009
411332refgcc -m32 -march=k6 -O3 -fomit-frame-pointer2016102020161009
411408refgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2016102020161009
411747refgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2016102020161009
411791refgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2016102020161009
411851refgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2016102020161009
411924refgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2016102020161009
411960refgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2016102020161009
412472refgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2016102020161009
412650refgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2016102020161009
412683refgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2016102020161009
412752refgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2016102020161009
413114refgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2016102020161009
413170refgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2016102020161009
413184refgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2016102020161009
413205refgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2016102020161009
413251refgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2016102020161009
413283refgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2016102020161009
413312refgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2016102020161009
413321refgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2016102020161009
413358refgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2016102020161009
413956refgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2016102020161009
413981refgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2016102020161009
414020refgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2016102020161009
414038refgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2016102020161009
414090refgcc -m32 -march=core2 -O -fomit-frame-pointer2016102020161009
414248refgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2016102020161009
414251refgcc -funroll-loops -m32 -Os -fomit-frame-pointer2016102020161009
414305refgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2016102020161009
414355refgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2016102020161009
414362refgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2016102020161009
414395refgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2016102020161009
414791refgcc -m32 -march=corei7 -O -fomit-frame-pointer2016102020161009
415062refgcc -m32 -march=pentium3 -O -fomit-frame-pointer2016102020161009
415101refgcc -m32 -march=pentium-m -O -fomit-frame-pointer2016102020161009
415133refgcc -m32 -O -fomit-frame-pointer2016102020161009
415552refgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2016102020161009
415616refgcc -m32 -march=pentium2 -O -fomit-frame-pointer2016102020161009
415730refgcc -m32 -march=prescott -O -fomit-frame-pointer2016102020161009
415774refgcc -m32 -march=nocona -O -fomit-frame-pointer2016102020161009
416855refgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2016102020161009
418193refgcc -m32 -march=nocona -Os -fomit-frame-pointer2016102020161009
418214refgcc -m32 -march=prescott -Os -fomit-frame-pointer2016102020161009
418221refgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2016102020161009
418260refgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2016102020161009
418362refgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2016102020161009
418826refgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2016102020161009
419442refgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2016102020161009
419615refgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2016102020161009
419627refgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2016102020161009
419629refgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2016102020161009
419642refgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2016102020161009
419723refgcc -m32 -march=k6 -O -fomit-frame-pointer2016102020161009
419776refgcc -m32 -march=k6-3 -O -fomit-frame-pointer2016102020161009
419779refgcc -m32 -march=k6-2 -O -fomit-frame-pointer2016102020161009
421338refgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2016102020161009
421398refgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2016102020161009
421768refgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2016102020161009
421861refgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2016102020161009
421914refgcc -m32 -march=corei7 -Os -fomit-frame-pointer2016102020161009
422092refgcc -m32 -march=core2 -Os -fomit-frame-pointer2016102020161009
422510refgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2016102020161009
422515refgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2016102020161009
422528refgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2016102020161009
423880refgcc -m32 -march=pentium -Os -fomit-frame-pointer2016102020161009
423936refgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2016102020161009
424172refgcc -m32 -Os -fomit-frame-pointer2016102020161009
424278refgcc -m32 -march=athlon -Os -fomit-frame-pointer2016102020161009
424503refgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2016102020161009
424507refgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2016102020161009
424520refgcc -m32 -march=k6 -Os -fomit-frame-pointer2016102020161009
425954refgcc -m32 -march=i386 -Os -fomit-frame-pointer2016102020161009
425984refgcc -m32 -march=i486 -Os -fomit-frame-pointer2016102020161009
427232refgcc -m32 -march=k8 -Os -fomit-frame-pointer2016102020161009
427424refgcc -m32 -march=barcelona -Os -fomit-frame-pointer2016102020161009
427451refgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2016102020161009
430171refgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2016102020161009
430208refgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2016102020161009

Test failure

Implementation: crypto_aead/norx6461v1/ref
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 35, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref xmm ymm
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref xmm ymm
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref xmm ymm
gcc -m32 -march=core2 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -O3 -fomit-frame-pointer ref xmm
gcc -m32 -march=core2 -O -fomit-frame-pointer xmm
gcc -m32 -march=core2 -Os -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer xmm
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ref xmm
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ref xmm
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ref xmm
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=corei7 -O -fomit-frame-pointer xmm
gcc -m32 -march=corei7 -Os -fomit-frame-pointer xmm

Compiler output

Implementation: crypto_aead/norx6461v1/xmm
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
norx.c: norx.c: In function 'crypto_aead_norx6461v1_xmm_encrypt':
norx.c: norx.c:411:19: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
norx.c: const __m128i N = LOADU(npub);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:714:1: error: inlining failed in call to always_inline '_mm_storeu_si128': target specific option mismatch
norx.c: _mm_storeu_si128 (__m128i *__P, __m128i __B)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ^
norx.c: norx.c:364:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 48, LOADU(in + 48));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:696:1: error: inlining failed in call to always_inline '_mm_loadu_si128': target specific option mismatch
norx.c: _mm_loadu_si128 (__m128i const *__P)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer xmm
gcc -m32 -O2 -fomit-frame-pointer xmm
gcc -m32 -O3 -fomit-frame-pointer xmm
gcc -m32 -O -fomit-frame-pointer xmm
gcc -m32 -Os -fomit-frame-pointer xmm
gcc -m32 -march=athlon -O2 -fomit-frame-pointer xmm
gcc -m32 -march=athlon -O3 -fomit-frame-pointer xmm
gcc -m32 -march=athlon -O -fomit-frame-pointer xmm
gcc -m32 -march=athlon -Os -fomit-frame-pointer xmm
gcc -m32 -march=i386 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=i386 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=i386 -O -fomit-frame-pointer xmm
gcc -m32 -march=i386 -Os -fomit-frame-pointer xmm
gcc -m32 -march=i486 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=i486 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=i486 -O -fomit-frame-pointer xmm
gcc -m32 -march=i486 -Os -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -O -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -O -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer xmm
gcc -m32 -march=k6 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=k6 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=k6 -O -fomit-frame-pointer xmm
gcc -m32 -march=k6 -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer xmm

Compiler output

Implementation: crypto_aead/norx6461v1/ymm
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
norx.c: norx.c: In function 'crypto_aead_norx6461v1_ymm_encrypt':
norx.c: norx.c:349:19: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
norx.c: const __m128i N = LOADU128(npub);
norx.c: ^
norx.c: norx.c:350:19: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
norx.c: const __m256i K = LOADU(k + 0);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:900:1: error: inlining failed in call to always_inline '_mm256_storeu_si256': target specific option mismatch
norx.c: _mm256_storeu_si256 (__m256i *__P, __m256i __A)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ^
norx.c: norx.c:303:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 32, LOADU(in + 32));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:894:1: error: inlining failed in call to always_inline '_mm256_loadu_si256': target specific option mismatch
norx.c: _mm256_loadu_si256 (__m256i const *__P)
norx.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer ymm
gcc -m32 -O2 -fomit-frame-pointer ymm
gcc -m32 -O3 -fomit-frame-pointer ymm
gcc -m32 -O -fomit-frame-pointer ymm
gcc -m32 -Os -fomit-frame-pointer ymm
gcc -m32 -march=athlon -O2 -fomit-frame-pointer ymm
gcc -m32 -march=athlon -O3 -fomit-frame-pointer ymm
gcc -m32 -march=athlon -O -fomit-frame-pointer ymm
gcc -m32 -march=athlon -Os -fomit-frame-pointer ymm
gcc -m32 -march=i386 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=i386 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=i386 -O -fomit-frame-pointer ymm
gcc -m32 -march=i386 -Os -fomit-frame-pointer ymm
gcc -m32 -march=i486 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=i486 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=i486 -O -fomit-frame-pointer ymm
gcc -m32 -march=i486 -Os -fomit-frame-pointer ymm
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=k6-2 -O -fomit-frame-pointer ymm
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer ymm
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=k6-3 -O -fomit-frame-pointer ymm
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer ymm
gcc -m32 -march=k6 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=k6 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=k6 -O -fomit-frame-pointer ymm
gcc -m32 -march=k6 -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer ymm
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentium2 -O -fomit-frame-pointer ymm
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentium -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentium -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentium -O -fomit-frame-pointer ymm
gcc -m32 -march=pentium -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer ymm
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer ymm

Compiler output

Implementation: crypto_aead/norx6461v1/ymm
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
norx.c: norx.c: In function 'crypto_aead_norx6461v1_ymm_encrypt':
norx.c: norx.c:350:19: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
norx.c: const __m256i K = LOADU(k + 0);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:900:1: error: inlining failed in call to always_inline '_mm256_storeu_si256': target specific option mismatch
norx.c: _mm256_storeu_si256 (__m256i *__P, __m256i __A)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ^
norx.c: norx.c:303:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 32, LOADU(in + 32));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:894:1: error: inlining failed in call to always_inline '_mm256_loadu_si256': target specific option mismatch
norx.c: _mm256_loadu_si256 (__m256i const *__P)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ...

Number of similar (compiler,implementation) pairs: 69, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer ymm
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer ymm
gcc -m32 -march=core2 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=core2 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=core2 -O -fomit-frame-pointer ymm
gcc -m32 -march=core2 -Os -fomit-frame-pointer ymm
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer ymm
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer ymm
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer ymm
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer ymm
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=corei7 -O -fomit-frame-pointer ymm
gcc -m32 -march=corei7 -Os -fomit-frame-pointer ymm
gcc -m32 -march=k8 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=k8 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=k8 -O -fomit-frame-pointer ymm
gcc -m32 -march=k8 -Os -fomit-frame-pointer ymm
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer ymm
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer ymm
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer ymm
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer ymm
gcc -m32 -march=nocona -O2 -fomit-frame-pointer ymm
gcc -m32 -march=nocona -O3 -fomit-frame-pointer ymm
gcc -m32 -march=nocona -O -fomit-frame-pointer ymm
gcc -m32 -march=nocona -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentium-m -O -fomit-frame-pointer ymm
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentium3 -O -fomit-frame-pointer ymm
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer ymm
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer ymm
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer ymm
gcc -m32 -march=pentium4 -O -fomit-frame-pointer ymm
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer ymm
gcc -m32 -march=prescott -O2 -fomit-frame-pointer ymm
gcc -m32 -march=prescott -O3 -fomit-frame-pointer ymm
gcc -m32 -march=prescott -O -fomit-frame-pointer ymm
gcc -m32 -march=prescott -Os -fomit-frame-pointer ymm

Compiler output

Implementation: crypto_aead/norx6461v1/xmm
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:714:1: error: inlining failed in call to always_inline '_mm_storeu_si128': target specific option mismatch
norx.c: _mm_storeu_si128 (__m128i *__P, __m128i __B)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ^
norx.c: norx.c:364:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 48, LOADU(in + 48));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:696:1: error: inlining failed in call to always_inline '_mm_loadu_si128': target specific option mismatch
norx.c: _mm_loadu_si128 (__m128i const *__P)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ^
norx.c: norx.c:364:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 48, LOADU(in + 48));
norx.c: ^
norx.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer xmm

Compiler output

Implementation: crypto_aead/norx6461v1/ymm
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
norx.c: norx.c: In function 'crypto_aead_norx6461v1_ymm_encrypt':
norx.c: norx.c:350:19: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
norx.c: const __m256i K = LOADU(k + 0);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:900:1: error: inlining failed in call to always_inline '_mm256_storeu_si256': target specific option mismatch
norx.c: _mm256_storeu_si256 (__m256i *__P, __m256i __A)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ^
norx.c: norx.c:303:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 32, LOADU(in + 32));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:894:1: error: inlining failed in call to always_inline '_mm256_loadu_si256': target specific option mismatch
norx.c: _mm256_loadu_si256 (__m256i const *__P)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ...
norx.c: norx.c: In function 'crypto_aead_norx6461v1_ymm_encrypt':
norx.c: norx.c:350:19: warning: AVX vector return without AVX enabled changes the ABI [-Wpsabi]
norx.c: const __m256i K = LOADU(k + 0);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:900:1: error: inlining failed in call to always_inline '_mm256_storeu_si256': target specific option mismatch
norx.c: _mm256_storeu_si256 (__m256i *__P, __m256i __A)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ^
norx.c: norx.c:303:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 32, LOADU(in + 32));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:41:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avxintrin.h:894:1: error: inlining failed in call to always_inline '_mm256_loadu_si256': target specific option mismatch
norx.c: _mm256_loadu_si256 (__m256i const *__P)
norx.c: ^
norx.c: norx.c:48:24: error: called from here
norx.c: #define STOREU(out, x) _mm256_storeu_si256((__m256i*)(out), (x))
norx.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer ymm
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer ymm
gcc -m32 -march=barcelona -O -fomit-frame-pointer ymm
gcc -m32 -march=barcelona -Os -fomit-frame-pointer ymm

Compiler output

Implementation: crypto_aead/norx6461v1/ymm
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:43:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: norx.c: In function 'crypto_aead_norx6461v1_ymm_encrypt':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avx2intrin.h:913:1: error: inlining failed in call to always_inline '_mm256_xor_si256': target specific option mismatch
norx.c: _mm256_xor_si256 (__m256i __A, __m256i __B)
norx.c: ^
norx.c: norx.c:276:7: error: called from here
norx.c: D = XOR(D, _mm256_set_epi64x(0, NORX_PARAMETER, 0, 0)); \
norx.c: ^
norx.c: norx.c:355:5: note: in expansion of macro 'INITIALIZE'
norx.c: INITIALIZE(A, B, C, D, N, K);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/immintrin.h:43:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:46,
norx.c: from norx.c:26:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/avx2intrin.h:1068:1: error: inlining failed in call to always_inline '_mm256_permute4x64_epi64': target specific option mismatch
norx.c: _mm256_permute4x64_epi64 (__m256i __X, const int __M)
norx.c: ^
norx.c: norx.c:272:7: error: called from here
norx.c: A = _mm256_permute4x64_epi64(A, _MM_SHUFFLE(3, 1, 0, 2)); \
norx.c: ^
norx.c: norx.c:355:5: note: in expansion of macro 'INITIALIZE'
norx.c: INITIALIZE(A, B, C, D, N, K);
norx.c: ^
norx.c: ...

Number of similar (compiler,implementation) pairs: 6, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ymm
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ymm
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ymm
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ymm
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ymm
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ymm