Implementation notes: x86, h4e450, crypto_aead/norx3261v1

Computer: h4e450
Architecture: x86
CPU ID: AuthenticAMD-00500f20-178bfbff
SUPERCOP version: 20171218
Operation: crypto_aead
Primitive: norx3261v1
TimeImplementationCompilerBenchmark dateSUPERCOP version
98154xmmgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2017100120170725
98154xmmgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2017100120170725
98168xmmgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2017100120170725
98168xmmgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2017100120170725
98691xmmgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2017100120170725
98700xmmgcc -m32 -march=nocona -O2 -fomit-frame-pointer2017100120170725
98700xmmgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2017100120170725
98701xmmgcc -m32 -march=prescott -O2 -fomit-frame-pointer2017100120170725
98729xmmgcc -m32 -march=prescott -O3 -fomit-frame-pointer2017100120170725
98734xmmgcc -m32 -march=nocona -O3 -fomit-frame-pointer2017100120170725
98900xmmgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2017100120170725
98910xmmgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2017100120170725
99090xmmgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2017100120170725
99095xmmgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2017100120170725
99194xmmgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2017100120170725
99232xmmgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2017100120170725
99298xmmgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2017100120170725
99299xmmgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2017100120170725
99565xmmgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2017100120170725
99575xmmgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2017100120170725
99608xmmgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2017100120170725
99612xmmgcc -m32 -march=k8 -O2 -fomit-frame-pointer2017100120170725
99712xmmgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2017100120170725
99731xmmgcc -m32 -march=k8 -O3 -fomit-frame-pointer2017100120170725
108481xmmgcc -m32 -march=barcelona -O -fomit-frame-pointer2017100120170725
108675xmmgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2017100120170725
108775xmmgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2017100120170725
109003xmmgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2017100120170725
109060xmmgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2017100120170725
109112xmmgcc -m32 -march=k8 -O -fomit-frame-pointer2017100120170725
109127xmmgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2017100120170725
109141xmmgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2017100120170725
109269xmmgcc -m32 -march=pentium-m -O -fomit-frame-pointer2017100120170725
109288xmmgcc -m32 -march=nocona -O -fomit-frame-pointer2017100120170725
109322xmmgcc -m32 -march=prescott -O -fomit-frame-pointer2017100120170725
109911xmmgcc -m32 -march=pentium4 -O -fomit-frame-pointer2017100120170725
113563xmmgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2017100120170725
113563xmmgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2017100120170725
113591xmmgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2017100120170725
113939xmmgcc -m32 -march=nocona -Os -fomit-frame-pointer2017100120170725
113939xmmgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2017100120170725
113977xmmgcc -m32 -march=prescott -Os -fomit-frame-pointer2017100120170725
115425xmmgcc -m32 -march=barcelona -Os -fomit-frame-pointer2017100120170725
115796xmmgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2017100120170725
115957xmmgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2017100120170725
116598xmmgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2017100120170725
116684xmmgcc -m32 -march=k8 -Os -fomit-frame-pointer2017100120170725
117040xmmgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2017100120170725
167595refgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2017100120170725
167969refgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2017100120170725
167975refgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2017100120170725
167975refgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2017100120170725
168088refgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2017100120170725
168658refgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2017100120170725
168701refgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2017100120170725
168881refgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2017100120170725
168938refgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2017100120170725
168962refgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2017100120170725
169019refgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2017100120170725
169394refgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2017100120170725
169518refgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2017100120170725
169561refgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2017100120170725
170615refgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2017100120170725
170843refgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2017100120170725
171167refgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2017100120170725
171442refgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2017100120170725
171612refgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2017100120170725
171632refgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2017100120170725
171665refgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2017100120170725
171670refgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2017100120170725
171760refgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2017100120170725
171855refgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2017100120170725
171870refgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2017100120170725
171898refgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2017100120170725
171945refgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2017100120170725
172045refgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2017100120170725
172620refgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2017100120170725
172648refgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2017100120170725
172658refgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2017100120170725
172695refgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2017100120170725
172705refgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2017100120170725
172781refgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2017100120170725
173132refgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2017100120170725
173171refgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2017100120170725
173181refgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2017100120170725
173237refgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2017100120170725
173237refgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2017100120170725
173261refgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2017100120170725
173341refgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2017100120170725
173370refgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2017100120170725
173375refgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2017100120170725
173536refgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2017100120170725
173542refgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2017100120170725
173584refgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2017100120170725
173703refgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2017100120170725
173712refgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2017100120170725
173802refgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2017100120170725
173850refgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2017100120170725
173864refgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2017100120170725
173997refgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2017100120170725
174011refgcc -m32 -O2 -fomit-frame-pointer2017100120170725
174230refgcc -m32 -march=core2 -O2 -fomit-frame-pointer2017100120170725
174234refgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2017100120170725
174258refgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2017100120170725
174277refgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2017100120170725
174316refgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2017100120170725
174391refgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2017100120170725
174453refgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2017100120170725
174463refgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2017100120170725
174481refgcc -m32 -march=k6 -O2 -fomit-frame-pointer2017100120170725
174525refgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2017100120170725
174534refgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2017100120170725
174553refgcc -m32 -march=k6 -O3 -fomit-frame-pointer2017100120170725
174709refgcc -funroll-loops -m32 -O -fomit-frame-pointer2017100120170725
174843refgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2017100120170725
174923refgcc -m32 -march=pentium -O3 -fomit-frame-pointer2017100120170725
174986refgcc -m32 -march=core2 -O3 -fomit-frame-pointer2017100120170725
175094refgcc -m32 -O3 -fomit-frame-pointer2017100120170725
175147refgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2017100120170725
175175refgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2017100120170725
175227refgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2017100120170725
175361refgcc -m32 -march=athlon -O2 -fomit-frame-pointer2017100120170725
175460refgcc -m32 -march=k8 -O2 -fomit-frame-pointer2017100120170725
175484refgcc -m32 -march=athlon -O3 -fomit-frame-pointer2017100120170725
175769refgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2017100120170725
175940refgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2017100120170725
176030refgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2017100120170725
176058refgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2017100120170725
176083refgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2017100120170725
176135refgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2017100120170725
176154refgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2017100120170725
176158refgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2017100120170725
176306refgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2017100120170725
176311refgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2017100120170725
176311refgcc -m32 -march=pentium -O2 -fomit-frame-pointer2017100120170725
176358refgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2017100120170725
176386refgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2017100120170725
176657refgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2017100120170725
176662refgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2017100120170725
176700refgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2017100120170725
176710refgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2017100120170725
176724refgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2017100120170725
176799refgcc -m32 -march=k6 -Os -fomit-frame-pointer2017100120170725
176809refgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2017100120170725
176842refgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2017100120170725
176866refgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2017100120170725
176923refgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2017100120170725
176923refgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2017100120170725
177294refgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2017100120170725
177389refgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2017100120170725
177555refgcc -m32 -march=pentium -Os -fomit-frame-pointer2017100120170725
177564refgcc -m32 -march=core2 -Os -fomit-frame-pointer2017100120170725
177607refgcc -m32 -Os -fomit-frame-pointer2017100120170725
177607refgcc -m32 -march=corei7 -Os -fomit-frame-pointer2017100120170725
177612refgcc -m32 -march=athlon -Os -fomit-frame-pointer2017100120170725
177655refgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2017100120170725
177674refgcc -m32 -march=k8 -Os -fomit-frame-pointer2017100120170725
177683refgcc -m32 -march=barcelona -Os -fomit-frame-pointer2017100120170725
177683refgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2017100120170725
177821refgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2017100120170725
177987refgcc -m32 -march=k8 -O3 -fomit-frame-pointer2017100120170725
178006refgcc -funroll-loops -m32 -Os -fomit-frame-pointer2017100120170725
178049refgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2017100120170725
178315refgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2017100120170725
178643refgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2017100120170725
179032refgcc -m32 -march=nocona -Os -fomit-frame-pointer2017100120170725
179056refgcc -m32 -march=prescott -Os -fomit-frame-pointer2017100120170725
179113refgcc -m32 -march=nocona -O2 -fomit-frame-pointer2017100120170725
179127refgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2017100120170725
179185refgcc -m32 -march=prescott -O2 -fomit-frame-pointer2017100120170725
179313refgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2017100120170725
179398refgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2017100120170725
179569refgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2017100120170725
179611refgcc -m32 -march=i486 -Os -fomit-frame-pointer2017100120170725
179621refgcc -m32 -march=i386 -Os -fomit-frame-pointer2017100120170725
179654refgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2017100120170725
180305refgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2017100120170725
180320refgcc -m32 -march=corei7 -O -fomit-frame-pointer2017100120170725
180343refgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2017100120170725
180386refgcc -m32 -march=athlon -O -fomit-frame-pointer2017100120170725
180462refgcc -m32 -march=k8 -O -fomit-frame-pointer2017100120170725
180519refgcc -m32 -O -fomit-frame-pointer2017100120170725
180519refgcc -m32 -march=prescott -O -fomit-frame-pointer2017100120170725
180523refgcc -m32 -march=nocona -O -fomit-frame-pointer2017100120170725
180538refgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2017100120170725
180818refgcc -m32 -march=core2 -O -fomit-frame-pointer2017100120170725
180885refgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2017100120170725
180894refgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2017100120170725
180942refgcc -m32 -march=barcelona -O -fomit-frame-pointer2017100120170725
181198refgcc -m32 -march=prescott -O3 -fomit-frame-pointer2017100120170725
181208refgcc -m32 -march=k6-3 -O -fomit-frame-pointer2017100120170725
181236refgcc -m32 -march=k6-2 -O -fomit-frame-pointer2017100120170725
181236refgcc -m32 -march=k6 -O -fomit-frame-pointer2017100120170725
181246refgcc -m32 -march=nocona -O3 -fomit-frame-pointer2017100120170725
181298refgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2017100120170725
181326refgcc -m32 -march=pentium -O -fomit-frame-pointer2017100120170725
181759refgcc -m32 -march=pentium-m -O -fomit-frame-pointer2017100120170725
181853refgcc -m32 -march=i386 -O3 -fomit-frame-pointer2017100120170725
181863refgcc -m32 -march=i386 -O2 -fomit-frame-pointer2017100120170725
181992refgcc -m32 -march=pentium2 -O -fomit-frame-pointer2017100120170725
182006refgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2017100120170725
182020refgcc -m32 -march=pentium3 -O -fomit-frame-pointer2017100120170725
182248refgcc -m32 -march=i486 -O2 -fomit-frame-pointer2017100120170725
182281refgcc -m32 -march=i486 -O3 -fomit-frame-pointer2017100120170725
182328refgcc -m32 -march=pentium4 -O -fomit-frame-pointer2017100120170725
184143refgcc -m32 -march=i386 -O -fomit-frame-pointer2017100120170725
184262refgcc -m32 -march=i486 -O -fomit-frame-pointer2017100120170725
184419refgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2017100120170725
185406refgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2017100120170725

Test failure

Implementation: crypto_aead/norx3261v1/ref
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 27, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer ref xmm
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer ref xmm
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer xmm
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer xmm
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer ref xmm
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer ref xmm
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer ref xmm
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=corei7 -O -fomit-frame-pointer xmm
gcc -m32 -march=corei7 -Os -fomit-frame-pointer xmm

Compiler output

Implementation: crypto_aead/norx3261v1/xmm
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
norx.c: norx.c: In function 'crypto_aead_norx3261v1_xmm_encrypt':
norx.c: norx.c:346:19: warning: SSE vector return without SSE enabled changes the ABI [-Wpsabi]
norx.c: const __m128i K = LOADU(k + 0);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:27:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:714:1: error: inlining failed in call to always_inline '_mm_storeu_si128': target specific option mismatch
norx.c: _mm_storeu_si128 (__m128i *__P, __m128i __B)
norx.c: ^
norx.c: norx.c:50:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ^
norx.c: norx.c:304:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 16, LOADU(in + 16));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:27:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:696:1: error: inlining failed in call to always_inline '_mm_loadu_si128': target specific option mismatch
norx.c: _mm_loadu_si128 (__m128i const *__P)
norx.c: ^
norx.c: norx.c:50:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ...

Number of similar (compiler,implementation) pairs: 88, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer xmm
gcc -m32 -O2 -fomit-frame-pointer xmm
gcc -m32 -O3 -fomit-frame-pointer xmm
gcc -m32 -O -fomit-frame-pointer xmm
gcc -m32 -Os -fomit-frame-pointer xmm
gcc -m32 -march=athlon -O2 -fomit-frame-pointer xmm
gcc -m32 -march=athlon -O3 -fomit-frame-pointer xmm
gcc -m32 -march=athlon -O -fomit-frame-pointer xmm
gcc -m32 -march=athlon -Os -fomit-frame-pointer xmm
gcc -m32 -march=i386 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=i386 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=i386 -O -fomit-frame-pointer xmm
gcc -m32 -march=i386 -Os -fomit-frame-pointer xmm
gcc -m32 -march=i486 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=i486 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=i486 -O -fomit-frame-pointer xmm
gcc -m32 -march=i486 -Os -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -O -fomit-frame-pointer xmm
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -O -fomit-frame-pointer xmm
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer xmm
gcc -m32 -march=k6 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=k6 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=k6 -O -fomit-frame-pointer xmm
gcc -m32 -march=k6 -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer xmm
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer xmm

Compiler output

Implementation: crypto_aead/norx3261v1/xmm
Compiler: gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:27:
norx.c: norx.c: In function 'block_copy':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:714:1: error: inlining failed in call to always_inline '_mm_storeu_si128': target specific option mismatch
norx.c: _mm_storeu_si128 (__m128i *__P, __m128i __B)
norx.c: ^
norx.c: norx.c:50:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ^
norx.c: norx.c:304:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 16, LOADU(in + 16));
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/xmmintrin.h:1249:0,
norx.c: from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:31,
norx.c: from norx.c:27:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/emmintrin.h:696:1: error: inlining failed in call to always_inline '_mm_loadu_si128': target specific option mismatch
norx.c: _mm_loadu_si128 (__m128i const *__P)
norx.c: ^
norx.c: norx.c:50:24: error: called from here
norx.c: #define STOREU(out, x) _mm_storeu_si128((__m128i*)(out), (x))
norx.c: ^
norx.c: norx.c:304:9: note: in expansion of macro 'STOREU'
norx.c: STOREU(out + 16, LOADU(in + 16));
norx.c: ^
norx.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer xmm
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -O -fomit-frame-pointer xmm
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer xmm

Compiler output

Implementation: crypto_aead/norx3261v1/xmm
Compiler: gcc -m32 -march=core2 -O2 -fomit-frame-pointer
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:41:0,
norx.c: from norx.c:27:
norx.c: norx.c: In function 'crypto_aead_norx3261v1_xmm_decrypt':
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/smmintrin.h:166:1: error: inlining failed in call to always_inline '_mm_blend_epi16': target specific option mismatch
norx.c: _mm_blend_epi16 (__m128i __X, __m128i __Y, const int __M)
norx.c: ^
norx.c: norx.c:249:58: error: called from here
norx.c: W2 = LOADL(IN + 32); STOREL(OUT + 32, XOR(C, W2)); C = BLEND(C, W2); \
norx.c: ^
norx.c: norx.c:430:13: note: in expansion of macro 'DECRYPT_BLOCK'
norx.c: DECRYPT_BLOCK(A, B, C, D, c, m);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:41:0,
norx.c: from norx.c:27:
norx.c: /usr/lib/gcc/x86_64-linux-gnu/5/include/smmintrin.h:166:1: error: inlining failed in call to always_inline '_mm_blend_epi16': target specific option mismatch
norx.c: _mm_blend_epi16 (__m128i __X, __m128i __Y, const int __M)
norx.c: ^
norx.c: norx.c:249:58: error: called from here
norx.c: W2 = LOADL(IN + 32); STOREL(OUT + 32, XOR(C, W2)); C = BLEND(C, W2); \
norx.c: ^
norx.c: norx.c:430:13: note: in expansion of macro 'DECRYPT_BLOCK'
norx.c: DECRYPT_BLOCK(A, B, C, D, c, m);
norx.c: ^
norx.c: In file included from /usr/lib/gcc/x86_64-linux-gnu/5/include/x86intrin.h:41:0,
norx.c: from norx.c:27:
norx.c: ...

Number of similar (compiler,implementation) pairs: 8, namely:
CompilerImplementations
gcc -m32 -march=core2 -O2 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -O3 -fomit-frame-pointer xmm
gcc -m32 -march=core2 -O -fomit-frame-pointer xmm
gcc -m32 -march=core2 -Os -fomit-frame-pointer xmm
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer xmm
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer xmm
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer xmm
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer xmm