Implementation notes: x86, kizomba, crypto_aead/scream10v1

Computer: kizomba
Architecture: x86
CPU ID: GenuineIntel-000906e9-bfebfbff
SUPERCOP version: 20181216
Operation: crypto_aead
Primitive: scream10v1
TimeImplementationCompilerBenchmark dateSUPERCOP version
331324refgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2018082520180818
332834refgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2018082520180818
332835refgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2018082520180818
334853refgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2018082520180818
335066refgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2018082520180818
336369refgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2018082520180818
336456refgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2018082520180818
337363refgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2018082520180818
339327refgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2018082520180818
340336refgcc -funroll-loops -m32 -O -fomit-frame-pointer2018082520180818
342070refgcc -m32 -march=k8 -O3 -fomit-frame-pointer2018082520180818
346672refgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2018082520180818
346720refgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2018082520180818
346730refgcc -m32 -march=athlon -O3 -fomit-frame-pointer2018082520180818
348088refgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2018082520180818
349323refgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2018082520180818
351506refgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2018082520180818
354030refgcc -m32 -O3 -fomit-frame-pointer2018082520180818
355261refgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2018082520180818
355484refgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2018082520180818
356716refgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2018082520180818
356721refgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2018082520180818
361083refgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2018082520180818
361196refgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2018082520180818
363278refgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2018082520180818
364826refgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2018082520180818
365953refgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2018082520180818
366434refgcc -m32 -march=nocona -O3 -fomit-frame-pointer2018082520180818
367804refgcc -m32 -march=prescott -O3 -fomit-frame-pointer2018082520180818
368150refgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2018082520180818
370027refgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2018082520180818
370115refgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2018082520180818
370264refgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2018082520180818
371456refgcc -m32 -march=core2 -O3 -fomit-frame-pointer2018082520180818
374883refgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2018082520180818
379691refgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2018082520180818
391238refgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2018082520180818
391496refgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018082520180818
391694refgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2018082520180818
392081refgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2018082520180818
392546refgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2018082520180818
392843refgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2018082520180818
393136refgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2018082520180818
394938refgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2018082520180818
403183refgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2018082520180818
404242refgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018082520180818
408593refgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2018082520180818
408863refgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2018082520180818
409788refgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018082520180818
417228refgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2018082520180818
421787refgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2018082520180818
429013refgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2018082520180818
474481refgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2018082520180818
478040refgcc -m32 -march=athlon -O2 -fomit-frame-pointer2018082520180818
478161refgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2018082520180818
478545refgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2018082520180818
478594refgcc -m32 -march=k8 -O2 -fomit-frame-pointer2018082520180818
479224refgcc -m32 -march=prescott -O -fomit-frame-pointer2018082520180818
480448refgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2018082520180818
480949refgcc -m32 -march=core2 -O2 -fomit-frame-pointer2018082520180818
480968refgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2018082520180818
481454refgcc -m32 -O2 -fomit-frame-pointer2018082520180818
481643refgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2018082520180818
481883refgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2018082520180818
482082refgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2018082520180818
482159refgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2018082520180818
482964refgcc -m32 -march=prescott -O2 -fomit-frame-pointer2018082520180818
483278refgcc -m32 -march=nocona -O2 -fomit-frame-pointer2018082520180818
483605refgcc -m32 -march=nocona -O -fomit-frame-pointer2018082520180818
485351refgcc -m32 -march=athlon -O -fomit-frame-pointer2018082520180818
486091refgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2018082520180818
487483refgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2018082520180818
487555refgcc -m32 -march=core2 -O -fomit-frame-pointer2018082520180818
487673refgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2018082520180818
487972refgcc -m32 -march=k8 -O -fomit-frame-pointer2018082520180818
488228refgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2018082520180818
488476refgcc -m32 -march=corei7 -O -fomit-frame-pointer2018082520180818
488716refgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2018082520180818
489324refgcc -m32 -march=barcelona -O -fomit-frame-pointer2018082520180818
489602refgcc -m32 -march=pentium4 -O -fomit-frame-pointer2018082520180818
489703refgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2018082520180818
490798refgcc -m32 -O -fomit-frame-pointer2018082520180818
528357refgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2018082520180818
529352refgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2018082520180818
529453refgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018082520180818
529556refgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2018082520180818
545139refgcc -m32 -march=pentium-m -O -fomit-frame-pointer2018082520180818
547482refgcc -m32 -march=pentium2 -O -fomit-frame-pointer2018082520180818
547909refgcc -m32 -march=pentium3 -O -fomit-frame-pointer2018082520180818
548441refgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2018082520180818
582349refgcc -m32 -march=i386 -O3 -fomit-frame-pointer2018082520180818
588637refgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2018082520180818
589919refgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2018082520180818
590596refgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2018082520180818
591147refgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2018082520180818
591905refgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2018082520180818
592061refgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2018082520180818
592236refgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2018082520180818
592291refgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2018082520180818
592375refgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2018082520180818
592510refgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018082520180818
592647refgcc -m32 -march=k6 -O3 -fomit-frame-pointer2018082520180818
592659refgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2018082520180818
593488refgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2018082520180818
593667refgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2018082520180818
595057refgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2018082520180818
596268refgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2018082520180818
598159refgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2018082520180818
598407refgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018082520180818
601359refgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2018082520180818
601750refgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2018082520180818
603186refgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2018082520180818
603715refgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2018082520180818
604842refgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2018082520180818
604951refgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2018082520180818
612129refgcc -m32 -march=pentium -O3 -fomit-frame-pointer2018082520180818
614389refgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018082520180818
653080refgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2018082520180818
656957refgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2018082520180818
657046refgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2018082520180818
657064refgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2018082520180818
662798refgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2018082520180818
666659refgcc -m32 -march=i486 -O3 -fomit-frame-pointer2018082520180818
738072refgcc -m32 -march=k6-3 -O -fomit-frame-pointer2018082520180818
738561refgcc -m32 -march=k6-2 -O -fomit-frame-pointer2018082520180818
740457refgcc -m32 -march=k6 -O -fomit-frame-pointer2018082520180818
748423refgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2018082520180818
749006refgcc -m32 -march=pentium -O -fomit-frame-pointer2018082520180818
751348refgcc -m32 -march=i486 -O -fomit-frame-pointer2018082520180818
755231refgcc -m32 -march=i386 -O -fomit-frame-pointer2018082520180818
766808refgcc -m32 -march=i486 -O2 -fomit-frame-pointer2018082520180818
768316refgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2018082520180818
769185refgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2018082520180818
770446refgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2018082520180818
778206refgcc -m32 -march=i386 -O2 -fomit-frame-pointer2018082520180818
787008refgcc -m32 -march=pentium -O2 -fomit-frame-pointer2018082520180818
787637refgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018082520180818
816441refgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2018082520180818
817934refgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2018082520180818
818287refgcc -m32 -march=k6 -O2 -fomit-frame-pointer2018082520180818
851318refgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018082520180818
853669refgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2018082520180818
853730refgcc -m32 -march=pentium -Os -fomit-frame-pointer2018082520180818
857139refgcc -m32 -march=athlon -Os -fomit-frame-pointer2018082520180818
857371refgcc -m32 -march=k6 -Os -fomit-frame-pointer2018082520180818
857585refgcc -m32 -march=core2 -Os -fomit-frame-pointer2018082520180818
857607refgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2018082520180818
857793refgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2018082520180818
858107refgcc -m32 -march=barcelona -Os -fomit-frame-pointer2018082520180818
858115refgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2018082520180818
858357refgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2018082520180818
859330refgcc -m32 -Os -fomit-frame-pointer2018082520180818
859506refgcc -m32 -march=k8 -Os -fomit-frame-pointer2018082520180818
859529refgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2018082520180818
859585refgcc -m32 -march=corei7 -Os -fomit-frame-pointer2018082520180818
862242refgcc -m32 -march=i386 -Os -fomit-frame-pointer2018082520180818
864514refgcc -m32 -march=nocona -Os -fomit-frame-pointer2018082520180818
866814refgcc -m32 -march=prescott -Os -fomit-frame-pointer2018082520180818
867748refgcc -m32 -march=i486 -Os -fomit-frame-pointer2018082520180818
868484refgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2018082520180818
896081refgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2018082520180818
913220refgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2018082520180818
958361refgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2018082520180818
959065refgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2018082520180818
965572refgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018082520180818
968885refgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2018082520180818
975476refgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2018082520180818
976250refgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2018082520180818
977252refgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2018082520180818
979427refgcc -funroll-loops -m32 -Os -fomit-frame-pointer2018082520180818
980046refgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2018082520180818
983867refgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2018082520180818
985998refgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2018082520180818
986414refgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2018082520180818
987284refgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2018082520180818
987752refgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2018082520180818

Test failure

Implementation: crypto_aead/scream10v1/sse
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 32, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer sse
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer sse
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer sse
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer sse
gcc -m32 -march=core2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core2 -O -fomit-frame-pointer sse
gcc -m32 -march=core2 -Os -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer sse
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer sse
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer sse
gcc -m32 -march=corei7 -O -fomit-frame-pointer sse
gcc -m32 -march=corei7 -Os -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v1/sse
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:16:32: warning: implicit declaration of function '__builtin_ia32_psrldi128'; did you mean '__builtin_ia32_bsrsi'? [-Wimplicit-function-declaration]
scream.c: #define shift_right(x) ((v16qi)__builtin_ia32_psrldi128((v4si)x, 4))
scream.c: ^
scream.c: scream.c:182:10: note: in expansion of macro 'shift_right'
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^~~~~~~~~~~
scream.c: scream.c:182:5: error: can't convert a value of type 'int' to vector type '__vector(16) char' which has different size
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^~
scream.c: scream.c:183:5: error: can't convert a value of type 'int' to vector type '__vector(16) char' which has different size
scream.c: t1 = shift_right(in[2]) & V(0xf);
scream.c: ^~
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128'; did you mean '__builtin_ia32_pause'? [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^~~~~~~~~~~~~~~~~~~~~~~~
scream.c: __builtin_ia32_pause
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ...

Number of similar (compiler,implementation) pairs: 40, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer sse
gcc -m32 -O2 -fomit-frame-pointer sse
gcc -m32 -O3 -fomit-frame-pointer sse
gcc -m32 -O -fomit-frame-pointer sse
gcc -m32 -Os -fomit-frame-pointer sse
gcc -m32 -march=i386 -O2 -fomit-frame-pointer sse
gcc -m32 -march=i386 -O3 -fomit-frame-pointer sse
gcc -m32 -march=i386 -O -fomit-frame-pointer sse
gcc -m32 -march=i386 -Os -fomit-frame-pointer sse
gcc -m32 -march=i486 -O2 -fomit-frame-pointer sse
gcc -m32 -march=i486 -O3 -fomit-frame-pointer sse
gcc -m32 -march=i486 -O -fomit-frame-pointer sse
gcc -m32 -march=i486 -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium -O -fomit-frame-pointer sse
gcc -m32 -march=pentium -Os -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v1/sse
Compiler: gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:16:32: warning: implicit declaration of function '__builtin_ia32_psrldi128'; did you mean '__builtin_ia32_psrldi'? [-Wimplicit-function-declaration]
scream.c: #define shift_right(x) ((v16qi)__builtin_ia32_psrldi128((v4si)x, 4))
scream.c: ^
scream.c: scream.c:182:10: note: in expansion of macro 'shift_right'
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^~~~~~~~~~~
scream.c: scream.c:182:5: error: can't convert a value of type 'int' to vector type '__vector(16) char' which has different size
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^~
scream.c: scream.c:183:5: error: can't convert a value of type 'int' to vector type '__vector(16) char' which has different size
scream.c: t1 = shift_right(in[2]) & V(0xf);
scream.c: ^~
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128'; did you mean '__builtin_ia32_pshufw'? [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^~~~~~~~~~~~~~~~~~~~~~~~
scream.c: __builtin_ia32_pshufw
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ...

Number of similar (compiler,implementation) pairs: 16, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer sse
gcc -m32 -march=athlon -O2 -fomit-frame-pointer sse
gcc -m32 -march=athlon -O3 -fomit-frame-pointer sse
gcc -m32 -march=athlon -O -fomit-frame-pointer sse
gcc -m32 -march=athlon -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -O -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v1/sse
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128'; did you mean '__builtin_ia32_psubb128'? [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^~~~~~~~~~~~~~~~~~~~~~~~
scream.c: __builtin_ia32_psubb128
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^~
scream.c: scream.c:199:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^~
scream.c: scream.c:203:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ...

Number of similar (compiler,implementation) pairs: 44, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer sse
gcc -m32 -march=k8 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k8 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k8 -O -fomit-frame-pointer sse
gcc -m32 -march=k8 -Os -fomit-frame-pointer sse
gcc -m32 -march=nocona -O2 -fomit-frame-pointer sse
gcc -m32 -march=nocona -O3 -fomit-frame-pointer sse
gcc -m32 -march=nocona -O -fomit-frame-pointer sse
gcc -m32 -march=nocona -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -O -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -O -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer sse
gcc -m32 -march=prescott -O2 -fomit-frame-pointer sse
gcc -m32 -march=prescott -O3 -fomit-frame-pointer sse
gcc -m32 -march=prescott -O -fomit-frame-pointer sse
gcc -m32 -march=prescott -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v1/sse
Compiler: gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:16:32: warning: implicit declaration of function '__builtin_ia32_psrldi128'; did you mean '__builtin_ia32_psrldi'? [-Wimplicit-function-declaration]
scream.c: #define shift_right(x) ((v16qi)__builtin_ia32_psrldi128((v4si)x, 4))
scream.c: ^
scream.c: scream.c:182:10: note: in expansion of macro 'shift_right'
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^~~~~~~~~~~
scream.c: scream.c:182:5: error: can't convert a value of type 'int' to vector type '__vector(16) char' which has different size
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^~
scream.c: scream.c:183:5: error: can't convert a value of type 'int' to vector type '__vector(16) char' which has different size
scream.c: t1 = shift_right(in[2]) & V(0xf);
scream.c: ^~
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128'; did you mean '__builtin_ia32_psubb'? [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^~~~~~~~~~~~~~~~~~~~~~~~
scream.c: __builtin_ia32_psubb
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ...

Number of similar (compiler,implementation) pairs: 40, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -O -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -O -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer sse
gcc -m32 -march=k6 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k6 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k6 -O -fomit-frame-pointer sse
gcc -m32 -march=k6 -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -O -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v1/sse
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128'; did you mean '__builtin_ia32_psubb128'? [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^~~~~~~~~~~~~~~~~~~~~~~~
scream.c: __builtin_ia32_psubb128
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^~
scream.c: scream.c:199:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^~
scream.c: scream.c:203:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ...
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128'; did you mean '__builtin_ia32_psubb128'? [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^~~~~~~~~~~~~~~~~~~~~~~~
scream.c: __builtin_ia32_psubb128
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^~
scream.c: scream.c:199:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^~
scream.c: scream.c:203:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer sse
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer sse
gcc -m32 -march=barcelona -O -fomit-frame-pointer sse
gcc -m32 -march=barcelona -Os -fomit-frame-pointer sse