Implementation notes: x86, rumba7, crypto_aead/scream10v3

Computer: rumba7
Architecture: x86
CPU ID: AuthenticAMD-00800f11-178bfbff
SUPERCOP version: 20171218
Operation: crypto_aead
Primitive: scream10v3
TimeImplementationCompilerBenchmark dateSUPERCOP version
443850refgcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer2018052920171218
450420refgcc -m32 -march=pentium3 -O3 -fomit-frame-pointer2018052920171218
450960refgcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer2018052920171218
451680refgcc -funroll-loops -m32 -O2 -fomit-frame-pointer2018052920171218
456900refgcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018052920171218
457020refgcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer2018052920171218
461940refgcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer2018052920171218
462150refgcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer2018052920171218
462210refgcc -m32 -march=pentium2 -O3 -fomit-frame-pointer2018052920171218
462450refgcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer2018052920171218
462750refgcc -m32 -march=corei7 -O3 -fomit-frame-pointer2018052920171218
463200refgcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer2018052920171218
463230refgcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer2018052920171218
463440refgcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018052920171218
463770refgcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer2018052920171218
463800refgcc -m32 -march=core2 -O3 -fomit-frame-pointer2018052920171218
464460refgcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer2018052920171218
464460refgcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer2018052920171218
464550refgcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer2018052920171218
464610refgcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer2018052920171218
464670refgcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer2018052920171218
465120refgcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer2018052920171218
465810refgcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer2018052920171218
465810refgcc -m32 -march=pentium-m -O3 -fomit-frame-pointer2018052920171218
466080refgcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer2018052920171218
466140refgcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer2018052920171218
466650refgcc -funroll-loops -m32 -O3 -fomit-frame-pointer2018052920171218
468150refgcc -m32 -O3 -fomit-frame-pointer2018052920171218
468240refgcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer2018052920171218
470010refgcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer2018052920171218
471210refgcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer2018052920171218
471240refgcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer2018052920171218
471360refgcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer2018052920171218
471990refgcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer2018052920171218
472350refgcc -m32 -march=nocona -O3 -fomit-frame-pointer2018052920171218
473160refgcc -m32 -march=barcelona -O3 -fomit-frame-pointer2018052920171218
473700refgcc -m32 -march=k8 -O3 -fomit-frame-pointer2018052920171218
473880refgcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer2018052920171218
473880refgcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer2018052920171218
474870refgcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer2018052920171218
475650refgcc -m32 -march=pentium4 -O3 -fomit-frame-pointer2018052920171218
477450refgcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer2018052920171218
479190refgcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer2018052920171218
480270refgcc -m32 -march=prescott -O3 -fomit-frame-pointer2018052920171218
482190refgcc -m32 -march=athlon -O3 -fomit-frame-pointer2018052920171218
483240refgcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer2018052920171218
485820refgcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer2018052920171218
488970refgcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer2018052920171218
492090refgcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer2018052920171218
493140refgcc -funroll-loops -m32 -O -fomit-frame-pointer2018052920171218
500130refgcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer2018052920171218
500760refgcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer2018052920171218
584370refgcc -m32 -march=core2 -O2 -fomit-frame-pointer2018052920171218
584670refgcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer2018052920171218
584940refgcc -m32 -march=corei7 -O2 -fomit-frame-pointer2018052920171218
584970refgcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer2018052920171218
585030refgcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer2018052920171218
585180refgcc -m32 -march=prescott -O2 -fomit-frame-pointer2018052920171218
585690refgcc -m32 -march=nocona -O2 -fomit-frame-pointer2018052920171218
585750refgcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer2018052920171218
585780refgcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer2018052920171218
585960refgcc -m32 -march=athlon -O2 -fomit-frame-pointer2018052920171218
586800refgcc -m32 -march=barcelona -O2 -fomit-frame-pointer2018052920171218
588660refgcc -m32 -march=core-avx-i -O -fomit-frame-pointer2018052920171218
588780refgcc -m32 -march=corei7-avx -O -fomit-frame-pointer2018052920171218
588780refgcc -m32 -march=k8 -O2 -fomit-frame-pointer2018052920171218
589800refgcc -m32 -march=prescott -O -fomit-frame-pointer2018052920171218
589890refgcc -m32 -O2 -fomit-frame-pointer2018052920171218
590760refgcc -m32 -march=nocona -O -fomit-frame-pointer2018052920171218
591180refgcc -m32 -march=athlon -O -fomit-frame-pointer2018052920171218
591420refgcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer2018052920171218
592260refgcc -m32 -O -fomit-frame-pointer2018052920171218
593220refgcc -m32 -march=barcelona -O -fomit-frame-pointer2018052920171218
593580refgcc -m32 -march=k8 -O -fomit-frame-pointer2018052920171218
594120refgcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer2018052920171218
595590refgcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer2018052920171218
595650refgcc -m32 -march=core2 -O -fomit-frame-pointer2018052920171218
595680refgcc -m32 -march=corei7 -O -fomit-frame-pointer2018052920171218
595950refgcc -m32 -march=core-avx2 -O -fomit-frame-pointer2018052920171218
598950refgcc -m32 -march=native -mtune=native -O -fomit-frame-pointer2018052920171218
598980refgcc -m32 -march=pentium4 -O2 -fomit-frame-pointer2018052920171218
607770refgcc -m32 -march=pentium4 -O -fomit-frame-pointer2018052920171218
634800refgcc -m32 -march=pentium-m -O -fomit-frame-pointer2018052920171218
637500refgcc -m32 -march=pentium-m -O2 -fomit-frame-pointer2018052920171218
637560refgcc -m32 -march=pentium3 -O -fomit-frame-pointer2018052920171218
638820refgcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer2018052920171218
638850refgcc -m32 -march=pentium2 -O2 -fomit-frame-pointer2018052920171218
639750refgcc -m32 -march=pentium3 -O2 -fomit-frame-pointer2018052920171218
642720refgcc -m32 -march=pentiumpro -O -fomit-frame-pointer2018052920171218
642840refgcc -m32 -march=pentium2 -O -fomit-frame-pointer2018052920171218
643440refgcc -m32 -march=pentium3 -Os -fomit-frame-pointer2018052920171218
644130refgcc -m32 -march=pentium-m -Os -fomit-frame-pointer2018052920171218
644640refgcc -m32 -march=pentium2 -Os -fomit-frame-pointer2018052920171218
645510refgcc -m32 -march=pentiumpro -Os -fomit-frame-pointer2018052920171218
651510refgcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer2018052920171218
651750refgcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer2018052920171218
659580refgcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer2018052920171218
660360refgcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer2018052920171218
736650refgcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer2018052920171218
745680refgcc -m32 -march=i386 -O3 -fomit-frame-pointer2018052920171218
763020refgcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer2018052920171218
763800refgcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018052920171218
820860refgcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018052920171218
821040refgcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer2018052920171218
824280refgcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer2018052920171218
825750refgcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer2018052920171218
825960refgcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer2018052920171218
826140refgcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer2018052920171218
827430refgcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer2018052920171218
829350refgcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer2018052920171218
832530refgcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer2018052920171218
839580refgcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer2018052920171218
845040refgcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer2018052920171218
846150refgcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer2018052920171218
848580refgcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer2018052920171218
850380refgcc -m32 -march=i386 -O2 -fomit-frame-pointer2018052920171218
850620refgcc -m32 -march=i486 -O2 -fomit-frame-pointer2018052920171218
865860refgcc -m32 -march=pentium -O2 -fomit-frame-pointer2018052920171218
870330refgcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer2018052920171218
870630refgcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018052920171218
870870refgcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer2018052920171218
871560refgcc -m32 -march=k6-2 -O3 -fomit-frame-pointer2018052920171218
872370refgcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer2018052920171218
874380refgcc -m32 -march=k6 -O3 -fomit-frame-pointer2018052920171218
874950refgcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer2018052920171218
875130refgcc -m32 -march=pentium -O3 -fomit-frame-pointer2018052920171218
875220refgcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer2018052920171218
876330refgcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer2018052920171218
876420refgcc -m32 -march=k6-3 -O3 -fomit-frame-pointer2018052920171218
877230refgcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer2018052920171218
884010refgcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer2018052920171218
884700refgcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer2018052920171218
884760refgcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer2018052920171218
885300refgcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer2018052920171218
885450refgcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer2018052920171218
885720refgcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer2018052920171218
902190refgcc -m32 -march=i386 -O -fomit-frame-pointer2018052920171218
902670refgcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer2018052920171218
904170refgcc -m32 -march=pentium -Os -fomit-frame-pointer2018052920171218
904410refgcc -m32 -march=i486 -O3 -fomit-frame-pointer2018052920171218
905880refgcc -m32 -march=prescott -Os -fomit-frame-pointer2018052920171218
906750refgcc -m32 -march=pentium4 -Os -fomit-frame-pointer2018052920171218
906840refgcc -m32 -march=i486 -Os -fomit-frame-pointer2018052920171218
906900refgcc -m32 -march=i386 -Os -fomit-frame-pointer2018052920171218
906990refgcc -m32 -march=nocona -Os -fomit-frame-pointer2018052920171218
908220refgcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer2018052920171218
908520refgcc -m32 -march=i486 -O -fomit-frame-pointer2018052920171218
908700refgcc -m32 -march=pentium-mmx -O -fomit-frame-pointer2018052920171218
908820refgcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer2018052920171218
909480refgcc -m32 -march=pentium -O -fomit-frame-pointer2018052920171218
912990refgcc -m32 -march=barcelona -Os -fomit-frame-pointer2018052920171218
913950refgcc -funroll-loops -m32 -Os -fomit-frame-pointer2018052920171218
914580refgcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer2018052920171218
914820refgcc -m32 -march=k8 -Os -fomit-frame-pointer2018052920171218
914940refgcc -m32 -march=core2 -Os -fomit-frame-pointer2018052920171218
915300refgcc -m32 -march=corei7 -Os -fomit-frame-pointer2018052920171218
915810refgcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer2018052920171218
916050refgcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer2018052920171218
916620refgcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer2018052920171218
917340refgcc -m32 -march=core-avx-i -Os -fomit-frame-pointer2018052920171218
917700refgcc -m32 -march=athlon -Os -fomit-frame-pointer2018052920171218
918210refgcc -m32 -march=core-avx2 -Os -fomit-frame-pointer2018052920171218
919140refgcc -m32 -Os -fomit-frame-pointer2018052920171218
919470refgcc -m32 -march=corei7-avx -Os -fomit-frame-pointer2018052920171218
948840refgcc -m32 -march=k6-3 -Os -fomit-frame-pointer2018052920171218
950160refgcc -m32 -march=k6-2 -Os -fomit-frame-pointer2018052920171218
950430refgcc -m32 -march=k6 -Os -fomit-frame-pointer2018052920171218
964080refgcc -m32 -march=k6-2 -O -fomit-frame-pointer2018052920171218
964680refgcc -m32 -march=k6-3 -O -fomit-frame-pointer2018052920171218
965940refgcc -m32 -march=k6 -O -fomit-frame-pointer2018052920171218
1020780refgcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer2018052920171218
1020840refgcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer2018052920171218
1021770refgcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer2018052920171218
1021980refgcc -m32 -march=k6-3 -O2 -fomit-frame-pointer2018052920171218
1022490refgcc -m32 -march=k6 -O2 -fomit-frame-pointer2018052920171218
1023000refgcc -m32 -march=k6-2 -O2 -fomit-frame-pointer2018052920171218

Test failure

Implementation: crypto_aead/scream10v3/sse
Compiler: gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 32, namely:
CompilerImplementations
gcc -m32 -march=core-avx-i -O2 -fomit-frame-pointer sse
gcc -m32 -march=core-avx-i -O3 -fomit-frame-pointer sse
gcc -m32 -march=core-avx-i -O -fomit-frame-pointer sse
gcc -m32 -march=core-avx-i -Os -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -O -fomit-frame-pointer sse
gcc -m32 -march=core-avx2 -Os -fomit-frame-pointer sse
gcc -m32 -march=core2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core2 -O -fomit-frame-pointer sse
gcc -m32 -march=core2 -Os -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -O -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -O2 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -O3 -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -O -fomit-frame-pointer sse
gcc -m32 -march=core2 -msse4 -Os -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -O2 -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -O3 -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -O -fomit-frame-pointer sse
gcc -m32 -march=corei7-avx -Os -fomit-frame-pointer sse
gcc -m32 -march=corei7 -O2 -fomit-frame-pointer sse
gcc -m32 -march=corei7 -O3 -fomit-frame-pointer sse
gcc -m32 -march=corei7 -O -fomit-frame-pointer sse
gcc -m32 -march=corei7 -Os -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -O2 -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -O3 -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -O -fomit-frame-pointer sse
gcc -m32 -march=native -mtune=native -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v3/sse
Compiler: gcc -funroll-loops -m32 -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:16:32: warning: implicit declaration of function '__builtin_ia32_psrldi128' [-Wimplicit-function-declaration]
scream.c: #define shift_right(x) ((v16qi)__builtin_ia32_psrldi128((v4si)x, 4))
scream.c: ^
scream.c: scream.c:199:10: note: in expansion of macro 'shift_right'
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^
scream.c: scream.c:199:5: error: can't convert between vector values of different size
scream.c: t0 = shift_right(in[0]) & V(0xf);
scream.c: ^
scream.c: scream.c:200:5: error: can't convert between vector values of different size
scream.c: t1 = shift_right(in[2]) & V(0xf);
scream.c: ^
scream.c: scream.c:202:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:202:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:203:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:207:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: ...

Number of similar (compiler,implementation) pairs: 96, namely:
CompilerImplementations
gcc -funroll-loops -m32 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=athlon -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i386 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=i486 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-2 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6-3 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k6 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium2 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium3 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentiumpro -Os -fomit-frame-pointer sse
gcc -m32 -O2 -fomit-frame-pointer sse
gcc -m32 -O3 -fomit-frame-pointer sse
gcc -m32 -O -fomit-frame-pointer sse
gcc -m32 -Os -fomit-frame-pointer sse
gcc -m32 -march=athlon -O2 -fomit-frame-pointer sse
gcc -m32 -march=athlon -O3 -fomit-frame-pointer sse
gcc -m32 -march=athlon -O -fomit-frame-pointer sse
gcc -m32 -march=athlon -Os -fomit-frame-pointer sse
gcc -m32 -march=i386 -O2 -fomit-frame-pointer sse
gcc -m32 -march=i386 -O3 -fomit-frame-pointer sse
gcc -m32 -march=i386 -O -fomit-frame-pointer sse
gcc -m32 -march=i386 -Os -fomit-frame-pointer sse
gcc -m32 -march=i486 -O2 -fomit-frame-pointer sse
gcc -m32 -march=i486 -O3 -fomit-frame-pointer sse
gcc -m32 -march=i486 -O -fomit-frame-pointer sse
gcc -m32 -march=i486 -Os -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -O -fomit-frame-pointer sse
gcc -m32 -march=k6-2 -Os -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -O -fomit-frame-pointer sse
gcc -m32 -march=k6-3 -Os -fomit-frame-pointer sse
gcc -m32 -march=k6 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k6 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k6 -O -fomit-frame-pointer sse
gcc -m32 -march=k6 -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -O -fomit-frame-pointer sse
gcc -m32 -march=pentium-mmx -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -O -fomit-frame-pointer sse
gcc -m32 -march=pentium2 -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -O -fomit-frame-pointer sse
gcc -m32 -march=pentium3 -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium -O -fomit-frame-pointer sse
gcc -m32 -march=pentium -Os -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -O -fomit-frame-pointer sse
gcc -m32 -march=pentiumpro -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v3/sse
Compiler: gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:202:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:202:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:203:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:207:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:208:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:215:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:216:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:220:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: ...

Number of similar (compiler,implementation) pairs: 44, namely:
CompilerImplementations
gcc -funroll-loops -m32 -march=barcelona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=barcelona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=barcelona -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=barcelona -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=k8 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=nocona -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium-m -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=pentium4 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -O -fomit-frame-pointer sse
gcc -funroll-loops -m32 -march=prescott -Os -fomit-frame-pointer sse
gcc -m32 -march=k8 -O2 -fomit-frame-pointer sse
gcc -m32 -march=k8 -O3 -fomit-frame-pointer sse
gcc -m32 -march=k8 -O -fomit-frame-pointer sse
gcc -m32 -march=k8 -Os -fomit-frame-pointer sse
gcc -m32 -march=nocona -O2 -fomit-frame-pointer sse
gcc -m32 -march=nocona -O3 -fomit-frame-pointer sse
gcc -m32 -march=nocona -O -fomit-frame-pointer sse
gcc -m32 -march=nocona -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -O -fomit-frame-pointer sse
gcc -m32 -march=pentium-m -Os -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -O2 -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -O3 -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -O -fomit-frame-pointer sse
gcc -m32 -march=pentium4 -Os -fomit-frame-pointer sse
gcc -m32 -march=prescott -O2 -fomit-frame-pointer sse
gcc -m32 -march=prescott -O3 -fomit-frame-pointer sse
gcc -m32 -march=prescott -O -fomit-frame-pointer sse
gcc -m32 -march=prescott -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream10v3/sse
Compiler: gcc -m32 -march=barcelona -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:202:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:202:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:203:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:207:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:208:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:215:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:216:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:220:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: ...
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:202:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:202:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:203:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:207:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:208:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:215:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:216:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:220:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m32 -march=barcelona -O2 -fomit-frame-pointer sse
gcc -m32 -march=barcelona -O3 -fomit-frame-pointer sse
gcc -m32 -march=barcelona -O -fomit-frame-pointer sse
gcc -m32 -march=barcelona -Os -fomit-frame-pointer sse