Implementation notes: amd64, calvin, crypto_aead/scream12v1

Computer: calvin
Architecture: amd64
CPU ID: AuthenticAMD-00600f20-178bfbff
SUPERCOP version: 20171218
Operation: crypto_aead
Primitive: scream12v1
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
97902? ? ?? ? ?ssegcc_-m64_-march=corei7-avx_-O3_-fomit-frame-pointer2017082420170725
98336? ? ?? ? ?ssegcc_-m64_-march=native_-mtune=native_-O3_-fomit-frame-pointer2017082420170725
99334? ? ?? ? ?ssegcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2017082420170725
99668? ? ?? ? ?ssegcc_-m64_-march=core-avx-i_-O3_-fomit-frame-pointer2017082420170725
102649? ? ?? ? ?ssegcc_-m64_-march=core2_-O3_-fomit-frame-pointer2017082420170725
102778? ? ?? ? ?ssegcc_-m64_-march=core2_-msse4_-O3_-fomit-frame-pointer2017082420170725
102925? ? ?? ? ?ssegcc_-m64_-march=corei7_-O3_-fomit-frame-pointer2017082420170725
102954? ? ?? ? ?ssegcc_-m64_-march=core2_-msse4.1_-O3_-fomit-frame-pointer2017082420170725
109179? ? ?? ? ?ssegcc_-m64_-march=native_-mtune=native_-O2_-fomit-frame-pointer2017082420170725
109412? ? ?? ? ?ssegcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2017082420170725
110277? ? ?? ? ?ssegcc_-m64_-march=core-avx-i_-O2_-fomit-frame-pointer2017082420170725
111091? ? ?? ? ?ssegcc_-m64_-march=corei7-avx_-O2_-fomit-frame-pointer2017082420170725
113711? ? ?? ? ?ssegcc_-m64_-march=core2_-O2_-fomit-frame-pointer2017082420170725
113876? ? ?? ? ?ssegcc_-m64_-march=core2_-msse4_-O2_-fomit-frame-pointer2017082420170725
114083? ? ?? ? ?sseclang_-O3_-fwrapv_-march=native_-fomit-frame-pointer_-Qunused-arguments2017082420170725
114084? ? ?? ? ?sseclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2017082420170725
114111? ? ?? ? ?ssegcc_-m64_-march=corei7_-O2_-fomit-frame-pointer2017082420170725
114126? ? ?? ? ?ssegcc_-m64_-march=core2_-msse4.1_-O2_-fomit-frame-pointer2017082420170725
114308? ? ?? ? ?sseclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2017082420170725
114339? ? ?? ? ?sseclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2017082420170725
114558? ? ?? ? ?ssegcc_-m64_-march=core-avx-i_-O_-fomit-frame-pointer2017082420170725
115047? ? ?? ? ?ssegcc_-m64_-march=corei7-avx_-O_-fomit-frame-pointer2017082420170725
117379? ? ?? ? ?ssegcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2017082420170725
117701? ? ?? ? ?ssegcc_-m64_-march=native_-mtune=native_-O_-fomit-frame-pointer2017082420170725
117833? ? ?? ? ?ssegcc_-m64_-march=corei7_-O_-fomit-frame-pointer2017082420170725
117991? ? ?? ? ?ssegcc_-m64_-march=core2_-O_-fomit-frame-pointer2017082420170725
118055? ? ?? ? ?ssegcc_-m64_-march=core2_-msse4.1_-O_-fomit-frame-pointer2017082420170725
118177? ? ?? ? ?ssegcc_-m64_-march=core2_-msse4_-O_-fomit-frame-pointer2017082420170725
488380? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-O2_-fomit-frame-pointer2017082420170725
488534? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-O2_-fomit-frame-pointer2017082420170725
488693? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-O2_-fomit-frame-pointer2017082420170725
488917? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-O2_-fomit-frame-pointer2017082420170725
495827? ? ?? ? ?refgcc_-funroll-loops_-m64_-O2_-fomit-frame-pointer2017082420170725
496180? ? ?? ? ?refgcc_-funroll-loops_-O2_-fomit-frame-pointer2017082420170725
496225? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-O2_-fomit-frame-pointer2017082420170725
503658? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-O3_-fomit-frame-pointer2017082420170725
503846? ? ?? ? ?refgcc_-m64_-march=corei7_-O3_-fomit-frame-pointer2017082420170725
504347? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-O3_-fomit-frame-pointer2017082420170725
504375? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-O3_-fomit-frame-pointer2017082420170725
504579? ? ?? ? ?refgcc_-m64_-march=core2_-O3_-fomit-frame-pointer2017082420170725
505176? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-O3_-fomit-frame-pointer2017082420170725
505334? ? ?? ? ?refgcc_-march=barcelona_-O3_-fomit-frame-pointer2017082420170725
505653? ? ?? ? ?refgcc_-m64_-march=barcelona_-O3_-fomit-frame-pointer2017082420170725
506480? ? ?? ? ?refgcc_-m64_-march=k8_-O3_-fomit-frame-pointer2017082420170725
506685? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-O3_-fomit-frame-pointer2017082420170725
507130? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-O3_-fomit-frame-pointer2017082420170725
508082? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-O3_-fomit-frame-pointer2017082420170725
508310? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-O3_-fomit-frame-pointer2017082420170725
508557? ? ?? ? ?refgcc_-march=k8_-O3_-fomit-frame-pointer2017082420170725
511471? ? ?? ? ?refgcc_-O3_-fomit-frame-pointer2017082420170725
511655? ? ?? ? ?refgcc_-fno-schedule-insns_-O3_-fomit-frame-pointer2017082420170725
511914? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-O2_-fomit-frame-pointer2017082420170725
512001? ? ?? ? ?refgcc_-m64_-O3_-fomit-frame-pointer2017082420170725
512176? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-O2_-fomit-frame-pointer2017082420170725
515087? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-O3_-fomit-frame-pointer2017082420170725
515201? ? ?? ? ?refgcc_-funroll-loops_-m64_-O3_-fomit-frame-pointer2017082420170725
516114? ? ?? ? ?refgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv2017082420170725
516282? ? ?? ? ?refgcc_-funroll-loops_-O3_-fomit-frame-pointer2017082420170725
516656? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-O3_-fomit-frame-pointer2017082420170725
525124? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-O3_-fomit-frame-pointer2017082420170725
525890? ? ?? ? ?refgcc_-m64_-march=nocona_-O3_-fomit-frame-pointer2017082420170725
526175? ? ?? ? ?refgcc_-march=nocona_-O3_-fomit-frame-pointer2017082420170725
528700? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-O3_-fomit-frame-pointer2017082420170725
536826? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-O_-fomit-frame-pointer2017082420170725
540598? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-O_-fomit-frame-pointer2017082420170725
543999? ? ?? ? ?refgcc_-funroll-loops_-O_-fomit-frame-pointer2017082420170725
544048? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-O_-fomit-frame-pointer2017082420170725
544390? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-O_-fomit-frame-pointer2017082420170725
544419? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-O_-fomit-frame-pointer2017082420170725
544522? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-O_-fomit-frame-pointer2017082420170725
544869? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-O_-fomit-frame-pointer2017082420170725
545169? ? ?? ? ?refgcc_-funroll-loops_-m64_-O_-fomit-frame-pointer2017082420170725
728618? ? ?? ? ?refclang_-march=native_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2017082420170725
729558? ? ?? ? ?refclang_-O3_-fwrapv_-march=native_-fomit-frame-pointer_-Qunused-arguments2017082420170725
739061? ? ?? ? ?refclang_-O3_-fwrapv_-mavx_-maes_-mpclmul_-fomit-frame-pointer_-Qunused-arguments2017082420170725
739291? ? ?? ? ?refclang_-O3_-fwrapv_-mavx_-fomit-frame-pointer_-Qunused-arguments2017082420170725
774896? ? ?? ? ?refclang_-O3_-fomit-frame-pointer_-Qunused-arguments2017082420170725
780782? ? ?? ? ?refclang_-mcpu=cortex-a9_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2017082420170725
781784? ? ?? ? ?refclang_-mcpu=native_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2017082420170725
782056? ? ?? ? ?refclang_-mcpu=cortex-a8_-mfpu=neon_-O3_-fomit-frame-pointer_-fwrapv_-Qunused-arguments2017082420170725
915664? ? ?? ? ?refgcc_-march=k8_-O2_-fomit-frame-pointer2017082420170725
918746? ? ?? ? ?refgcc_-m64_-march=barcelona_-O2_-fomit-frame-pointer2017082420170725
920532? ? ?? ? ?refgcc_-march=barcelona_-O2_-fomit-frame-pointer2017082420170725
920743? ? ?? ? ?refgcc_-m64_-march=k8_-O2_-fomit-frame-pointer2017082420170725
924837? ? ?? ? ?refgcc_-m64_-march=nocona_-O2_-fomit-frame-pointer2017082420170725
926100? ? ?? ? ?refgcc_-march=nocona_-O2_-fomit-frame-pointer2017082420170725
926162? ? ?? ? ?refgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv2017082420170725
926237? ? ?? ? ?refgcc_-m64_-march=corei7_-O2_-fomit-frame-pointer2017082420170725
927947? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-O2_-fomit-frame-pointer2017082420170725
928192? ? ?? ? ?refgcc_-O2_-fomit-frame-pointer2017082420170725
929592? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-O2_-fomit-frame-pointer2017082420170725
931252? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-O2_-fomit-frame-pointer2017082420170725
931283? ? ?? ? ?refgcc_-m64_-march=core2_-O2_-fomit-frame-pointer2017082420170725
931867? ? ?? ? ?refgcc_-m64_-O2_-fomit-frame-pointer2017082420170725
932238? ? ?? ? ?refgcc_-O_-fomit-frame-pointer2017082420170725
932318? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-O2_-fomit-frame-pointer2017082420170725
933456? ? ?? ? ?refgcc_-m64_-O_-fomit-frame-pointer2017082420170725
934189? ? ?? ? ?refgcc_-fno-schedule-insns_-O_-fomit-frame-pointer2017082420170725
939112? ? ?? ? ?refgcc_-fno-schedule-insns_-O2_-fomit-frame-pointer2017082420170725
940903? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-O2_-fomit-frame-pointer2017082420170725
942613? ? ?? ? ?refgcc_-m64_-march=nocona_-O_-fomit-frame-pointer2017082420170725
943643? ? ?? ? ?refgcc_-m64_-march=k8_-O_-fomit-frame-pointer2017082420170725
944840? ? ?? ? ?refgcc_-march=nocona_-O_-fomit-frame-pointer2017082420170725
950745? ? ?? ? ?refgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv2017082420170725
958972? ? ?? ? ?refgcc_-march=k8_-O_-fomit-frame-pointer2017082420170725
959164? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-O_-fomit-frame-pointer2017082420170725
966939? ? ?? ? ?refgcc_-m64_-march=corei7_-O_-fomit-frame-pointer2017082420170725
967137? ? ?? ? ?refgcc_-m64_-march=barcelona_-O_-fomit-frame-pointer2017082420170725
967503? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-O_-fomit-frame-pointer2017082420170725
967928? ? ?? ? ?refgcc_-march=barcelona_-O_-fomit-frame-pointer2017082420170725
967946? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-O_-fomit-frame-pointer2017082420170725
968124? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-O_-fomit-frame-pointer2017082420170725
968345? ? ?? ? ?refgcc_-m64_-march=core2_-O_-fomit-frame-pointer2017082420170725
969752? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-O_-fomit-frame-pointer2017082420170725
1234601? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=nocona_-Os_-fomit-frame-pointer2017082420170725
1235353? ? ?? ? ?refgcc_-funroll-loops_-march=nocona_-Os_-fomit-frame-pointer2017082420170725
1266175? ? ?? ? ?refgcc_-march=nocona_-Os_-fomit-frame-pointer2017082420170725
1269011? ? ?? ? ?refgcc_-m64_-march=nocona_-Os_-fomit-frame-pointer2017082420170725
1278475? ? ?? ? ?refgcc_-march=barcelona_-Os_-fomit-frame-pointer2017082420170725
1278985? ? ?? ? ?refgcc_-funroll-loops_-fno-schedule-insns_-Os_-fomit-frame-pointer2017082420170725
1279138? ? ?? ? ?refgcc_-m64_-march=k8_-Os_-fomit-frame-pointer2017082420170725
1280617? ? ?? ? ?refgcc_-m64_-march=native_-mtune=native_-Os_-fomit-frame-pointer2017082420170725
1281580? ? ?? ? ?refgcc_-m64_-march=corei7_-Os_-fomit-frame-pointer2017082420170725
1281688? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=k8_-Os_-fomit-frame-pointer2017082420170725
1281692? ? ?? ? ?refgcc_-m64_-march=barcelona_-Os_-fomit-frame-pointer2017082420170725
1282114? ? ?? ? ?refgcc_-funroll-loops_-march=k8_-Os_-fomit-frame-pointer2017082420170725
1282617? ? ?? ? ?refgcc_-funroll-loops_-Os_-fomit-frame-pointer2017082420170725
1282803? ? ?? ? ?refgcc_-funroll-loops_-m64_-Os_-fomit-frame-pointer2017082420170725
1283144? ? ?? ? ?refgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv2017082420170725
1283182? ? ?? ? ?refgcc_-m64_-Os_-fomit-frame-pointer2017082420170725
1283361? ? ?? ? ?refgcc_-m64_-march=core-avx-i_-Os_-fomit-frame-pointer2017082420170725
1283395? ? ?? ? ?refgcc_-Os_-fomit-frame-pointer2017082420170725
1283868? ? ?? ? ?refgcc_-m64_-march=core2_-msse4_-Os_-fomit-frame-pointer2017082420170725
1285908? ? ?? ? ?refgcc_-m64_-march=core2_-msse4.1_-Os_-fomit-frame-pointer2017082420170725
1286211? ? ?? ? ?refgcc_-funroll-loops_-march=barcelona_-Os_-fomit-frame-pointer2017082420170725
1286722? ? ?? ? ?refgcc_-funroll-loops_-m64_-march=barcelona_-Os_-fomit-frame-pointer2017082420170725
1287289? ? ?? ? ?refgcc_-fno-schedule-insns_-Os_-fomit-frame-pointer2017082420170725
1287557? ? ?? ? ?refgcc_-m64_-march=corei7-avx_-Os_-fomit-frame-pointer2017082420170725
1290223? ? ?? ? ?refgcc_-m64_-march=core2_-Os_-fomit-frame-pointer2017082420170725
1292958? ? ?? ? ?refgcc_-march=k8_-Os_-fomit-frame-pointer2017082420170725
2988230? ? ?? ? ?refcc2017082420170725
2997121? ? ?? ? ?refgcc2017082420170725
2999114? ? ?? ? ?refgcc_-funroll-loops2017082420170725

Test failure

Implementation: crypto_aead/scream12v1/sse
Compiler: gcc -m64 -march=core-avx-i -Os -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 14, namely:
CompilerImplementations
gcc -m64 -march=core-avx-i -Os -fomit-frame-pointer sse
gcc -m64 -march=core-avx2 -O2 -fomit-frame-pointer ref sse
gcc -m64 -march=core-avx2 -O -fomit-frame-pointer ref sse
gcc -m64 -march=core-avx2 -Os -fomit-frame-pointer ref sse
gcc -m64 -march=core2 -Os -fomit-frame-pointer sse
gcc -m64 -march=core2 -msse4.1 -Os -fomit-frame-pointer sse
gcc -m64 -march=core2 -msse4 -Os -fomit-frame-pointer sse
gcc -m64 -march=corei7-avx -Os -fomit-frame-pointer sse
gcc -m64 -march=corei7 -Os -fomit-frame-pointer sse
gcc -m64 -march=native -mtune=native -Os -fomit-frame-pointer sse
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv sse

Compiler output

Implementation: crypto_aead/scream12v1/sse
Compiler: cc
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:199:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:203:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: ...

Number of similar (compiler,implementation) pairs: 71, namely:
CompilerImplementations
cc sse
gcc sse
gcc -O2 -fomit-frame-pointer sse
gcc -O3 -fomit-frame-pointer sse
gcc -O -fomit-frame-pointer sse
gcc -Os -fomit-frame-pointer sse
gcc -fno-schedule-insns -O2 -fomit-frame-pointer sse
gcc -fno-schedule-insns -O3 -fomit-frame-pointer sse
gcc -fno-schedule-insns -O -fomit-frame-pointer sse
gcc -fno-schedule-insns -Os -fomit-frame-pointer sse
gcc -funroll-loops sse
gcc -funroll-loops -O2 -fomit-frame-pointer sse
gcc -funroll-loops -O3 -fomit-frame-pointer sse
gcc -funroll-loops -O -fomit-frame-pointer sse
gcc -funroll-loops -Os -fomit-frame-pointer sse
gcc -funroll-loops -fno-schedule-insns -O2 -fomit-frame-pointer sse
gcc -funroll-loops -fno-schedule-insns -O3 -fomit-frame-pointer sse
gcc -funroll-loops -fno-schedule-insns -O -fomit-frame-pointer sse
gcc -funroll-loops -fno-schedule-insns -Os -fomit-frame-pointer sse
gcc -funroll-loops -m64 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -O -fomit-frame-pointer sse
gcc -funroll-loops -m64 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=barcelona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=barcelona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=barcelona -O -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=barcelona -Os -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer sse
gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer sse
gcc -funroll-loops -march=barcelona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -march=barcelona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -march=barcelona -O -fomit-frame-pointer sse
gcc -funroll-loops -march=barcelona -Os -fomit-frame-pointer sse
gcc -funroll-loops -march=k8 -O2 -fomit-frame-pointer sse
gcc -funroll-loops -march=k8 -O3 -fomit-frame-pointer sse
gcc -funroll-loops -march=k8 -O -fomit-frame-pointer sse
gcc -funroll-loops -march=k8 -Os -fomit-frame-pointer sse
gcc -funroll-loops -march=nocona -O2 -fomit-frame-pointer sse
gcc -funroll-loops -march=nocona -O3 -fomit-frame-pointer sse
gcc -funroll-loops -march=nocona -O -fomit-frame-pointer sse
gcc -funroll-loops -march=nocona -Os -fomit-frame-pointer sse
gcc -m64 -O2 -fomit-frame-pointer sse
gcc -m64 -O3 -fomit-frame-pointer sse
gcc -m64 -O -fomit-frame-pointer sse
gcc -m64 -Os -fomit-frame-pointer sse
gcc -m64 -march=k8 -O2 -fomit-frame-pointer sse
gcc -m64 -march=k8 -O3 -fomit-frame-pointer sse
gcc -m64 -march=k8 -O -fomit-frame-pointer sse
gcc -m64 -march=k8 -Os -fomit-frame-pointer sse
gcc -m64 -march=nocona -O2 -fomit-frame-pointer sse
gcc -m64 -march=nocona -O3 -fomit-frame-pointer sse
gcc -m64 -march=nocona -O -fomit-frame-pointer sse
gcc -m64 -march=nocona -Os -fomit-frame-pointer sse
gcc -march=barcelona -O2 -fomit-frame-pointer sse
gcc -march=barcelona -O3 -fomit-frame-pointer sse
gcc -march=barcelona -O -fomit-frame-pointer sse
gcc -march=barcelona -Os -fomit-frame-pointer sse
gcc -march=k8 -O2 -fomit-frame-pointer sse
gcc -march=k8 -O3 -fomit-frame-pointer sse
gcc -march=k8 -O -fomit-frame-pointer sse
gcc -march=k8 -Os -fomit-frame-pointer sse
gcc -march=nocona -O2 -fomit-frame-pointer sse
gcc -march=nocona -O3 -fomit-frame-pointer sse
gcc -march=nocona -O -fomit-frame-pointer sse
gcc -march=nocona -Os -fomit-frame-pointer sse

Compiler output

Implementation: crypto_aead/scream12v1/sse
Compiler: clang -O3 -fomit-frame-pointer -Qunused-arguments
scream.c: scream.c:185:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:199:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:203:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:204:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: D ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:211:10: error: '__builtin_ia32_pshufb128' needs target feature ssse3
scream.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
clang -O3 -fomit-frame-pointer -Qunused-arguments sse
clang -mcpu=cortex-a8 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments sse
clang -mcpu=cortex-a9 -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments sse
clang -mcpu=native -mfpu=neon -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments sse

Compiler output

Implementation: crypto_aead/scream12v1/sse
Compiler: gcc -m64 -march=barcelona -O2 -fomit-frame-pointer
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:199:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:203:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: ...
scream.c: scream.c: In function 'LBox16P':
scream.c: scream.c:185:10: warning: implicit declaration of function '__builtin_ia32_pshufb128' [-Wimplicit-function-declaration]
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:185:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: A = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:186:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: C = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:190:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: B = __builtin_ia32_pshufb128(table, t0);
scream.c: ^
scream.c: scream.c:191:8: error: incompatible types when assigning to type 'v16qi {aka __vector(16) char}' from type 'int'
scream.c: D = __builtin_ia32_pshufb128(table, t1);
scream.c: ^
scream.c: scream.c:198:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: A ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: scream.c:199:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: C ^= __builtin_ia32_pshufb128(table, in[2]);
scream.c: ^
scream.c: scream.c:203:7: error: conversion of scalar 'int' to vector 'v16qi {aka __vector(16) char}' involves truncation
scream.c: B ^= __builtin_ia32_pshufb128(table, in[0]);
scream.c: ^
scream.c: ...

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -m64 -march=barcelona -O2 -fomit-frame-pointer sse
gcc -m64 -march=barcelona -O3 -fomit-frame-pointer sse
gcc -m64 -march=barcelona -O -fomit-frame-pointer sse
gcc -m64 -march=barcelona -Os -fomit-frame-pointer sse