Implementation notes: amd64, genji262, crypto_stream/nlsv2

Computer: genji262
Architecture: amd64
CPU ID: AuthenticAMD-00800f12-178bfbff
SUPERCOP version: 20191017
Operation: crypto_stream
Primitive: nlsv2
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
497237152 4096 454543 4952 832e/v2/sync/2icc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019102420191017
501645400 4096 461167 4952 832e/v2/sync/2icc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019102420191017
501646136 4096 463127 4952 832e/v2/sync/2icc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019102420191017
503846136 4096 463127 4952 832e/v2/sync/2icc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019102420191017
503837152 4096 454543 4952 832e/v2/sync/2icc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019102420191017
503837152 4096 454543 4952 832e/v2/sync/2icc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019102420191017
503846136 4096 463127 4952 832e/v2/sync/2icc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019102420191017
506046136 4096 463127 4952 832e/v2/sync/2icc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019102420191017
506037152 4096 454543 4952 832e/v2/sync/2icc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019102420191017
512637096 4096 452807 4952 832e/v2/sync/2icc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019102420191017
534622992 4096 436527 4912 864e/v2/sync/2gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
545621000 4096 432999 4912 864e/v2/sync/2gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
556622751 4096 434535 4912 864e/v2/sync/2gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
587418154 4096 428778 4888 832e/v2/sync/2gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
589648512 4096 465551 4952 832e/v2/sync/2icc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019102420191017
591848512 4096 465551 4952 832e/v2/sync/2icc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019102420191017
591839480 4096 456487 4952 832e/v2/sync/2icc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019102420191017
591839480 4096 456487 4952 832e/v2/sync/2icc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019102420191017
591848512 4096 465551 4952 832e/v2/sync/2icc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019102420191017
594039480 4096 456487 4952 832e/v2/sync/2icc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019102420191017
594048512 4096 465551 4952 832e/v2/sync/2icc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019102420191017
596239480 4096 456487 4952 832e/v2/sync/2icc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019102420191017
1067021848 4096 437559 4952 832e/v2/sync/1icc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019102420191017
1089027440 4096 443207 4952 832e/v2/sync/1icc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019102420191017
1111022584 4096 439975 4952 832e/v2/sync/1icc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019102420191017
1115422584 4096 439975 4952 832e/v2/sync/1icc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019102420191017
1126422584 4096 439975 4952 832e/v2/sync/1icc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019102420191017
1128622584 4096 439975 4952 832e/v2/sync/1icc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019102420191017
1146228008 4096 444999 4952 832e/v2/sync/1icc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019102420191017
1152828008 4096 444999 4952 832e/v2/sync/1icc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019102420191017
1155024560 4096 441567 4952 832e/v2/sync/1icc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019102420191017
1155024560 4096 441567 4952 832e/v2/sync/1icc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019102420191017
1157228008 4096 444999 4952 832e/v2/sync/1icc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019102420191017
1161628008 4096 444999 4952 832e/v2/sync/1icc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019102420191017
1161624560 4096 441567 4952 832e/v2/sync/1icc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019102420191017
1168224560 4096 441567 4952 832e/v2/sync/1icc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019102420191017
1177030712 4096 447751 4952 832e/v2/sync/1icc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019102420191017
1181430712 4096 447751 4952 832e/v2/sync/1icc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019102420191017
1181430712 4096 447751 4952 832e/v2/sync/1icc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019102420191017
1181430712 4096 447751 4952 832e/v2/sync/1icc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019102420191017
136845248 4096 417247 4912 864e/v2/sync/1gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
145864948 4096 416727 4912 864e/v2/sync/1gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
147843849 4096 414482 4888 832e/v2/sync/1gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017
179308400 4096 421927 4912 864e/v2/sync/1gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019102420191017

Test failure

Implementation: e/v2/sync/1
Security model: unknown
Compiler: icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 12, namely:
CompilerImplementations
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer e/v2/sync/1
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer e/v2/sync/1
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer e/v2/sync/1
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer e/v2/sync/1
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer e/v2/sync/1
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer e/v2/sync/1
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer e/v2/sync/2
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer e/v2/sync/2
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer e/v2/sync/2
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer e/v2/sync/2
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer e/v2/sync/2
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer e/v2/sync/2

Compiler output

Implementation: e/v2/sync/1
Security model: unknown
Compiler: clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE
api.c: In file included from api.c:2:
api.c: In file included from /scratch_gpfs_na2700_60/bdolbeaur/SC/supercop-20191017/supercop-data/genji262/amd64/include/estream-convert-api.h:7:
api.c: In file included from ./e/ecrypt-sync.h:15:
api.c: In file included from /scratch_gpfs_na2700_60/bdolbeaur/SC/supercop-20191017/supercop-data/genji262/amd64/include/ecrypt-portable.h:23:
api.c: In file included from /scratch_gpfs_na2700_60/bdolbeaur/SC/supercop-20191017/supercop-data/genji262/amd64/include/ecrypt-config.h:302:
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:52:1: error: conflicting types for '_mm_prefetch'
api.c: _mm_prefetch (const void *__P, enum _mm_hint __I)
api.c: ^
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:52:1: note: '_mm_prefetch' is a builtin with type 'void (const char *, int)'
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:52:1: error: definition of builtin function '_mm_prefetch'
api.c: _mm_prefetch (const void *__P, enum _mm_hint __I)
api.c: ^
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:54:3: error: argument to '__builtin_prefetch' must be a constant integer
api.c: __builtin_prefetch (__P, (__I & 0x4) >> 2, __I & 0x3);
api.c: ^ ~~~~~~~~~~~~~~~~
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:130:10: error: invalid conversion between vector type '__m128' (vector of 4 'float' values) and integer type 'int' of different size
api.c: return (__m128) __builtin_ia32_addss ((__v4sf)__A, (__v4sf)__B);
api.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:136:10: error: invalid conversion between vector type '__m128' (vector of 4 'float' values) and integer type 'int' of different size
api.c: return (__m128) __builtin_ia32_subss ((__v4sf)__A, (__v4sf)__B);
api.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:142:10: error: invalid conversion between vector type '__m128' (vector of 4 'float' values) and integer type 'int' of different size
api.c: return (__m128) __builtin_ia32_mulss ((__v4sf)__A, (__v4sf)__B);
api.c: ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
api.c: /software/compilers/gcc/gcc-9.2.0-full+isl+binutils/lib/gcc/x86_64-pc-linux-gnu/9.2.0/include/xmmintrin.h:148:10: error: invalid conversion between vector type '__m128' (vector of 4 'float' values) and integer type 'int' of different size
api.c: ...

Number of similar (compiler,implementation) pairs: 10, namely:
CompilerImplementations
clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/1
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/1
clang -march=native -O -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/1
clang -march=native -Os -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/1
clang -mcpu=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/1
clang -march=native -O2 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/2
clang -march=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/2
clang -march=native -O -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/2
clang -march=native -Os -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/2
clang -mcpu=native -O3 -fomit-frame-pointer -fwrapv -Qunused-arguments -fPIC -fPIE e/v2/sync/2