Implementation notes: amd64, genji548, crypto_hash/nasha512

Computer: genji548
Architecture: amd64
CPU ID: GenuineIntel-00050654-bfebfbff
SUPERCOP version: 20191017
Operation: crypto_hash
Primitive: nasha512
TimeObject sizeTest sizeImplementationCompilerBenchmark dateSUPERCOP version
283928532 0 018500 808 776optgcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
2862010043 0 020156 808 776optgcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
2877420614 0 033537 816 776optgcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
3412243853 0 456777 816 131872opt_v4gcc_-march=native_-mtune=native_-O3_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
3429631940 0 442060 808 131872opt_v4gcc_-march=native_-mtune=native_-O2_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
3434430713 0 440692 808 131872opt_v4gcc_-march=native_-mtune=native_-O_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
358387936 0 017060 792 776optgcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
3762028880 0 438004 792 131872opt_v4gcc_-march=native_-mtune=native_-Os_-fomit-frame-pointer_-fwrapv_-fPIC_-fPIE2019101920191017
4080854616 0 470349 856 131840opt_v4icc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019101920191017
4083254616 0 470349 856 131840opt_v4icc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019101920191017
4084054616 0 470349 856 131840opt_v4icc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019101920191017
4089253624 0 468957 856 131840opt_v4icc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019101920191017
4089453208 0 469109 856 131872opt_v4icc_-march=skylake-avx512_-mtune=skylake-avx512_-O3_-fomit-frame-pointer2019101920191017
4091254680 0 470413 856 131840opt_v4icc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019101920191017
4097054264 0 470277 856 131872opt_v4icc_-march=skylake-avx512_-mtune=skylake-avx512_-O2_-fomit-frame-pointer2019101920191017
4101253960 0 469341 856 131840opt_v4icc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019101920191017
4102255000 0 471541 856 131872opt_v4icc_-march=icelake-client_-mtune=icelake-client_-O2_-fomit-frame-pointer2019101920191017
4107853960 0 469341 856 131840opt_v4icc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019101920191017
4111053960 0 469341 856 131840opt_v4icc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019101920191017
4111853688 0 469021 856 131840opt_v4icc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019101920191017
4113253960 0 469341 856 131840opt_v4icc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019101920191017
4116253688 0 469021 856 131840opt_v4icc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019101920191017
4120253688 0 469021 856 131840opt_v4icc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019101920191017
4131053000 0 468413 856 131840opt_v4icc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019101920191017
4144253000 0 468413 856 131840opt_v4icc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019101920191017
4149453000 0 468413 856 131840opt_v4icc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019101920191017
4150853000 0 468413 856 131840opt_v4icc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019101920191017
4171254072 0 470261 856 131872opt_v4icc_-march=icelake-client_-mtune=icelake-client_-O3_-fomit-frame-pointer2019101920191017
4182453200 0 467285 856 131840opt_v4icc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019101920191017
4216052320 0 466461 856 131840opt_v4icc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019101920191017
4219235472 0 050805 856 744opticc_-march=skylake_-mtune=skylake_-O3_-fomit-frame-pointer2019101920191017
4226634528 0 048669 856 744opticc_-march=corei7_-mtune=corei7_-O3_-fomit-frame-pointer2019101920191017
4228435504 0 050837 856 744opticc_-march=core-avx2_-mtune=core-avx2_-O3_-fomit-frame-pointer2019101920191017
4232035504 0 050837 856 744opticc_-march=broadwell_-mtune=broadwell_-O3_-fomit-frame-pointer2019101920191017
4233434816 0 050229 856 744opticc_-march=core-avx-i_-mtune=core-avx-i_-O3_-fomit-frame-pointer2019101920191017
4235234816 0 050229 856 744opticc_-march=ivybridge_-mtune=ivybridge_-O3_-fomit-frame-pointer2019101920191017
4235234816 0 050229 856 744opticc_-march=sandybridge_-mtune=sandybridge_-O3_-fomit-frame-pointer2019101920191017
4236036368 0 052557 856 776opticc_-march=icelake-client_-mtune=icelake-client_-O3_-fomit-frame-pointer2019101920191017
4250836864 0 052597 856 744opticc_-march=skylake_-mtune=skylake_-O2_-fomit-frame-pointer2019101920191017
4278037392 0 053405 856 776opticc_-march=skylake-avx512_-mtune=skylake-avx512_-O2_-fomit-frame-pointer2019101920191017
4286035504 0 050837 856 744opticc_-march=haswell_-mtune=haswell_-O3_-fomit-frame-pointer2019101920191017
4288235456 0 049541 856 744opticc_-march=corei7_-mtune=corei7_-O2_-fomit-frame-pointer2019101920191017
4288236048 0 051949 856 776opticc_-march=skylake-avx512_-mtune=skylake-avx512_-O3_-fomit-frame-pointer2019101920191017
4292036848 0 052581 856 744opticc_-march=broadwell_-mtune=broadwell_-O2_-fomit-frame-pointer2019101920191017
4293236848 0 052581 856 744opticc_-march=core-avx2_-mtune=core-avx2_-O2_-fomit-frame-pointer2019101920191017
4296236848 0 052581 856 744opticc_-march=haswell_-mtune=haswell_-O2_-fomit-frame-pointer2019101920191017
4298837480 0 054021 856 776opticc_-march=icelake-client_-mtune=icelake-client_-O2_-fomit-frame-pointer2019101920191017
4344435600 0 050981 856 744opticc_-march=ivybridge_-mtune=ivybridge_-O2_-fomit-frame-pointer2019101920191017
4345835600 0 050981 856 744opticc_-march=corei7-avx_-mtune=corei7-avx_-O2_-fomit-frame-pointer2019101920191017
4347035600 0 050981 856 744opticc_-march=sandybridge_-mtune=sandybridge_-O2_-fomit-frame-pointer2019101920191017
4347235600 0 050981 856 744opticc_-march=core-avx-i_-mtune=core-avx-i_-O2_-fomit-frame-pointer2019101920191017
4914034816 0 050229 856 744opticc_-march=corei7-avx_-mtune=corei7-avx_-O3_-fomit-frame-pointer2019101920191017

Test failure

Implementation: opt
Security model: unknown
Compiler: icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer
error 111

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer opt
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer opt
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer opt_v4
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer opt_v4

Compiler output

Implementation: opt_v4
Security model: unknown
Compiler: gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv -fPIC -fPIE
Nasha.c: Nasha.c: In function 'Init':
Nasha.c: Nasha.c:815:29: warning: assignment to 'uint_16t' {aka 'short unsigned int'} from 'uint_16t *' {aka 'short unsigned int *'} makes integer from pointer without a cast [-Wint-conversion]
Nasha.c: 815 | ssbox[i][j] = ssbox[i^j];
Nasha.c: | ^

Number of similar (compiler,implementation) pairs: 4, namely:
CompilerImplementations
gcc -march=native -mtune=native -O2 -fomit-frame-pointer -fwrapv -fPIC -fPIE opt_v4
gcc -march=native -mtune=native -O3 -fomit-frame-pointer -fwrapv -fPIC -fPIE opt_v4
gcc -march=native -mtune=native -O -fomit-frame-pointer -fwrapv -fPIC -fPIE opt_v4
gcc -march=native -mtune=native -Os -fomit-frame-pointer -fwrapv -fPIC -fPIE opt_v4

Compiler output

Implementation: opt_v4
Security model: unknown
Compiler: icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer
Nasha.c: Nasha.c(815): warning #810: conversion from "uint_16t={crypto_uint16={unsigned short}} *" to "uint_16t={crypto_uint16={unsigned short}}" may lose significant bits
Nasha.c: ssbox[i][j] = ssbox[i^j];
Nasha.c: ^
Nasha.c:

Number of similar (compiler,implementation) pairs: 24, namely:
CompilerImplementations
icc -march=broadwell -mtune=broadwell -O2 -fomit-frame-pointer opt_v4
icc -march=broadwell -mtune=broadwell -O3 -fomit-frame-pointer opt_v4
icc -march=cannonlake -mtune=cannonlake -O2 -fomit-frame-pointer opt_v4
icc -march=cannonlake -mtune=cannonlake -O3 -fomit-frame-pointer opt_v4
icc -march=core-avx-i -mtune=core-avx-i -O2 -fomit-frame-pointer opt_v4
icc -march=core-avx-i -mtune=core-avx-i -O3 -fomit-frame-pointer opt_v4
icc -march=core-avx2 -mtune=core-avx2 -O2 -fomit-frame-pointer opt_v4
icc -march=core-avx2 -mtune=core-avx2 -O3 -fomit-frame-pointer opt_v4
icc -march=corei7-avx -mtune=corei7-avx -O2 -fomit-frame-pointer opt_v4
icc -march=corei7-avx -mtune=corei7-avx -O3 -fomit-frame-pointer opt_v4
icc -march=corei7 -mtune=corei7 -O2 -fomit-frame-pointer opt_v4
icc -march=corei7 -mtune=corei7 -O3 -fomit-frame-pointer opt_v4
icc -march=haswell -mtune=haswell -O2 -fomit-frame-pointer opt_v4
icc -march=haswell -mtune=haswell -O3 -fomit-frame-pointer opt_v4
icc -march=icelake-client -mtune=icelake-client -O2 -fomit-frame-pointer opt_v4
icc -march=icelake-client -mtune=icelake-client -O3 -fomit-frame-pointer opt_v4
icc -march=ivybridge -mtune=ivybridge -O2 -fomit-frame-pointer opt_v4
icc -march=ivybridge -mtune=ivybridge -O3 -fomit-frame-pointer opt_v4
icc -march=sandybridge -mtune=sandybridge -O2 -fomit-frame-pointer opt_v4
icc -march=sandybridge -mtune=sandybridge -O3 -fomit-frame-pointer opt_v4
icc -march=skylake-avx512 -mtune=skylake-avx512 -O2 -fomit-frame-pointer opt_v4
icc -march=skylake-avx512 -mtune=skylake-avx512 -O3 -fomit-frame-pointer opt_v4
icc -march=skylake -mtune=skylake -O2 -fomit-frame-pointer opt_v4
icc -march=skylake -mtune=skylake -O3 -fomit-frame-pointer opt_v4