| Time | Implementation | Compiler | Benchmark date | SUPERCOP version |
| 10422 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 10425 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 10430 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 10431 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 10434 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 10441 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 11265 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 11370 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 11394 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 11823 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 11851 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 12029 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 14910 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 14916 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 15045 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 15217 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 15267 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 15300 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 16185 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 16191 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 16677 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 16686 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 16774 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 16800 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 18087 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 18120 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 18255 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 18279 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161216 | 20161026 |
| 18291 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 21882 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 22245 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 24027 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 24102 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 24519 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 26418 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 28317 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 28726 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 29511 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161216 | 20161026 |
| 31644 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 37041 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 38436 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |
| 44169 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161216 | 20161026 |