| Time | Implementation | Compiler | Benchmark date | SUPERCOP version |
| 6009 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 6009 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 6012 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 6012 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 6015 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 6023 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 6772 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 6841 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 7052 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 7056 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 7081 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 7167 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 8801 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 8909 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 8912 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 8918 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 9136 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 9244 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 9302 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 9316 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 9353 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 9408 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 9778 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 9936 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 10846 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 10868 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 11264 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 11278 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 11329 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 11337 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 11598 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 11768 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 12464 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 13729 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 13879 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 14177 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 14684 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 17668 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 18120 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 19713 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 23073 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 23155 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |