| Time | Implementation | Compiler | Benchmark date | SUPERCOP version |
| 8505 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 8505 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 8508 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 8512 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 8538 | armneon3 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 8551 | armneon3 | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 9602 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 9649 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 10080 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 10084 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 10109 | armneon2 | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 10195 | armneon2 | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 11373 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 11761 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 11792 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 11854 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 11890 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 12006 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 12081 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 12174 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 12284 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 12416 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 12997 | e/merged | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 13127 | e/merged | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 14543 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 14578 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 14762 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 15963 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 15975 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 16214 | ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 16287 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 16530 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 16544 | armneon | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 16580 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 16616 | armneon | gcc -mcpu=native -mfpu=neon-vfpv4 -O3 | 20161215 | 20161026 |
| 16938 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 17203 | ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 20937 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -O2 | 20161215 | 20161026 |
| 20952 | e/regs | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 22737 | e/regs | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 25953 | e/ref | gcc -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |
| 26155 | e/ref | gcc -funroll-loops -mcpu=native -mfpu=neon-vfpv4 -Os | 20161215 | 20161026 |