| Time | Implementation | Compiler | Benchmark date | SUPERCOP version |
| 561 | ref | gcc -m64 -march=k8 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 572 | ref | gcc -funroll-loops -m64 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 583 | ref | gcc -funroll-loops -m64 -march=k8 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 594 | ref | gcc -m64 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 594 | ref | gcc -m64 -march=nocona -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 605 | ref | gcc -funroll-loops -m64 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 605 | ref | gcc -funroll-loops -m64 -march=k8 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 605 | ref | gcc -funroll-loops -m64 -march=nocona -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 605 | ref | gcc -m64 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 605 | ref | gcc -m64 -march=k8 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 616 | ref | gcc -funroll-loops -m64 -mcpu=G5 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 616 | ref | gcc -m64 -mcpu=G4 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 616 | ref | gcc -m64 -mcpu=G5 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 627 | ref | gcc -funroll-loops -m64 -mcpu=G4 -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 627 | ref | gcc -m64 -mcpu=G4 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 627 | ref | gcc -m64 -mcpu=G5 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 638 | ref | gcc -funroll-loops -m64 -march=nocona -Os -fomit-frame-pointer | 20100904 | 20100903 |
| 638 | ref | gcc -m64 -march=nocona -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 660 | ref | gcc -funroll-loops -m64 -mcpu=G4 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 660 | ref | gcc -funroll-loops -m64 -mcpu=G5 -O3 -fomit-frame-pointer | 20100904 | 20100903 |
| 1243 | ref | gcc -m64 -march=nocona -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1254 | ref | gcc -funroll-loops -m64 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1254 | ref | gcc -funroll-loops -m64 -mcpu=G4 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1254 | ref | gcc -funroll-loops -m64 -mcpu=G5 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1254 | ref | gcc -m64 -march=k8 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1254 | ref | gcc -m64 -mcpu=G4 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1254 | ref | gcc -m64 -mcpu=G5 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1265 | ref | gcc -funroll-loops -m64 -march=nocona -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1276 | ref | gcc -funroll-loops -m64 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1276 | ref | gcc -funroll-loops -m64 -march=k8 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1276 | ref | gcc -m64 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1287 | ref | gcc -funroll-loops -m64 -march=k8 -O2 -fomit-frame-pointer | 20100904 | 20100903 |
| 1287 | ref | gcc -funroll-loops -m64 -march=nocona -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1287 | ref | gcc -m64 -march=k8 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1287 | ref | gcc -m64 -march=nocona -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1298 | ref | gcc -m64 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1463 | ref | gcc -funroll-loops -m64 -mcpu=G4 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1463 | ref | gcc -funroll-loops -m64 -mcpu=G5 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1463 | ref | gcc -m64 -mcpu=G4 -O -fomit-frame-pointer | 20100904 | 20100903 |
| 1463 | ref | gcc -m64 -mcpu=G5 -O -fomit-frame-pointer | 20100904 | 20100903 |