Full logs at http://log.ouroborus.net/limitingfactor/dph
Environment
Platform
host: limitingfactor.cse.unsw.EDU.AU
arch: i386
processor: i386
system: Darwin 10.7.0
Versions
GHC The Glorious Glasgow Haskell Compilation System, version 7.0.1
GCC i686-apple-darwin10-gcc-4.2.1 (GCC) 4.2.1 (Apple Inc. build 5666) (dot
3)
Total tests = 708
-- WINNERS (had a swing of < -10%)
dph.evens.vectorised.par.N1
runtime (wall clock) : 500.7ms (----) / 500.9ms (----) /
501.1ms (----)
kernel runtime (wall clock) : 181.0ms ( -11) / 181.7ms ( -12) /
182.0ms ( -12)
dph.quicksort.vectorised.par.N1
runtime (wall clock) : 700.9ms (----) / 701.1ms (----) /
701.3ms (----)
kernel runtime (wall clock) : 384.0ms ( -6) / 384.4ms ( -9) /
385.0ms ( -10)
dph.quicksort.vectorised.par.N8
runtime (wall clock) : 801.3ms (----) / 801.4ms ( -1) /
801.5ms ( -11)
kernel runtime (wall clock) : 465.0ms ( -1) / 473.9ms ( -2) /
484.0ms ( -4)
dph.quickhull.vector-immutable.seq.N4
runtime (wall clock) : 400.7ms (----) / 400.9ms (----) /
401.0ms (----)
kernel runtime (wall clock) : 115.0ms ( -15) / 129.1ms ( -7) /
133.0ms ( -6)
repa.laplace.par.N1
runtime (wall clock) : 6.705s ( -28) / 6.794s ( -28) /
6.806s ( -29)
kernel runtime (wall clock) : 6.137s ( -11) / 6.146s ( -11) /
6.153s ( -12)
repa.laplace.par.N2
runtime (wall clock) : 4.004s ( -23) / 4.084s ( -23) /
4.104s ( -24)
kernel runtime (wall clock) : 3.542s ( -9) / 3.577s ( -9) /
3.595s ( -9)
repa.fft2d.par.N2
runtime (wall clock) : 4.804s ( -13) / 4.994s ( -10) /
5.104s ( -11)
kernel runtime (wall clock) : 4.235s ( -14) / 4.402s ( -12) /
4.534s ( -12)
noslow.dph-prim.seq.Double.filterin_r
kernel runtime (wall clock) : 36.77us ( -14) / 36.78us ( -14) /
36.80us ( -14)
-- LOSERS (had a swing of > +10%)
dph.dotp.vectorised.par.N1
runtime (wall clock) : 1.901s ( +6) / 1.902s ( +4) /
1.903s (----)
kernel runtime (wall clock) : 99.00ms (+106) / 99.00ms (+106) /
99.00ms (+102)
dph.dotp.vectorised.par.N2
runtime (wall clock) : 1.901s ( +6) / 1.902s ( +6) /
1.902s ( +5)
kernel runtime (wall clock) : 49.00ms (+104) / 50.20ms ( +54) /
51.00ms ( +24)
dph.dotp.vectorised.par.N4
runtime (wall clock) : 1.801s ( -31) / 1.802s ( -31) /
1.802s ( -33)
kernel runtime (wall clock) : 27.00ms ( +29) / 30.50ms ( +12) /
32.00ms ( +3)
dph.dotp.vectorised.seq.N4
runtime (wall clock) : 1.901s ( +6) / 1.902s ( +6) /
1.902s ( +6)
kernel runtime (wall clock) : 102.0ms ( +92) / 102.0ms ( +92) /
102.0ms ( +85)
dph.dotp.vector.seq.N4
runtime (wall clock) : 1.901s ( +6) / 1.962s ( +9) /
2.002s ( +11)
kernel runtime (wall clock) : 53.00ms (----) / 82.60ms ( +54) /
103.0ms ( +81)
dph.sumsq.vectorised.par.N2
runtime (wall clock) : 500.5ms (+150) / 500.7ms (+150) /
501.1ms (+150)
kernel runtime (wall clock) : 418.0ms (+127) / 418.0ms (+127) /
418.0ms (+127)
dph.sumsq.vectorised.par.N4
runtime (wall clock) : 300.5ms (+199) / 300.6ms (+199) /
300.9ms (+199)
kernel runtime (wall clock) : 209.0ms (+127) / 209.0ms (+127) /
209.0ms (+127)
dph.sumsq.vectorised.par.N8
runtime (wall clock) : 200.5ms (+100) / 200.6ms (+100) /
200.7ms ( +99)
kernel runtime (wall clock) : 104.0ms (+126) / 104.9ms (+126) /
105.0ms (+110)
dph.sumsq.vectorised.seq.N4
runtime (wall clock) : 1.201s (+200) / 1.201s (+200) /
1.201s (+200)
kernel runtime (wall clock) : 1.103s (+201) / 1.103s (+200) /
1.105s (+200)
dph.sumsq.vector.seq.N4
runtime (wall clock) : 1.201s (+200) / 1.201s (+200) /
1.201s (+200)
kernel runtime (wall clock) : 1.103s (+201) / 1.103s (+200) /
1.105s (+200)
dph.evens.vectorised.par.N8
runtime (wall clock) : 400.6ms (----) / 480.9ms ( +17) /
501.1ms (----)
kernel runtime (wall clock) : 69.00ms ( +1) / 75.20ms ( +5) /
80.00ms ( -7)
dph.evens.vectorised.seq.N4
runtime (wall clock) : 500.8ms (----) / 570.9ms ( +14) /
601.1ms ( +20)
kernel runtime (wall clock) : 199.0ms ( +5) / 199.6ms ( +5) /
200.0ms ( +5)
dph.quicksort.vectorised.par.N2
runtime (wall clock) : 600.9ms ( +20) / 611.1ms ( -8) /
701.2ms (----)
kernel runtime (wall clock) : 346.0ms ( +14) / 356.0ms ( -4) /
367.0ms ( -6)
dph.quicksort.vectorised.par.N4
runtime (wall clock) : 601.0ms ( +20) / 631.2ms (----) /
701.3ms (----)
kernel runtime (wall clock) : 351.0ms ( +14) / 360.3ms ( +1) /
371.0ms ( -2)
dph.smvm.vectorised.par.N2
runtime (wall clock) : 100.5ms (----) / 100.6ms (----) /
100.9ms (----)
kernel runtime (wall clock) : 19.00ms ( +12) / 20.00ms ( +5) /
21.00ms (----)
dph.smvm.vectorised.par.N4
runtime (wall clock) : 100.5ms (----) / 100.6ms (----) /
100.8ms (----)
kernel runtime (wall clock) : 10.00ms ( +11) / 11.80ms ( -22) /
18.00ms (----)
dph.smvm.vectorised.seq.N4
runtime (wall clock) : 100.4ms (----) / 100.5ms (----) /
100.9ms (----)
kernel runtime (wall clock) : 23.00ms ( +35) / 23.00ms ( +35) /
23.00ms ( +35)
dph.quickhull.vectorised.par.N2
runtime (wall clock) : 800.9ms ( +14) / 811.2ms ( +3) /
901.5ms ( +12)
kernel runtime (wall clock) : 479.0ms ( +9) / 510.1ms ( +8) /
547.0ms ( +10)
dph.quickhull.vectorised.seq.N4
runtime (wall clock) : 900.9ms ( +13) / 901.1ms ( +6) /
901.4ms (----)
kernel runtime (wall clock) : 558.0ms ( +9) / 567.9ms ( +9) /
573.0ms ( +9)
dph.quickhull.vector-mutable.seq.N4
runtime (wall clock) : 300.7ms (----) / 390.8ms ( +26) /
401.0ms (----)
kernel runtime (wall clock) : 54.00ms ( +2) / 60.00ms ( +12) /
62.00ms ( +11)
dph.quickhull.vector-forkIO.par.N4
runtime (wall clock) : 300.6ms (----) / 300.8ms (----) /
301.0ms (----)
kernel runtime (wall clock) : 31.00ms (----) / 35.80ms ( +6) /
46.00ms ( +12)
dph.quickhull.vector-forkIO.par.N8
runtime (wall clock) : 300.8ms ( -25) / 300.8ms ( -25) /
301.0ms ( -25)
kernel runtime (wall clock) : 41.00ms ( +8) / 44.70ms ( +13) /
47.00ms ( +15)
repa.mmult.par.N1
runtime (wall clock) : 21.91s (+155) / 21.92s (+154) /
22.01s (+150)
kernel runtime (wall clock) : 21.61s (+155) / 21.65s (+155) /
21.70s (+155)
repa.mmult.par.N2
runtime (wall clock) : 11.11s (+158) / 11.13s (+155) /
11.21s (+154)
kernel runtime (wall clock) : 10.86s (+156) / 10.88s (+156) /
10.92s (+156)
repa.mmult.par.N4
runtime (wall clock) : 5.704s (+200) / 5.706s (+200) /
5.706s (+200)
kernel runtime (wall clock) : 5.442s (+204) / 5.460s (+204) /
5.475s (+205)
repa.mmult.par.N8
runtime (wall clock) : 2.936s (+144) / 3.016s (+146) /
3.151s (+139)
kernel runtime (wall clock) : 2.727s (+152) / 2.753s (+151) /
2.884s (+145)
repa.laplace.par.N4
runtime (wall clock) : 3.003s (----) / 3.423s ( +14) /
3.804s ( +27)
kernel runtime (wall clock) : 2.603s ( +29) / 3.003s ( +49) /
3.402s ( +68)
repa.laplace.par.N6
runtime (wall clock) : 2.903s ( +4) / 2.973s ( +6) /
3.003s ( +7)
kernel runtime (wall clock) : 2.525s ( +18) / 2.561s ( +19) /
2.604s ( +18)
repa.blur.par.N1
runtime (wall clock) : 6.303s (+425) / 6.303s (+425) /
6.304s (+425)
kernel runtime (wall clock) : 5.909s (+632) / 5.915s (+632) /
5.930s (+632)
repa.blur.par.N2
runtime (wall clock) : 3.602s (+414) / 3.823s (+438) /
4.403s (+450)
kernel runtime (wall clock) : 3.319s (+651) / 3.533s (+688) /
4.084s (+763)
repa.blur.par.N4
runtime (wall clock) : 2.502s (+400) / 2.572s (+414) /
2.602s (+420)
kernel runtime (wall clock) : 2.276s (+725) / 2.334s (+725) /
2.386s (+720)
repa.blur.par.N6
runtime (wall clock) : 2.002s (+400) / 2.002s (+400) /
2.002s (+399)
kernel runtime (wall clock) : 1.735s (+763) / 1.747s (+752) /
1.763s (+732)
repa.blur.par.N8
runtime (wall clock) : 1.702s (+325) / 1.723s (+330) /
1.903s (+374)
kernel runtime (wall clock) : 1.465s (+737) / 1.499s (+724) /
1.694s (+801)
repa.canny.par.N1
runtime (wall clock) : 2.101s (+425) / 2.101s (+424) /
2.102s (+424)
kernel runtime (wall clock) : 1.674s (+6875) / 1.677s (+6889) /
1.692s (+6950)
repa.canny.par.N2
runtime (wall clock) : 1.201s (+300) / 1.211s (+303) /
1.301s (+333)
kernel runtime (wall clock) : 931.0ms (+5376) / 946.1ms (+4959) /
1.000s (+4900)
repa.canny.par.N4
runtime (wall clock) : 900.9ms (+200) / 901.0ms (+200) /
901.4ms (+200)
kernel runtime (wall clock) : 598.0ms (+4500) / 616.6ms (+4501) /
635.0ms (+4133)
repa.canny.par.N6
runtime (wall clock) : 700.8ms (+250) / 700.9ms (+249) /
701.1ms (+249)
kernel runtime (wall clock) : 447.0ms (+3625) / 453.3ms (+3498) /
459.0ms (+3431)
repa.canny.par.N8
runtime (wall clock) : 600.8ms (+200) / 601.1ms (+200) /
601.3ms (+199)
kernel runtime (wall clock) : 367.0ms (+2723) / 374.5ms (+2759) /
379.0ms (+2607)
repa.fft3d.par.N1
runtime (wall clock) : 33.02s ( +11) / 33.10s ( +11) /
33.22s ( +11)
kernel runtime (wall clock) : 27.39s ( +11) / 27.45s ( +11) /
27.48s ( +11)
repa.fft3d.par.N2
runtime (wall clock) : 18.51s ( +9) / 19.51s ( +12) /
20.22s ( +15)
kernel runtime (wall clock) : 15.28s ( +10) / 16.23s ( +13) /
16.85s ( +15)
repa.fft3d.par.N4
runtime (wall clock) : 11.21s ( +40) / 11.40s ( +42) /
11.61s ( +45)
kernel runtime (wall clock) : 9.325s ( +50) / 9.519s ( +53) /
9.646s ( +56)
noslow.list.*Double.find_indices
kernel runtime (wall clock) : 437.4us ( +13) / 439.0us ( +13) /
440.1us ( +13)
noslow.vector.Primitive.*Double.filterin_r
kernel runtime (wall clock) : 408.5us ( +13) / 410.2us ( +13) /
411.3us ( +13)
noslow.vector-unsafe.Primitive.*Double.filterin_r
kernel runtime (wall clock) : 410.6us ( +13) / 412.1us ( +13) /
413.1us ( +14)
noslow.dph-prim.seq.Double.scale_r
kernel runtime (wall clock) : 69.05us ( +10) / 69.06us ( +10) /
69.08us ( +10)
noslow.dph-prim.seq.Double.axpy
kernel runtime (wall clock) : 91.63us ( +11) / 91.67us ( +11) /
91.71us ( +11)
noslow.vector.Primitive.Double.scale_r
kernel runtime (wall clock) : 69.17us ( +12) / 69.18us ( +12) /
69.19us ( +12)
noslow.vector.Primitive.Double.axpy
kernel runtime (wall clock) : 90.98us ( +11) / 91.00us ( +11) /
91.01us ( +11)
noslow.vector.Unboxed.Double.scale_r
kernel runtime (wall clock) : 69.12us ( +11) / 69.16us ( +11) /
69.19us ( +11)
noslow.vector.Unboxed.Double.axpy
kernel runtime (wall clock) : 91.25us ( +10) / 91.27us ( +10) /
91.30us ( +10)
noslow.vector-unsafe.Primitive.Double.scale_r
kernel runtime (wall clock) : 65.70us ( +11) / 65.71us ( +11) /
65.72us ( +11)
noslow.vector-unsafe.Unboxed.Double.scale_r
kernel runtime (wall clock) : 70.16us ( +12) / 70.18us ( +12) /
70.19us ( +12)
_______________________________________________
Cvs-ghc mailing list
[email protected]
http://www.haskell.org/mailman/listinfo/cvs-ghc