Full logs at http://log.ouroborus.net/limitingfactor/dph

Environment
 Platform
   host:      limitingfactor.cse.unsw.EDU.AU
   arch:      i386
   processor: i386
   system:    Darwin 10.6.0
 Versions
   GHC The Glorious Glasgow Haskell Compilation System, version 7.1.20110215
   GCC i686-apple-darwin10-gcc-4.2.1 (GCC) 4.2.1 (Apple Inc. build 5659)

Total tests = 702

-- WINNERS (had a swing of < -10%)
dph.dotp.vectorised.seq.N4
      runtime        (wall clock)    : 2.502s  (  +9) / 2.502s  (  +9) / 2.503s 
 (  +9)
      kernel runtime (wall clock)    : 53.00ms (  -7) / 53.00ms (  -9) / 
53.00ms ( -15)

dph.sumsq.vectorised.par.N1
      runtime        (wall clock)    : 400.6ms ( -20) / 400.7ms ( -20) / 
400.9ms ( -20)
      kernel runtime (wall clock)    : 368.0ms ( -17) / 368.0ms ( -17) / 
368.0ms ( -17)

dph.sumsq.vectorised.par.N2
      runtime        (wall clock)    : 200.5ms ( -33) / 200.6ms ( -33) / 
201.0ms ( -33)
      kernel runtime (wall clock)    : 184.0ms ( -17) / 184.0ms ( -17) / 
184.0ms ( -17)

dph.sumsq.vectorised.par.N4
      runtime        (wall clock)    : 200.4ms (----) / 200.6ms (----) / 
200.6ms (----)
      kernel runtime (wall clock)    : 92.00ms ( -16) / 92.00ms ( -17) / 
92.00ms ( -17)

dph.sumsq.vectorised.par.N8
      runtime        (wall clock)    : 100.4ms (----) / 100.5ms (----) / 
100.6ms (----)
      kernel runtime (wall clock)    : 48.00ms ( -20) / 52.50ms ( -18) / 
56.00ms ( -15)

dph.sumsq.vectorised.seq.N4
      runtime        (wall clock)    : 400.6ms ( -20) / 400.7ms ( -20) / 
400.9ms ( -20)
      kernel runtime (wall clock)    : 368.0ms ( -15) / 368.0ms ( -15) / 
368.0ms ( -15)

dph.sumsq.vector.seq.N4
      runtime        (wall clock)    : 400.6ms ( -20) / 400.7ms ( -20) / 
400.9ms ( -20)
      kernel runtime (wall clock)    : 368.0ms ( -10) / 368.0ms ( -11) / 
368.0ms ( -11)

dph.evens.vectorised.par.N8
      runtime        (wall clock)    : 500.8ms (----) / 500.9ms (----) / 
501.1ms (----)
      kernel runtime (wall clock)    : 67.00ms ( -11) / 73.90ms (  -5) / 
83.00ms ( -10)

dph.quicksort.vectorised.par.N2
      runtime        (wall clock)    : 601.0ms ( -14) / 601.2ms ( -14) / 
601.4ms ( -14)
      kernel runtime (wall clock)    : 323.0ms ( -15) / 360.8ms ( -10) / 
376.0ms (  -8)

dph.quicksort.vectorised.par.N4
      runtime        (wall clock)    : 601.1ms ( -14) / 601.2ms ( -14) / 
601.5ms ( -14)
      kernel runtime (wall clock)    : 333.0ms ( -14) / 353.7ms ( -13) / 
366.0ms ( -14)

dph.quicksort.vectorised.par.N8
      runtime        (wall clock)    : 801.4ms ( -11) / 801.5ms ( -12) / 
801.7ms ( -20)
      kernel runtime (wall clock)    : 468.0ms ( -11) / 478.3ms ( -12) / 
484.0ms ( -22)

dph.quickhull.vectorised.par.N1
      runtime        (wall clock)    : 1.201s  ( -20) / 1.201s  ( -20) / 1.202s 
 ( -20)
      kernel runtime (wall clock)    : 723.0ms ( -33) / 724.4ms ( -33) / 
727.0ms ( -32)

dph.quickhull.vectorised.par.N2
      runtime        (wall clock)    : 901.2ms ( -10) / 901.3ms ( -13) / 
901.6ms ( -18)
      kernel runtime (wall clock)    : 473.0ms ( -27) / 515.8ms ( -25) / 
546.0ms ( -25)

dph.quickhull.vectorised.par.N4
      runtime        (wall clock)    : 801.2ms (----) / 801.4ms ( -10) / 
801.6ms ( -11)
      kernel runtime (wall clock)    : 378.0ms ( -28) / 397.3ms ( -30) / 
424.0ms ( -31)

dph.quickhull.vectorised.par.N8
      runtime        (wall clock)    : 801.2ms ( -11) / 802.0ms ( -11) / 
805.0ms ( -12)
      kernel runtime (wall clock)    : 377.0ms ( -31) / 387.7ms ( -33) / 
396.0ms ( -35)

dph.quickhull.vectorised.seq.N4
      runtime        (wall clock)    : 1.001s  (  -9) / 1.001s  (  -9) / 1.001s 
 (  -9)
      kernel runtime (wall clock)    : 577.0ms ( -16) / 583.4ms ( -16) / 
587.0ms ( -16)

dph.quickhull.vector-mutable.seq.N4
      runtime        (wall clock)    : 400.7ms ( -20) / 400.8ms ( -20) / 
400.9ms ( -20)
      kernel runtime (wall clock)    : 50.00ms ( -41) / 54.20ms ( -37) / 
58.00ms ( -33)

dph.quickhull.vector-forkIO.par.N4
      runtime        (wall clock)    : 400.8ms (----) / 400.9ms (----) / 
401.1ms (----)
      kernel runtime (wall clock)    : 30.00ms ( -46) / 39.30ms ( -34) / 
47.00ms ( -24)

dph.quickhull.vector-forkIO.par.N8
      runtime        (wall clock)    : 400.8ms (----) / 400.9ms (----) / 
400.9ms (----)
      kernel runtime (wall clock)    : 37.00ms ( -34) / 39.20ms ( -38) / 
42.00ms ( -42)

repa.laplace.par.N1
      runtime        (wall clock)    : 5.803s  ( -38) / 5.804s  ( -38) / 5.805s 
 ( -40)
      kernel runtime (wall clock)    : 3.349s  ( -51) / 3.373s  ( -51) / 3.381s 
 ( -51)

repa.laplace.par.N2
      runtime        (wall clock)    : 3.303s  ( -37) / 3.483s  ( -34) / 3.504s 
 ( -35)
      kernel runtime (wall clock)    : 2.018s  ( -48) / 2.090s  ( -47) / 2.100s 
 ( -47)

repa.laplace.par.N4
      runtime        (wall clock)    : 2.502s  ( -17) / 2.743s  (  -9) / 3.003s 
 (----)
      kernel runtime (wall clock)    : 1.668s  ( -17) / 1.935s  (  -4) / 2.167s 
 (  +7)

repa.laplace.par.N6
      runtime        (wall clock)    : 2.303s  ( -18) / 2.413s  ( -14) / 2.503s 
 ( -11)
      kernel runtime (wall clock)    : 1.741s  ( -19) / 1.800s  ( -17) / 1.858s 
 ( -16)

repa.laplace.par.N8
      runtime        (wall clock)    : 2.103s  ( -19) / 2.104s  ( -21) / 2.105s 
 ( -22)
      kernel runtime (wall clock)    : 1.546s  ( -27) / 1.564s  ( -26) / 1.584s 
 ( -28)

repa.blur.par.N1
      runtime        (wall clock)    : 900.8ms ( -69) / 930.9ms ( -68) / 1.001s 
 ( -68)
      kernel runtime (wall clock)    : 619.0ms ( -76) / 621.4ms ( -76) / 
626.0ms ( -76)

repa.blur.par.N2
      runtime        (wall clock)    : 600.7ms ( -62) / 600.8ms ( -62) / 
600.9ms ( -62)
      kernel runtime (wall clock)    : 360.0ms ( -74) / 362.4ms ( -74) / 
363.0ms ( -74)

repa.blur.par.N4
      runtime        (wall clock)    : 400.6ms ( -56) / 400.7ms ( -56) / 
400.8ms ( -56)
      kernel runtime (wall clock)    : 191.0ms ( -73) / 205.3ms ( -71) / 
221.0ms ( -69)

repa.blur.par.N6
      runtime        (wall clock)    : 400.6ms ( -43) / 400.7ms ( -43) / 
400.8ms ( -43)
      kernel runtime (wall clock)    : 161.0ms ( -67) / 163.6ms ( -67) / 
168.0ms ( -66)

repa.blur.par.N8
      runtime        (wall clock)    : 300.6ms ( -50) / 330.7ms ( -45) / 
401.0ms ( -34)
      kernel runtime (wall clock)    : 132.0ms ( -67) / 137.4ms ( -67) / 
144.0ms ( -66)

repa.edgedetect.par.N1
      runtime        (wall clock)    : 400.6ms ( -20) / 400.7ms ( -20) / 
400.8ms ( -20)
      kernel runtime (wall clock)    : 48.00ms ( -76) / 48.30ms ( -77) / 
49.00ms ( -76)

repa.edgedetect.par.N2
      runtime        (wall clock)    : 300.5ms (----) / 300.6ms ( -23) / 
300.8ms ( -25)
      kernel runtime (wall clock)    : 29.00ms ( -77) / 29.60ms ( -77) / 
30.00ms ( -78)

repa.edgedetect.par.N4
      runtime        (wall clock)    : 300.6ms (----) / 300.7ms (----) / 
300.9ms (----)
      kernel runtime (wall clock)    : 19.00ms ( -74) / 20.30ms ( -76) / 
23.00ms ( -74)

repa.edgedetect.par.N6
      runtime        (wall clock)    : 300.5ms (----) / 300.6ms (----) / 
300.6ms (----)
      kernel runtime (wall clock)    : 19.00ms ( -65) / 19.00ms ( -68) / 
19.00ms ( -71)

repa.edgedetect.par.N8
      runtime        (wall clock)    : 200.4ms ( -33) / 200.5ms ( -33) / 
200.6ms ( -33)
      kernel runtime (wall clock)    : 16.00ms ( -68) / 16.60ms ( -70) / 
17.00ms ( -73)

repa.fft2d.par.N2
      runtime        (wall clock)    : 4.504s  ( -18) / 4.794s  ( -14) / 5.006s 
 ( -12)
      kernel runtime (wall clock)    : 4.017s  ( -18) / 4.298s  ( -14) / 4.511s 
 ( -13)

repa.fft2d.par.N4
      runtime        (wall clock)    : 3.003s  ( -19) / 3.063s  ( -17) / 3.104s 
 ( -16)
      kernel runtime (wall clock)    : 2.670s  ( -19) / 2.717s  ( -18) / 2.752s 
 ( -17)

repa.fft2d.par.N6
      runtime        (wall clock)    : 2.503s  ( -36) / 2.593s  ( -34) / 2.603s 
 ( -35)
      kernel runtime (wall clock)    : 2.254s  ( -38) / 2.271s  ( -38) / 2.291s 
 ( -37)

repa.fft2d.par.N8
      runtime        (wall clock)    : 2.404s  ( -43) / 2.475s  ( -42) / 2.605s 
 ( -40)
      kernel runtime (wall clock)    : 2.165s  ( -45) / 2.207s  ( -44) / 2.305s 
 ( -42)

repa.fft3d.par.N8
      runtime        (wall clock)    : 6.517s  ( -12) / 6.637s  ( -11) / 6.819s 
 (  -9)
      kernel runtime (wall clock)    : 5.581s  (  -9) / 5.680s  (  -9) / 5.881s 
 (  -7)

noslow.dph-prim.seq.Double.axpy
      kernel runtime (wall clock)    : 82.32us ( -10) / 82.34us ( -10) / 
82.35us ( -10)

noslow.vector.Primitive.Double.scale_r
      kernel runtime (wall clock)    : 61.43us ( -11) / 61.44us ( -11) / 
61.45us ( -11)

noslow.vector.Primitive.Double.axpy
      kernel runtime (wall clock)    : 82.09us ( -10) / 82.11us ( -10) / 
82.13us ( -10)

-- LOSERS  (had a swing of > +10%)
dph.dotp.vectorised.par.N1
      runtime        (wall clock)    : 2.502s  ( +14) / 2.502s  ( +14) / 2.502s 
 ( +14)
      kernel runtime (wall clock)    : 48.00ms ( -13) / 48.00ms ( -14) / 
48.00ms ( -14)

dph.dotp.vectorised.par.N2
      runtime        (wall clock)    : 2.501s  ( +14) / 2.502s  ( +14) / 2.503s 
 ( +14)
      kernel runtime (wall clock)    : 24.00ms ( -11) / 34.40ms (----) / 
43.00ms (  -2)

dph.dotp.vectorised.par.N4
      runtime        (wall clock)    : 2.502s  (  +9) / 2.562s  ( +11) / 2.603s 
 ( +13)
      kernel runtime (wall clock)    : 22.00ms (----) / 27.50ms (----) / 
41.00ms ( +32)

dph.dotp.vector.seq.N4
      runtime        (wall clock)    : 2.502s  (  +9) / 2.512s  (  +9) / 2.602s 
 ( +13)
      kernel runtime (wall clock)    : 53.00ms (  -9) / 53.50ms ( -10) / 
55.00ms ( -14)

dph.evens.vectorised.par.N1
      runtime        (wall clock)    : 600.8ms ( +20) / 600.9ms ( +20) / 
601.0ms ( +20)
      kernel runtime (wall clock)    : 205.0ms ( +13) / 205.2ms ( +12) / 
207.0ms ( +12)

dph.evens.vectorised.par.N2
      runtime        (wall clock)    : 500.8ms ( +25) / 500.9ms ( +25) / 
501.0ms ( +25)
      kernel runtime (wall clock)    : 114.0ms ( +13) / 118.3ms ( +11) / 
124.0ms ( +12)

dph.evens.vectorised.par.N4
      runtime        (wall clock)    : 400.8ms (----) / 420.9ms (  +5) / 
501.0ms ( +25)
      kernel runtime (wall clock)    : 81.00ms ( +13) / 87.90ms ( +10) / 
94.00ms ( +11)

dph.evens.vectorised.seq.N4
      runtime        (wall clock)    : 500.7ms (----) / 520.9ms (  +4) / 
601.1ms ( +20)
      kernel runtime (wall clock)    : 191.0ms ( +19) / 191.8ms ( +10) / 
194.0ms (  +2)

repa.mmult.par.N1
      runtime        (wall clock)    : 16.51s  ( +92) / 16.52s  ( +92) / 16.62s 
 ( +89)
      kernel runtime (wall clock)    : 16.22s  ( +92) / 16.26s  ( +92) / 16.32s 
 ( +92)

repa.mmult.par.N2
      runtime        (wall clock)    : 8.304s  ( +93) / 8.468s  ( +94) / 8.710s 
 ( +98)
      kernel runtime (wall clock)    : 8.080s  ( +91) / 8.219s  ( +93) / 8.425s 
 ( +98)

repa.mmult.par.N4
      runtime        (wall clock)    : 4.303s  (+126) / 4.305s  (+126) / 4.305s 
 (+126)
      kernel runtime (wall clock)    : 4.046s  (+126) / 4.060s  (+126) / 4.066s 
 (+127)

repa.mmult.par.N8
      runtime        (wall clock)    : 2.303s  ( +91) / 2.342s  ( +91) / 2.429s 
 ( +84)
      kernel runtime (wall clock)    : 2.033s  ( +88) / 2.074s  ( +89) / 2.177s 
 ( +85)

repa.fft3d.par.N4
      runtime        (wall clock)    : 10.11s  ( +26) / 10.14s  ( +27) / 10.31s 
 ( +29)
      kernel runtime (wall clock)    : 8.560s  ( +38) / 8.609s  ( +39) / 8.687s 
 ( +40)

noslow.list.*Double.count_filter
      kernel runtime (wall clock)    : 241.5us ( +11) / 242.4us ( +11) / 
243.1us ( +11)

noslow.dph-prim.seq.Double.filterin_r
      kernel runtime (wall clock)    : 48.33us ( +31) / 48.43us ( +32) / 
48.52us ( +32)

noslow.vector.Unboxed.Double.filterin_r
      kernel runtime (wall clock)    : 46.75us ( +35) / 46.78us ( +35) / 
46.81us ( +35)




_______________________________________________
Cvs-ghc mailing list
[email protected]
http://www.haskell.org/mailman/listinfo/cvs-ghc

Reply via email to