Other pages


mflop6.f Benchmark Results, Summary

options                                                         Mfl/s
---------------------------------------------------------------------
-O2 -mips2                                                       26.4
-O2                                                              31.7
-O3 -lfastm                                                      78.6
-O3 -OPT:round=3 -lfastm                                        104.2
-O3 -OPT:round=3:IEEE_ar=3 -lfastm                              131.2
-O3 -OPT:round=3:IEEE_ar=3:fast_sq=ON -lfastm                   146.1
-O3 -OPT:round=3:IEEE_ar=3:fast_sq=ON -GCM:array_sp=ON -lfastm  146.4

Detailed results

corona:mflop/mflop6> f77 -O2 -mips2 mflop6.f
corona:mflop/mflop6> a.out

  112 Mflops, vector length   10000:   4.27 sec  26.25 Mfl
  131 Mflops, vector length     100:   5.18 sec  25.34 Mfl
  131 Mflops, vector length    1000:   4.98 sec  26.36 Mfl
  131 Mflops, vector length   10000:   4.97 sec  26.42 Mfl
  131 Mflops, vector length  100000:   4.95 sec  26.49 Mfl
  131 Mflops, vector length 1000000:   9.37 sec  14.02 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b   44.89   48.84   48.64   42.98    7.48
                   a=a*cc   36.09   37.02   37.19   36.93   18.65
                    a=a*d   29.07   29.62   29.73   29.50    9.43
                    a=b+c   24.48   24.74   24.78   24.02    6.44
                 a=a+b*cc   37.10   37.19   37.23   37.81   18.31
              am=am+bm*cc   30.88   37.13   37.21   36.77   18.35
                  a=a+b*c   32.91   33.03   33.03   32.83   13.46
                sm=sm+b*c    8.13    8.92    8.96    9.10    8.02
              a=(a+b*c)/d   19.00   19.13   19.15   18.44   10.77
        a=(a+b*c)/(b+a*c)   30.16   30.36   30.44   30.98   34.73
   a=(aa+b*(bb+b*(cc+b)))   44.33   45.01   45.16   46.66   52.15
 a=(aa+b1*(bb+b1*(cc+b1))   44.29   45.02   45.10   46.20   62.99
 a=(aa+sqrt(amax1(0.,b)))   27.98   28.01   28.04   29.41   26.57
      a=(aa+sqrt(b)) [if]   20.87   20.88   20.91   22.21   20.92


corona:mflop/mflop6> f77 -O2 -mips4 mflop6.f
corona:mflop/mflop6> a.out

  112 Mflops, vector length   10000:   3.54 sec  31.61 Mfl
  158 Mflops, vector length     100:   5.29 sec  29.88 Mfl
  158 Mflops, vector length    1000:   5.01 sec  31.55 Mfl
  158 Mflops, vector length   10000:   4.99 sec  31.67 Mfl
  158 Mflops, vector length  100000:   5.03 sec  31.40 Mfl
  158 Mflops, vector length 1000000:  10.63 sec  14.86 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b   33.81   36.75   36.72   34.60    7.63
                   a=a*cc   24.22   24.15   24.15   24.29   14.77
                    a=a*d   21.21   21.25   21.25   21.26    8.53
                    a=b+c   21.05   21.24   21.27   20.96    6.31
                 a=a+b*cc   42.38   42.51   42.53   42.78   18.76
              am=am+bm*cc   29.47   42.20   42.51   41.61   18.75
                  a=a+b*c   34.98   36.87   37.17   36.23   12.95
                sm=sm+b*c   26.38   35.72   37.10   36.97   18.91
              a=(a+b*c)/d   20.28   20.27   20.32   19.53   13.37
        a=(a+b*c)/(b+a*c)   33.83   33.86   33.97   34.58   22.54
   a=(aa+b*(bb+b*(cc+b)))   52.88   53.17   53.26   54.28   33.72
 a=(aa+b1*(bb+b1*(cc+b1))   52.89   53.18   53.19   54.00   38.73
 a=(aa+sqrt(amax1(0.,b)))   49.55   49.64   49.60   49.63   48.77
      a=(aa+sqrt(b)) [if]   23.75   23.80   23.78   23.98   28.23


corona:mflop/mflop6> f77 -O3 -mips4 mflop6.f -lfastm
corona:mflop/mflop6> a.out

  112 Mflops, vector length   10000:   1.46 sec  76.63 Mfl
  383 Mflops, vector length     100:   5.96 sec  64.33 Mfl
  383 Mflops, vector length    1000:   4.93 sec  77.67 Mfl
  383 Mflops, vector length   10000:   4.87 sec  78.62 Mfl
  383 Mflops, vector length  100000:   5.27 sec  72.75 Mfl
  383 Mflops, vector length 1000000:  11.95 sec  32.06 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b   71.08   85.57   84.19   77.61   32.59
                   a=a*cc  132.00  132.04  130.40  108.18   33.74
                    a=a*d  132.00  132.10  130.32  106.18   30.15
                    a=b+c   71.48   84.43   84.71   79.77   40.81
                 a=a+b*cc  137.07  136.89  133.93  110.41   26.44
              am=am+bm*cc   37.18   69.93   78.30   78.54   65.49
                  a=a+b*c  185.80  183.41  166.00   83.63   23.58
                sm=sm+b*c   39.53  116.01  144.28  146.50   24.50
              a=(a+b*c)/d   37.24   37.20   36.95   34.09   18.10
        a=(a+b*c)/(b+a*c)   20.71   20.71   20.66   20.79   17.36
   a=(aa+b*(bb+b*(cc+b)))  183.83  239.31  246.05  249.17   54.06
 a=(aa+b1*(bb+b1*(cc+b1))  178.00  238.72  246.41  247.08   58.70
 a=(aa+sqrt(amax1(0.,b)))   88.65   91.34   91.65   91.72   60.62
      a=(aa+sqrt(b)) [if]   82.89   87.59   88.14   87.90   57.38


corona:mflop/mflop6> f77 -O3 -mips4 -OPT:roundoff=3 mflop6.f -lfastm

  112 Mflops, vector length   10000:   1.09 sec 103.08 Mfl
  515 Mflops, vector length     100:   6.08 sec  84.74 Mfl
  515 Mflops, vector length    1000:   5.05 sec 102.16 Mfl
  515 Mflops, vector length   10000:   4.95 sec 104.20 Mfl
  515 Mflops, vector length  100000:   5.01 sec 102.78 Mfl
  515 Mflops, vector length 1000000:  14.01 sec  36.78 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b  168.70  194.09  195.44  180.10   31.70
                   a=a*cc  126.51  145.82  148.21  148.63   68.99
                    a=a*d   88.20   93.75   94.08   93.79   34.59
                    a=b+c  133.88  147.14  148.24  144.71   27.03
                 a=a+b*cc  175.13  188.08  189.17  189.25   54.40
              am=am+bm*cc   49.13   88.60   97.26   96.60   22.69
                  a=a+b*c  162.83  183.62  185.35  181.63   39.32
                sm=sm+b*c   55.15  127.12  145.51  145.53   23.97
              a=(a+b*c)/d   33.82   34.32   34.30   33.33   25.31
        a=(a+b*c)/(b+a*c)   55.22   56.34   56.47   56.58   35.08
   a=(aa+b*(bb+b*(cc+b)))  184.96  239.70  246.79  248.02   51.79
 a=(aa+b1*(bb+b1*(cc+b1))  172.08  237.26  245.99  244.43   55.16
 a=(aa+sqrt(amax1(0.,b)))   88.51   91.22   91.44   89.97   61.15
      a=(aa+sqrt(b)) [if]   83.06   87.60   88.00   87.55   57.79


corona:mflop/mflop6> f77 -O3 -mips4 \
    -OPT:roundoff=3:IEEE_arithm=3 mflop6.f -lfastm
corona:mflop/mflop6> a.out

  112 Mflops, vector length   10000:   0.87 sec 129.39 Mfl
  646 Mflops, vector length     100:   6.37 sec 101.55 Mfl
  646 Mflops, vector length    1000:   5.06 sec 127.77 Mfl
  646 Mflops, vector length   10000:   4.93 sec 131.20 Mfl
  646 Mflops, vector length  100000:   5.03 sec 128.63 Mfl
  646 Mflops, vector length 1000000:  17.41 sec  37.15 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b  169.14  194.56  195.50  181.51   29.71
                   a=a*cc  126.57  146.22  148.36  147.51   63.26
                    a=a*d   88.24   93.98   94.49   92.70   30.74
                    a=b+c  121.81  133.24  134.04  125.39   23.58
                 a=a+b*cc  175.08  188.11  189.05  183.46   51.59
              am=am+bm*cc   49.11   88.64   97.31   96.17   22.52
                  a=a+b*c  162.85  183.71  185.83  175.49   37.16
                sm=sm+b*c   55.19  127.08  145.67  145.39   23.80
              a=(a+b*c)/d  118.30  126.43  127.27  118.62   33.66
        a=(a+b*c)/(b+a*c)   90.42   92.76   93.04   92.97   56.01
   a=(aa+b*(bb+b*(cc+b)))  181.01  238.58  246.45  247.57   50.64
 a=(aa+b1*(bb+b1*(cc+b1))  171.96  236.86  245.91  244.70   53.16
 a=(aa+sqrt(amax1(0.,b)))   88.60   91.10   91.67   92.32   61.23
      a=(aa+sqrt(b)) [if]   83.11   87.29   88.06   89.17   58.04

corona:mflop/mflop6> f77 -O3 -mips4 \
    -OPT:roundoff=3:IEEE_arithm=3:FAST_sq=ON mflop6.f -lfastm
corona:mflop/mflop6> a.out

  112 Mflops, vector length   10000:   0.78 sec 144.00 Mfl
  720 Mflops, vector length     100:   6.53 sec 110.33 Mfl
  720 Mflops, vector length    1000:   5.06 sec 142.20 Mfl
  720 Mflops, vector length   10000:   4.93 sec 146.13 Mfl
  720 Mflops, vector length  100000:   5.01 sec 143.84 Mfl
  720 Mflops, vector length 1000000:  18.54 sec  38.83 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b  169.21  194.66  195.02  183.89   29.32
                   a=a*cc  124.79  145.79  147.78  147.79   61.58
                    a=a*d   87.72   93.89   94.28   93.31   29.83
                    a=b+c  133.31  147.12  147.85  138.99   22.83
                 a=a+b*cc  175.87  187.89  188.12  186.75   63.36
              am=am+bm*cc   49.56   88.65   97.28   96.52   22.92
                  a=a+b*c  162.39  183.69  185.07  180.44   46.51
                sm=sm+b*c   55.38  127.13  145.74  146.00   24.13
              a=(a+b*c)/d  118.61  126.44  126.83  120.42   42.17
        a=(a+b*c)/(b+a*c)   90.61   92.78   92.95   93.73   51.66
   a=(aa+b*(bb+b*(cc+b)))  179.04  237.42  245.40  248.46   50.64
 a=(aa+b1*(bb+b1*(cc+b1))  171.80  236.40  245.58  246.85   52.80
 a=(aa+sqrt(amax1(0.,b)))  157.95  167.70  167.60  161.44   70.29
      a=(aa+sqrt(b)) [if]  147.25  166.59  168.88  170.48   68.93


corona:mflop/mflop6> f77 -O3 -mips4 \
    -OPT:roundoff=3:IEEE_arithm=3:FAST_sq=ON \
    -GCM:array_speculation=ON mflop6.f -lfastm
corona:mflop/mflop6> a.out

  112 Mflops, vector length   10000:   0.78 sec 144.36 Mfl
  721 Mflops, vector length     100:   6.55 sec 110.18 Mfl
  721 Mflops, vector length    1000:   5.07 sec 142.29 Mfl
  721 Mflops, vector length   10000:   4.93 sec 146.45 Mfl
  721 Mflops, vector length  100000:   5.01 sec 144.08 Mfl
  721 Mflops, vector length 1000000:  18.51 sec  39.00 Mfl
                  OP/LEN:     100    1000   10000  100000 1000000
                      a=b  168.27  194.51  195.98  181.40   29.39
                   a=a*cc  124.96  146.01  148.34  147.12   60.53
                    a=a*d   88.15   93.89   94.46   92.90   29.91
                    a=b+c  132.17  147.25  148.11  141.99   22.86
                 a=a+b*cc  176.67  188.10  189.22  188.60   63.69
              am=am+bm*cc   49.61   88.70   97.27   96.98   23.13
                  a=a+b*c  161.97  183.72  185.81  181.10   46.64
                sm=sm+b*c   54.87  127.10  145.64  146.54   24.48
              a=(a+b*c)/d  118.61  126.28  127.09  121.07   42.22
        a=(a+b*c)/(b+a*c)   90.68   92.57   93.00   92.98   51.83
   a=(aa+b*(bb+b*(cc+b)))  179.01  237.58  246.12  245.99   50.79
 a=(aa+b1*(bb+b1*(cc+b1))  171.19  236.87  246.47  244.19   53.20
 a=(aa+sqrt(amax1(0.,b)))  157.73  168.45  167.68  164.69   70.61
      a=(aa+sqrt(b)) [if]  147.84  167.46  169.75  170.98   69.47