#!RS6000-590 Workstation ##Parkbench (LOWLEV_1.0), ##07/SEP/1994, ##at Old Dominion University, Norfolk, Virginia, USA #*name: Roger Hockney #*establishment: University of Southampton #*email: rwh@pac.soton.ac.uk #telephone: 0635 578679 #date sent: 01/11/94 #*date benchmarked: 07/SEP/1994 #*benchmark suite and revision: Parkbench (LOWLEV_1.0) #*message passing library and revision: N/A #*benchmark: RINF1 #*problem size (if applicable): N/A #*number of nodes: 1 #*file number if one of a group: 1 of 1 #*manufacturer: IBM #*model number: RS6000-590 Workstation #cpu: Power-2 #cpu speed (MHz): 66MHz #fpu: integrated #primary cache: #secondary cache: #other cache: #memory: #disk and connection: #interconnect type: #switching: #other hardware: #operating system and version: AIX 3.2.5 #compilers, libraries and versions: f77 #compiler switches: -O2 #additional tuning parameters: none #other software: #additional comments: Benchmarks performed on a workstation # at Old Dominion University, Norfolk, Virginia, USA # in the Center for Coastal Physical Oceanography (CCPO). # There were no other users during the measurements. # ================================================= # === === # === PARKBENCH Parallel Benchmarks === # === === # === RINF1 === # === === # === Program: R-infinity and N-half === # === Version: Standard Fortran 77 === # === Author: Roger Hockney === # === Update: November 1993; Release: 1.0 === # === === # ================================================= # This run started Wed Sep 7 09:39:04 1994 # # Run on single IBM RS/6000 Model 590 # at Old Dominion University, VA, USA (CCPO) # Software levels are AIX 3.2.5 # # Contact: Roger Hockney, rwh@pac.soton.ac.uk # # # # (1) CONTIGUOUS DYADS: A(I)=B(I)*C(I) # # ICASE= 1 NCASE= 17 NMAX=100000 NTIMES= 100000 # # # SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) # vlen sec Mflop/s vlen % sec Mflop/s 1 1 4.448767E-08 .000000 .000 .000 100000 .444877E-02 22.478136 2 2 9.008127E-08 21.932903 -.024 .000 50000 .450406E-02 22.202173 3 3 1.366439E-07 21.702271 -.038 .167 33333 .455475E-02 21.954872 4 4 1.624064E-07 24.980089 .208 3.401 25000 .406016E-02 24.629572 5 5 2.115584E-07 24.602268 .175 2.371 20000 .423117E-02 23.634136 6 6 2.527435E-07 24.450335 .159 1.822 16666 .421222E-02 23.739479 7 7 3.140995E-07 23.158207 .010 2.316 14285 .448691E-02 22.285929 8 8 3.774054E-07 21.829712 -.163 2.888 12500 .471757E-02 21.197363 9 9 4.385247E-07 20.808990 -.311 3.094 11111 .487245E-02 20.523357 10 10 4.980992E-07 20.068892 -.430 3.076 10000 .498099E-02 20.076323 11 20 1.101414E-06 17.885092 -.920 2.244 5000 .550707E-02 18.158470 12 30 1.693993E-06 17.300961 -1.078 1.547 3333 .564608E-02 17.709633 13 40 2.308198E-06 17.003366 -1.175 1.183 2500 .577050E-02 17.329533 14 50 2.910464E-06 16.872023 -1.226 .939 2000 .582093E-02 17.179392 15 60 3.493647E-06 16.847479 -1.238 .758 1666 .582042E-02 17.174030 16 70 4.117333E-06 16.781881 -1.274 .646 1428 .587955E-02 17.001295 17 80 4.720230E-06 16.740236 -1.302 .560 1250 .590029E-02 16.948326 18 90 5.292587E-06 16.747078 -1.296 .486 1111 .588006E-02 17.004917 19 100 5.928192E-06 16.714243 -1.325 .437 1000 .592819E-02 16.868549 20 200 1.196339E-05 16.641666 -1.428 222.200 500 .598170E-02 16.717667 24 600 3.593407E-05 .000000 .000 .000 166 .596506E-02 16.697247 25 700 4.213904E-05 16.116116 -20.882 .000 142 .598374E-02 16.611673 26 800 4.788633E-05 16.733232 2.570 .225 125 .598579E-02 16.706228 27 900 5.421204E-05 16.506773 -6.488 .221 111 .601754E-02 16.601479 28 1000 6.023936E-05 16.478924 -7.658 .179 100 .602394E-02 16.600443 29 2000 1.204992E-04 16.563593 -3.672 .089 50 .602496E-02 16.597620 30 3000 1.819462E-04 16.460030 -9.224 .119 33 .600422E-02 16.488392 31 4000 2.444698E-04 16.344690 -16.425 .196 25 .611174E-02 16.361942 32 5000 3.076608E-04 16.241646 -23.957 .251 20 .615322E-02 16.251663 33 6000 3.902560E-04 15.669094 -72.759 1.338 16 .624410E-02 15.374523 34 7000 5.691977E-04 13.606360 -276.958 5.248 14 .796877E-02 12.298012 35 8000 6.708267E-04 12.553591 -399.009 5.538 12 .804992E-02 11.925584 36 9000 7.406778E-04 12.145282 -454.240 5.109 11 .814746E-02 12.151032 37 10000 8.260352E-04 11.914273 -490.298 4.545 10 .826035E-02 12.106022 38 20000 1.648077E-03 11.856379 -504.829 2.203 5 .824038E-02 12.135357 39 30000 2.451883E-03 11.979824 -466.627 1.451 3 .735565E-02 12.235496 40 40000 3.250048E-03 12.093115 -424.242 1.091 2 .650010E-02 12.307510 41 50000 4.048512E-03 12.174232 -387.790 .878 2 .809702E-02 12.350217 42 60000 4.915968E-03 12.151614 -399.903 .707 1 .491597E-02 12.205124 43 70000 5.666560E-03 12.206128 -365.403 .628 1 .566656E-02 12.353173 44 80000 6.532096E-03 12.200510 -369.560 .532 1 .653210E-02 12.247218 45 90000 7.348224E-03 12.199494 -370.430 .462 1 .734822E-02 12.247857 46 100000 8.162560E-03 12.201455 -368.505 .407 1 .816256E-02 12.251059 (2) DYADS, STRIDE=8: A(I)=B(I)*C(I) ICASE= 2 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 1.107610E-07 .000000 .000 .000 100000 .110761E-01 9.028452 2 2 8.929791E-08 -46.591698 -6.161 111.100 50000 .446490E-02 22.396942 3 3 1.367975E-07 .000000 .000 .000 33333 .455987E-02 21.930222 4 4 1.662567E-07 33.945332 1.644 .000 25000 .415642E-02 24.059187 5 5 2.093312E-07 27.573402 .709 1.533 20000 .418662E-02 23.885595 6 6 2.569370E-07 24.783585 .267 1.809 16666 .428211E-02 23.352030 7 7 3.171819E-07 22.150890 -.187 2.508 14285 .453094E-02 22.069353 8 8 3.775488E-07 20.538244 -.488 2.670 12500 .471936E-02 21.189314 9 9 4.378105E-07 19.532969 -.693 2.594 11111 .486451E-02 20.556841 10 10 4.981760E-07 18.866585 -.840 2.435 10000 .498176E-02 20.073227 11 20 1.102182E-06 17.211866 -1.302 222.200 5000 .551091E-02 18.145817 15 60 3.506093E-06 .000000 .000 .000 1666 .584115E-02 17.113064 16 70 4.120381E-06 16.279016 -2.924 .000 1428 .588390E-02 16.988720 17 80 4.723507E-06 16.428270 -2.370 .056 1250 .590438E-02 16.936567 18 90 5.296504E-06 16.738203 -1.157 .199 1111 .588442E-02 16.992342 19 100 5.995776E-06 16.245667 -3.183 .455 1000 .599578E-02 16.678408 20 200 1.206118E-05 16.355740 -2.674 .212 500 .603059E-02 16.582121 21 300 1.804915E-05 16.482347 -2.004 .186 333 .601037E-02 16.621279 22 400 2.423603E-05 16.430975 -2.321 .152 250 .605901E-02 16.504351 23 500 3.085568E-05 16.218304 -3.859 .433 200 .617114E-02 16.204472 24 600 3.939162E-05 15.548429 -9.516 1.583 166 .653901E-02 15.231668 25 700 1.273402E-04 7.846605 -85.242 15.100 142 .180823E-01 5.497087 26 800 3.837256E-04 3.309307 -143.181 18.161 125 .479657E-01 2.084823 27 900 5.295671E-04 2.235820 -164.762 18.042 111 .587820E-01 1.699501 28 1000 6.184141E-04 1.835502 -177.338 17.306 100 .618414E-01 1.617040 29 2000 1.235169E-03 1.565664 -202.436 8.904 50 .617585E-01 1.619211 30 3000 1.847808E-03 1.530215 -207.303 5.785 33 .609777E-01 1.623545 31 4000 2.464338E-03 1.535439 -206.321 4.209 25 .616084E-01 1.623154 32 5000 3.079795E-03 1.546273 -203.644 3.281 20 .615959E-01 1.623484 33 6000 3.701216E-03 1.555263 -200.811 2.667 16 .592195E-01 1.621089 34 7000 4.312247E-03 1.563968 -197.407 2.245 14 .603715E-01 1.623284 35 8000 4.934229E-03 1.570350 -194.378 1.924 12 .592108E-01 1.621327 36 9000 5.578985E-03 1.573052 -192.851 1.665 11 .613688E-01 1.613197 37 10000 6.180070E-03 1.577351 -190.004 1.479 10 .618007E-01 1.618105 (3) CONTIGUOUS TRIADS: A(I)=B(I)*C(I)+D(I) ICASE= 3 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 3.000192E-08 .000000 .000 .000 100000 .600038E-02 33.331203 2 2 6.011648E-08 33.206520 -.004 .000 50000 .601165E-02 33.268745 3 3 8.296787E-08 37.760109 .179 2.063 33333 .553114E-02 36.158577 4 4 1.045862E-07 40.550785 .315 2.131 25000 .522931E-02 38.245949 5 5 1.132736E-07 47.390419 .705 4.779 20000 .453094E-02 44.140911 6 6 1.284224E-07 51.991096 1.000 4.799 16666 .428058E-02 46.720818 7 7 1.435553E-07 55.163952 1.224 4.445 14285 .410138E-02 48.761684 8 8 1.587098E-07 57.408413 1.396 4.030 12500 .396774E-02 50.406479 9 9 1.738616E-07 59.041779 1.531 3.636 11111 .386355E-02 51.765320 10 10 1.890048E-07 60.262806 1.638 3.286 10000 .378010E-02 52.908707 11 20 3.372544E-07 64.335930 2.082 2.031 5000 .337254E-02 59.302414 12 30 4.920300E-07 65.106781 2.176 1.351 3333 .327987E-02 60.971893 13 40 6.370304E-07 65.905807 2.285 1.048 2500 .318515E-02 62.791348 14 50 7.968640E-07 65.725784 2.257 .812 2000 .318746E-02 62.745968 15 60 9.367203E-07 66.114540 2.325 .702 1666 .312115E-02 64.053268 16 70 1.086745E-06 66.318329 2.365 .600 1428 .310374E-02 64.412529 17 80 1.250099E-06 66.136658 2.325 .522 1250 .312525E-02 63.994919 18 90 1.386225E-06 66.312698 2.368 .478 1111 .308019E-02 64.924522 19 100 1.536384E-06 66.422821 2.399 .429 1000 .307277E-02 65.087891 20 200 3.040256E-06 66.525887 2.441 .214 500 .304026E-02 65.783936 21 300 4.543423E-06 66.553329 2.455 .140 333 .302592E-02 66.029510 22 400 6.044672E-06 66.569061 2.464 .103 250 .302234E-02 66.173981 23 500 7.550080E-06 66.559723 2.458 .081 200 .302003E-02 66.224464 24 600 9.052531E-06 66.555923 2.454 .066 166 .300544E-02 66.279808 25 700 1.055369E-05 66.557587 2.456 .055 142 .299725E-02 66.327515 26 800 1.191834E-05 66.835060 2.767 .193 125 .297958E-02 67.123466 27 900 1.357146E-05 66.730545 2.632 .183 111 .301286E-02 66.315643 28 1000 1.505664E-05 66.688026 2.569 .165 100 .301133E-02 66.415886 29 2000 3.108608E-05 65.289375 -.887 222.200 50 .310861E-02 64.337479 33 6000 2.980240E-04 .000000 .000 .000 16 .953677E-02 20.132607 34 7000 3.486354E-04 19.758389 -111.526 .000 14 .976179E-02 20.078281 35 8000 3.853227E-04 22.909853 880.853 .852 12 .924774E-02 20.761818 36 9000 4.390167E-04 21.754953 500.378 .807 11 .965837E-02 20.500357 37 10000 4.950528E-04 20.642441 116.821 .954 10 .990106E-02 20.199867 38 20000 9.597951E-04 21.137224 307.380 .477 5 .959795E-02 20.837780 39 30000 1.471957E-03 20.537327 45.592 .555 3 .883174E-02 20.381025 40 40000 1.921536E-03 20.794706 176.103 .509 2 .768614E-02 20.816679 41 50000 2.395200E-03 20.903233 240.229 .420 2 .958080E-02 20.875082 42 60000 2.890112E-03 20.866943 215.363 .337 1 .578022E-02 20.760441 43 70000 3.345792E-03 20.930500 265.480 .308 1 .669158E-02 20.921803 44 80000 3.858560E-03 20.868681 209.925 .292 1 .771712E-02 20.733124 45 90000 4.365312E-03 20.779663 119.576 .332 1 .873062E-02 20.617083 46 100000 4.855168E-03 20.716179 47.415 .334 1 .971034E-02 20.596609 (4) TRIADS, STRIDE=8: A(I)=B(I)*C(I)+D(I) ICASE= 4 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 3.052032E-08 .000000 .000 .000 100000 .610406E-02 32.765057 2 2 5.987840E-08 34.062168 .040 .000 50000 .598784E-02 33.401024 3 3 8.094417E-08 39.663769 .265 2.415 33333 .539622E-02 37.062584 4 4 1.110886E-07 38.055988 .187 1.757 25000 .555443E-02 36.007282 5 5 1.127680E-07 46.359486 .664 6.102 20000 .451072E-02 44.338821 6 6 1.284915E-07 51.571503 1.001 5.924 16666 .428288E-02 46.695679 7 7 1.435643E-07 55.098362 1.252 5.392 14285 .410163E-02 48.758636 8 8 1.587302E-07 57.525558 1.439 4.823 12500 .396826E-02 50.399971 9 9 1.723294E-07 59.616367 1.613 4.414 11111 .382950E-02 52.225567 10 10 1.873664E-07 61.091820 1.744 3.983 10000 .374733E-02 53.371365 11 20 3.412480E-07 63.847923 2.045 2.193 5000 .341248E-02 58.608398 12 30 4.878824E-07 65.471848 2.243 1.543 3333 .325222E-02 61.490227 13 40 6.449664E-07 65.489571 2.245 1.121 2500 .322483E-02 62.018734 14 50 7.882240E-07 65.974037 2.320 .914 2000 .315290E-02 63.433746 15 60 9.491669E-07 65.805672 2.291 .739 1666 .316262E-02 63.213329 16 70 1.089076E-06 66.071968 2.343 .646 1428 .311040E-02 64.274696 17 80 1.238938E-06 66.235107 2.379 .563 1250 .309734E-02 64.571457 18 90 1.404889E-06 66.051727 2.334 .503 1111 .312166E-02 64.061989 19 100 1.539072E-06 66.204094 2.376 .465 1000 .307814E-02 64.974213 20 200 3.109120E-06 65.434967 2.057 .328 500 .310912E-02 64.326881 21 300 4.708709E-06 64.567093 1.623 .345 333 .313600E-02 63.711735 22 400 6.201856E-06 64.679321 1.690 .259 250 .310093E-02 64.496826 23 500 9.343360E-06 58.557983 -2.639 222.200 200 .373734E-02 53.513939 27 900 3.430031E-04 .000000 .000 .000 111 .761467E-01 2.623883 28 1000 3.828185E-04 2.511587 -38.518 .000 100 .765637E-01 2.612204 29 2000 7.634662E-04 2.620586 .936 .089 50 .763466E-01 2.619631 30 3000 1.145309E-03 2.620075 .710 .051 33 .755904E-01 2.619380 31 4000 1.527997E-03 2.618210 -.290 .039 25 .763999E-01 2.617805 32 5000 1.907898E-03 2.620206 .990 .037 20 .763159E-01 2.620686 33 6000 2.291864E-03 2.618861 -.021 .034 16 .733396E-01 2.617956 34 7000 2.672283E-03 2.619261 .325 .028 14 .748239E-01 2.619483 35 8000 3.057120E-03 2.617912 -1.002 .032 12 .733709E-01 2.616842 36 9000 3.466554E-03 2.606264 -13.839 .214 11 .762642E-01 2.596238 37 10000 3.861069E-03 2.596623 -25.630 .263 10 .772214E-01 2.589956 (5) RANDOM SCATTER/GATHER: ICASE= 5 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 1.053850E-07 .000000 .000 .000 100000 .210770E-01 9.489019 2 2 1.500774E-07 22.375130 1.358 .000 50000 .150077E-01 13.326453 3 3 2.026926E-07 20.553377 1.139 .921 33333 .135127E-01 14.800739 4 4 2.552371E-07 19.913511 1.052 .845 25000 .127619E-01 15.671701 5 5 3.089088E-07 19.523344 .992 .775 20000 .123564E-01 16.186007 6 6 3.616964E-07 19.330654 .959 .665 16666 .120561E-01 16.588499 7 7 4.136591E-07 19.253559 .944 .554 14285 .118182E-01 16.922146 8 8 4.645273E-07 19.254625 .945 .461 12500 .116132E-01 17.221806 9 9 5.200295E-07 19.167368 .925 .428 11111 .115561E-01 17.306709 10 10 5.738496E-07 19.090431 .907 .406 10000 .114770E-01 17.426168 11 20 1.100698E-06 18.993513 .877 .217 5000 .110070E-01 18.170294 12 30 1.624982E-06 19.000427 .880 .141 3333 .108321E-01 18.461746 13 40 2.151680E-06 18.999376 .879 .102 2500 .107584E-01 18.590124 14 50 2.678144E-06 18.998518 .879 .079 2000 .107126E-01 18.669645 15 60 3.204994E-06 18.996689 .878 .064 1666 .106790E-01 18.720783 16 70 3.739697E-06 18.976562 .866 .070 1428 .106806E-01 18.718092 17 80 4.258201E-06 18.982323 .870 .061 1250 .106455E-01 18.787275 18 90 4.784734E-06 18.985785 .872 .054 1111 .106317E-01 18.809822 19 100 5.315072E-06 18.983295 .870 .048 1000 .106301E-01 18.814421 20 200 1.058176E-05 18.982876 .870 .023 500 .105818E-01 18.900448 21 300 1.584778E-05 18.984270 .872 .015 333 .105546E-01 18.930092 22 400 2.116198E-05 18.960081 .824 .034 250 .105810E-01 18.901819 23 500 2.638144E-05 18.972246 .853 .033 200 .105526E-01 18.952719 24 600 3.165301E-05 18.976839 .866 .028 166 .105088E-01 18.955542 25 700 3.691809E-05 18.979843 .875 .024 142 .104847E-01 18.960897 26 800 4.218470E-05 18.981695 .883 .021 125 .105462E-01 18.964220 27 900 4.763791E-05 18.958355 .779 .063 111 .105756E-01 18.892517 28 1000 5.297152E-05 18.938431 .677 .079 100 .105943E-01 18.878069 29 2000 1.056640E-04 18.935934 .655 .039 50 .105664E-01 18.927921 30 3000 1.596082E-04 18.852180 -.249 222.200 33 .105341E-01 18.796022 34 7000 3.988389E-04 .000000 .000 .000 14 .111675E-01 17.550947 35 8000 4.758507E-04 12.985024 -1821.068 .000 12 .114204E-01 16.811998 36 9000 5.817600E-04 10.933673 -2691.886 1.171 11 .127987E-01 15.470297 37 10000 6.809088E-04 10.502887 -2887.892 1.002 10 .136182E-01 14.686255 38 20000 1.534387E-03 11.450423 -2391.392 .659 5 .153439E-01 13.034519 39 30000 2.343808E-03 11.798630 -2170.784 .677 3 .140628E-01 12.799683 40 40000 3.232512E-03 11.717471 -2233.723 .491 2 .129300E-01 12.374278 41 50000 4.003264E-03 11.868147 -2091.409 .573 2 .160131E-01 12.489808 42 60000 4.722688E-03 12.106533 -1821.884 .925 1 .944538E-02 12.704630 43 70000 5.503488E-03 12.258460 -1620.193 .940 1 .110070E-01 12.719207 44 80000 6.311936E-03 12.336239 -1500.941 .840 1 .126239E-01 12.674400 45 90000 7.084288E-03 12.405704 -1379.619 .776 1 .141686E-01 12.704170 46 100000 7.930112E-03 12.418263 -1354.931 .668 1 .158602E-01 12.610162 (6) CONTIGUOUS 4-OP: A(I)=B(I)*C(I)+D(I)*E(I)+F(I) ICASE= 6 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 1.875456E-08 .000000 .000 .000 100000 .750182E-02 53.320370 2 2 4.505728E-08 38.018879 -.287 .000 50000 .901146E-02 44.387943 3 3 5.666745E-08 52.752510 .119 6.111 33333 .755558E-02 52.940449 4 4 7.181312E-08 58.552860 .315 4.810 25000 .718131E-02 55.700130 5 5 9.413439E-08 56.333107 .227 3.434 20000 .753075E-02 53.115551 6 6 1.160533E-07 53.939877 .118 2.874 16666 .773658E-02 51.700390 7 7 1.393036E-07 51.745861 .005 2.652 14285 .795981E-02 50.249954 8 8 1.618842E-07 50.190678 -.085 2.449 12500 .809421E-02 49.418053 9 9 1.861535E-07 48.796791 -.176 2.342 11111 .827341E-02 48.347187 10 10 2.070720E-07 48.062851 -.228 2.119 10000 .828288E-02 48.292381 11 20 4.403712E-07 45.039383 -.524 1.408 5000 .880742E-02 45.416229 12 30 6.533838E-07 45.099579 -.517 .909 3333 .871091E-02 45.914822 13 40 8.776960E-07 45.021233 -.528 .652 2500 .877696E-02 45.573868 14 50 1.101664E-06 44.954700 -.538 .503 2000 .881331E-02 45.385887 15 60 1.325945E-06 44.898914 -.549 .406 1666 .883610E-02 45.250751 16 70 1.562129E-06 44.700306 -.594 .385 1428 .892288E-02 44.810646 17 80 1.787750E-06 44.585281 -.624 .350 1250 .893875E-02 44.748974 18 90 2.013782E-06 44.510303 -.646 .314 1111 .894925E-02 44.692020 19 100 2.239744E-06 44.459072 -.664 .283 1000 .895898E-02 44.647961 20 200 4.500736E-06 44.344238 -.727 222.200 500 .900147E-02 44.437176 24 600 1.358034E-05 .000000 .000 .000 166 .901734E-02 44.181526 25 700 1.594817E-05 42.232708 -26.466 .000 142 .905856E-02 43.892185 26 800 1.806234E-05 44.622948 7.881 .331 125 .903117E-02 44.291061 27 900 2.032663E-05 44.736622 9.600 .256 111 .902502E-02 44.276890 28 1000 2.258368E-05 44.672470 8.582 .207 100 .903347E-02 44.279762 29 2000 4.569472E-05 43.575905 -10.857 .190 50 .913894E-02 43.768738 30 3000 9.096146E-05 32.199169 -240.817 4.512 33 .120069E-01 32.980999 31 4000 1.662694E-04 24.049194 -442.300 6.811 25 .166269E-01 24.057337 32 5000 2.149824E-04 22.139423 -503.352 5.651 20 .171986E-01 23.257717 33 6000 2.485320E-04 22.126690 -503.873 4.637 16 .159060E-01 24.141762 34 7000 2.895086E-04 22.279768 -496.124 3.810 14 .162125E-01 24.178904 35 8000 3.307094E-04 22.461836 -485.025 3.221 12 .158740E-01 24.190426 36 9000 3.786938E-04 22.471390 -484.339 2.703 11 .166625E-01 23.765900 37 10000 4.162304E-04 22.617716 -472.190 2.401 10 .166492E-01 24.025154 38 20000 8.250368E-04 23.404844 -367.492 1.374 5 .165007E-01 24.241343 39 30000 1.247808E-03 23.650290 -327.575 .907 3 .149737E-01 24.042160 40 40000 1.665824E-03 23.752632 -307.577 .669 2 .133266E-01 24.012140 41 50000 2.111136E-03 23.637032 -334.593 .536 2 .168891E-01 23.683931 42 60000 2.544832E-03 23.546585 -359.745 .455 1 .101793E-01 23.577196 43 70000 2.975616E-03 23.486477 -379.479 .394 1 .119025E-01 23.524542 44 80000 3.424064E-03 23.397772 -413.536 .378 1 .136963E-01 23.364050 45 90000 3.859648E-03 23.333094 -442.298 .357 1 .154386E-01 23.318188 46 100000 4.278400E-03 23.313005 -452.546 .319 1 .171136E-01 23.373224 (7) INNER PRODUCT: S=S+B(I)*C(I) ICASE= 7 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 2.226688E-08 .000000 .000 .000 100000 .445338E-02 44.909748 2 2 2.986496E-08 131.612244 1.931 .000 50000 .298650E-02 66.968117 3 3 4.540077E-08 86.453232 .811 4.121 33333 .302669E-02 66.078171 4 4 5.974528E-08 78.142700 .573 3.300 25000 .298726E-02 66.950897 5 5 7.573760E-08 73.087784 .406 2.855 20000 .302950E-02 66.017403 6 6 9.091180E-08 70.680359 .316 2.395 16666 .303027E-02 65.998032 7 7 1.060827E-07 69.327843 .259 2.016 14285 .303078E-02 65.986229 8 8 1.212416E-07 68.491066 .219 1.716 12500 .303104E-02 65.983955 9 9 1.348199E-07 68.424995 .216 1.455 11111 .299597E-02 66.755714 10 10 1.481344E-07 68.724709 .233 1.272 10000 .296269E-02 67.506264 11 20 3.031296E-07 66.795876 .088 .747 5000 .303130E-02 65.978386 12 30 4.603852E-07 65.588623 -.017 .591 3333 .306893E-02 65.162819 13 40 5.993472E-07 66.360359 .061 .534 2500 .299674E-02 66.739281 14 50 7.489920E-07 66.640785 .095 .434 2000 .299597E-02 66.756386 15 60 8.990732E-07 66.743027 .109 .354 1666 .299571E-02 66.735390 16 70 1.081636E-06 65.856087 -.034 .634 1428 .308915E-02 64.716789 17 80 1.231565E-06 65.476173 -.104 .606 1250 .307891E-02 64.958015 18 90 1.439568E-06 64.320473 -.350 1.035 1111 .319872E-02 62.518757 19 100 1.521152E-06 64.719467 -.254 1.019 1000 .304230E-02 65.739655 20 200 2.999040E-06 65.985687 .231 .652 500 .299904E-02 66.688004 21 300 4.554570E-06 65.940994 .210 .419 333 .303334E-02 65.867905 22 400 5.997568E-06 66.399475 .468 .357 250 .299878E-02 66.693703 23 500 7.498240E-06 66.575005 .585 .290 200 .299930E-02 66.682312 24 600 9.102650E-06 66.306267 .372 .273 166 .302208E-02 65.914871 25 700 1.049600E-05 66.474182 .529 .253 142 .298086E-02 66.692070 26 800 1.199616E-05 66.567123 .631 .226 125 .299904E-02 66.688004 27 900 1.365564E-05 66.363564 .373 .245 111 .303155E-02 65.906837 28 1000 1.634432E-05 64.711708 -2.030 222.200 100 .326886E-02 61.183334 32 5000 7.777920E-05 .000000 .000 .000 20 .311117E-02 64.284538 33 6000 9.242400E-05 68.283623 311.046 .000 16 .295757E-02 64.918205 34 7000 1.077486E-04 66.734802 183.019 .149 14 .301696E-02 64.966057 35 8000 1.239360E-04 65.021637 32.850 .312 12 .297446E-02 64.549446 36 9000 1.860771E-04 40.305065 -2260.407 7.170 11 .409370E-02 48.367050 37 10000 2.669184E-04 28.161249 -3487.570 9.127 10 .533837E-02 37.464634 38 20000 5.631744E-04 29.524828 -3304.584 4.035 5 .563174E-02 35.512981 39 30000 8.557227E-04 31.052794 -3049.096 2.679 3 .513434E-02 35.058086 40 40000 1.130560E-03 32.261864 -2796.626 2.196 2 .452224E-02 35.380699 41 50000 1.424704E-03 32.811218 -2655.318 1.754 2 .569882E-02 35.095009 42 60000 1.697024E-03 33.348030 -2488.043 1.554 1 .339405E-02 35.356010 43 70000 2.002176E-03 33.530186 -2420.532 1.285 1 .400435E-02 34.961964 44 80000 2.261888E-03 33.867680 -2274.096 1.205 1 .452378E-02 35.368683 45 90000 2.568064E-03 33.985966 -2214.913 1.040 1 .513613E-02 35.045856 46 100000 2.828160E-03 34.204212 -2090.563 .986 1 .565632E-02 35.358677 (8) FIRST ORDER RECURRENCE: A(I)=B(I)*A(I-1)+D(I) ICASE= 8 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 7.486725E-09 .000000 .000 .000 100000 .149734E-02 133.569748 2 2 3.844608E-08 32.300415 -.758 .000 50000 .384461E-02 52.020912 3 3 4.477869E-08 53.630856 -.378 12.963 33333 .298522E-02 66.996155 4 4 6.812160E-08 53.124451 -.391 7.383 25000 .340608E-02 58.718525 5 5 9.701120E-08 47.910053 -.548 5.516 20000 .388045E-02 51.540443 6 6 1.209264E-07 45.677780 -.632 4.368 16666 .403072E-02 49.616940 7 7 1.308494E-07 47.677322 -.543 4.154 14285 .373837E-02 53.496609 8 8 1.662259E-07 45.888504 -.635 3.449 12500 .415565E-02 48.127274 9 9 1.888723E-07 44.983307 -.688 3.005 11111 .419712E-02 47.651245 10 10 2.173056E-07 43.874947 -.761 2.758 10000 .434611E-02 46.018139 11 20 5.137408E-07 37.854084 -1.334 2.566 5000 .513741E-02 38.930138 12 30 8.221110E-07 35.442196 -1.615 2.013 3333 .548019E-02 36.491421 13 40 1.123635E-06 34.581581 -1.738 1.558 2500 .561818E-02 35.598740 14 50 1.416640E-06 34.288200 -1.790 1.224 2000 .566656E-02 35.294781 15 60 1.726694E-06 34.000027 -1.852 1.024 1666 .575334E-02 34.748486 16 70 2.028280E-06 33.822033 -1.898 .875 1428 .579277E-02 34.511997 17 80 2.316288E-06 33.780796 -1.911 .746 1250 .579072E-02 34.538017 18 90 2.631892E-06 33.667309 -1.952 .663 1111 .584806E-02 34.195930 19 100 2.932992E-06 33.587460 -1.985 .595 1000 .586598E-02 34.094875 20 200 5.916160E-06 33.508553 -2.039 222.200 500 .591616E-02 33.805710 24 600 1.803875E-05 .000000 .000 .000 166 .598886E-02 33.261734 25 700 2.091358E-05 34.784653 27.472 .000 142 .593946E-02 33.471077 26 800 2.392474E-05 33.978992 12.166 .134 125 .598118E-02 33.438194 27 900 2.710717E-05 33.094578 -5.502 .284 111 .601779E-02 33.201546 28 1000 2.990976E-05 33.405022 1.012 .266 100 .598195E-02 33.433903 29 2000 6.049024E-05 32.907227 -10.676 .157 50 .604902E-02 33.063187 30 3000 9.237334E-05 32.316437 -26.493 .319 33 .609664E-02 32.476902 31 4000 1.203149E-04 32.913528 -7.825 .525 25 .601574E-02 33.246098 32 5000 1.558016E-04 32.295788 -30.409 .714 20 .623206E-02 32.092094 33 6000 2.195760E-04 29.013712 -170.441 3.697 16 .702643E-02 27.325390 34 7000 2.692754E-04 26.993610 -271.640 4.095 14 .753971E-02 25.995689 35 8000 3.311147E-04 25.175264 -378.257 4.453 12 .794675E-02 24.160814 36 9000 3.726778E-04 24.284664 -439.063 4.221 11 .819891E-02 24.149544 37 10000 4.310912E-04 23.436859 -505.776 4.013 10 .862182E-02 23.196947 38 20000 8.305920E-04 23.462109 -502.571 2.012 5 .830592E-02 24.079210 39 30000 1.234389E-03 23.771269 -454.194 1.341 3 .740634E-02 24.303516 40 40000 1.656704E-03 23.832405 -442.634 .972 2 .662682E-02 24.144325 41 50000 2.042304E-03 24.062340 -390.382 .826 2 .816922E-02 24.482153 42 60000 2.466176E-03 24.113258 -376.590 .671 1 .493235E-02 24.329165 43 70000 2.844160E-03 24.265314 -327.949 .627 1 .568832E-02 24.611837 44 80000 3.405184E-03 23.929565 -453.430 .817 1 .681037E-02 23.493591 45 90000 3.799424E-03 23.803953 -507.838 .764 1 .759885E-02 23.687801 46 100000 4.120448E-03 23.911249 -454.478 .734 1 .824090E-02 24.269205 (9) CHARGE ASSIGNMENT: A(J(I))=A(J(I))+S ICASE= 9 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 4.133377E-08 .000000 .000 .000 100000 .413338E-02 24.193295 2 2 1.202227E-07 12.676045 -.476 .000 50000 .601114E-02 16.635790 3 3 1.946131E-07 13.048070 -.451 .545 33333 .648704E-02 15.415197 4 4 2.695066E-07 13.176812 -.439 .425 25000 .673766E-02 14.841938 5 5 4.077440E-07 11.336527 -.657 4.280 20000 .815488E-02 12.262596 6 6 4.669166E-07 11.417866 -.645 3.422 16666 .778163E-02 12.850260 7 7 5.597234E-07 11.374311 -.653 2.648 14285 .799565E-02 12.506177 8 8 6.326682E-07 11.519486 -.623 2.263 12500 .790835E-02 12.644859 9 9 7.078419E-07 11.693628 -.582 2.039 11111 .786483E-02 12.714703 10 10 8.431873E-07 11.418595 -.654 1.987 10000 .843187E-02 11.859762 11 20 1.708032E-06 11.332584 -.686 .944 5000 .854016E-02 11.709383 12 30 2.592720E-06 11.311047 -.696 .597 3333 .864154E-02 11.570859 13 40 3.463782E-06 11.335545 -.683 .433 2500 .865946E-02 11.548070 14 50 4.336640E-06 11.356740 -.670 .339 2000 .867328E-02 11.529664 15 60 5.210353E-06 11.372015 -.658 .277 1666 .868045E-02 11.515535 16 70 6.084302E-06 11.383132 -.648 .234 1428 .868838E-02 11.505017 17 80 6.958285E-06 11.391510 -.640 .202 1250 .869786E-02 11.497087 18 90 7.831158E-06 11.398620 -.632 .177 1111 .870042E-02 11.492554 19 100 8.705279E-06 11.404073 -.624 .158 1000 .870528E-02 11.487282 20 200 1.750630E-05 11.393725 -.646 222.200 500 .875315E-02 11.424457 24 600 5.234275E-05 .000000 .000 .000 166 .868890E-02 11.462906 25 700 6.134625E-05 11.106784 -18.640 .000 142 .871117E-02 11.410640 26 800 7.007027E-05 11.281891 -8.949 .094 125 .875878E-02 11.417109 27 900 7.886414E-05 11.326542 -6.346 .083 111 .875392E-02 11.412031 28 1000 8.765695E-05 11.344776 -5.230 .071 100 .876570E-02 11.408108 29 2000 1.754317E-04 11.384510 -2.504 .040 50 .877158E-02 11.400449 30 3000 2.649212E-04 11.308653 -8.429 .115 33 .874240E-02 11.324121 31 4000 3.509453E-04 11.363845 -3.410 .148 25 .877363E-02 11.397788 32 5000 4.424320E-04 11.314224 -8.683 .179 20 .884864E-02 11.301171 33 6000 5.244800E-04 11.379901 -.559 .266 16 .839168E-02 11.439902 34 7000 6.147291E-04 11.383267 -.078 .216 14 .860621E-02 11.387129 35 8000 7.020800E-04 11.388679 .803 .183 12 .842496E-02 11.394712 36 9000 7.897833E-04 11.392093 1.432 .157 11 .868762E-02 11.395531 37 10000 8.773889E-04 11.394878 2.007 .137 10 .877389E-02 11.397455 38 20000 1.765223E-03 11.345394 -13.117 .109 5 .882611E-02 11.330016 39 30000 2.675798E-03 11.244159 -50.244 .199 3 .802739E-02 11.211611 40 40000 3.633408E-03 11.087090 -118.669 .388 2 .726682E-02 11.008947 41 50000 4.611712E-03 10.939436 -195.112 .512 2 .922342E-02 10.841961 42 60000 5.557504E-03 10.854564 -247.191 .502 1 .555750E-02 10.796213 43 70000 6.474496E-03 10.820382 -271.890 .440 1 .647450E-02 10.811652 44 80000 7.348224E-03 10.831566 -262.458 .382 1 .734822E-02 10.886984 45 90000 8.311808E-03 10.819400 -274.314 .335 1 .831181E-02 10.827969 46 100000 9.227776E-03 10.815497 -278.668 .296 1 .922778E-02 10.836847 (10) TRANSPOSITION: B(I,J)=A(J,I) ICASE= 10 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 6.002432E-08 .000000 .000 .000 100000 .600243E-02 16.659914 2 2 9.055232E-08 32.756813 .966 .000 25000 .452762E-02 22.086679 3 3 1.209382E-07 32.833256 .972 .028 11111 .403123E-02 24.806065 4 4 1.513062E-07 32.869694 .974 .028 6250 .378266E-02 26.436451 5 5 1.798656E-07 33.284908 1.012 .299 4000 .359731E-02 27.798534 6 6 2.118891E-07 33.092804 .993 .283 2777 .353050E-02 28.316702 7 7 2.398118E-07 33.295151 1.015 .304 2040 .342451E-02 29.189562 8 8 2.697874E-07 33.385647 1.026 .271 1562 .337126E-02 29.652973 9 9 2.967074E-07 33.655537 1.061 .395 1234 .329523E-02 30.332916 10 10 3.297536E-07 33.588230 1.052 .348 1000 .329754E-02 30.325674 11 20 6.390272E-07 32.934643 .935 .348 250 .319514E-02 31.297571 12 30 9.339003E-07 33.097794 .969 .247 111 .310989E-02 32.123344 13 40 1.238297E-06 33.088425 .966 .179 62 .307098E-02 32.302437 14 50 1.560064E-06 32.836124 .899 .277 40 .312013E-02 32.049969 15 60 1.850153E-06 32.877346 .912 .230 27 .299725E-02 32.429749 16 70 2.160640E-06 32.850925 .902 .194 20 .302490E-02 32.397808 17 80 2.627627E-06 31.969353 .549 1.242 15 .315315E-02 30.445723 18 90 4.250785E-06 26.937605 -1.743 222.200 12 .459085E-02 21.172560 (11) MATRIX MULT BY INNER PRODUCT ICASE= 11 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 7.532160E-08 .000000 .000 .000 100000 .150643E-01 13.276403 2 2 7.532032E-08 -781874.937500 -58893.070 111.100 12500 .753203E-02 26.553259 3 3 8.629352E-08 .000000 .000 .000 3703 .575181E-02 34.765068 4 4 9.908322E-08 78.187881 3.747 .000 1562 .495258E-02 40.370102 5 5 1.118144E-07 78.367195 3.763 .012 800 .447258E-02 44.716957 6 6 1.267686E-07 74.539787 3.400 .472 462 .421683E-02 47.330318 7 7 1.399302E-07 74.096748 3.356 .391 291 .399053E-02 50.024960 8 8 1.543487E-07 73.256851 3.269 .379 195 .385254E-02 51.830688 9 9 1.703783E-07 71.629379 3.093 .567 137 .378138E-02 52.823627 10 10 1.834368E-07 71.353165 3.062 .502 100 .366874E-02 54.514690 11 20 3.407733E-07 66.453392 2.432 .778 12 .327142E-02 58.690037 12 30 4.832712E-07 67.111771 2.525 .547 3 .260966E-02 62.076950 13 40 6.583200E-07 65.093529 2.207 .812 1 .210662E-02 60.760723 14 50 7.926785E-07 65.594818 2.296 .688 1 .396339E-02 63.077278 15 60 9.362844E-07 66.120926 2.402 .634 1 .674125E-02 64.083092 16 70 1.117153E-06 65.464935 2.253 .658 1 .109481E-01 62.659294 17 80 1.248300E-06 65.652992 2.301 .585 1 .159782E-01 64.087158 18 90 1.402611E-06 65.714439 2.319 .506 1 .227223E-01 64.166031 19 100 1.563584E-06 65.612839 2.286 .449 1 .312717E-01 63.955627 20 200 4.268560E-06 51.412125 -4.345 222.200 1 .341485E+00 46.854206 (12) MATRIX MULT BY MIDDLE PRODUCT ICASE= 12 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 8.261120E-08 .000000 .000 .000 100000 .165222E-01 12.104896 2 2 8.237824E-08 -4292.478516 -355.607 111.100 12500 .823782E-02 24.278257 3 3 9.129798E-08 .000000 .000 .000 3703 .608538E-02 32.859432 4 4 9.276312E-08 682.529053 59.314 .000 1562 .463667E-02 43.120583 5 5 1.066944E-07 129.900360 8.590 2.754 800 .426778E-02 46.862816 6 6 1.194728E-07 101.568451 5.917 2.689 462 .397414E-02 50.220631 7 7 1.335207E-07 89.964317 4.784 2.538 291 .380774E-02 52.426315 8 8 1.491282E-07 82.507805 4.028 2.463 195 .372224E-02 53.645119 9 9 1.621772E-07 79.501640 3.711 2.220 137 .359936E-02 55.494869 10 10 1.787264E-07 76.334602 3.364 2.109 100 .357453E-02 55.951443 11 20 3.252533E-07 70.282349 2.613 1.379 12 .312243E-02 61.490532 12 30 4.754489E-07 68.578117 2.381 .983 3 .256742E-02 63.098267 13 40 6.274400E-07 67.755905 2.255 .766 1 .200781E-02 63.751110 14 50 7.839232E-07 67.032127 2.131 .672 1 .391962E-02 63.781761 15 60 9.343289E-07 66.731422 2.073 .566 1 .672717E-02 64.217216 16 70 1.085727E-06 66.558891 2.035 .482 1 .106401E-01 64.472916 17 80 1.248080E-06 66.190765 1.944 .481 1 .159754E-01 64.098457 18 90 1.403986E-06 65.908546 1.866 .468 1 .227446E-01 64.103195 19 100 1.562048E-06 65.652725 1.788 .462 1 .312410E-01 64.018517 20 200 4.133050E-06 52.648624 -4.183 222.200 1 .330644E+00 48.390415 (13) MATRIX MULT BY OUTER PRODUCT ICASE= 13 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 1.356826E-07 .000000 .000 .000 100000 .271365E-01 7.370144 2 4 2.561741E-07 24.898018 2.378 .000 12500 .128087E-01 15.614383 3 9 4.415303E-07 26.238026 2.622 .613 3703 .980992E-02 20.383654 4 16 6.889629E-07 27.215569 2.858 .740 1562 .860928E-02 23.223312 5 25 9.984959E-07 27.929930 3.081 .747 800 .798797E-02 25.037659 6 36 1.365980E-06 28.547844 3.327 .770 462 .757299E-02 26.354710 7 49 1.817072E-06 28.749279 3.426 .576 291 .740275E-02 26.966457 8 64 2.285456E-06 29.292923 3.754 .760 195 .713062E-02 28.003160 9 81 2.821398E-06 29.783693 4.109 .837 137 .695757E-02 28.709169 10 100 3.446272E-06 30.041502 4.330 .730 100 .689254E-02 29.016861 11 400 1.291147E-05 31.352253 6.072 .394 12 .619750E-02 30.980215 12 900 2.833636E-05 31.916647 7.211 .285 3 .510054E-02 31.761318 13 1600 5.047040E-05 31.859390 7.024 .157 1 .403763E-02 31.701750 14 2500 7.768576E-05 32.148941 8.536 .224 1 .776858E-02 32.180927 15 3600 1.128469E-04 32.039654 7.667 .173 1 .135416E-01 31.901619 16 4900 1.682633E-04 30.313587 -12.257 222.200 1 .235569E-01 29.121023 20 40000 3.130582E-03 .000000 .000 .000 1 .125223E+01 12.777176 21 90000 7.026359E-03 12.834409 179.173 .000 1 .421582E+01 12.808909 (14) DYADS, STRIDE=128: A(I)=B(I)*C(I) ICASE= 14 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 4.502528E-08 .000000 .000 .000 100000 .450253E-02 22.209745 2 2 9.012737E-08 22.171923 -.002 222.200 50000 .450637E-02 22.190819 6 6 2.570753E-07 .000000 .000 .000 16666 .428442E-02 23.339468 7 7 3.172178E-07 16.627171 -1.726 .000 14285 .453146E-02 22.066858 8 8 3.775898E-07 16.595514 -1.734 .014 12500 .471987E-02 21.187014 9 9 4.442156E-07 16.082521 -1.887 .395 11111 .493568E-02 20.260431 10 10 4.982784E-07 16.409473 -1.783 .472 10000 .498278E-02 20.069103 11 20 1.103462E-06 16.549391 -1.731 .204 5000 .551731E-02 18.124767 12 30 1.707588E-06 16.554905 -1.729 .122 3333 .569139E-02 17.568638 13 40 2.297856E-06 16.636347 -1.686 .156 2500 .574464E-02 17.407530 14 50 2.917120E-06 16.585751 -1.718 .154 2000 .583424E-02 17.140194 15 60 3.521460E-06 16.565016 -1.734 .131 1666 .586675E-02 17.038389 16 70 4.101199E-06 16.606737 -1.697 .155 1428 .585651E-02 17.068180 17 80 4.730880E-06 16.580851 -1.723 .150 1250 .591360E-02 16.910173 18 90 5.334524E-06 16.566933 -1.739 .135 1111 .592666E-02 16.871233 19 100 5.904128E-06 16.596510 -1.701 .156 1000 .590413E-02 16.937304 20 200 2.254612E-04 1.125965 -32.560 14.660 500 .112731E+00 .887070 21 300 3.390047E-04 .881566 -34.553 10.490 333 .112889E+00 .884943 22 400 4.521114E-04 .838109 -35.289 7.750 250 .113028E+00 .884738 23 500 5.653197E-04 .829958 -35.515 6.032 200 .113064E+00 .884455 24 600 6.837452E-04 .828002 -35.595 4.855 166 .113502E+00 .877520 25 700 8.018948E-04 .828219 -35.583 4.035 142 .113869E+00 .872932 (15) DYADS, STRIDE=1024: A(I)=B(I)*C(I) ICASE= 15 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 4.562433E-08 .000000 .000 .000 100000 .456243E-02 21.918131 2 2 9.111040E-08 21.984753 .003 .000 50000 .455552E-02 21.951391 3 3 1.346317E-07 22.470037 .033 .344 33333 .448768E-02 22.283005 4 4 1.645363E-07 24.983929 .223 2.496 25000 .411341E-02 24.310741 5 5 2.115584E-07 24.673443 .195 1.769 20000 .423117E-02 23.634136 6 6 2.569063E-07 24.176975 .144 1.475 16666 .428160E-02 23.354820 7 7 3.172178E-07 22.888929 -.006 222.200 14285 .453146E-02 22.066858 11 20 2.260321E-05 .000000 .000 .000 5000 .113016E+00 .884830 12 30 3.387065E-05 .887513 .061 .000 3333 .112891E+00 .885723 13 40 4.519844E-05 .885143 -.002 .031 2500 .112996E+00 .884986 14 50 5.641664E-05 .886776 .047 .040 2000 .112833E+00 .886263 15 60 6.769786E-05 .887034 .056 .031 1666 .112785E+00 .886291 16 70 7.906492E-05 .886057 .019 .039 1428 .112905E+00 .885348 17 80 9.038746E-05 .885401 -.008 .040 1250 .112984E+00 .885078 18 90 1.016433E-04 .885380 -.009 .033 1111 .112926E+00 .885450 (16) CONTIGUOUS DAXPY: A(I)=S*B(I)+C(I) ICASE= 16 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 2.198400E-08 .000000 .000 .000 100000 .439680E-02 45.487633 2 2 4.511232E-08 43.237030 -.049 .000 50000 .451123E-02 44.333790 3 3 6.832581E-08 43.157570 -.052 .029 33333 .455501E-02 43.907272 4 4 8.312831E-08 48.391834 .144 2.752 25000 .415642E-02 48.118382 5 5 1.040576E-07 49.464985 .192 2.059 20000 .416230E-02 48.050308 6 6 1.271091E-07 48.796551 .157 1.597 16666 .423680E-02 47.203548 7 7 1.585641E-07 45.941887 -.008 2.389 14285 .453018E-02 44.146187 8 8 1.887437E-07 43.481506 -.168 2.827 12500 .471859E-02 42.385525 9 9 2.188937E-07 41.580322 -.306 2.979 11111 .486426E-02 41.115849 10 10 2.490496E-07 40.131256 -.424 2.974 10000 .498099E-02 40.152645 11 20 5.512448E-07 35.747475 -.916 2.223 5000 .551245E-02 36.281521 12 30 8.599388E-07 34.177364 -1.128 1.629 3333 .573235E-02 34.886204 13 40 1.147034E-06 33.983032 -1.160 1.183 2500 .573517E-02 34.872559 14 50 1.455104E-06 33.741673 -1.207 .929 2000 .582042E-02 34.361805 15 60 1.756965E-06 33.601421 -1.240 .760 1666 .585421E-02 34.149796 16 70 2.046566E-06 33.599709 -1.241 .632 1428 .584499E-02 34.203640 17 80 2.360115E-06 33.507603 -1.271 .548 1250 .590029E-02 33.896652 18 90 2.661617E-06 33.444855 -1.295 .483 1111 .591411E-02 33.814034 19 100 2.946048E-06 33.464806 -1.286 .426 1000 .589210E-02 33.943779 20 200 5.981696E-06 33.299404 -1.404 222.200 500 .598170E-02 33.435333 24 600 1.796318E-05 .000000 .000 .000 166 .596378E-02 33.401657 25 700 2.106862E-05 32.201550 -21.558 .000 142 .598349E-02 33.224766 26 800 2.407936E-05 32.700153 -12.085 .093 125 .601984E-02 33.223476 27 900 2.694458E-05 33.383495 1.594 .224 111 .598170E-02 33.401901 28 1000 3.011584E-05 33.133129 -3.668 .208 100 .602317E-02 33.205116 29 2000 6.049280E-05 32.930893 -8.427 .103 50 .604928E-02 33.061787 30 3000 9.032534E-05 33.136066 -2.924 .123 33 .596147E-02 33.213272 31 4000 1.212314E-04 32.995438 -7.312 .138 25 .606157E-02 32.994762 32 5000 1.569216E-04 32.157494 -37.883 .820 20 .627686E-02 31.863045 33 6000 2.000480E-04 30.699621 -100.013 1.803 16 .640154E-02 29.992802 34 7000 2.868297E-04 26.810616 -293.060 5.156 14 .803123E-02 24.404724 35 8000 3.305600E-04 25.080078 -393.838 5.227 12 .793344E-02 24.201355 36 9000 3.880611E-04 23.787952 -481.590 5.017 11 .853734E-02 23.192226 37 10000 4.128384E-04 23.504984 -503.816 4.596 10 .825677E-02 24.222553 38 20000 8.173312E-04 23.767469 -470.573 2.254 5 .817331E-02 24.469885 39 30000 1.224619E-03 24.014118 -432.141 1.474 3 .734771E-02 24.497423 40 40000 1.636288E-03 24.117519 -412.694 1.076 2 .654515E-02 24.445574 41 50000 2.036736E-03 24.239649 -385.116 .856 2 .814694E-02 24.549082 42 60000 2.423936E-03 24.405144 -340.583 .745 1 .484787E-02 24.753128 43 70000 2.900608E-03 24.240280 -392.933 .669 1 .580122E-02 24.132872 44 80000 3.286784E-03 24.232746 -395.732 .577 1 .657357E-02 24.339901 45 90000 3.644672E-03 24.353001 -344.011 .570 1 .728934E-02 24.693581 46 100000 4.183680E-03 24.181355 -428.602 .621 1 .836736E-02 23.902403 (17) INDIRECT DAXPY: A(J(I))=S*B(K(I))+C(L(I)) ICASE= 17 NCASE= 17 NMAX=100000 NTIMES= 100000 SI NI TI RINF N1/2 PCT ERROR REPEAT TOTAL TIME R(N) vlen sec Mflop/s vlen % sec Mflop/s 1 1 4.505728E-08 .000000 .000 .000 100000 .901146E-02 22.193972 2 2 9.011200E-08 22.195232 .000 .000 50000 .901120E-02 22.194601 3 3 1.288871E-07 23.857872 .100 1.148 33333 .859238E-02 23.276194 4 4 1.647565E-07 25.133673 .194 1.412 25000 .823782E-02 24.278257 5 5 2.038912E-07 25.489897 .226 1.091 20000 .815565E-02 24.522884 6 6 2.409696E-07 25.796585 .256 .925 16666 .803200E-02 24.899405 7 7 2.770750E-07 26.100595 .291 .856 14285 .791603E-02 25.263920 8 8 3.180237E-07 26.079165 .288 .698 12500 .795059E-02 25.155361 9 9 3.539325E-07 26.180010 .302 .614 11111 .786509E-02 25.428577 10 10 3.893888E-07 26.334925 .326 .594 10000 .778778E-02 25.681273 11 20 7.683840E-07 26.449850 .348 .296 5000 .768384E-02 26.028652 12 30 1.139749E-06 26.599060 .383 .221 3333 .759757E-02 26.321581 13 40 1.522125E-06 26.551186 .370 .165 2500 .761062E-02 26.279053 14 50 1.898624E-06 26.538511 .366 .129 2000 .759450E-02 26.334862 15 60 2.274881E-06 26.537201 .366 .104 1666 .757990E-02 26.375004 16 70 2.651698E-06 26.536697 .365 .086 1428 .757325E-02 26.398184 17 80 3.028787E-06 26.535545 .365 .073 1250 .757197E-02 26.413212 18 90 3.408994E-06 26.525211 .359 .066 1111 .757478E-02 26.400753 19 100 3.765120E-06 26.569469 .386 .111 1000 .753024E-02 26.559578 20 200 7.571712E-06 26.498377 .318 .078 500 .757171E-02 26.414104 21 300 1.135356E-05 26.467098 .282 .056 333 .756147E-02 26.423426 22 400 1.513370E-05 26.456923 .268 .042 250 .756685E-02 26.431086 23 500 1.881664E-05 26.522760 .378 .082 200 .752666E-02 26.572226 24 600 2.258121E-05 26.551769 .436 .077 166 .749696E-02 26.570768 25 700 2.647437E-05 26.513811 .347 .086 142 .751872E-02 26.440670 26 800 3.029094E-05 26.480570 .256 .092 125 .757274E-02 26.410534 27 900 3.454616E-05 26.340416 -.189 222.200 111 .766925E-02 26.052097 31 4000 7.334605E-04 .000000 .000 .000 25 .366730E-01 5.453600 32 5000 9.200512E-04 5.359322 -69.149 .000 20 .368020E-01 5.434480 33 6000 1.103208E-03 5.409096 -29.546 .073 16 .353027E-01 5.438684 34 7000 1.285641E-03 5.435672 -6.763 .084 14 .359980E-01 5.444754 35 8000 1.471659E-03 5.428922 -12.964 .069 12 .353198E-01 5.436043 36 9000 1.654819E-03 5.431368 -10.566 .057 11 .364060E-01 5.438661 37 10000 1.849062E-03 5.400410 -42.806 .155 10 .369812E-01 5.408146 38 20000 3.684019E-03 5.422146 -16.042 .084 5 .368402E-01 5.428854 39 30000 5.522688E-03 5.429082 -6.345 .057 3 .331361E-01 5.432137 40 40000 7.369792E-03 5.427225 -9.342 .042 2 .294792E-01 5.427561 41 50000 9.211200E-03 5.427183 -9.422 .032 2 .368448E-01 5.428174 42 60000 1.105050E-02 5.428071 -7.490 .026 1 .221010E-01 5.429620 43 70000 1.294746E-02 5.417093 -35.050 .091 1 .258949E-01 5.406467 44 80000 1.470310E-02 5.426616 -7.686 .115 1 .294062E-01 5.441028 45 90000 1.658074E-02 5.426980 -6.497 .098 1 .331615E-01 5.427986 46 100000 1.842701E-02 5.426790 -7.197 .086 1 .368540E-01 5.426817 # SUMMARY OF SELECTED VALUES # -------------------------- # # LENGTHS RMSERR/VALUE R-INFINITY N-HALF R(N) # vlen % Mflop/s vlen Mflop/s # # (1) CONTIGUOUS DYADS: A(I)=B(I)*C(I) # <= 80 .560 16.740 -1.302 | Min = 11.926 # >= 600 .407 12.201 -368.505 | Max = 24.630 # # (2) DYADS, STRIDE=8: A(I)=B(I)*C(I) # <= 8 2.670 20.538 -.488 | Min = 1.613 # >= 60 1.479 1.577 -190.004 | Max = 24.059 # # (3) CONTIGUOUS TRIADS: A(I)=B(I)*C(I)+D(I) # <= 800 .193 66.835 2.767 | Min = 20.078 # >= 6000 .334 20.716 47.415 | Max = 67.123 # # (4) TRIADS, STRIDE=8: A(I)=B(I)*C(I)+D(I) # <= 200 .328 65.435 2.057 | Min = 2.590 # >= 900 .263 2.597 -25.630 | Max = 64.974 # # (5) RANDOM SCATTER/GATHER: # <= 900 .063 18.958 .779 | Min = 9.489 # >= 7000 .668 12.418 -1354.931 | Max = 18.964 # # (6) CONTIGUOUS 4-OP: A(I)=B(I)*C(I)+D(I)*E(I)+F(I) # <= 80 .350 44.585 -.624 | Min = 23.258 # >= 600 .319 23.313 -452.546 | Max = 55.700 # # (7) INNER PRODUCT: S=S+B(I)*C(I) # <= 700 .253 66.474 .529 | Min = 34.962 # >= 5000 .986 34.204 -2090.563 | Max = 67.506 # # (8) FIRST ORDER RECURRENCE: A(I)=B(I)*A(I-1)+D(I) # <= 80 .746 33.781 -1.911 | Min = 23.197 # >= 600 .734 23.911 -454.478 | Max = 133.570 # # (9) CHARGE ASSIGNMENT: A(J(I))=A(J(I))+S # <= 80 .202 11.392 -.640 | Min = 10.796 # >= 600 .296 10.815 -278.668 | Max = 24.193 # # (10) TRANSPOSITION: B(I,J)=A(J,I) # <= 60 .230 32.877 .912 | Min = 16.660 # >= 400 .000 26.938 -1.743 | Max = 32.430 # # (11) MATRIX MULT BY INNER PRODUCT # <= 80 .585 65.653 2.301 | Min = 13.276 # >= 600 .000 51.412 -4.345 | Max = 64.166 # # (12) MATRIX MULT BY MIDDLE PRODUCT # <= 80 .481 66.191 1.944 | Min = 12.105 # >= 600 .000 52.649 -4.183 | Max = 64.473 # # (13) MATRIX MULT BY OUTER PRODUCT # <= 1600 .157 31.859 7.024 | Min = 7.370 # >= 200 .000 12.834 179.173 | Max = 32.181 # # (14) DYADS, STRIDE=128: A(I)=B(I)*C(I) # <= 0 .000 .000 .000 | Min = .873 # >= 6 4.035 .828 -35.583 | Max = 23.339 # # (15) DYADS, STRIDE=1024: A(I)=B(I)*C(I) # <= 4 2.496 24.984 .223 | Min = .885 # >= 20 .033 .885 -.009 | Max = 24.311 # # (16) CONTIGUOUS DAXPY: A(I)=S*B(I)+C(I) # <= 80 .548 33.508 -1.271 | Min = 23.192 # >= 600 .621 24.181 -428.602 | Max = 48.118 # # (17) INDIRECT DAXPY: A(J(I))=S*B(K(I))+C(L(I)) # <= 600 .077 26.552 .436 | Min = 5.406 # >= 4000 .086 5.427 -7.197 | Max = 26.572 # # # # TOTAL EXECUTION TIME IS 1.6083316803E+01 SECONDS.