Dr Patrick H. Worley Oak Ridge National Laboratory System Description ------------------ 11/15-16/95 NASA Ames NAS SP2 mpxlf IBM MPI xlf flags: -O3 -qstrict -NQ30000 CURRENT STATUS: 144 nodes available 11/13/95 Welcome Back. We are now running AIX 4.1.3, PSSP 2.1.0. Home filesystems have merged: /u/username works /home/ba /home/bb /home/bc are each 8 GB. /scratch is a PIOFS (parallel file system) and mounted on all the nodes. Babbage2 is up and ready for use. Babbage1 will be up in the near future. VERSION DIFFERENTIATION: AIX 3.2.5 --> 4.1.3 PSSP 1.2.0 --> 2.1.0 poe 1.2.1 --> 2.1.0.2 ESSL 2.2.1 --> 2.2.2.1 xlC 2.1.2 --> 3.1.3 xlf 3.1.2 --> 3.2.3 PBS 1.1.4 --> 1.1.4+ PVMe 1.3.1 --> 2.1.0 MP_EUILIB=us MP_EUIDEVICE=css MP_HOSTFILE=NULL MP_RESD=yes MP_RMPOOL=0 MP_CONTROL_WORKSTATION=engine.nas.nasa.gov MP_INFOLEVEL=1 MP_EUILIBPATH=/usr/lpp/ppe.poe/lib MP_PROCS=1 MP_LABELIO=yes MP_EUIDEVELOP=no MP_PGMMODEL=spmd MP_PULSE=600 SP_NAME=engine.nas.nasa.gov Timing Tables ------------- make MACH=sp COMM=mpif WORKSPACE=13000000 / 8500000 optimization level 0 optimization level 1 T42L16 1x1 - / 270.27 -procs 1 2x1 - / 253.34 -procs 2 1x2 - /142.40 -procs 2 - / 253.32 2x2 - / 109.87 -procs 4 1x4 - / 78.10 -procs 4 4x2 - / 52.58 -procs 8 2x4 - / 50.87 -procs 8 4x4 - / 28.32 -procs 16 4x4 - / 28.15 -procs 16 8x4 - / 16.28 -procs 32 8x4 - / 15.41 -procs 32 8x8 - / 10.45 -procs 64 16x4 - / 9.65 -procs 64 16x8 9.14 / 7.98 -procs 128 16x8 - / 6.81 -procs 128 T170L32 4x4 1764.4 / - -procs 16 4x4 1758.2 / - -procs 16 8x4 - / 905.84 -procs 32 8x4 - / 900.88 -procs 32 8x8 - / 487.92 -procs 64 16x4 - / 455.09 -procs 64 - / 485.83 16x8 - / 218.13 -procs 128 16x8 - / 217.56 -procs 128 T340L64 16x8 -procs 128 (need 104+ MBytes) Note: 1) all timings in seconds 2) using -qarch=pwr2 does not change timings. Is this hardwired into NASA Ames compilers? 3) Two different executable sizes used, depending on problem size and number of processors. Raw Timing Output Data ---------------------- small problem; level 0 optimization .27027E+03 .12422E+01 .12795E+01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 1, 1) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 4691369 .25334E+03 .11636E+01 .12128E+01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 2, 1) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 2412937 .10987E+03 .48971E+00 .18220E+01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 2, 2) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 1206801 .52583E+02 .23875E+00 .31223E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 4, 2) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 637193 .28319E+02 .12751E+00 .14497E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 4, 4) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 318969 .16289E+02 .70707E-01 .86119E-01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 8, 4) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 176549 .10452E+02 .45058E-01 .63277E-01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 8, 8) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 88629 .79818E+01 .30583E-01 .19513E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 16, 8) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 53015 .91425E+01 .30734E-01 .19008E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 16, 8) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 53015 medium problem; level 0 optimization .17644E+04 .80712E+01 .10239E+02 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 4, 4) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 10112721 .90584E+03 .41333E+01 .44161E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 8, 4) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 5608617 .48792E+03 .21781E+01 .50238E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 8, 8) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 2805673 .48583E+03 .21764E+01 .48410E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 8, 8) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 2805673 .21813E+03 .96944E+00 .12676E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 16, 8) 1 (1,10,10, 2, 2,6,6) (0, 0, 0, 1, 2,6,6) 0 0 1679629 small problem; level 1 optimization .14240E+03 .65313E+00 .72640E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 1, 2) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 2346017 .78099E+02 .35721E+00 .42947E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 1, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 1173489 .50865E+02 .23157E+00 .25490E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 2, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 603809 .28145E+02 .12728E+00 .14437E+00 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 4, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 318969 .15412E+02 .68647E-01 .78276E-01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 8, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 176549 .96453E+01 .41431E-01 .58839E-01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 16, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 105339 .68057E+01 .29059E-01 .42498E-01 .00000E+00 216 ( 42, 42, 42) ( 128, 64, 16) (2,T,F,F) ( 16, 8) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 53015 medium problem; level 1 optimization .17582E+04 .80684E+01 .82376E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 4, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 10112721 .90088E+03 .41305E+01 .42842E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 8, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 5608617 .45509E+03 .19948E+01 .24105E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 16, 4) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 3356565 .21756E+03 .97148E+00 .12169E+01 .00000E+00 216 (170,170,170) ( 512, 256, 32) (2,T,F,F) ( 16, 8) 1 (1,10,10, 2, 2,5,5) (0, 2, 2, 1, 2,5,5) 0 0 1679629