# Invocation command line: # /spec/cpu2000/bin/runspec -c cfp.SqH.cfg -r -u 128 --deletework ############################################################################ # Invocation command line: # /spec/cpu2000/bin/runspec -c tuned.690.cfp.rate.006.cfg -r -u 128 --deletework ############################################################################ ############################################################################ # Invocation command line: # # /spec/cpu2000/bin/runspec -c tuned.690.cfp.001.cfg # /spec/cpu2000/bin/runspec -c tuned.690.cfp.001.cfg -r -u ... # ############################################################################ # # Config-file for 64-way 1.9 GHz Squadron-H publication measurements. # Tuning-runs were performed Sept. 5-6 2004 and the results are accumulated # in the directory # # /gsa/ausgsa/projects/s/spec/Results/Squadron-H.32way/cpu.1way.compilers_08_08.runs_09_05.SMT # # The parameters are set up for a reportable run. # # Authors: Carl Ponder, Alan MacKay & Kaivalya M. Dixit at IBM # ############################################################################ # # General environment settings. # OS_LIBS=-L/usr/lib #=============================================================================== # How the compilers are called #=============================================================================== # To remove all the warning messages that are put out, you can append the following # compile time message suppression flag to these 2 lines: # -w -qinfo=noinl -qsuppress=1500-036 # Also need on the FC line is "-qsuppress=cmpmsg" # To reduce compile time, the following options can be used (also added here): # -qipa=noobject -qipa=threads #=============================================================================== CC=/usr/vac/bin/xlc FC=/usr/bin/xlf90 F77=/usr/bin/xlf90 FXLF=/usr/bin/xlf # The next line set up parallel make, the value of j is the number of thread. #makeflags = -j8 # galgel & facerec do not have dependency rules to allow parallel make's # need to add "makeflags = -j1" for them, the easist way is to add in the # portability flags section # # Commands for "rate" run execution. The "submit" command is used to bind the # execution-thread to a CPU. # # On the Squadron, we still use this for 1-way runs so the thread will # not "drift" between CPU's and lose locality. # # use_submit_for_speed = 1 # submit = let "MYCPU=\$SPECUSERNUM"; bindprocessor \$\$ \$MYCPU; $command # submit = schedule.16 \$SPECUSERNUM $command # submit = schedule.32 \$SPECUSERNUM $command # submit = schedule.64 \$SPECUSERNUM $command # submit = schedule.128 \$SPECUSERNUM $command submit = schedule.128 \$SPECUSERNUM $command # # # Global options for reports # company_name = IBM license_num = 11 tester_name = IBM test_site = Austin, TX test_date = Nov-2004 # # 32-way Squadron-H # hw_avail =Nov-2004 hw_vendor =IBM Corporation hw_model =IBM eServer p5 595 (1900 MHz, 64 CPU) hw_cpu =POWER5 hw_cpu_mhz =1900 hw_fpu =Integrated hw_ncpu =64 cores, 32 chips, 2 cores/chip (SMT on) hw_ncpuorder =16,24,32,40,48,56,64 hw_pcache =64KBI+32KBD (on chip)/core hw_scache =1920KB unified (on chip)/chip hw_tcache =144MB unified (off-chip)/MCM, 8 MCM/SUT hw_ocache =None hw_memory =256 GB DDR2 hw_disk =3x36GB SCSI, 15K RPM hw_other =None # hw_parallel = No # hw_parallel = SMT hw_parallel = No sw_avail =Dec-2004 sw_parallel = sw_os =AIX 5L V5.3 sw_compiler0 =XL C/C++ Enterprise Edition V7.0 for AIX sw_compiler1 =XL Fortran Enterprise Edition V9.1 for AIX sw_compiler2 =Other Software: ESSL for AIX V4.2 sw_file =AIX/JFS2 sw_state =Multi-user users=128 rate=1 # # Global options for runspec # runlist = fp action = validate iterations = 3 output_format = asc,config,pdf ignore_errors = 0 reportable = 1 mean_anyway = 1 size = ref tune = base,peak ext = SqH.Pub.040907 env_vars = 1 deletework = 0 # # # FP "base" optimization flags. fp=base=default=default: fdo_pre0 = /usr/vacpp/bin/cleanpdf PASS1_FFLAGS =-qpdf1 -O5 -blpdata -lmass PASS1_LDFFLAGS =-qpdf1 -O5 -blpdata -lmass PASS2_FFLAGS =-qpdf2 -O5 -blpdata -lmass PASS2_LDFFLAGS =-qpdf2 -O5 -blpdata -lmass # PASS1_CFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS1_CFLAGS =-qpdf1 -O5 -blpdata -qalign=natural PASS1_LDCFLAGS =-qpdf1 -O5 -blpdata -qalign=natural # PASS2_CFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural PASS2_CFLAGS =-qpdf2 -O5 -blpdata -qalign=natural PASS2_LDCFLAGS =-qpdf2 -O5 -blpdata -qalign=natural # # Portability flags. # # If there aren't any flags for the benchmark, we leave an # empty entry as a placeholder. # 168.wupwise=default=default=default: EXTRA_FFLAGS=-qfixed 171.swim=default=default=default: EXTRA_FFLAGS=-qfixed 172.mgrid=default=default=default: EXTRA_FFLAGS=-qfixed 173.applu=default=default=default: EXTRA_FFLAGS=-qfixed 177.mesa=default=default=default: 178.galgel=default=default=default: EXTRA_FFLAGS=-qfixed -qsuffix=f=f90 179.art=default=default=default: 183.equake=default=default=default: 187.facerec=default=default=default: EXTRA_FFLAGS=-qsuffix=f=f90 188.ammp=default=default=default: 189.lucas=default=default=default: EXTRA_FFLAGS=-qsuffix=f=f90 191.fma3d=default=default=default: EXTRA_FFLAGS= -qsuffix=f=f90 200.sixtrack=default=default=default: EXTRA_FFLAGS=-qfixed 301.apsi=default=default=default: EXTRA_FFLAGS=-qfixed fp=default=default=default: notes1000= Portability Flags: notes1010= -qfixed used in: 168.wupwise, 171.swim, 172.mgrid, 173.applu, notes1020= 178.galgel, 200.sixtrack, 301.apsi notes1030= -qsuffix=f=f90 used in: 178.galgel, 187.facerec, 189.lucas, 191.fma3d notes1040= notes1050= notes1060= Base Optimization Flags: notes1070= C: -qpdf1/pdf2 notes1075= -O5 -blpdata -lmass notes1080= Fortran: -qpdf1/pdf2 notes1085= -O5 -blpdata -lmass notes1090= 168.wupwise=peak=default=default: F77OPTIMIZE = -O5 -qarch=pwr3 -qtune=pwr3 -blpdata -lmass EXTRA_F77FLAGS=-qfixed # F77OPTIMIZE=-O5 171.swim=peak=default=default: # F77 = $(FXLF) basepeak=1 172.mgrid=peak=default=default: EXTRA_F77FLAGS=-qfixed fdo_pre0 = /usr/vacpp/bin/cleanpdf PASS1_F77FLAGS =-qpdf1 -O5 -blpdata -lmass PASS1_LDF77FLAGS =-qpdf1 -O5 -blpdata -lmass PASS2_F77FLAGS =-qpdf2 -O5 -blpdata -lmass PASS2_LDF77FLAGS =-qpdf2 -O5 -blpdata -lmass 173.applu=peak=default=default: users=64 F77 = $(FXLF) F77OPTIMIZE = -O5 -blpdata -lmass # F77OPTIMIZE = -O5 -qarch=pwr3 -qtune=pwr3 -blpdata -lmass 177.mesa=peak=default=default: fdo_pre0 = /usr/vacpp/bin/cleanpdf PASS1_CFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS1_LDCFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS2_CFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural PASS2_LDCFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural 178.galgel=peak=default=default: basepeak=1 # FOPTIMIZE = -O5 -blpdata -qessl -lessl 179.art=peak=default=default: fdo_pre0 = /usr/vacpp/bin/cleanpdf PASS1_CFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS1_LDCFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS2_CFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural PASS2_LDCFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural 183.equake=peak=default=default: fdo_pre0 = /usr/vacpp/bin/cleanpdf PASS1_CFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS1_LDCFLAGS =-qpdf1 -O5 -blpdata -lmass -qalign=natural PASS2_CFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural PASS2_LDCFLAGS =-qpdf2 -O5 -blpdata -lmass -qalign=natural 187.facerec=peak=default=default: basepeak=1 188.ammp=peak=default=default: fdo_pre0 = /usr/vacpp/bin/cleanpdf PASS1_CFLAGS = -qpdf1 -O5 -blpdata -qalign=natural -D_ILS_MACROS PASS1_LDCFLAGS = -qpdf1 -O5 -blpdata -qalign=natural -D_ILS_MACROS PASS2_CFLAGS = -qpdf2 -O5 -blpdata -qalign=natural -D_ILS_MACROS PASS2_LDCFLAGS = -qpdf2 -O5 -blpdata -qalign=natural -D_ILS_MACROS 189.lucas=peak=default=default: users=64 FOPTIMIZE = -O5 -blpdata -lmass 191.fma3d=peak=default=default: fdo_pre0 = /usr/vac/bin/cleanpdf PASS1_FFLAGS =-qpdf1 -O5 -blpdata -qalign=natural -qhot=arraypad -Q PASS1_LDFFLAGS =-qpdf1 -O5 -blpdata -qalign=natural -qhot=arraypad -Q PASS2_FFLAGS =-qpdf2 -O5 -blpdata -qalign=natural -qhot=arraypad -Q PASS2_LDFFLAGS =-qpdf2 -O5 -blpdata -qalign=natural -qhot=arraypad -Q 200.sixtrack=peak=default=default: EXTRA_F77FLAGS=-qfixed F77OPTIMIZE = -O3 -qhot -qarch=pwr5 -qtune=pwr5 -qfdpr fdo_run1 = fdpr -quiet -R3 -p $commandexe -x $command fdo_post1 = cp ${baseexe}.fdpr $baseexe 301.apsi=peak=default=default: EXTRA_F77FLAGS=-qfixed F77OPTIMIZE = -O5 -lmass -qessl -lessl -blpdata -qsave # # # Notes: # fp=default=default=default: notes2000= Peak Optimization Flags: notes2010= 168.wupwise: -O5 -qarch=pwr3 -qtune=pwr3 -blpdata -lmass notes2020= 171.swim: basepeak=1 notes2040= 172.mgrid: -qpdf1/pdf2 notes2045= -O5 -blpdata -lmass notes2050= 173.applu: -O5 -blpdata -lmass notes2055= F77=xlf notes2060= 177.mesa: -qpdf1/pdf2 notes2065= notes2080= 178.galgel: -qpdf1/pdf2 notes2085= -O5 notes2090= 179.art: -qpdf1/pdf2 notes2095= -O5 notes2100= 183.equake: -qpdf1/pdf2 notes2110= -O5 notes2120= 187.facerec: -qpdf1/pdf2 notes2140= -O5 notes2150= 188.ammp: -qpdf1/pdf2 notes2160= -O5 -blpdata -qalign=natural -D_ILS_MACROS notes2170= 189.lucas: -O5 -blpdata -lmass notes2180= 191.fma3d: -qpdf1/pdf2 notes2190= -O5 -blpdata -qalign=natural -qhot=arraypad -Q notes2200= 200.sixtrack: -O3 -qhot -qarch=pwr5 -qtune=pwr5 -qfdpr notes2210= fdpr -R3 notes2220= 301.apsi: -O5 -lmass -qessl -lessl -blpdata -qsave notes2300= notes2310= notes2320= MCM: Acronym for "Multi-Chip Module" notes2330= SUT: Acronym for "System Under Test" notes2340= notes2350= C: IBM XL C for AIX invoked as xlc notes2360= Fortran 90: IBM XL Fortran for AIX invoked as xlf90 notes2370= notes2380= ulimits set to unlimited. notes2390= Large page mode and memory affinity were set as follows: notes2400= vmo -r -o lgpg_regions=8192 -o lgpg_size=16777216 -o memory_affinity=1 notes2410= chuser capabilities=CAP_BYPASS_RAC_VMM,CAP_PROPAGATE $USER notes2420= shutdown -r notes2430= export MEMORY_AFFINITY=MCM notes2440=