# Invocation command line: # /benchmarks/cpu2000_1.2/bin/runspec -c Sep1-fp-retune -s -r -u 2 fp ############################################################################ # Invocation command line: # /benchmarks/cpu2000_1.2/bin/runspec --config=config.1360.b --reportable fp ############################################################################ ##################################################################### # SUT/Experimenter Section # If it affects performance, you need to describe it, either # in the pre-defined fields or by adding it to the notes section. # System Description - edit as needed hw_avail = Aug-2002 hw_model = AlphaServer ES45 68/1250 machine_name = AlphaServer ES45 68/1250 hw_memory = 16GB hw_disk = 9 GB SCSI hw_other = None hw_vendor = Compaq Computer Corporation company_name = Compaq Computer Corporation # CPU description - edit as needed # Note ncpu = number enabled; ncpuorder = valid numbers of CPUs # to order for this model hw_cpu = Alpha 21264C hw_cpu_mhz = 1250 hw_fpu = Integrated hw_ncpu = 1 hw_ncpuorder = 1 to 4 hw_parallel = No hw_pcache = 64KB(I)+64KB(D) on chip hw_scache = 16MB off chip per CPU hw_tcache = None hw_ocache = None # Tester description - edit the date, put your name here. Notice that # "tester_name" is the company, but as it says in the documentation, # "prepared_by" can be personal: # # prepared_by Is never output. If you wish, you could set this to # your own name, so that the rawfile will be tagged with # your name but not the formal reports. test_date = Jul-2002 license_num = 2 prepared_by = Paula Smith tester_name = HP NH # Operating system, file system - edit at least the OS version sw_os = Compaq Tru64 UNIX T5.1B-6 (Rev. 2510) sw_file = ufs sw_state = Multi-user # Special notes # If you have notes to add, put them here, starting with number 900. # #sw_os2 = +Patch Kit 2 #notes900 = #notes901 = Information on UNIX V5.1 Patches can be found at #notes902 = http://ftp1.service.digital.com/public/unix/v5.1/ #notes903 = # OS Date # Use the "sw_avail" line here only if the OS you are testing ships # later than the compilers (and then comment out their availability # dates, below!) Notice that the field "sw_avail" occurs multiple # times in this file, but only one should be used on a given run: # # - the OS date (if later than the compilers), or # - the last complier date (may be different for FP vs. Int) sw_avail = Oct-2002 # With luck, you shouldn't have to edit below this point # (unless you are installing new compilers or re-tuning) # End of SUT/Experimenter section ###################################################################### #SC#submit= echo "$command" > dobmk; prun -n 1 sh dobmk #SC#command_add_redirect=1 #GS#submit = runon $SPECUSERNUM $command #GS#notes906 = submit = runon $command ###################################################################### # The special "un-named" section of the config file. Must appear # before any instances of "default=" ext = aug30A output_format = asc #reportable = 1 teeout = no teerunout = yes tune = all ###################################################################### # Compiler selection - See "OS Date" above! Remember, it's the # LAST compiler in a set whose date should be listed. Remember that # C is used on both suites. Remember KAP dates. Remember to include # KAP C if "kcc" is ever used (it's probably not the default, so won't # be listed here under "CC", but should be listed as a sw_compiler if it # is used anywhere else in the file). default=default=default=default: sw_compiler = Compaq C V6.5-011-48C5K sw_compiler2 = Spike V5.2 (506 48C5K) #sw_avail = Oct-2001 CC = cc -v int=default=default=default: sw_compiler4 = Compaq C++ V6.5-028 CXX = cxx -v fp=default=default=default: sw_compiler4 = Compaq Fortran V5.5-1877-48BBF sw_compiler5 = Compaq Fortran 77 V5.5-1877-48BBF sw_compiler6 = KAP Fortran V4.4 k340504 20010517 sw_compiler7 = KAP Fortran 77 V4.1 k310440 980926 sw_compiler8 = KAP C V4.2 k010737S 010515 FC = f90 -v # Notice that in the compiler selection above, we always ask for -v, # verbose mode. SPEC has said that it would prefer that notes sections # NOT document the use of "-v". OK, I've dropped it from the notes # sections, but it's here in the config file and plain to see for anyone # who really cares. The effect of -v is simply to cause the driver to use # verbose mode, but it has no effect on the generated executable. ######################################################################### # # Feedback description. When using feedback for individual benchmarks, # do it strictly as described here, so that this comment remains correct. # (Unfortunately, there is no convenient macro mechanism to enforce this # automatically, so just do it.) default=default=default=default: notes700 = notes701 = Most benchmarks are built using one or more types of notes702 = profile-driven feedback. The types used are designated notes703 = by abbreviations in the notes: notes704 = notes705 = +CFB: Code generation is optimized by the compiler, using notes706 = feedback from a training run. These commands are notes707 = done before the first compile (in phase "fdo_pre0"): notes708 = notes710 = mkdir /tmp/pp notes711 = rm -f /tmp/pp/${baseexe}* notes712 = notes713 = and these flags are added to the first and second compiles: notes714 = notes715 = PASS1_CFLAGS = -prof_gen_noopt -prof_dir /tmp/pp notes716 = PASS2_CFLAGS = -prof_use -prof_dir /tmp/pp notes717 = notes718 = (Peak builds use /tmp/pp above; base builds use /tmp/pb.) notes719 = notes720 = +IFB: Icache usage is improved by the post-link-time optimizer notes721 = Spike, using feedback from a training run. These commands notes722 = are used (in phase "fdo_postN"): notes723 = notes724 = mv ${baseexe} oldexe notes725 = spike oldexe -feedback oldexe -o ${baseexe} notes726 = notes727 = +PFB: Prefetches are improved by the post-link-time optimizer notes728 = Spike, using feedback from a training run. These notes729 = commands are used (in phase "fdo_post_makeN"): notes730 = notes731 = rm -f *Counts* notes732 = mv ${baseexe} oldexe notes733 = pixie -stats dstride oldexe 1>pixie.out 2>pixie.err notes734 = mv oldexe.pixie ${baseexe} notes735 = notes736 = A training run is carried out (in phase "fdo_runN"), and notes737 = then this command (in phase "fdo_postN"): notes738 = notes739 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} notes740 = notes741 = When Spike is used for both Icache and Prefetch improvements, notes742 = only one spike command is actually issued, with the Icache notes743 = options followed by the Prefetch options. notes744 = notes750 = vm: notes751 = vm_bigpg_enabled = 1 notes752 = vm_bigpg_thresh=16 notes753 = vm_swap_eager = 0 notes754 = notes755 = proc: notes756 = max_per_proc_address_space = 0x40000000000 notes757 = max_per_proc_data_size = 0x40000000000 notes758 = max_per_proc_stack_size = 0x40000000000 notes759 = max_proc_per_user = 2048 notes760 = max_threads_per_user = 0 notes761 = maxusers = 16384 notes762 = per_proc_address_space = 0x40000000000 notes763 = per_proc_data_size = 0x40000000000 notes764 = per_proc_stack_size = 0x40000000000 notes765 = ####################################################################### # Integer Baseline Optimization # notes0xx are used for baseline tuning description int=base=default=default: notes000 = Baseline C : cc -arch ev6 -fast +CFB ONESTEP notes001 = C++: cxx -arch ev6 -O2 ONESTEP OPTIMIZE = -v -arch ev6 COPTIMIZE = -fast CXXOPTIMIZE = -O2 ONESTEP = yes fdo_pre0 = mkdir /tmp/pb; rm -f /tmp/pb/${baseexe}* PASS1_CFLAGS = -prof_gen_noopt -prof_dir /tmp/pb PASS2_CFLAGS = -prof_use_feedback -prof_dir /tmp/pb 252.eon=base=default=default: # Turn feedback off for eon fdo_pre0 = ####################################################################### # Integer Peak # notes10x are used for peak tuning description, followed by the # actual benchmark numbers (e.g. notes253 and (if needed) notes253_1 # for perlbmk) int=peak=default=default: notes100 = notes101 = Peak: notes102 = All but 252.eon: cc -g3 -arch ev6 ONESTEP OPTIMIZE = -v -g3 -arch ev6 ONESTEP = yes # GEM Feedback - turn off in individual benchmark if not needed. fdo_pre0 = mkdir /tmp/pp; rm -f /tmp/pp/${baseexe}* PASS1_CFLAGS = -prof_gen_noopt -prof_dir /tmp/pp PASS2_CFLAGS = -prof_use_feedback -prof_dir /tmp/pp 164.gzip=peak=default=default: notes164 = 164.gzip: -fast -O4 -non_shared +CFB COPTIMIZE = -fast -O4 -non_shared feedback = 1 175.vpr=peak=default=default: notes175 = 175.vpr: -fast -O4 -assume restricted_pointers +CFB COPTIMIZE = -fast -O4 -assume restricted_pointers feedback = 1 176.gcc=peak=default=default: notes176 = 176.gcc: -fast -O4 -xtaso_short -all -ldensemalloc -none notes176_1 = +CFB +IFB COPTIMIZE = -fast -O4 -xtaso_short -all -ldensemalloc -none feedback = 1 fdo_post2 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_run2 = $command fdo_post2 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_run2 = $command fdo_post2 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 171.swim=peak=default=default: notes171 = 171.swim: same as base basepeak = 1 #notes171 = 171.swim: f90 -fast -O5 #F77OPTIMIZE = -fast -O5 #F77 = f90 172.mgrid=peak=default=default: notes172 = 172.mgrid: kf90 -call_shared -arch generic -O5 -inline notes172_1 = manual -nopipeline -unroll 9 -automatic notes172_2 = -fkapargs='-aggressive=a -fuse -interleave notes172_3 = -ur=2 -ur3=5 -cachesize=128,16000 ' +PFB F77OPTIMIZE = -call_shared -arch generic -O5 -inline manual -nopipeline -transform_loops -unroll 9 -automatic -fkapargs='-aggressive=a -fuse -interleave -ur=2 -ur3=5 -cachesize=128,16000 ' F77 = kf90 fdo_post_make1 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 173.applu=peak=default=default: notes173 = 173.applu: kf90 -O5 -transform_loops notes173_1 = -fkapargs=' -o=0 -nointerleave -ur=14 #notes173_2 = -ur2=260 -ur3=18' +CFB+IFB+PFB notes173_2 = -ur2=260 -ur3=18' +PFB OPTIMIZE = -O5 -transform_loops -fkapargs=' -o=0 -nointerleave -ur=14 -ur2=260 -ur3=18' F77 = kf90 #feedback = 1 #fdo_pre0 = mkdir /tmp/pp; rm -f /tmp/pp/${baseexe}* #PASS1_CFLAGS = -prof_gen_noopt -prof_dir /tmp/pp #PASS2_CFLAGS = -prof_use_feedback -prof_dir /tmp/pp #fdo_post_make2 = <pixie.out 2>pixie.err # mv oldexe.pixie ${baseexe} #EOT #fdo_run2 = $command #fdo_post2 = spike oldexe -feedback oldexe -o ${baseexe} -fb oldexe -stride_prefetch fdo_post_make1 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 177.mesa=peak=default=default: notes177 = 177.mesa: kcc -fast -O4 +CFB +IFB COPTIMIZE = -fast -O4 CC = kcc fdo_pre0 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 183.equake=peak=default=default: notes183 = 183.equake: cc -call_shared -arch generic -fast -O4 notes183_1 = -ldensemalloc -assume restricted_pointers notes183_2 = -inline speed -unroll 13 -xtaso_short +PFB COPTIMIZE = -call_shared -arch generic -fast -O4 -ldensemalloc -assume restricted_pointers -inline speed -unroll 13 -xtaso_short CC = cc fdo_post_make1 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 187.facerec=peak=default=default: #notes187 = 187.facerec: f90 -O3 -inline all -speculate all -unroll 3 #notes187_1 = -automatic -assume noaccuracy_sensitive #notes187_2 = -math_library accurate +IFB +PFB #FOPTIMIZE = -O3 -inline all -speculate all -unroll 7 -automatic -assume noaccuracy_sensitive -math_library accurate notes187 = 187.facerec: f90 -O4 -nopipeline -inline all notes187_1 = -non_shared -speculate all -unroll 7 notes187_2 = -automatic -assume accuracy_sensitive notes187_3 = -math_library fast +IFB FOPTIMIZE = -O4 -nopipeline -inline all -non_shared -speculate all -unroll 7 -automatic -assume accuracy_sensitive -math_library fast FC = f90 #fdo_post_make2 = <pixie.out 2>pixie.err # mv oldexe.pixie ${baseexe} #EOT #fdo_run2 = $command #fdo_post2 = spike oldexe -feedback oldexe -o ${baseexe} -fb oldexe -stride_prefetch fdo_post1 = mv ${baseexe} oldexe fdo_post2 = spike oldexe -feedback oldexe -o ${baseexe} 188.ammp=peak=default=default: notes188 = 188.ammp: cc -arch host -O4 -ifo -assume nomath_errno notes188_1 = -assume trusted_short_alignment -fp_reorder notes188_2 = -readonly_strings -ldensemalloc -xtaso_short notes188_3 = -assume restricted_pointers -unroll 9 notes188_4 = -inline speed +CFB +IFB +PFB OPTIMIZE = -arch host -O4 -ifo -assume nomath_errno -assume trusted_short_alignment -fp_reorder -readonly_strings -ldensemalloc -xtaso_short -assume restricted_pointers -unroll 9 -inline speed CC = cc feedback = 1 fdo_pre0 = mkdir /tmp/pp; rm -f /tmp/pp/${baseexe}* PASS1_CFLAGS = -prof_gen_noopt -prof_dir /tmp/pp PASS2_CFLAGS = -prof_use_feedback -prof_dir /tmp/pp fdo_post_make2 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_run2 = $command fdo_post2 = spike oldexe -feedback oldexe -o ${baseexe} -fb oldexe -stride_prefetch 189.lucas=peak=default=default: notes189 = 189.lucas: kf90 -O5 -fkapargs='-ur=1' +PFB FOPTIMIZE = -O5 -fkapargs='-ur=1' FC = kf90 fdo_post_make1 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 191.fma3d=peak=default=default: notes191 = 191.fma3d: kf90 -O4 -transform_loops +PFB FOPTIMIZE = -O4 -transform_loops -fkapargs='-cachesize=128,16000 ' FC = kf90 fdo_post_make1 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 200.sixtrack=peak=default=default: notes200 = 200.sixtrack: f90 -fast -O5 -assume accuracy_sensitive notes200_1 = -notransform_loops +PFB F77OPTIMIZE = -fast -O5 -assume accuracy_sensitive -notransform_loops F77 = f90 fdo_post_make1 = <pixie.out 2>pixie.err mv oldexe.pixie ${baseexe} EOT fdo_post1 = spike oldexe -fb oldexe -stride_prefetch -o ${baseexe} 301.apsi=peak=default=default: #notes301 = 301.apsi: kf90 -O5 -inline none -call_shared #notes301_1 = -speculate by_routine -align commons #notes301_2 = -fkapargs=' -aggressive=a -tune=ev5 -fuse #notes301_3 = -ur=21 -ur3=19 -cachesize=128,16000' +IFB notes301 = 301.apsi: kf90 -O5 -inline none -call_shared -speculate all notes301_1 = -align commons -fkapargs=' -aggressive=ab notes301_2 = -tune=ev5 -fuse -ur=1 -ur2=60 -ur3=20 notes301_3 = -cachesize=128,16000' #F77OPTIMIZE = -O5 -inline none -call_shared -speculate by_routine -align commons -fkapargs=' -aggressive=a -tune=ev5 -fuse -ur=21 -ur3=19 -cachesize=64,8000' F77OPTIMIZE = -O5 -inline none -call_shared -speculate all -align commons -fkapargs=' -aggressive=ab -tune=ev5 -fuse -ur=1 -ur2=60 -ur3=20 -cachesize=128,16000' F77 = kf90 #fdo_post1 = mv ${baseexe} oldexe #fdo_post2 = spike oldexe -feedback oldexe -o ${baseexe} ####################################################################### # Integer Portability # notes8xx are used for portability int=default=default=default: notes800 = notes801 = Portability: gcc: -Dalloca=__builtin_alloca; crafty: -DALPHA notes802 = perlbmk: -DSPEC_CPU2000_DUNIX; vortex: -DSPEC_CPU2000_LP64 notes803 = gap: -DSYS_HAS_CALLOC_PROTO -DSYS_IS_BSD -DSYS_HAS_IOCTL_PROTO notes804 = -DSPEC_CPU2000_LP64 176.gcc=default=default=default: EXTRA_CFLAGS= -Dalloca=__builtin_alloca 186.crafty=default=default=default: EXTRA_CFLAGS = -DALPHA 252.eon=default=default=default: CXXPORTABILITY = -lm 253.perlbmk=default=default=default: EXTRA_CFLAGS = -DSPEC_CPU2000_DUNIX 254.gap=default=default=default: EXTRA_CFLAGS = -DSYS_HAS_CALLOC_PROTO -DSYS_IS_BSD -DSYS_HAS_IOCTL_PROTO -DSPEC_CPU2000_LP64 255.vortex=default=default=default: EXTRA_CFLAGS = -DSPEC_CPU2000_LP64 ####################################################################### # Floating point Portability # notes8xx are used for portability fp=default=default=default: notes800 = notes801 = Portability: galgel: -fixed 178.galgel=default=default=default: EXTRA_FFLAGS = -fixed