# Invocation command line: # /cpu2000/bin/runspec -a validate -c pathscale-2.4-v0.cfg -r -u 8 -T all all ############################################################################ # pathscale-amd64.cfg # # Copyright 2003, 2004, 2005, 2006 PathScale, Inc. All Rights Reserved. # # Configuration file for use with the PathScale compiler on x86-64 check_md5 = 1 ext=ps_amd64 teeout=yes teerunout=yes mean_anyway=yes reportable=1 ################################################################ # Machine-specific section ################################################################ #include: SUT.inc # ---- Begin inclusion of '/cpu2000/config/SUT.inc' ################################################################ # Machine-specific section ################################################################ hw_cpu = AMD Opteron 8214 hw_cpu_mhz = 2200 hw_disk = SAS, 72GB 15K RPM hw_fpu = Integrated hw_memory = 16x2GB, PC2-5300 hw_vendor = IBM hw_model = IBM System X 3755 (AMD Opteron (TM) 2214) hw_avail = Oct-2006 hw_ncpu = 8 cores, 2 chips, 2 cores/chip hw_ncpuorder = 1,2,3,4 hw_ocache = N/A hw_other = None hw_parallel = No hw_pcache = 64KBI + 64KBD on chip hw_scache = 1024KB (I+D) on chip hw_tcache = N/A sw_file = Linux/reiserfs sw_os = SuSE Linux 9.0 SP3 SLES 64 bit Kernel 2.6.5-7.244-smp sw_state = Multi-user, run level 3 license_num = 11 sw_compiler = PathScale EKO Compiler Suite, Release 2.4 sw_avail = Apr-2005 test_date = May-2005 prepared_by = Matt Eckl company_name = IBM Corporation tester_name = IBM Corporation VENDOR = IBM Corporation output_format = asc backup_config = NO teeout = YES teerunout = YES feedback = YES check_md5 = YES notes99900= # ---- End inclusion of '/cpu2000/config/SUT.inc' license_num = 2323 sw_compiler010 = PathScale EKOPath(TM) Compiler sw_compiler020 = Suite, Release 2.4 sw_avail = Mar-2006 test_date = Mar-2006 prepared_by = PathScale, Inc. company_name = PathScale, Inc. tester_name = PathScale, Inc. default=default=default=default: ACML_PSC64_DIR = /opt/acml3.0.0/pathscale64/lib CC=pathcc FC=pathf95 F77=pathf95 CXX=pathCC ################################################################ # Initial Notes ################################################################ notes016 = notes018 = +FDO: PASS1= -fb_create fbdata PASS2= -fb_opt fbdata ################################################################ # Final Notes ################################################################ default=default=default=default: notes5000 = ################################################################# # # # SPECint Tuning & Notes # # # ################################################################# # Specify feedback-directed optimization for all SPECint runs. int=default=default=default: PASS1_CFLAGS = -fb_create fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata int=base=default=default: COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast notes021 = notes022 = Baseline optimization flags: notes023 = C programs: -Ofast +FDO notes024 = C++ programs: -Ofast +FDO notes100 = notes101 = Portability Flags: notes106 = 186.crafty: -DLINUX_i386 notes107 = 252.eon: -DHAS_ERRLIST notes108 = 253.perlbmk: -DSPEC_CPU2000_LINUX_I386 -DSPEC_CPU2000_NEED_BOOL notes109 = -DSPEC_CPU2000_GLIBC22 -DSPEC_CPU2000_LP64 notes112 = 254.gap: -DSYS_IS_USG -DSYS_HAS_IOCTL_PROTO -DSYS_HAS_TIME_PROTO notes113 = -DSYS_HAS_CALLOC_PROTO -DSPEC_CPU2000_LP64 notes116 = 255.vortex: -DSPEC_CPU2000_LP64 ################################################################# # # # SPECint Portability flags # # # ################################################################# 186.crafty=default=default=default: CPORTABILITY = -DLINUX_i386 252.eon=default=default=default: CXXPORTABILITY = -DHAS_ERRLIST 253.perlbmk=default=default=default: CPORTABILITY = -DSPEC_CPU2000_LINUX_I386 -DSPEC_CPU2000_NEED_BOOL -DSPEC_CPU2000_LP64 254.gap=default=default=default: CPORTABILITY = -DSYS_IS_USG -DSYS_HAS_IOCTL_PROTO -DSYS_HAS_TIME_PROTO -DSYS_HAS_CALLOC_PROTO -DSPEC_CPU2000_LP64 255.vortex=default=default=default: CPORTABILITY= -DSPEC_CPU2000_LP64 notes120 = notes125 = Peak Tuning: 164.gzip=peak=default=default: OPTIMIZE = -O3 -ipa -WOPT:val=0 -OPT:unroll_size=0 notes205= 164.gzip: -O3 -ipa -WOPT:val=0 -OPT:unroll_size=0 +FDO 175.vpr=peak=default=default: OPTIMIZE = -O3 -ipa -m32 notes208= 175.vpr: -O3 -ipa -m32 +FDO 176.gcc=peak=default=default: OPTIMIZE = -O3 -IPA:plimit=10000 -LNO:opt=0 -OPT:goto=off notes212= 176.gcc: -O3 -IPA:plimit=10000 -LNO:opt=0 -OPT:goto=off +FDO 181.mcf=peak=default=default: OPTIMIZE = -O3 -ipa -IPA:field_reorder=on -m32 notes214= 181.mcf: -O3 -ipa -IPA:field_reorder=on -m32 +FDO 186.crafty=peak=default=default: OPTIMIZE = -Ofast -CG:local_fwd_sched=on -LNO:opt=0 -WOPT:val=0 notes217= 186.crafty: -Ofast -CG:local_fwd_sched=on -LNO:opt=0 -WOPT:val=0 +FDO 197.parser=peak=default=default: OPTIMIZE = -O3 -ipa -m32 -IPA:ctype=on notes220= 197.parser: -O3 -ipa -m32 -IPA:ctype=on +FDO 252.eon=peak=default=default: OPTIMIZE = -Ofast -CG:gcm=off:p2align_freq=1:prefetch=off -IPA:plimit=4000 -OPT:treeheight=on -TENV:X=4:frame_pointer=off -fno-exceptions -LNO:fu=10:full_unroll_outer=on -GRA:optimize_boundary=on notes223= 252.eon: -Ofast -CG:gcm=off:p2align_freq=1:prefetch=off -IPA:plimit=4000 notes224= -OPT:treeheight=on -TENV:X=4:frame_pointer=off -fno-exceptions notes225= -LNO:fu=10:full_unroll_outer=on -GRA:optimize_boundary=on +FDO 253.perlbmk=peak=default=default: OPTIMIZE = -O2 -ipa -OPT:Ofast:transform_to_memlib=off -fno-math-errno -IPA:plimit=10000 notes227= 253.perlbmk: -O2 -ipa -OPT:Ofast:transform_to_memlib=off notes228= -fno-math-errno -IPA:plimit=10000 +FDO 254.gap=peak=default=default: basepeak = true notes230= 254.gap: basepeak = true 255.vortex=peak=default=default: OPTIMIZE = -Ofast -OPT:goto=off -CG:p2align=on -GRA:optimize_boundary=on -IPA:min_hotness=120 notes233= 255.vortex: -Ofast -OPT:goto=off -CG:p2align=on notes234= -GRA:optimize_boundary=on -IPA:min_hotness=120 +FDO 256.bzip2=peak=default=default: basepeak = true notes240= 256.bzip2: basepeak = true 300.twolf=peak=default=default: OPTIMIZE = -O2 -CG:gcm=off:p2align_freq=100000 -OPT:Ofast:unroll_times_max=8:unroll_size=256:alias=disjoint -WOPT:mem_opnds=on -m32 notes245= 300.twolf: -O2 -CG:gcm=off:p2align_freq=100000 notes246= -OPT:Ofast:unroll_times_max=8:unroll_size=256:alias=disjoint notes247= -WOPT:mem_opnds=on -m32 +FDO ################################################################# # # # SPECfp Tuning # # # ################################################################# # Specify feedback-directed optimization for all SPECfp codes. fp=default=default=default: COPTIMIZE = -Ofast -WOPT:mem_opnds=on PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata FOPTIMIZE = -Ofast -LNO:fusion=2 -OPT:fast_complex=on F77OPTIMIZE = -Ofast -LNO:fusion=2 -OPT:fast_complex=on PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_F77FLAGS = -fb_create fbdata PASS2_F77FLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata notes020 = +ACML means -L/pathscale64/lib -lacml, notes021 = which causes linking with AMD Core Math Library V3.0.0 notes028 = notes030 = Baseline optimization notes032 = C programs: -Ofast -WOPT:mem_opnds=on +FDO notes034 = Fortran programs: -Ofast -LNO:fusion=2 -OPT:fast_complex=on +FDO notes101 = Portability Flags: notes102 = 178.galgel: -fixedform 178.galgel=default=default=default: FPORTABILITY=-fixedform notes150 = notes155 =Peak Tuning: 168.wupwise=peak=default=default: F77OPTIMIZE = -Ofast -IPA:linear=on -LNO:prefetch_ahead=5:prefetch=3 -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 feedback = 0 notes204= 168.wupwise: -Ofast -IPA:linear=on -LNO:prefetch_ahead=5:prefetch=3 notes205= -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 171.swim=peak=default=default: F77OPTIMIZE = -Ofast -CG:local_fwd_sched=on -LNO:fusion=2 -m3dnow feedback = 0 notes210= 171.swim: -Ofast -CG:local_fwd_sched=on -LNO:fusion=2 -m3dnow 172.mgrid=peak=default=default: F77OPTIMIZE = -Ofast -CG:gcm=off -OPT:IEEE_arith=3:unroll_size=200 -LNO:fusion=2:fission=1:blocking=off:prefetch_ahead=2 -WOPT:mem_opnds=on:aggstr=0 feedback = 0 notes215= 172.mgrid: -Ofast -CG:gcm=off -OPT:IEEE_arith=3:unroll_size=200 notes216= -LNO:fusion=2:fission=1:blocking=off:prefetch_ahead=2 notes217= -WOPT:mem_opnds=on:aggstr=0 173.applu=peak=default=default: F77OPTIMIZE = -Ofast -CG:local_fwd_sched=on -OPT:ro=3 -TENV:X=3 -LNO:fusion=2:fission=2:full_unroll_size=10000 notes220= 173.applu: -Ofast -CG:local_fwd_sched=on -OPT:ro=3 -TENV:X=3 notes221= -LNO:fusion=2:fission=2:full_unroll_size=10000 +FDO 177.mesa=peak=default=default: COPTIMIZE = -O2 -ipa -OPT:Ofast -fno-math-errno -CG:local_fwd_sched=on -WOPT:mem_opnds=on notes225= 177.mesa: -O2 -ipa -OPT:Ofast -fno-math-errno -CG:local_fwd_sched=on -WOPT:mem_opnds=on +FDO 178.galgel=peak=default=default: FOPTIMIZE = -Ofast -OPT:fast_complex=on #RM_SOURCES = lapak.f90 #EXTRA_LIBS = -L$(ACML_PSC64_DIR) -lacml notes230= 178.galgel: -Ofast -OPT:fast_complex=on +ACML +FDO notes232= RM_SOURCES=lapak.f90 179.art=peak=default=default: COPTIMIZE= -O3 -OPT:Ofast -fno-math-errno -mno-sse2 -m32 feedback = 0 notes235= 179.art: -O3 -OPT:Ofast -fno-math-errno -mno-sse2 -m32 183.equake=peak=default=default: COPTIMIZE = -Ofast -CG:load_exe=2 -WOPT:mem_opnds=on -m32 notes240= 183.equake: -Ofast -CG:load_exe=2 -WOPT:mem_opnds=on -m32 +FDO 187.facerec=peak=default=default: FOPTIMIZE = -Ofast -IPA:plimit=1500 -LNO:fusion=2 -OPT:IEEE_NaN_Inf=off:ro=3:unroll_size=0 notes245= 187.facerec: -Ofast -IPA:plimit=1500 -LNO:fusion=2 notes246= -OPT:IEEE_NaN_Inf=off:ro=3:unroll_size=0 +FDO 188.ammp=peak=default=default: COPTIMIZE = -O3 -OPT:alias=disjoint:unroll_times_max=8:Ofast:ro=3 -GRA:optimize_boundary=on -fno-math-errno -TENV:X=4 notes250= 188.ammp: -O3 -OPT:alias=disjoint:unroll_times_max=8:Ofast:ro=3 notes251= -GRA:optimize_boundary=on -fno-math-errno -TENV:X=4 +FDO 189.lucas=peak=default=default: FOPTIMIZE = -Ofast -OPT:ro=3:fast_nint=off:unroll_size=256 -WOPT:mem_opnds=on notes255= 189.lucas: -Ofast -OPT:ro=3:fast_nint=off:unroll_size=256 -WOPT:mem_opnds=on +FDO 191.fma3d=peak=default=default: FOPTIMIZE = -O2 -ipa -CG:load_exe=1 -OPT:Ofast:IEEE_arith=3:ro=3 -WOPT:mem_opnds=on:retype_expr=on -IPA:pu_reorder=1 notes260= 191.fma3d: -O2 -ipa -CG:load_exe=1 -OPT:Ofast:IEEE_arith=3:ro=3 notes261= -WOPT:mem_opnds=on:retype_expr=on -IPA:pu_reorder=1 +FDO 200.sixtrack=peak=default=default: F77OPTIMIZE = -O3 -OPT:Ofast:early_intrinsics=on -fno-math-errno -CG:load_exe=1 notes265= 200.sixtrack: -O3 -OPT:Ofast:early_intrinsics=on notes266= -fno-math-errno -CG:load_exe=1 +FDO 301.apsi=peak=default=default: F77OPTIMIZE = -Ofast -CG:load_exe=0 -LNO:prefetch=0:simd=2 feedback=0 notes270= 301.apsi: -Ofast -CG:load_exe=0 -LNO:prefetch=0:simd=2