# Invocation command line: # /cpu2006/bin/runspec -c amd0905is.cfg --define NCPUS=6 --rate 24 -T all fp --nopreenv --note-preenv # output_root was not used for this run ############################################################################ # AMD SPEC CPU2006 V1.1 Configuration File for 64-bit Linux (Hex-Core) # # CPU2006 Version 1.1 # Compiler name/version: PGI 8.0, Open64 4.2.2 # Operating system version: 64-bit Linux # Hardware: AMD Opteron (Istanbul) # FP Base Pointer Size: 64-bit only # FP Peak Pointer Size: 32/64-bit # INT Base Pointer Size: 32/64-bit # INT Peak Pointer Size: 32/64-bit # Auto Parallization: Yes # # Important! Please run with your stack size set to 'unlimited'. # Failure to do so may cause 483.xalancbmk to get a stack overflow during # execution. # Using csh: unlimit # Using bash: ulimit -s unlimited # # Your LD_LIBRARY_PATH must be set to the location of the dependent # runtime libraries. (Though this should be taken care of by the # preENV_LD_LIBRARY_PATH found in the AMD0905is-sut.inc file.) # # If building new binaries, please adjust the SMARTHEAP_DIR variable to # the directory containing the Smartheap library. # ##################################################################### # Macro section #################################################################### # Modify this section to use the appropriate architecture flags # This should be shanghai-xx for either Shanghai or Istanbul systems %define pgi_tp64 -tp shanghai-64 %define pgi_tp32 -tp shanghai-32 # Adjust the build jobs to the number of concurrent build processses %define build_jobs 4 ##################################################################### # Header Section ##################################################################### ext = amd0905is ignore_errors = no tune = base,peak output_format = asc,flags flagsurl000 = http://www.spec.org/cpu2006/flags/pgi80_linux_flags.20090710.xml $[top]/x86-open64-422-flags.xml \ $[top]/amd-platform.xml size = test,train,ref check_md5 = yes reportable = yes env_vars = no teeout = yes mean_anyway = yes makeflags = -j %{build_jobs} #################################################################### # Include file containing the SUT hardware inforamtion # as well as the submit command, tester information and notes #################################################################### #include: AMD0905is-sut.inc # ----- Begin inclusion of 'AMD0905is-sut.inc' ############################################################################ ##################################################################### # Paths ##################################################################### # Set location of run time libraries for runs. preENV_LD_LIBRARY_PATH = $[top]/amd0905is-libs/64:$[top]/amd0905is-libs/32 # Set this path to your SmartHeap Library for builds. SMARTHEAP_DIR = /root/work/libraries/SmartHeap-8.1/lib ##################################################################### # Machine Specific Settings ##################################################################### # How many sockets does your test system have? %define num_sockets 4 # How many cores per socket does your system have (Istanbul = 6) %define num_cores_per_socket 6 # What is vm/nr_hugepages set to in /etc/sysctl.conf? # Recommended settings with 4x4GB DIMMs/socket: 1P: 2700, 2P: 5400, 4P: 10800 %define num_system_huge_pages 10800 # If --define NCPUS is set on the fp runspec command, use that setting. # This setting tells PGI autopar binaries how many cores to parallelize # across. %ifdef %{NCPUS} preENV_NCPUS=%{NCPUS} %endif # Huge pages per copy var for Open64 preENV_HUGETLB_LIMIT = 450 # Huge pages per copy var for PGI preENV_PGI_HUGE_PAGES = 450 # Run the sync command after setup post_setup=sync ##################################################################### # Submit Section ##################################################################### # This config file is set to run these binaries on up to a 4P, 24 # core system. If this does not match the description of your # system, change this config file, specifically match the socket the # memory is bound (-m) to the physical cpu number. Use "man numactl" # and "numactl --hardware" to better understand how to use this # command. submit0 = echo "$command" > run.sh submit1 = if `test $SPECCOPYNUM -eq 0 `; then numactl -m 0 --physcpubind=0 sh run.sh; fi submit2 = if `test $SPECCOPYNUM -eq 1 `; then numactl -m 0 --physcpubind=4 sh run.sh; fi submit3 = if `test $SPECCOPYNUM -eq 2 `; then numactl -m 0 --physcpubind=8 sh run.sh; fi submit4 = if `test $SPECCOPYNUM -eq 3 `; then numactl -m 0 --physcpubind=12 sh run.sh; fi submit5 = if `test $SPECCOPYNUM -eq 4 `; then numactl -m 0 --physcpubind=16 sh run.sh; fi submit6 = if `test $SPECCOPYNUM -eq 5 `; then numactl -m 0 --physcpubind=20 sh run.sh; fi submit7 = if `test $SPECCOPYNUM -eq 6 `; then numactl -m 1 --physcpubind=1 sh run.sh; fi submit8 = if `test $SPECCOPYNUM -eq 7 `; then numactl -m 1 --physcpubind=5 sh run.sh; fi submit9 = if `test $SPECCOPYNUM -eq 8 `; then numactl -m 1 --physcpubind=9 sh run.sh; fi submit10 = if `test $SPECCOPYNUM -eq 9 `; then numactl -m 1 --physcpubind=13 sh run.sh; fi submit11 = if `test $SPECCOPYNUM -eq 10 `; then numactl -m 1 --physcpubind=17 sh run.sh; fi submit12 = if `test $SPECCOPYNUM -eq 11 `; then numactl -m 1 --physcpubind=21 sh run.sh; fi submit13 = if `test $SPECCOPYNUM -eq 12 `; then numactl -m 2 --physcpubind=2 sh run.sh; fi submit14 = if `test $SPECCOPYNUM -eq 13 `; then numactl -m 2 --physcpubind=6 sh run.sh; fi submit15 = if `test $SPECCOPYNUM -eq 14 `; then numactl -m 2 --physcpubind=10 sh run.sh; fi submit16 = if `test $SPECCOPYNUM -eq 15 `; then numactl -m 2 --physcpubind=14 sh run.sh; fi submit17 = if `test $SPECCOPYNUM -eq 16 `; then numactl -m 2 --physcpubind=18 sh run.sh; fi submit18 = if `test $SPECCOPYNUM -eq 17 `; then numactl -m 2 --physcpubind=22 sh run.sh; fi submit19 = if `test $SPECCOPYNUM -eq 18 `; then numactl -m 3 --physcpubind=3 sh run.sh; fi submit20 = if `test $SPECCOPYNUM -eq 19 `; then numactl -m 3 --physcpubind=7 sh run.sh; fi submit21 = if `test $SPECCOPYNUM -eq 20 `; then numactl -m 3 --physcpubind=11 sh run.sh; fi submit22 = if `test $SPECCOPYNUM -eq 21 `; then numactl -m 3 --physcpubind=15 sh run.sh; fi submit23 = if `test $SPECCOPYNUM -eq 22 `; then numactl -m 3 --physcpubind=19 sh run.sh; fi submit24 = if `test $SPECCOPYNUM -eq 23 `; then numactl -m 3 --physcpubind=23 sh run.sh; fi # SPEED # For a speed run, the submit1 command above will be used. use_submit_for_speed = 1 #################################################################### # Tester information #################################################################### license_num = 11 prepared_by = IBM Corporation tester = IBM Corporation test_sponsor = IBM Corporation hw_vendor = IBM Corporation hw_model = IBM BladeCenter LS42 (AMD Opteron 8435) #################################################################### # Hardware information #################################################################### default=default=default=default: hw_avail = Sep-2009 hw_cpu_name = AMD Opteron 8435 hw_cpu_mhz = 2600 hw_fpu = Integrated hw_nchips = 4 hw_ncores = 24 hw_ncoresperchip = 6 hw_nthreadspercore = 1 hw_ncpuorder = 1,2,3,4 chips hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 512 KB I+D on chip per core hw_tcache = 6 MB I+D on chip per chip hw_ocache = None hw_disk = 1 x 73 GB SAS, 10000 RPM hw_memory = 64 GB (16 x 4 GB, PC2-6400 ECC) hw_other = None sw_file = ext3 #sw_os000 = SuSE Linux Enterprise Server 10 (x86_64) #sw_os001 = SP2, Kernel 2.6.16.60-0.21-smp sw_os000 = Red Hat Enterprise Linux Server release 5.3, sw_os001 = Kernel 2.6.18-128.el5 on an x86_64 sw_state = Run level 3 (Full multiuser with network) ##################################################################### # Notes ##################################################################### notes_030 =The x86 Open64 Compiler Suite is only available from (and supported by) AMD at notes_035 =http://developer.amd.com/cpu/open64. notes_submit_000 ='numactl' was used to bind copies to the cores. notes_submit_005 =See the configuration file for details. notes_os_000 ='ulimit -s unlimited' was used to set environment stack size notes_os_005 ='ulimit -l 2097152' was used to set environment locked pages in memory limit notes_os_010 = notes_os_015 =Set vm/nr_hugepages=10800 in /etc/sysctl.conf notes_os_020 =mount -t hugetlbfs nodev /mnt/hugepages notes_os_025 = notes_os_030 =Processor Performance States Disabled in BIOS notes_os_035 =Memory ChipKill Disabled in BIOS # Uncomment this if you used this for a speed run #notes_os_025 =powersave -f was used to set the CPU frequency to its maximum. # ---- End inclusion of '/cpu2006/config/AMD0905is-sut.inc' ############################ Software Info ############################ fp=default=default=default: sw_base_ptrsize = 64-bit sw_peak_ptrsize = 32/64-bit sw_avail = Apr-2009 sw_compiler000 = PGI Server Complete Version 8.0 sw_compiler001 = x86 Open64 4.2.2 Compiler Suite (from AMD) sw_other = binutils 2.18 int=default=default=default: sw_base_ptrsize = 32/64-bit sw_peak_ptrsize = 32/64-bit sw_avail = Apr-2009 sw_compiler1 = PGI Server Complete Version 8.0 sw_compiler2 = x86 Open64 4.2.2 Compiler Suite (from AMD) sw_other1 = binutils 2.18 sw_other2 = SmartHeap 8.1 32-bit Library for Linux default=default=default=default: ##################################################################### # Base compiler selection ##################################################################### int=base=default=default: CC = opencc -march=barcelona CXX = openCC -march=barcelona FC = openf95 -march=barcelona fp=base=default=default: CC = pgcc CXX = pgcpp FC = pgf95 ##################################################################### # Portability ##################################################################### # Set for all base and peak benchmarks unless changed below default=default=default=default: PORTABILITY = -DSPEC_CPU_LP64 ##################################################################### # Int Base Portabilty (Open64) ##################################################################### 400.perlbench=base=default=default: CPORTABILITY = -DSPEC_CPU_LINUX_X64 462.libquantum=base=default=default: CPORTABILITY= -DSPEC_CPU_LINUX 471.omnetpp=base=default=default: # Needed to avoid -DSPEC_CPU_LP64 on -m32 C++ base codes PORTABILITY = 473.astar=base=default=default: # Needed to avoid -DSPEC_CPU_LP64 on -m32 C++ base codes PORTABILITY = 483.xalancbmk=base=default=default: CXXPORTABILITY= -DSPEC_CPU_LINUX # Needed to avoid -DSPEC_CPU_LP64 on -m32 C++ base codes PORTABILITY = ##################################################################### # INT Base Flags (Open64) ##################################################################### int=base=default=default: COPTIMIZE = -Ofast -CG:local_sched_alg=1 -HP:bdt=2m:heap=2m CXXOPTIMIZE = -Ofast -m32 -INLINE:aggressive=on EXTRA_CXXLIBS = -L$(SMARTHEAP_DIR) -lsmartheap ##################################################################### # FP Base Portabilty (PGI) ##################################################################### 435.gromacs=base=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=base=default=default: LDPORTABILITY = -Mnomain 454.calculix=base=default=default: LDPORTABILITY = -Mnomain 481.wrf=base=default=default: CPORTABILITY = -DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX ##################################################################### # FP Base Flags (PGI) ##################################################################### fp=base=default=default: COPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} FOPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed -Mvect=short -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} CXXOPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed --zc_eh -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi ##################################################################### # INT Peak Portability ##################################################################### # Open64 400.perlbench=peak=default=default: CPORTABILITY = -DSPEC_CPU_LINUX_X64 # Open64 403.gcc=peak=default=default: PORTABILITY = # Open64 429.mcf=peak=default=default: PORTABILITY = # Open64 462.libquantum=peak=default=default: CPORTABILITY = -DSPEC_CPU_LINUX # Open64 471.omnetpp=peak=default=default: # Needed to avoid -DSPEC_CPU_LP64 on -m32 C++ base codes PORTABILITY = # PGI 473.astar=peak=default=default: PORTABILITY = # Open64 483.xalancbmk=peak=default=default: CXXPORTABILITY = -DSPEC_CPU_LINUX # Needed to avoid -DSPEC_CPU_LP64 on -m32 C++ base codes PORTABILITY = ##################################################################### # INT Peak Flags ##################################################################### # Open64 400.perlbench=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -Ofast -IPA:plimit=20000 -LNO:opt=0 -OPT:unroll_times_max=8:unroll_size=256:unroll_level=2:keep_ext=on -WOPT:if_conv=0 -CG:local_sched_alg=1:unroll_fb_req=on -HP:bdt=2m:heap=2m PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 401.bzip2=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -O3 -OPT:alias=disjoint:unroll_size=0 -OPT:Ofast:goto=off -INLINE:aggressive=on -CG:local_sched_alg=1 -m3dnow -HP:bdt=2m:heap=2m PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 403.gcc=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -Ofast -LNO:trip_count=256:prefetch_ahead=10 -CG:cmp_peep=on -m32 -HP:bdt=2m:heap=2m -GRA:unspill=on PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 429.mcf=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -O3 -ipa -INLINE:aggressive=on -CG:gcm=off -GRA:prioritize_by_density=on -m32 -HP:bdt=2m:heap=2m PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 # Open64 445.gobmk=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -O3 -OPT:alias=restrict:unroll_times_max=8:unroll_size=256:unroll_level=2:keep_ext=on -ipa -IPA:plimit=750:min_hotness=300:pu_reorder=1 -LNO:prefetch=1:ignore_feedback=off -CG:p2align=on:unroll_fb_req=on -HP:bdt=2m:heap=2m PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # PGI 456.hmmer=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Mvect=partial -Munroll=n:8 -Msmartalloc=huge -Msafeptr -Mprefetch=t0 -Mfprelaxed -Mipa=jobs:%{build_jobs},const,ptr,arg,inline %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # Open64 458.sjeng=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -O3 -ipa -LNO:ignore_feedback=off:full_unroll=10:fusion=0:fission=2 -IPA:pu_reorder=2 -CG:ptr_load_use=0 -OPT:unroll_times_max=8 -INLINE:aggressive=on -HP:bdt=2m:heap=2m PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 462.libquantum=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -Ofast -LNO:pf2=0 -CG:gcm=off:use_prefetchnta=on:cmp_peep=on -WOPT:aggstr=0 -HP:bdt=2m:heap=2m -OPT:alias=disjoint -INLINE:aggressive=on -IPA:space=1000:plimit=20000 feedback=0 PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 464.h264ref=peak=default=default: CC = opencc -march=barcelona COPTIMIZE = -O3 -IPA:plimit=20000 -OPT:alias=disjoint -LNO:prefetch=0 -CG:ptr_load_use=0:push_pop_int_saved_regs=off -HP:bdt=2m:heap=2m PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 471.omnetpp=peak=default=default: CXX = openCC -march=barcelona CXXOPTIMIZE = -Ofast -CG:gcm=off -INLINE:aggressive=on -OPT:alias=disjoint -WOPT:if_conv=0 -m32 EXTRA_CXXLIBS = -L$(SMARTHEAP_DIR) -lsmartheap PASS1_CXXFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 # PGI 473.astar=peak=default=default: CXX = pgcpp CXXOPTIMIZE = -fastsse -O4 -Msmartalloc=huge -Msafeptr=global -Mfprelaxed --zc_eh %{pgi_tp32} EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CXXFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CXXFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline:6 PASS2_LDFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline:6 feedback = 1 basepeak = 0 # Open64 483.xalancbmk=peak=default=default: CXX = openCC -march=barcelona CXXOPTIMIZE = -Ofast -INLINE:aggressive=on -m32 -CG:cmp_peep=on -GRA:unspill=on -TENV:frame_pointer=off EXTRA_CXXLIBS = -L$(SMARTHEAP_DIR) -lsmartheap PASS1_CXXFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 ##################################################################### # FP Peak Portability ##################################################################### # PGI 436.cactusADM=peak=default=default: LDPORTABILITY = -Mnomain # Open64 447.dealII=peak=default=default: PORTABILITY = # Open64 450.soplex=peak=default=default: PORTABILITY = # PGI 454.calculix=peak=default=default: LDPORTABILITY = -Mnomain # PGI 481.wrf=peak=default=default: CPORTABILITY = -DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX ##################################################################### # FP Peak Flags ##################################################################### # PGI 410.bwaves=peak=default=default: FC = pgf95 FOPTIMIZE = -fastsse -Msmartalloc -Mprefetch=nta -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # Open64 416.gamess=peak=default=default: FC = openf95 -march=barcelona FOPTIMIZE = -O2 -OPT:Ofast:ro=3:unroll_size=256 -HP:bdt=2m:heap=2m PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata # PGI 433.milc=peak=default=default: CC = pgcc EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 1 # PGI 434.zeusmp=peak=default=default: FC = pgf95 FOPTIMIZE = -fastsse -Mfprelaxed -Mprefetch=distance:8,t0 -Msmartalloc=huge,hugebss -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # Open64 435.gromacs=peak=default=default: CC = opencc -march=barcelona FC = openf95 -march=barcelona FOPTIMIZE = -Ofast -OPT:rsqrt=2 -HP:bdt=2m:heap=2m COPTIMIZE = $(FOPTIMIZE) PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 # PGI 436.cactusADM=peak=default=default: CC = pgcc FC = pgf95 COPTIMIZE = -fastsse -Mconcur -Msmartalloc=huge -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} FOPTIMIZE = -fastsse -Mconcur -Mfprelaxed -Msmartalloc=huge -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi %if '%{NCPUS}' eq '6' && '%{num_sockets}' gt '1' # 2P or 4P rate run uses submits below copies = %{num_sockets} %endif # 2P speed run %if '%{NCPUS}' eq '12' copies = 1 CPULIST=0,1,2,3,4,5,6,7,8,9,10,11 %endif # 4P speed run %if '%{NCPUS}' eq '24' copies = 1 CPULIST=0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23 %endif # 1P run runs (same for speed or rate) %if '%{NCPUS}' eq '6' && '%{num_sockets}' eq '1' copies = 1 CPULIST=0,1,2,3,4,5 %endif submit0 = echo "$command" > run.sh # Adjust submit1 based on number of copies submit1 = if `test $copies -eq 1 `; then numactl --physcpubind=$CPULIST sh run.sh \ else if `test $SPECCOPYNUM -eq 0 `; then numactl -m 0 --physcpubind=0,4,8,12,16,20 sh run.sh; fi; fi submit2 = if `test $SPECCOPYNUM -eq 1 `; then numactl -m 1 --physcpubind=1,5,9,13,17,21 sh run.sh; fi submit3 = if `test $SPECCOPYNUM -eq 2 `; then numactl -m 2 --physcpubind=2,6,10,14,18,22 sh run.sh; fi submit4 = if `test $SPECCOPYNUM -eq 3 `; then numactl -m 3 --physcpubind=3,7,11,15,19,23 sh run.sh; fi feedback = 0 basepeak = 0 # PGI 437.leslie3d=peak=default=default: FC = pgf95 FOPTIMIZE = -fastsse -Mvect=fuse -Msmartalloc=huge -Mprefetch=distance:8,t0 -Mfprelaxed %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi PASS1_FFLAGS = -Mpfi=indirect PASS1_LDFLAGS = -Mpfi=indirect PASS2_FFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # PGI 444.namd=peak=default=default: CXX = pgcpp CXXOPTIMIZE = -fastsse -Munroll=n:4,m:8 -Msmartalloc=huge -Mnodepchk -Mfprelaxed --zc_eh %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CXXFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CXXFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # Open64 447.dealII=peak=default=default: CXX = openCC -march=barcelona CXXOPTIMIZE = -Ofast -static -INLINE:aggressive=on -LNO:opt=0 -Wf,-fno-exceptions -m32 -OPT:unroll_times_max=8:unroll_size=256:unroll_level=2 -HP:bdt=2m:heap=2m -GRA:unspill=on -CG:cmp_peep=on -TENV:frame_pointer=off PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 # Open64 450.soplex=peak=default=default: CXX = openCC -march=barcelona CXXOPTIMIZE = -O3 -INLINE:aggressive=on -OPT:IEEE_arith=3:IEEE_NaN_Inf=off:fold_unsigned_relops=on:malloc_alg=1 -CG:load_exe=0 -fno-exceptions -m32 -HP:bdt=2m PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata # Open64 453.povray=peak=default=default: CXX = openCC -march=barcelona CXXOPTIMIZE = -Ofast -INLINE:aggressive=on -HP:bdt=2m:heap=2m PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata # PGI 454.calculix=peak=default=default: CC = pgcc FC = pgf95 FOPTIMIZE = -fastsse -Mvect=short -Msmartalloc=huge -Mprefetch=t0 -Mpre -Mfprelaxed %{pgi_tp64} COPTIMIZE = -fastsse -Mvect=short -Msmartalloc=huge -Mprefetch=t0 -Mpre -Mfprelaxed %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi PASS1_FFLAGS = -Mpfi=indirect PASS1_CFLAGS = -Mpfi=indirect PASS1_LDFLAGS = -Mpfi=indirect PASS2_FFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_CFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # Open64 459.GemsFDTD=peak=default=default: FC = openf95 -march=barcelona FOPTIMIZE = -Ofast -LNO:fission=2:simd=2:prefetch_ahead=1 -CG:load_exe=0 -HP PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 # Open64 465.tonto=peak=default=default: FC = openf95 -march=barcelona FOPTIMIZE = -Ofast -OPT:alias=no_f90_pointer_alias -LNO:blocking=off -CG:load_exe=1 -IPA:plimit=525 -HP PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 0 # PGI 470.lbm=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Msmartalloc=huge -Mprefetch=t0 -Mloop32 -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PGI 481.wrf=peak=default=default: CC = pgcc FC = pgf95 FOPTIMIZE = -fastsse -Mvect=noaltcode -Msmartalloc=huge -Mprefetch=distance:8 -Mfprelaxed %{pgi_tp64} COPTIMIZE = -fastsse -Mvect=noaltcode -Msmartalloc=huge -Mprefetch=distance:8 -Mfprelaxed %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PGI 482.sphinx3=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Mfprelaxed -Msmartalloc %{pgi_tp64} EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CFLAGS = -Mpfi=indirect PASS1_LDFLAGS = -Mpfi=indirect PASS2_CFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: flagsurl001 = http://www.spec.org/cpu2006/flags/x86-open64-4.2.2-flags-revA.20090710.xml flagsurl002 = http://www.spec.org/cpu2006/flags/amd-platform.20090728.xml notes_000 =Environment variables set by runspec before the start of the run: notes_005 =HUGETLB_LIMIT = "450" notes_010 =LD_LIBRARY_PATH = "/cpu2006/amd0905is-libs/64:/cpu2006/amd0905is-libs/32" notes_015 =NCPUS = "6" notes_020 =PGI_HUGE_PAGES = "450" notes_025 =