# Invocation command line: # /root/work/cpu2006-amd814gh/bin/runspec -c amd814GH -F amd814GH-flags.xml -r -C 8 -T all int # output_root was not used for this run ############################################################################ # AMD64 SPEC CPU2006 Serial Configuration File for 64-bit Linux (Quad-Core) # # Auto Parallization: Not Used # # Important! Please run with your stack size set to 'unlimited'. # Failure to do so may cause 483.xalancbmk to get a stack overflow during execution. # Using csh: unlimit # Using bash: ulimit -s unlimited # # Set your LD_LIBRARY_PATH to the location of the dependency runtime libraries # # Please adjust the SHL_DIR variable to the directory containing the Smartheap library. ##################################################################### # Header Section ##################################################################### ext = amd814GH ignore_errors = no tune = base,peak output_format = asc,pdf,raw,flags,cfg,html size = test,train,ref check_md5 = yes reportable = yes mean_anyway = yes env_vars = no teeout = yes teerunout = yes # Adjust the make jobs flag for the number of cores. makeflags = -j 4 ##################################################################### # Macro section #################################################################### # Modify this section to use the appropriate architecture flags %define pgi_tp64 -tp barcelona-64 %define pgi_tp32 -tp barcelona #################################################################### # Include file containing the SUT hardware inforamtion # as well as the submit command, tester information and notes #################################################################### #include: AMDsut.inc # ----- Begin inclusion of 'AMDsut.inc' ############################################################################ ##################################################################### # Submit Section ##################################################################### # RATE #This config file is set to run these binaries on a 2P, 8 core system. If this #does not match the description of your system, change this config file, #specifically "bind0","bind1","bind2", etc. to match your system. Use #"man numactl" and "numactl --hardware" to better understand how to use #this command. bind0 = numactl -m 0 --physcpubind=0 bind1 = numactl -m 0 --physcpubind=1 bind2 = numactl -m 0 --physcpubind=2 bind3 = numactl -m 0 --physcpubind=3 bind4 = numactl -m 1 --physcpubind=4 bind5 = numactl -m 1 --physcpubind=5 bind6 = numactl -m 1 --physcpubind=6 bind7 = numactl -m 1 --physcpubind=7 # SPEED # Below is an example numactl command for a speed run using # 4 threads on a single Quad-core chip. # Please adjust as needed for your system # # bind0 = numactl -l --physcpubind=0,1,2,3 use_submit_for_speed = 1 submit = echo "$command" > run.sh ; $BIND bash run.sh #################################################################### # Tester information #################################################################### license_num = 49 prepared_by = AMD Performance Labs tester = Advanced Micro Devices test_date = Sep-2007 test_sponsor = Advanced Micro Devices #################################################################### # Hardware information #################################################################### default=default=default=default: hw_avail = Dec-2007 hw_cpu_name = AMD Opteron 2356 hw_cpu_mhz = 2300 hw_fpu = Integrated hw_nchips = 2 hw_ncores = 8 hw_ncoresperchip = 4 hw_nthreadspercore = 1 hw_ncpuorder = 1,2 chips hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 512 KB I+D on chip per core hw_tcache = 2 MB I+D on chip per chip hw_ocache = None hw_vendor = Supermicro hw_model = Supermicro H8DMU+, AMD Opteron 2356 hw_disk = 1x400GB SATA, 7200 RPM hw_memory = 16 GB (8x2GB, DDR2-667 CL5 Reg Dual Rank) hw_other = None sw_file = ReiserFS sw_state = Multi-user, run level 3 sw_os = SuSE Linux Enterprise Server 10 SP1 64-bit kernel ##################################################################### # Notes ##################################################################### notes_os_000 = 'ulimit -s unlimited' used to set environment stack size notes_os_005 = 'ulimit -l 2457600' was used to set environment lock pages quantity notes_os_010 = 'numactl' was used to bind copies to the cores notes_os_015 = Set vm/nr_hugepages=1200 in /etc/sysctl.conf notes_os_020 = mount -t hugetlbfs nodev /mnt/hugepages notes_os_025 = Environment variable PGI_HUGE_PAGES set to 150 # ---- End inclusion of '/root/work/cpu2006-amd814gh/config/AMDsut.inc' ############################ Software Info ############################ fp=default=default=default: sw_peak_ptrsize = 32/64-bit sw_base_ptrsize = 64-bit sw_auto_parallel = No sw_avail = Oct-2007 sw_compiler1 = The Portland Group (PGI) sw_compiler2 = PGI pgf90 7.1-0 Fortran Compiler sw_compiler3 = PGI pgcc 7.1-0 C Compiler sw_compiler4 = PGI pgCC 7.1-0 C++ Compiler sw_compiler5 = The PathScale Compiler v3.0 sw_compiler6 = PathScale pathf95 3.0 Fortran Compiler sw_compiler7 = PathScale pathcc 3.0 C Compiler sw_compiler8 = PathScale pathCC 3.0 C++ Compiler int=default=default=default: sw_peak_ptrsize = 32/64-bit sw_base_ptrsize = 32/64-bit sw_auto_parallel = No sw_other = SmartHeap 8.0 32-bit Library for Linux sw_avail = Oct-2007 sw_compiler000 = The Portland Group (PGI) sw_compiler001 = PGI pgcc 7.1-0 C Compiler sw_compiler002 = PGI pgCC 7.1-0 C++ Compiler sw_compiler003 = The PathScale Compiler v3.0 sw_compiler004 = PathScale pathcc 3.0 C Compiler sw_compiler005 = PathScale pathCC 3.0 C++ Compiler default=default=default=default: ##################################################################### # Compiler selection # # CC = pgcc -w CXX = pgcpp -w FC = pgf95 -w SHL_DIR = /cpu2006/work/cpu2006/SmartHeap ##################################################################### # Optimization ##################################################################### default=default=default=default: EXTRA_LDFLAGS = -Bstatic_pgi fp=base=default=default: COPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} CXXOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 --zc_eh %{pgi_tp64} FOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} int=base=default=default: COPTIMIZE = -fast -Mipa=fast,inline,noarg -Mfprelaxed -Msmartalloc=huge:840 %{pgi_tp64} CXXOPTIMIZE = -fastsse -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 --zc_eh %{pgi_tp32} ##################################################################### ## FP Peak Flags ##################################################################### fp=peak=default=default: EXTRA_LIBS= basepeak=0 410.bwaves=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata FOPTIMIZE = -O3 -OPT:Ofast:IEEE_arith=3 -LNO:blocking=off:ignore_feedback=off feedback=1 basepeak=0 416.gamess=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata FOPTIMIZE = -O2 -OPT:Ofast:ro=3:unroll_size=256 feedback=1 basepeak=0 433.milc=peak=default=default: COPTIMIZE = -fast -O4 -Mdse -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline,noarg -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline,noarg -Mpfo feedback=1 basepeak=0 434.zeusmp=peak=default=default: basepeak=1 feedback=0 435.gromacs=peak=default=default: COPTIMIZE = -fast -Mfpapprox=rsqrt -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} FOPTIMIZE = -fast -Mfpapprox=rsqrt -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} feedback=0 basepeak=0 436.cactusADM=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = CXXOPTIMIZE = -Ofast PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata COPTIMIZE = -O3 -LNO:prefetch=3:prefetch_ahead=5:ou_prod_max=10:full_unroll=5 -ipa FOPTIMIZE = -O3 -LNO:prefetch=3:prefetch_ahead=5:ou_prod_max=10:full_unroll=5 -ipa feedback=1 basepeak=0 437.leslie3d=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast FOPTIMIZE = -Ofast -OPT:malloc_alg=1 feedback=0 basepeak=0 444.namd=peak=default=default: CXXOPTIMIZE = -fast -O4 -Mfprelaxed -Msmartalloc=huge:448 --zc_eh %{pgi_tp64} -Mnodepchk -Mprefetch -Msafe_lastval -Msafeptr=static -Mstride0 -Munroll=n:4 -Mvect=noidiom -Mvect=prefetch feedback=0 basepeak=0 447.dealII=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast FOPTIMIZE = -Ofast -OPT:malloc_alg=1 PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata PORTABILITY = CXXOPTIMIZE=-Ofast -static -INLINE:aggressive=on -OPT:malloc_alg=1 -m32 -fno-exceptions feedback=0 basepeak=0 450.soplex=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast FOPTIMIZE = -Ofast -OPT:malloc_alg=1 PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata CXXOPTIMIZE=-m32 -O3 -OPT:IEEE_arith=3 -CG:load_exe=0:movnti=1 -LNO:minvariant=off:prefetch=1 -fno-exceptions PORTABILITY = feedback=1 basepeak=0 453.povray=peak=default=default: feedback=0 basepeak=1 454.calculix=peak=default=default: feedback=0 basepeak=1 459.GemsFDTD=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata FOPTIMIZE = -Ofast -LNO:fission=2:prefetch=0 feedback=0 basepeak=0 465.tonto=peak=default=default: FOPTIMIZE = -fast -O4 -Mfprelaxed -Msmartalloc=huge:448 -Mipa=fast,inline -Mvect=noaltcode %{pgi_tp64} feedback=0 basepeak=0 470.lbm=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS= COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast FOPTIMIZE = -Ofast -OPT:malloc_alg=1 feedback=0 basepeak=0 481.wrf=peak=default=default: FOPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:448 -Mvect=noaltcode %{pgi_tp64} COPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:448 -Mvect=noaltcode %{pgi_tp64} feedback=0 basepeak=0 482.sphinx3=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = CXXOPTIMIZE = -Ofast FOPTIMIZE = -Ofast -OPT:malloc_alg=1 PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata COPTIMIZE = -O3 -OPT:Ofast -WOPT:aggstr=0 -m32 feedback=1 basepeak=0 ##################################################################### ## INT Peak Flags ##################################################################### int=peak=default=default: EXTRA_LIBS = basepeak=1 400.perlbench=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast -LNO:opt=0 CXXOPTIMIZE = -Ofast -m32 EXTRA_CXXLIBS = -L$(SHL_DIR) -lsmartheap PASS1_CFLAGS = -fb_create fbdata PASS1_CXXFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback=1 basepeak=0 401.bzip2=peak=default=default: COPTIMIZE = -fast -O4 -Msmartalloc=huge:448 %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mpfo PASS2_LDFLAGS = -Mpfo feedback=1 basepeak=0 403.gcc=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = CXXOPTIMIZE = -Ofast -m32 EXTRA_CXXLIBS = -L$(SHL_DIR) -lsmartheap PASS1_CFLAGS = -fb_create fbdata PASS1_CXXFLAGS= -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_CXXFLAGS= -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata PORTABILITY = CPORTABILITY = COPTIMIZE = -m32 -O3 -OPT:Ofast feedback=1 basepeak=0 429.mcf=peak=default=default: COPTIMIZE = -fastsse -Mipa=fast,inline:1 -Msmartalloc=huge:420 %{pgi_tp32} feedback=0 basepeak=0 445.gobmk=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = PORTABILITY = -DSPEC_CPU_LP64 CXXOPTIMIZE = -Ofast -m32 EXTRA_CXXLIBS = -L$(SHL_DIR) -lsmartheap PASS1_CFLAGS = -fb_create fbdata PASS1_CXXFLAGS= -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_CXXFLAGS= -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata COPTIMIZE = -O3 -OPT:alias=disjoint -LNO:simd=0:minvariant=off -WOPT:retype_expr=on feedback=1 basepeak=0 456.hmmer=peak=default=default: COPTIMIZE = -fast -Msmartalloc=huge:448 -Mfprelaxed -Msafeptr -Mipa=const,ptr,arg %{pgi_tp64} feedback=0 basepeak=0 458.sjeng=peak=default=default: COPTIMIZE = -fast -Msmartalloc=huge:448 -Mfprelaxed %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline:1,noarg -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline:1,noarg -Mpfo feedback=1 basepeak=0 462.libquantum=peak=default=default: COPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:448 -Munroll=m:4 -Mipa=fast,inline,noarg feedback=0 basepeak=0 464.h264ref=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -O3 -IPA:plimit=20000 -OPT:alias=disjoint -LNO:prefetch=0 CXXOPTIMIZE = -Ofast -m32 EXTRA_CXXLIBS = -L$(SHL_DIR) -lsmartheap PASS1_CFLAGS = -fb_create fbdata PASS1_CXXFLAGS= -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_CXXFLAGS= -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback=1 basepeak=0 471.omnetpp=peak=default=default: feedback=0 basepeak=1 473.astar=peak=default=default: CXXOPTIMIZE = -fastsse -O4 -Msmartalloc=huge:160 -Mfprelaxed --zc_eh %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline -Mpfo feedback=0 basepeak=1 483.xalancbmk=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = PORTABILITY = CXXOPTIMIZE = -Ofast -m32 -OPT:unroll_times_max=8 COPTIMIZE = -Ofast -OPT:malloc_alg=1 EXTRA_CXXLIBS = -L$(SHL_DIR) -lsmartheap PASS1_CFLAGS = -fb_create fbdata PASS1_CXXFLAGS= -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_CXXFLAGS= -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback=0 basepeak=0 ##################################################################### # Portability ##################################################################### fp=default=default=default: PORTABILITY = -DSPEC_CPU_LP64 int=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 400.perlbench=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX_X64 429.mcf=peak=default=default: CPORTABILITY = 435.gromacs=default=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=base=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=peak=default=default: FPORTABILITY= -fno-second-underscore 454.calculix=default=default=default: LDPORTABILITY = -Mnomain 447.dealII=peak=default=default: CXXPORTABILITY = 462.libquantum=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX 481.wrf=default=default=default: CPORTABILITY=-DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX 483.xalancbmk=default=default=default: CXXPORTABILITY= -DSPEC_CPU_LINUX # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: flagsurl000= http://www.spec.org/cpu2006/flags/amd814GH-flags.20090714.xml nc000 = SPEC has determined that this result was not in compliance with nc001 = the SPEC CPU2006 run and reporting rules. Specifically, the nc002 = submitter reported that the result would not meet the 3 month nc003 = availability requirement in the SPEC CPU2006 run rules due to a nc004 = change in the availability date of the processor. notes_000 = The test system can be assembled using two notes_005 = Ablecom PWS-702A-1R 700W 12V redundant power supplies.