# Invocation command line: # /cpu2006/bin/runspec --verbose=6 -c hp-hybrid -F pgi710b_flags.xml -T all fp # output_root was not used for this run ############################################################################ # PGI 7.1 CPU2006 Configuration File for 64-bit Linux (Dual-Core) # # Compiler name/version: PGI 7.1-0 # Operating system version: 64-bit Linux # Hardware: AMD Opteron (Dual-core) # FP Base Pointer Size: 64-bit only # FP Peak Pointer Size: 64-bit only # INT Base Pointer Size: 32/64-bit # INT Peak Pointer Size: 32/64-bit # Auto Parallization: With FP/INT Peak # # Important! Please run with your stack size set to 'unlimited'. # Failure to do so may cause 483.xalancbmk to get a stack overflow during execution. # Using csh: unlimit # Using bash: ulimit -s unlimited # # Set your LD_LIBRARY_PATH to the location of the PGI and Smartheap runtime libraries # # Also be sure to adjust the submit command and makeflags to match # the number of cores in use. # Please adjust the SHL_DIR variable to the directory containing # the Smartheap library. ##################################################################### # Header Section ##################################################################### ext = pgi711_ps30_rate ignore_errors = no tune = base,peak output_format = all size = ref check_md5 = yes reportable = yes env_vars = no teeout = no teerunout = no verbose = 6 # Adjust the make flag for the number of cores. makeflags = -j 2 ##################################################################### # Macro section #################################################################### # Modify this section to use the appropriate architecture flags %define pgi_tp64 -tp k8-64 %define pgi_tp32 -tp k8-32 #################################################################### # Include the SUT hardware and tester information #################################################################### #include: pgi_sut.cfg # ----- Begin inclusion of 'pgi_sut.cfg' ############################################################################ bind0 = numactl -m 0 --physcpubind=0 bind1 = numactl -m 0 --physcpubind=1 bind2 = numactl -m 1 --physcpubind=2 bind3 = numactl -m 1 --physcpubind=3 submit = echo "$command" > run.sh ; $BIND sh run.sh ################################################################ # Machine-specific section ################################################################ default=default=default=default: hw_cpu_name = AMD Opteron 2222 hw_cpu_mhz = 3000 hw_disk = 1x146 GB 10 K SAS hw_fpu = Integrated hw_memory = 32 GB (8x4 GB PC2-5300P CL5) hw_vendor = Hewlett-Packard Company hw_model000 = ProLiant DL185 G5 hw_model001 = (3.0 GHz AMD Opteron 2222) hw_avail = Jan-2008 hw_nchips = 2 hw_ncores = 4 hw_ncoresperchip= 2 hw_nthreadspercore = 1 hw_ncpuorder = 1,2 chips hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 1 MB I+D on chip per core hw_tcache = None hw_ocache = None hw_other = None sw_file = ext2 sw_os000 = SUSE Linux Enterprise Server 10 (x86_64) SP1 sw_os001 = Kernel 2.6.16.46-0.12-smp sw_state = Multi-user run level 3 license_num = 3 test_date = Dec-2007 prepared_by = ISS Performance Engineering test_sponsor = Hewlett-Packard Company tester = Hewlett-Packard Company # ---- End inclusion of '/cpu2006/config/pgi_sut.cfg' use_submit_for_speed = 1 ############################ Software Info ############################ fp=default=default=default: sw_avail = Nov-2007 sw_compiler000 = The Portland Group (PGI) sw_compiler001 = PGI pgf90 7.1-1 Fortran Compiler sw_compiler002 = PGI pgcc 7.1-1 C Compiler sw_compiler003 = PGI pgCC 7.1-1 C++ Compiler sw_compiler004 = QLogic PathScale Compiler Suite, sw_other = None sw_compiler005 = Release 3.0 sw_peak_ptrsize = 32/64-bit sw_base_ptrsize = 64-bit sw_auto_parallel = No int=default=default=default: sw_avail = Oct-2007 sw_compiler1 = The Portland Group (PGI) sw_compiler3 = PGI pgcc 7.1-1 C Compiler sw_compiler4 = PGI pgCC 7.1-1 C++ Compiler sw_peak_ptrsize = 32/64-bit sw_base_ptrsize = 32/64-bit sw_auto_parallel = No sw_other = SmartHeap 8.0 32-bit Library for Linux default=default=default=default: ##################################################################### # Compiler selection # # CC = pgcc -w CXX = pgcpp -w FC = pgf95 -w SHL_DIR = /cpu2006/SmartHeap_8.1/lib ##################################################################### # Optimization ##################################################################### default=default=default=default: EXTRA_LDFLAGS = -Bstatic_pgi fp=base=default=default: COPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:8 %{pgi_tp64} CXXOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:8 --zc_eh %{pgi_tp64} FOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:8 %{pgi_tp64} int=base=default=default: COPTIMIZE = -fast -Mipa=fast,inline,noarg -Mfprelaxed -Msmartalloc=huge:840 %{pgi_tp64} CXXOPTIMIZE = -fastsse -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 --zc_eh %{pgi_tp32} EXTRA_CXXLIBS= -L$(SHL_DIR) -lsmartheap ##################################################################### ## FP Peak Flags ##################################################################### fp=peak=default=default: EXTRA_LIBS= basepeak=0 410.bwaves=peak=default=default: FOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc %{pgi_tp64} feedback=0 basepeak=0 416.gamess=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = FOPTIMIZE=-O2 -OPT:Ofast:ro=3:unroll_size=256 PASS1_FFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata 433.milc=peak=default=default: COPTIMIZE = -fast -O4 -Mdse -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline,noarg -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline,noarg -Mpfo feedback=1 basepeak=0 434.zeusmp=peak=default=default: feedback=0 basepeak=1 435.gromacs=peak=default=default: COPTIMIZE = -fast -O4 -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} FOPTIMIZE = -fast -O4 -Mfpapprox=rsqrt -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:448 %{pgi_tp64} feedback=0 basepeak=0 436.cactusADM=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE=-O3 -LNO:prefetch=3:prefetch_ahead=5:ou_prod_max=10:full_unroll=5 -ipa FOPTIMIZE=-O3 -LNO:prefetch=3:prefetch_ahead=5:ou_prod_max=10:full_unroll=5 -ipa 437.leslie3d=peak=default=default: CC = pathcc CXX = pathCC FC = pathf95 EXTRA_LDFLAGS = COPTIMIZE = -Ofast CXXOPTIMIZE = -Ofast FOPTIMIZE = -Ofast -OPT:malloc_alg=1 feedback=0 basepeak=0 444.namd=peak=default=default: CXXOPTIMIZE = -fast -O4 -Mfprelaxed -Msmartalloc=huge:448 --zc_eh %{pgi_tp64} -Mnodepchk -Mprefetch -Msafe_lastval -Msafeptr=static -Mstride0 -Munroll=n:4 -Mvect=noidiom -Mvect=prefetch feedback=0 basepeak=0 447.dealII=peak=default=default: CXX = pathCC EXTRA_LDFLAGS = CXXOPTIMIZE=-Ofast -static -INLINE:aggressive=on -OPT:malloc_alg=1 -m32 -fno-exceptions feedback=0 450.soplex=peak=default=default: CXX = pathCC EXTRA_LDFLAGS = CXXOPTIMIZE=-m32 -O3 -OPT:IEEE_arith=3 -CG:load_exe=0:movnti=1 -LNO:minvariant=off:prefetch=1 -fno-exceptions PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback=1 453.povray=peak=default=default: CXX = pathCC EXTRA_LDFLAGS = CXXOPTIMIZE=-Ofast -fno-fast-math PASS1_CXXFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback=1 454.calculix=peak=default=default: feedback=0 basepeak=1 459.GemsFDTD=peak=default=default: FC = pathf95 EXTRA_LDFLAGS = FOPTIMIZE=-Ofast -LNO:fission=2:prefetch=0 feedback=0 465.tonto=peak=default=default: FOPTIMIZE = -fast -O4 -Mfprelaxed -Msmartalloc=huge:448 -Mipa=fast,inline -Mvect=noaltcode %{pgi_tp64} feedback=0 basepeak=0 470.lbm=peak=default=default: CC = pathcc EXTRA_LDFLAGS = COPTIMIZE = -Ofast feedback=0 basepeak=0 481.wrf=peak=default=default: FOPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:448 -Mvect=noaltcode %{pgi_tp64} COPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:448 -Mvect=noaltcode %{pgi_tp64} basepeak=0 feedback=0 482.sphinx3=peak=default=default: CC = pathcc EXTRA_LDFLAGS = COPTIMIZE=-O3 -OPT:Ofast -WOPT:aggstr=0 -m32 PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata ##################################################################### ## INT Peak Flags ##################################################################### int=peak=default=default: EXTRA_LIBS = basepeak=1 400.perlbench=peak=default=default: CC = pathcc EXTRA_LDFLAGS = COPTIMIZE=-Ofast -LNO:opt=0 PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata basepeak=0 401.bzip2=peak=default=default: COPTIMIZE = -fast -O4 -Msmartalloc=huge:448 %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mpfo PASS2_LDFLAGS = -Mpfo feedback=1 basepeak=0 403.gcc=peak=default=default: CC = pathcc EXTRA_LDFLAGS = COPTIMIZE=-m32 -O3 -OPT:Ofast PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata basepeak=0 429.mcf=peak=default=default: COPTIMIZE = -fastsse -Mipa=fast,inline -Msmartalloc=huge:420 %{pgi_tp32} feedback=0 basepeak=0 445.gobmk=peak=default=default: CC = pathcc EXTRA_LDFLAGS = COPTIMIZE=-O3 -OPT:alias=disjoint -LNO:simd=0:minvariant=off -WOPT:retype_expr=on PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata basepeak=0 456.hmmer=peak=default=default: COPTIMIZE = -fast -Msmartalloc=huge:448 -Mfprelaxed -Msafeptr -Mipa=const,ptr,arg %{pgi_tp64} feedback=0 basepeak=0 458.sjeng=peak=default=default: COPTIMIZE = -fast -Msmartalloc=huge:448 -Mfprelaxed %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline,noarg -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline,noarg -Mpfo feedback=1 basepeak=0 462.libquantum=peak=default=default: COPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:448 -Munroll=m:4 -Mipa=fast,inline,noarg feedback=0 basepeak=0 464.h264ref=peak=default=default: CC = pathcc CXX = pathCC EXTRA_LDFLAGS = COPTIMIZE=-O3 -IPA:plimit=20000 -OPT:alias=disjoint -LNO:prefetch=0 PASS1_CFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_LDFLAGS = -fb_opt fbdata basepeak=0 471.omnetpp=peak=default=default: feedback=0 basepeak=1 473.astar=peak=default=default: feedback=0 basepeak=1 483.xalancbmk=peak=default=default: CXXOPTIMIZE = -fastsse -O4 -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:420 --zc_eh %{pgi_tp32} EXTRA_CXXLIBS= -L$(SHL_DIR) -lsmartheap feedback=0 basepeak=0 ##################################################################### # Portability ##################################################################### fp=default=default=default: PORTABILITY = -DSPEC_CPU_LP64 int=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 400.perlbench=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX_X64 403.gcc=peak=default=default: CPORTABILITY = 429.mcf=peak=default=default: CPORTABILITY = 435.gromacs=default=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=base=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=peak=default=default: FPORTABILITY= -fno-second-underscore 447.dealII=peak=default=default: PORTABILITY = 450.soplex=peak=default=default: PORTABILITY = 454.calculix=default=default=default: LDPORTABILITY = -Mnomain 462.libquantum=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX 481.wrf=default=default=default: CPORTABILITY=-DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX 482.sphinx3=peak=default=default: PORTABILITY = 483.xalancbmk=default=default=default: CXXPORTABILITY= -DSPEC_CPU_LINUX # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: flagsurl000= http://www.spec.org/cpu2006/flags/hp-pgi710_ps30_flags.xml notes_os_000=Environment stack size set to 'unlimited' notes_os_005=ulimit -l set to 1048576 notes_os_010='numactl' was used to bind copies to the cores notes_os_015=Set vm/nr_hugepages=1024 in /etc/sysctl.conf notes_os_020=mount -t hugetlbfs nodev /mnt/hugepages