# Invocation command line:
# /home/HPC2021F1.0.1/bin/harness/runhpc --reportable --config=4Ns_AMD_I204_O410.cfg --tune=base --pmodel=OMP --define model=omp --threads=8 --rank=48 --size=ref --iterations=3 tiny
# output_root was not used for this run
############################################################################
#strict_rundir_verify=1

# The following setting was inserted automatically as a result of
# post-run basepeak application.
basepeak = 1

%ifndef %{label}         # IF acctype is not set use mpi
%   define label I204_OMPI410_AMD
%endif

%ifndef %{model}         # IF acctype is not set use mpi
%   define model mpi
pmodel=MPI
#%   define acctype omp
#%   define acctype cuda
%endif

teeout = yes
makeflags=-j 32

flagsurl000=http://www.spec.org/hpc2021/flags/Intel_compiler_flags.2021-10-20.xml

label         = %{label}_%{model}
tune          = base
output_format = text
use_submit_for_speed = 1

default:
CC           = mpicc
CXX          = mpicxx
FC           = mpifort

CC_VERSION_OPTION  = -V -c
CXX_VERSION_OPTION = -V -c
FC_VERSION_OPTION  = -V -c

submit = mpirun --allow-run-as-root --oversubscribe --bind-to numa -map-by numa -mca coll_hcoll_enable 1 -x HCOLL_ENABLE_NBC=1 -x HCOLL_MAIN_IB=mlx5_0:1 -mca pml ucx -hostfile /home/HPC2021F1.0.1/config/4nodes -npernode 128 -np $ranks $command
%if %{model} eq 'omp'
	submit = mpirun --allow-run-as-root --oversubscribe  -mca coll_hcoll_enable 1 -x HCOLL_ENABLE_NBC=1 -x HCOLL_MAIN_IB=mlx5_0:1 -mca pml ucx -hostfile /home/HPC2021F1.0.1/config/4nodes --map-by ppr:16:node:pe=8 -np $ranks $command
%endif

default=base=default:
OPTIMIZE     = -Ofast -no-prec-div -march=core-avx2 -ipo
COPTIMIZE     = -ansi-alias
CXXOPTIMIZE   = -ansi-alias
#PORTABILITY = -DSPEC_LP64
#PORTABILITY += -std=c99

%if %{model} eq 'omp'
  pmodel = OMP
  OPTIMIZE += -qopenmp
%endif

613.soma_s=default=default:
%if %{model} eq 'omp'
        PORTABILITY += -DSPEC_NO_VAR_ARRAY_REDUCE
%endif

513.soma_t=default=default:
%if %{model} eq 'omp'
        PORTABILITY += -DSPEC_NO_VAR_ARRAY_REDUCE
%endif


# The following section was added automatically, and contains settings that
# did not appear in the original configuration file, but were added to the
# raw file after the run.
default:
system_class = Homogenous
sw_compiler = Intel C/C++/Fortran Compiler 2021.5.0
sw_mpi_library = Open MPI 4.0.5
test_sponsor = Lenovo Global Technology
license_num = 28
tester = Lenovo Global Technology
hw_avail = Jul-2022
sw_avail = Jul-2022
prepared_by = Lenovo Global Technology
system_vendor = Lenovo Global Technology
system_name = ThinkSystem SR665 (AMD EPYC 7773X)
node_compute_syslbl = ThinkSystem SR665
node_compute_sw_state = Multi-user, run level 3
node_compute_sw_sharedfile = NFS
node_compute_sw_other = None
node_compute_sw_localfile = xfs
node_compute_purpose = Compute
node_compute_order = 1
node_compute_hw_vendor = Lenovo Global Technology
node_compute_hw_scache = 512 KB I+D on chip per core
node_compute_hw_pcache = 32 KB I + 32 KB D on chip per core
node_compute_hw_other = None
node_compute_hw_ocache = None
node_compute_hw_nthreadspercore = 2
node_compute_hw_ncpuorder = 1,2 chips
node_compute_hw_ncoresperchip = 64
node_compute_hw_ncores = 128
node_compute_hw_nchips = 2
node_compute_hw_model = ThinkSystem SR665
node_compute_hw_memory = 1 TB (16 x 64 GB 2Rx4 PC4-3200A-R)
node_compute_hw_disk = 1x ThinkSystem 2.5" 5300 480GB SSD
node_compute_hw_cpu_name = AMD EPYC 7773X
node_compute_hw_cpu_mhz = 2200
node_compute_hw_cpu_char = Max Boost Clock up to 3.5 GHz
node_compute_hw_adapter_fs_slot_type = PCI-Express 4.0 x16
node_compute_hw_adapter_fs_ports_used = 1
node_compute_hw_adapter_fs_model = Mellanox ConnectX-6 HDR
node_compute_hw_adapter_fs_interconnect = Nvidia Mellanox ConnectX-6 HDR
node_compute_hw_adapter_fs_firmware = 20.28.1002
node_compute_hw_adapter_fs_driver = 5.2-1.0.4
node_compute_hw_adapter_fs_data_rate = 200 Gbits/s
node_compute_hw_adapter_fs_count = 1
node_compute_count = 3
interconnect_fs_syslbl = Nvidia Mellanox ConnectX-6 HDR
interconnect_fs_purpose = MPI Traffic, NFS Access
interconnect_fs_order = 0
interconnect_fs_label = Nvidia Mellanox ConnectX-6 HDR
interconnect_fs_hw_vendor = Nvidia
interconnect_fs_hw_topo = Mesh
interconnect_fs_hw_switch_fs_ports = 40
interconnect_fs_hw_switch_fs_model = QM8700
interconnect_fs_hw_switch_fs_firmware = 3.9.0606
interconnect_fs_hw_switch_fs_data_rate = 200 Gb/s
interconnect_fs_hw_switch_fs_count = 1
interconnect_fs_hw_model = Nvidia Mellanox ConnectX-6 HDR
node_compute_hw_tcache000 = 768 MB I+D on chip per chip
node_compute_hw_tcache001 = 96 MB shared / 8 cores
node_compute_sw_os000 = Red Hat Enterprise Linux Server release 8.5,
node_compute_sw_os001 = Kernel 4.18.0-348.el8.x86_64
notes_submit_000 =The config file option 'submit' was used.
notes_submit_005 =submit = mpirun --allow-run-as-root  --oversubscribe -genv coll_hcoll_enable 1
notes_submit_010 =-x HCOLL_ENABLE_NBC=1 -x HCOLL_MAIN_IB=mlx5_0:1 -mca pml ucx
notes_submit_015 =-hostfile /home/HPC2021F1.0.1/config/4nodes --map-by ppr:16:node:pe=8