# Invocation command line: # /home/root/specmpi_local/bin/runspec --config=lenovoA21O402H47R81-2.cfg --size=mref --tune=base --reportable --rank=128 --iterations=3 medium # output_root was not used for this run ############################################################################ %define ext A21_O402_H47_R81 ################################################################################ # Compilers ################################################################################ default: CPL=/opt/OMPI/O402_A21_H47_R81 ext = A21O402H47R81 CC = ${CPL}/bin/mpicc CXX = ${CPL}/bin/mpic++ FC = ${CPL}/bin/mpifort #mpif90 CC_VERSION_OPTION = --version CXX_VERSION_OPTION = --version FC_VERSION_OPTION = --version submit = ${CPL}/bin/mpirun --allow-run-as-root -np $ranks $command ################################################################################ # Portability Flags ################################################################################ default:# data model applies to all benchmarks EXTRA_PORTABILITY = -DSPEC_LP64 #MATHLIBOPT = -lamdlibm -lm ################################################################################ # Tuning Flags ################################################################################ 121.pop2=default=default=default: CPORTABILITY = -DSPEC_MPI_CASE_FLAG # TBD:flto is giving relocation error 126.lammps=default=default=default: CXXPORTABILITY = -DMPICH_IGNORE_CXX_SEEK 127.wrf2=default=default=default: CPORTABILITY = -DSPEC_MPI_CASE_FLAG -DSPEC_MPI_LINUX -Wno-return-type 147.l2wrf2=default=default=default: CPORTABILITY = -Wno-return-type ##################### # Base tuning flags # ##################### default=base: COPTIMIZE = -Ofast -flto -ffast-math -march=znver2 -mavx2 #-mno-avx2 O3 CXXOPTIMIZE = -Ofast -flto -ffast-math -march=znver2 -mavx2 #-mno-avx2 O3 FOPTIMIZE = -Ofast -flto -ffast-math -march=znver2 -funroll-loops -ffast-math -mavx2 #-mno-avx2 O3 ##EXTRA_LIBS = -lamdlibm -ljemalloc ##EXTRA_FLIBS = -lamdlibm -lm EXTRA_LIBS = -L/home/AMD_FFTW/amd-fftw/lib -lfftw3 -L/home/AMD_libm/amd-libm/lib -lamdlibm -lm -L/home/AMD_blis/amd-blis/lib EXTRA_FLIBS = -L/home/AMD_FFTW/amd-fftw/lib -lfftw3 -L/home/AMD_libm/amd-libm/lib -lamdlibm -lm -L/home/AMD_blis/amd-blis/lib ##################### # Peak tuning flags # ##################### default=peak: COPTIMIZE = -O3 -flto -ffast-math -march=znver1 -mno-avx2 CXXOPTIMIZE = -O3 -flto -ffast-math -march=znver1 -mno-avx2 FOPTIMIZE = -O3 -march=znver1 -mno-avx2 -funroll-loops -ffast-math EXTRA_LIBS = -lamdlibm -ljemalloc EXTRA_FLIBS = -lamdlibm -lm #MPIRUN_OPTS=--allow-run-as-root -mca coll_hcoll_enable 1 -x HCOLL_MAIN_IB=mlx5_0:1 -mca pml ucx -x UCX_TLS=sm -x UCX_DC_MLX5_NUM_DCI=16 --map-by numa MPIRUN_OPTS=--allow-run-as-root --map-by numa #submit = mpiexec -hosts localhost -n $ranks $command # 1N #submit = /opt/OpenMPI/OMPI402_ICC20_HPCX47/bin/mpirun --allow-run-as-root --oversubscribe -x HCOLL_MAIN_IB=mlx5_0:1 -np $ranks $command #submit = ${CPL}/bin/mpirun --allow-run-as-root -mca coll_hcoll_enable 1 -x HCOLL_MAIN_IB=mlx5_0:1 -mca pml ucx -x UCX_TLS=sm -x UCX_DC_MLX5_NUM_DCI=16 --map-by numa -np $ranks $command submit = ${CPL}/bin/mpirun ${MPIRUN_OPTS} -np $ranks $command # 2Ns #submit = /opt/OpenMPI/OMPI402_ICC20_HPCX47/bin/mpirun --allow-run-as-root -host 192.168.99.161,192.168.99.185 --oversubscribe -mca coll_hcoll_enable 1 -x HCOLL_MAIN_IB=mlx5_0:1 -mca pml ucx -x UCX_TLS=sm,dc_x -x UCX_DC_MLX5_NUM_DCI=16 --map-by numa -np $ranks $command # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: sw_base_ptrsize = 64-bit sw_peak_ptrsize = Not Applicable sw_other = None sw_mpi_other = None sw_preprocessors = No test_sponsor = Lenovo Global Technology license_num = 28 tester = Lenovo Global Technology hw_avail = Jun-2020 sw_avail = Jun-2020 prepared_by = Lenovo Global Technology system_vendor = Lenovo Global Technology node_fileserver_sw_state = Multi-User, run level 3 node_fileserver_sw_sharedfile = NFS node_fileserver_sw_other = None node_fileserver_sw_os = Red Hat Enterprise Linux Server release 8.1 node_fileserver_sw_localfile = None node_fileserver_purpose = Fileserver node_fileserver_order = 2 node_fileserver_label = NFS node_fileserver_hw_vendor = Lenovo Global Technology node_fileserver_hw_scache = 512 KB I+D on chip per core node_fileserver_hw_pcache = 32 KB I + 32 KB D on chip per core node_fileserver_hw_other = None node_fileserver_hw_ocache = None node_fileserver_hw_nthreadspercore = 1 node_fileserver_hw_ncpuorder = 1-2 chips node_fileserver_hw_ncoresperchip = 64 node_fileserver_hw_ncores = 128 node_fileserver_hw_nchips = 2 node_fileserver_hw_model = ThinkSystem SR665 node_fileserver_hw_memory = 1 TB (16 x 64 GB 2Rx4 PC4-3200AA-R) node_fileserver_hw_disk = 1 x 480 GB SATA 2.5" SSD node_fileserver_hw_cpu_name = AMD EPYC 7H12 CPU node_fileserver_hw_cpu_mhz = 2600 node_fileserver_hw_cpu_char = None node_fileserver_hw_adapter_fs_slot_type = PCI-Express 4.0 x16 node_fileserver_hw_adapter_fs_ports_used = 1 node_fileserver_hw_adapter_fs_model = Mellanox ConnectX-6 HDR Infiniband node_fileserver_hw_adapter_fs_interconnect = Mellanox ConnectX-6 HDR Infiniband node_fileserver_hw_adapter_fs_firmware = 20.25.2006 node_fileserver_hw_adapter_fs_driver = 4.7-1.0.0.1.2 node_fileserver_hw_adapter_fs_data_rate = 200 Gb/s node_fileserver_hw_adapter_fs_count = 1 node_fileserver_count = 1 node_compute_sw_state = Multi-user, run level 3 node_compute_sw_sharedfile = None node_compute_sw_other = None node_compute_sw_localfile = xfs node_compute_purpose = compute node_compute_order = 1 node_compute_label = ThinkSystem SR665 node_compute_hw_vendor = Lenovo Global Technology node_compute_hw_scache = 512 KB I+D on chip per core node_compute_hw_pcache = 32 KB I + 32 KB D on chip per core node_compute_hw_other = None node_compute_hw_ocache = None node_compute_hw_nthreadspercore = 1 node_compute_hw_ncpuorder = 1-2 chips node_compute_hw_ncoresperchip = 64 node_compute_hw_ncores = 128 node_compute_hw_nchips = 2 node_compute_hw_model = SR665 node_compute_hw_memory = 1 TB (16 x 64 GB 2Rx4 PC4-3200AA-R) node_compute_hw_disk = 1 x 480 GB SATA 2.5" SSD node_compute_hw_cpu_name = AMD EPYC 7H12 node_compute_hw_cpu_mhz = 2600 node_compute_hw_cpu_char = None node_compute_hw_adapter_fs_slot_type = PCI-Express 4.0 x16 node_compute_hw_adapter_fs_ports_used = 1 node_compute_hw_adapter_fs_model = Mellanox ConnectX-6 HDR Infiniband node_compute_hw_adapter_fs_interconnect = Mellanox ConnectX-6 HDR Infiniband Adapter node_compute_hw_adapter_fs_firmware = 20.25.2006 node_compute_hw_adapter_fs_driver = 4.7-1.0.0.1.2 node_compute_hw_adapter_fs_data_rate = 200 Gbs/s node_compute_hw_adapter_fs_count = 1 node_compute_count = 1 flagsurl000 = http://www.spec.org/mpi2007/flags/EM64T_Intel121_flags.20200506.01.xml node_compute_hw_tcache000 = 256 MB I+D on chip per chip node_compute_hw_tcache001 = 16 MB shared / 4 cores node_compute_sw_os000 = Red Hat Enterprise Linux Server release 8.1, node_compute_sw_os001 = 4.18.0-147.el8.x86_64 sw_c_compiler000 = AMD Optimizing C Compiler for Linux sw_c_compiler001 = Version 2.1 Build 1030.2019_11_12 sw_cxx_compiler000 = AMD Optimizing C++ Compiler for Linux sw_cxx_compiler001 = Version 2.1 Build 1030.2019_11_12 sw_f_compiler000 = AMD Optimizing Fortran Compiler for Linux sw_f_compiler001 = Version 2.1 Build 1030.2019_11_12 sw_mpi_library000 = OpenMPI MPI Library sw_mpi_library001 = Version 4.0.2 system_class = Homogeneous system_name000 = ThinkSystem SR665 system_name001 = (AMD EPYC 7H12, 2.6 GHz) notes_000 = MPI startup command: notes_005 = mpiexec command was used to start MPI jobs. notes_010 = RAM configuration: notes_015 = Compute nodes have 1 x 32 GB RDIMM on each memory channel. notes_020 = Add "idle=poll" into grub notes_025 = BIOS settings: notes_030 = Operating Mode : Maximum Performance Mode notes_035 = Hyper-Threading Technology (SMT): Enabled notes_040 = NPS4 notes_045 = Yes: The test sponsor attests, as of date of publication, notes_050 = that CVE-2017-5754 (Meltdown) is mitigated in the system as tested and documented. notes_055 = Yes: The test sponsor attests, as of date of publication, notes_060 = that CVE-2017-5753 (Spectre variant 1) is mitigated in the system as tested and documented. notes_065 = Yes: The test sponsor attests, as of date of publication, notes_070 = that CVE-2017-5715 (Spectre variant 2) is mitigated in the system as tested and documented. node_fileserver_hw_tcache001 = 256 MB I+D on chip per chip node_fileserver_hw_tcache002 = 16 MB shared / 4 cores