# Invocation command line: # /root/cpu2017/bin/harness/runcpu --configfile kachkin-xl-linux-ppc64le_numactl.cfg --tune base --iterations 2 --reportable --nopower --runmode rate --tune base --size refrate fprate # output_root was not used for this run ############################################################################ #------------------------------------------------------------------------------ # SPEC CPU2017 config file for: XL / Linux / IBM POWER #------------------------------------------------------------------------------ # # Usage: (1) Copy this to a new name # cd $SPEC/config # cp Example-x.cfg myname.cfg # (2) Change items that are marked 'EDIT' (search for it) # # SPEC tested this config file with: # Compiler name/version: XL C/C++: V13.1.5 # XL Fortran: V15.1.5 # Operating system version: Ubuntu 16.04.1 LTS, RHEL 7.1 and RHEL 7.2 # on PowerPC64 Little-Endian. # Hardware: POWER8 # # # If your system differs, this config file might not work. # You might find a better config file at http://www.spec.org/cpu2017/results # # You may find that it is required to increase the process stack size to # something greater than the default in order to build or run some benchmarks. # This can be done with the command "ulimit -s ". For example, # to remove any limit, you can type the following command in your shell before # invoking runcpu - # ulimit -s unlimited # # This config file is intended only for 64-bit compilation. # # Compiler issues: Contact your compiler vendor, not SPEC. # For SPEC help: http://www.spec.org/cpu2017/Docs/techsupport.html #------------------------------------------------------------------------------ #--------- Label -------------------------------------------------------------- # Arbitrary string to tag binaries # Two Suggestions: # (1) EDIT this label as you try new ideas. %define label sk_reportable_test # (2) Use a label meaningful to *you*. #--------- Preprocessor ------------------------------------------------------- %ifndef %{build_ncpus} # EDIT to adjust number of simultaneous compiles. % define build_ncpus 128 # Or, you can set it on the command line: %endif # 'runcpu --define build_ncpus=nn' # Don't change this part. %define model -m64 %ifdef %{bits} % if %{bits} == 64 % info . % info Note: For this config file, you do not need '--define bits' % info . because PowerPC64 Little-Endian ABI is always 64-bit. % info . % else % error This config file always uses 64 bits. Please remove your setting for 'bits'. % endif %endif #--------- Global Settings ---------------------------------------------------- # For info, see: # https://www.spec.org/cpu2017/Docs/config.html#fieldname # Example: https://www.spec.org/cpu2017/Docs/config.html#tune flagsurl000 = http://www.spec.org/cpu2017/flags/vesnin_xl-V1.2.xml flagsurl001 = http://www.spec.org/cpu2017/flags/vesnin_platform-V1.3.xml ignore_errors = 1 iterations = 1 label = %{label}-q64 makeflags = --jobs=%{build_ncpus} mean_anyway = 1 output_format = txt,html,cfg,pdf,csv preenv = 1 preENV_OMP_STACKSIZE = 192M reportable = 0 tune = base,peak #--------- How Many CPUs? ----------------------------------------------------- # Both SPECrate and SPECspeed can test multiple chips / cores / hw threads # - For SPECrate, you set the number of copies. # - For SPECspeed, you set the number of threads. # See: https://www.spec.org/cpu2017/Docs/system-requirements.html#MultipleCPUs # # q. How many should I set? # a. Unknown, you will have to try it and see! # # To get you started, some suggestions: # # copies - This config file defaults to testing only 1 copy. You might # try increasing it to match the number of logical processors, # if you have enough memory. See: # https://www.spec.org/cpu2017/Docs/system-requirements.html#memory # # threads - This config file sets a starting point. You could try raising # it. A higher thread count is much more likely to be useful for # fpspeed than for intspeed. # intrate,fprate: copies = 160 # EDIT to change number of copies (see above) intspeed,fpspeed: threads = 40 # EDIT to change number of OpenMP threads (see above) bind = </dev/null; $command notes_submit_000 = The config file option 'submit' was used notes_submit_010 = to assign benchmark copy to specific kernel thread using notes_submit_020 = the "numactl -l -C " command. #--------- Compilers ---------------------------------------------------------- default: CC_PATH = /opt/ibm/xlC/13.1.5/bin CXX_PATH = /opt/ibm/xlC/13.1.5/bin XLF_PATH = /opt/ibm/xlf/15.1.5/bin # How to say "Show me your version, please" CC_VERSION_OPTION = -qversion=verbose CXX_VERSION_OPTION = -qversion=verbose FC_VERSION_OPTION = -qversion=verbose specrate: # 5xx.benchname is the 900 MB dataset CC = $(CC_PATH)/xlc -qlanglvl=extc99 CXX = $(CXX_PATH)/xlC FC = $(XLF_PATH)/xlf95 specspeed: # 6xx.benchname is the up to 14 GB dataset CC = $(CC_PATH)/xlc_r -qlanglvl=extc99 # NOTE: _r here means re-entrant. CXX = $(CXX_PATH)/xlC_r # Thus _r invocation of the FC = $(XLF_PATH)/xlf95_r # compilers are used for speed. default: sw_base_ptrsize = 64-bit sw_peak_ptrsize = Not Applicable #--------- Portability -------------------------------------------------------- default: # data model applies to all benchmarks EXTRA_PORTABILITY = -DSPEC_LP64 500.perlbench_r,600.perlbench_s: CPORTABILITY = -DSPEC_LINUX_PPC_LE 503.bwaves_r,603.bwaves_s: FPORTABILITY = -qfixed 507.cactuBSSN_r,607.cactuBSSN_s: CPORTABILITY = -DSPEC_NO_UNDERSCORE 510.parest_r: CXXPORTABILITY = -qnoxlcompatmacros 521.wrf_r,621.wrf_s: CPORTABILITY = -DSPEC_NOUNDERSCORE FPPPORTABILITY = -DSPEC_IBMXL EXTRA_FPORTABILITY = -qufmt=be 523.xalancbmk_r,623.xalancbmk_s: CXXPORTABILITY = -DSPEC_LINUX 526.blender_r: PORTABILITY = -qchars=unsigned CXXPORTABILITY = -D__BOOL_DEFINED 527.cam4_r,627.cam4_s: CPORTABILITY = -DSPEC_NO_UNDERSCORE 628.pop2_s: CPORTABILITY = -DSPEC_NO_UNDERSCORE EXTRA_FPORTABILITY = -qufmt=be #-------- Tuning Flags common to Base and Peak -------------------------------- default: # default for all: int/fp, rate/speed, base, peak OPTIMIZE = -O5 -q64 -qinline=40 -qipa=threads -qsimd=noauto specspeed: EXTRA_OPTIMIZE = -qsmp=omp EXTRA_COPTIMIZE = -DSPEC_OPENMP EXTRA_CXXOPTIMIZE = -DSPEC_OPENMP EXTRA_FPPOPTIMIZE = -DSPEC_OPENMP #-------- Baseline Tuning Flags ---------------------------------------------- # 500.perlbench_r/600.perlbench_s needs -qalias=noansi # 502.gcc_r/602.gcc_s needs -fgnu89-inline or -z muldefs # For 'base', all benchmarks must use the same options, so we # set those flags for all integer base benchmarks. # See: # www.spec.org/cpu2017/Docs/runrules.html#BaseFlags # www.spec.org/cpu2017/Docs/benchmarks/500.perlbench_r.html # www.spec.org/cpu2017/Docs/benchmarks/502.gcc_r.html # intrate,intspeed=base: COPTIMIZE = -qalias=noansi LDCFLAGS = -Wl,-z,muldefs fprate,fpspeed=base: FOPTIMIZE = -qsmallstack=dynlenonheap #-------- Peak Tuning Flags ---------------------------------------------- default=peak: fdo_pre0 = $CC_PATH/cleanpdf PASS1_FLAGS = -qpdf1 PASS2_FLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 500.perlbench_r,600.perlbench_s=peak: COPTIMIZE = -qalias=noansi -qstrict=nans 502.gcc_r,602.gcc_s=peak: LDCFLAGS = -Wl,-z,muldefs COPTIMIZE = -qalias=noansi 503.bwaves_r,603.bwaves_s=peak: FOPTIMIZE = -qsmallstack=dynlenonheap 521.wrf_r,621.wrf_s=peak: FOPTIMIZE = -qspill=4096 -qsmallstack=dynlenonheap 526.blender_r=peak: COPTIMIZE = -qalias=noansi 627.cam4_s=peak: ENV_OMP_STACKSIZE = 192M 628.pop2_s=peak: FOPTIMIZE = -qsmallstack=dynlenonheap 654.roms_s=peak: basepeak=yes #------------------------------------------------------------------------------ # Tester and System Descriptions - EDIT all sections below this point #------------------------------------------------------------------------------ # For info about any field, see # https://www.spec.org/cpu2017/Docs/config.html#fieldname # Example: https://www.spec.org/cpu2017/Docs/config.html#hw_memory #------------------------------------------------------------------------------- #--------- EDIT to match your version ----------------------------------------- default: sw_compiler000 = C/C++: Version 13.1.5 of IBM XL C/C++; sw_compiler001 = Fortran: Version 15.1.5 of IBM XL Fortran #--------- EDIT info about you ------------------------------------------------ # To understand the difference between hw_vendor/sponsor/tester, see: # https://www.spec.org/cpu2017/Docs/config.html#test_sponsor intrate,intspeed,fprate,fpspeed: # Important: keep this line hw_vendor = Yadro tester = Yadro test_sponsor = Yadro license_num = 4813 # prepared_by = # Ima Pseudonym # Whatever you like: is never output #--------- EDIT system availability dates ------------------------------------- intrate,intspeed,fprate,fpspeed: # Important: keep this line # Example # Brief info about field hw_avail = Dec-2017 # Date of LAST hardware component to ship sw_avail = Dec-2016 # Date of LAST software component to ship #--------- EDIT system information -------------------------------------------- intrate,intspeed,fprate,fpspeed: # Important: keep this line # Example # Brief info about field hw_cpu_name = IBM POWER8 hw_cpu_nominal_mhz = 2926 hw_cpu_max_mhz = 3491 # Max chip frequency, in MHz hw_disk = 1 x 7.3 TB 7200 RPM SATA hw_model = Yadro Vesnin (2.92 GHz, 40 cores, RHEL 7.4) hw_nchips = 4 # 99 # number chips enabled hw_ncores = 40 # 9999 # number cores enabled hw_ncpuorder = 1-4 chips# 1-9 chips # Ordering options hw_nthreadspercore = 4 # 9 # number threads enabled per core hw_other = None hw_memory000 = 4 TB (128 x 32 GB 2Rx4 PC4 - 2400T, hw_memory001 = running at 1600) hw_pcache = 32 KB I + 64 KB D on chip per core # 99 KB I + 99 KB D on chip per core # Primary cache size, type, location hw_scache = 512 KB I+D on chip per core hw_tcache = 8 MB I+D on chip per core# 9 MB I+D on chip per chip # Third cache or "None" hw_ocache = 16 MB I+D off chip per 8 DIMMs# 9 GB I+D off chip per system board # Other cache or "None" fw_bios = Version 1.19 of OpenPOWER Firmware. Released Nov-2017. sw_file = xfs # ext99 # File system sw_os000 = RHEL 7.2 #AIX 9.9.9.9. # Operating system sw_other = None sw_state = Run level 3 (multi-user) # Run level 99 # Software state. # Note: Some commented-out fields above are automatically set to preliminary # values by sysinfo # https://www.spec.org/cpu2017/Docs/config.html#sysinfo # Uncomment lines for which you already know a better answer than sysinfo. # The following settings were obtained by running the sysinfo_program # 'specperl $[top]/bin/sysinfo' (sysinfo:SHA:ecd2bef08f316af97f5a7768b641e2a3307c1b4b68efb5a57fa76367d790d233) default: notes_plat_sysinfo_000 = Sysinfo program /root/cpu2017/bin/sysinfo notes_plat_sysinfo_005 = Rev: r5797 of 2017-06-14 96c45e4568ad54c135fd618bcc091c0f notes_plat_sysinfo_010 = running on localhost.localdomain Fri Dec 22 23:29:42 2017 notes_plat_sysinfo_015 = notes_plat_sysinfo_020 = SUT (System Under Test) info as seen by some common utilities. notes_plat_sysinfo_025 = For more information on this section, see notes_plat_sysinfo_030 = https://www.spec.org/cpu2017/Docs/config.html#sysinfo notes_plat_sysinfo_035 = notes_plat_sysinfo_040 = From /proc/cpuinfo notes_plat_sysinfo_045 = 'clock : ' reported by /proc/cpuinfo may not be reliable. Use with caution. notes_plat_sysinfo_050 = cpu : POWER8 (raw), altivec supported notes_plat_sysinfo_055 = clock : 3491.000000MHz notes_plat_sysinfo_060 = machine : PowerNV 0000000000000000 notes_plat_sysinfo_065 = model : 0000000000000000 notes_plat_sysinfo_070 = platform : PowerNV notes_plat_sysinfo_075 = revision : 2.0 (pvr 004d 0200) notes_plat_sysinfo_080 = notes_plat_sysinfo_085 = Number of cores, from 'ppc64_cpu --cores-present' : 40 notes_plat_sysinfo_090 = notes_plat_sysinfo_095 = WARNING regarding the output of 'lscfg': this utility reports resources for the system, notes_plat_sysinfo_100 = not the current partition. Therefore, for a partition that has a subset of the full notes_plat_sysinfo_105 = system resources: notes_plat_sysinfo_110 = (1) The tester may need to adjust the sysinfo-supplied 'hw_ncores'. notes_plat_sysinfo_115 = (2) The tester may need to adjust the sysinfo-supplied 'hw_nchips'. notes_plat_sysinfo_120 = notes_plat_sysinfo_125 = Processors, from lscfg -vp notes_plat_sysinfo_130 = Node: processor@18 notes_plat_sysinfo_135 = Node: processor@10 notes_plat_sysinfo_140 = Node: processor@8 notes_plat_sysinfo_145 = Node: processor@0 notes_plat_sysinfo_150 = 160 "processors" notes_plat_sysinfo_155 = notes_plat_sysinfo_160 = From numactl --hardware WARNING: a numactl 'node' might or might not correspond to a notes_plat_sysinfo_165 = physical chip. notes_plat_sysinfo_170 = available: 4 nodes (0,8,16,24) notes_plat_sysinfo_175 = node 0 cpus: 0 1 2 3 8 9 10 11 16 17 18 19 24 25 26 27 32 33 34 35 40 41 42 43 48 49 50 notes_plat_sysinfo_180 = 51 56 57 58 59 64 65 66 67 72 73 74 75 notes_plat_sysinfo_185 = node 0 size: 1048576 MB notes_plat_sysinfo_190 = node 0 free: 972590 MB notes_plat_sysinfo_195 = node 8 cpus: 80 81 82 83 88 89 90 91 96 97 98 99 104 105 106 107 112 113 114 115 120 notes_plat_sysinfo_200 = 121 122 123 128 129 130 131 136 137 138 139 144 145 146 147 152 153 154 155 notes_plat_sysinfo_205 = node 8 size: 1048576 MB notes_plat_sysinfo_210 = node 8 free: 976361 MB notes_plat_sysinfo_215 = node 16 cpus: 160 161 162 163 168 169 170 171 176 177 178 179 184 185 186 187 192 193 notes_plat_sysinfo_220 = 194 195 200 201 202 203 208 209 210 211 216 217 218 219 224 225 226 227 232 233 234 235 notes_plat_sysinfo_225 = node 16 size: 1048576 MB notes_plat_sysinfo_230 = node 16 free: 976455 MB notes_plat_sysinfo_235 = node 24 cpus: 240 241 242 243 248 249 250 251 256 257 258 259 264 265 266 267 272 273 notes_plat_sysinfo_240 = 274 275 280 281 282 283 288 289 290 291 296 297 298 299 304 305 306 307 312 313 314 315 notes_plat_sysinfo_245 = node 24 size: 1048576 MB notes_plat_sysinfo_250 = node 24 free: 972943 MB notes_plat_sysinfo_255 = node distances: notes_plat_sysinfo_260 = node 0 8 16 24 notes_plat_sysinfo_265 = 0: 10 40 40 40 notes_plat_sysinfo_270 = 8: 40 10 40 40 notes_plat_sysinfo_275 = 16: 40 40 10 40 notes_plat_sysinfo_280 = 24: 40 40 40 10 notes_plat_sysinfo_285 = notes_plat_sysinfo_290 = From /proc/meminfo notes_plat_sysinfo_295 = MemTotal: 4282726848 kB notes_plat_sysinfo_300 = HugePages_Total: 16000 notes_plat_sysinfo_305 = Hugepagesize: 16384 kB notes_plat_sysinfo_310 = notes_plat_sysinfo_315 = From /etc/*release* /etc/*version* notes_plat_sysinfo_320 = os-release: notes_plat_sysinfo_325 = NAME="Red Hat Enterprise Linux Server" notes_plat_sysinfo_330 = VERSION="7.4 (Maipo)" notes_plat_sysinfo_335 = ID="rhel" notes_plat_sysinfo_340 = ID_LIKE="fedora" notes_plat_sysinfo_345 = VARIANT="Server" notes_plat_sysinfo_350 = VARIANT_ID="server" notes_plat_sysinfo_355 = VERSION_ID="7.4" notes_plat_sysinfo_360 = PRETTY_NAME="Red Hat Enterprise Linux" notes_plat_sysinfo_365 = redhat-release: Red Hat Enterprise Linux Server release 7.4 (Maipo) notes_plat_sysinfo_370 = system-release: Red Hat Enterprise Linux Server release 7.4 (Maipo) notes_plat_sysinfo_375 = system-release-cpe: cpe:/o:redhat:enterprise_linux:7.4:ga:server notes_plat_sysinfo_380 = notes_plat_sysinfo_385 = uname -a: notes_plat_sysinfo_390 = Linux localhost.localdomain 3.10.0-693.el7.ppc64le #1 SMP Thu Jul 6 19:59:44 EDT 2017 notes_plat_sysinfo_395 = ppc64le ppc64le ppc64le GNU/Linux notes_plat_sysinfo_400 = notes_plat_sysinfo_405 = run-level 3 2017-12-22 23:04 notes_plat_sysinfo_410 = notes_plat_sysinfo_415 = SPEC is set to: /root/cpu2017 notes_plat_sysinfo_420 = Filesystem Type Size Used Avail Use% Mounted on notes_plat_sysinfo_425 = /dev/mapper/rhel-root xfs 110G 57G 53G 53% / notes_plat_sysinfo_430 = notes_plat_sysinfo_435 = (End of data from sysinfo program) hw_cpu_name = POWER8 (raw), altivec supported hw_disk = 110 GB add more disk info here hw_memory001 = 4084.327 GB fixme: If using DDR3, format is: hw_memory002 = 'N GB (M x N GB nRxn PCn-nnnnnR-n, ECC)' hw_nchips = 4 hw_ncores = 40 hw_nthreadspercore = 4 prepared_by = root (is never output, only tags rawfile) sw_file = xfs sw_os001 = Red Hat Enterprise Linux Server release 7.4 sw_os002 = (Maipo) sw_os003 = 3.10.0-693.el7.ppc64le sw_state = Run level 3 (add definition here) # End of settings added by sysinfo_program # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: notes_000 ="ppc64_cpu --smt=4" used to set SMT4 mode (see flags file for details). notes_005 = notes_010 =Binaries were compiled on a system with 4x POWER8 chips + 4 TB Memory using rhel 7.2 notes_015 = notes_020 =No: The test sponsor attests, as of date of publication, that CVE-2017-5754 (Meltdown) notes_025 =is mitigated in the system as tested and documented. notes_030 =No: The test sponsor attests, as of date of publication, that CVE-2017-5753 (Spectre variant 1) notes_035 =is mitigated in the system as tested and documented. notes_040 =No: The test sponsor attests, as of date of publication, that CVE-2017-5715 (Spectre variant 2) notes_045 =is mitigated in the system as tested and documented. notes_050 = notes_055 =This benchmark result is intended to provide perspective on past performance using notes_060 =the historical hardware and/or software described on this result page. notes_065 = notes_070 =The system as described on this result page was formerly generally available. At the time of notes_075 =this publication, it may not be shipping, and/or may not be supported, and/or may fail notes_080 =to meet other tests of General Availability described in the SPEC OSG Policy document, notes_085 =http://www.spec.org/osg/policy.html notes_090 = notes_095 =This measured result may not be representative of the result that would be measured were this notes_100 =benchmark run with hardware and software available as of the publication date.