# Invocation command line: # /autobench/sources/speccpu2006/bin/runspec --config XL-128c-kit12.cfg --action run --rate 1 --copies 512 --reportable --nobuild --tune all --iterations 3 --define numcores=128 --extension XL_1214-Sep_2012_PTF_RC2_120816_interin-rhel63-Saturn fp # output_root was not used for this run ############################################################################ ####################################################################### # # SPEC CPU2006 Benchmark Config file IBM eServer pSeries Linux # ####################################################################### # THIS CONFIG FILE IS FOR BUILDING on P6 # # --define (-S) options that are passed to the runspec command # that dynamically affect this config file # # numcores=n The number of cores in the system # to determine how many copies to run in rate # # mybaseopt=x Allows override where x=3,4,5 (-O3, -O4, -O5) for base runs # # nolibhuge Allows override to not use extra libraries on base runs # nosmartheap # # debug Adds debug ('-g') compiler option %define P7 -qarch=pwr7 -qtune=pwr7 %define LHBDT -B/usr/share/libhugetlbfs/ -tl -Wl,--hugetlbfs-align %define LHLIB -lhugetlbfs ###################################### %define FDPROPTS -O4 -omullX %define FDPRINT %ifdef %{numcores} %define make_j %{numcores} %else %define make_j 4 %endif #====================================================================== # Global Options apply to all runs #====================================================================== # # For just a report generated without a raw file or any runs required # Do a "runspec --reportonly" (also --action=report or --fakereport) # # Just set up the build or run directories, use --buildsetup or --setup # on the runspec command # Sets nobuild as the default - you will need -D to force a compile # nobuild = 1 # -D forces a build (recompile) # -N prohibits a build (recompile) #action = validate # -a #tune = base # -T #iterations = 1 # -n output_format = text,html,csv # -o #basepeak = 0 #reportable = 0 # -l turns off #ignore_errors = 1 # -I mean_anyway = 1 allow_extension_override = 1 #ext = XL-ppc64 # -e size = ref post_setup = sync parallel_test = 1 sysinfo_program = # Include the run-time derived system information so that each # system run has the correct information #include: SUT.inc # ----- Begin inclusion of 'SUT.inc' ############################################################################ # company_name = IBM Corporation hw_vendor = IBM Corporation license_num = 11 sw_state = Run level 3 (multi-user) hw_cpu_mhz = 3724 hw_cpu_name = POWER7+ hw_memory = 1 TB (64 x 16 GB) DDR3 1066 MHz # # # hw_disk = 12x146.8 GB SAS SFF 15K RPM # # sw_os000 = Red Hat Enterprise Linux Server release 6.3 sw_os001 = (ppc64) kernel 2.6.32-279.el6.ppc64 sw_file = ext4 # # sw_avail = Dec-2012 # essl.rte-5.1.0-0.ppc64 sw_compiler000 = C/C++: Version 12.1 of IBM XL C/C++ for Linux; sw_compiler001 =Fortran: Version 14.1 of IBM XL Fortran for Linux essl.rte-5.1.0-0.ppc64 sw_other000= -Post-Link Optimization for Linux on sw_other001 = POWER, version 5.6.1-7 sw_other002= -MicroQuill SmartHeap 9 essl.rte-5.1.0-0.ppc64 sw_other003= -Apache C++ Standard Library V4.2.1 notes_000 = The following environment varibles were set before the runspec command: notes_005 = export HUGETLB_VERBOSE=0 # hw_model = IBM Power 780 (3.7 GHz, 128 core, RHEL) hw_avail =Oct-2012 # hw_ncpuorder =32,64,96,128 cores hw_nchips =16 hw_ncores = 128 hw_nthreadspercore = 4 hw_ncoresperchip =8 hw_pcache =32 KB I + 32 KB D on chip per core hw_fpu = Integrated hw_other =None # # hw_scache =256 KB I+D on chip per core hw_tcache =10 MB I+D on chip per core hw_ocache =None # # # notes_010 = export HUGETLB_MORECORE=yes notes_015 = export XLFRTEOPTS=intrinthds=1 notes_020 = export HUGETLB_ELFMAP=RW # # # # ppc64_cpu output # ---- End inclusion of '/autobench/sources/speccpu2006/config/SUT.inc' # This tells runspec to set enviornment variables of the form # ENV_xxx if found in here. Forced to 0 for reportable runs env_vars = 0 # Control if the embedded md5 string of compiler options is checked for # recompile if the options have changed check_md5 = 0 # Controls if the log file info is echo'd to the screen teeout = yes # If 1, make copy of the config file before modifing with MD5 # signitures of the compile options. backup_config = 0 # verbose -> -v #verbose = 1 to 99, 5 is default, 91 is good for debugging verbose = 1 %ifdef %{make_j} makeflags = -j%{make_j} %endif # We alway use submit to ensure there is a bindprocessor done. # use_submit_for_speed If set, use submit commands for speed as well as rate use_submit_for_speed = 1 submit = numactl --membind=\$SPECCOPYNUM --physcpubind=\$SPECCOPYNUM $command %ifdef %{hugectl_int} submit = hugectl --heap numactl --physcpubind=\$SPECCOPYNUM --membind=\$SPECCOPYNUM $command %endif %ifdef %{hugectl_fp} submit = hugectl --heap --text --data --bss numactl --physcpubind=\$SPECCOPYNUM --membind=\$SPECCOPYNUM $command %endif bind = \ 0 4 8 12 16 20 24 28 32 36 40 44 48 52 56 60 64 68 72 76 80 84 88 92 96 100 104 108 112 116 120 124 128 132 136 140 144 148 152 156 160 164 168 172 176 180 184 188 192 196 200 204 208 212 216 220 224 228 232 236 240 244 248 252 256 260 264 268 272 276 280 284 288 292 296 300 304 308 312 316 320 324 328 332 336 340 344 348 352 356 360 364 368 372 376 380 384 388 392 396 400 404 408 412 416 420 424 428 432 436 440 444 448 452 456 460 464 468 472 476 480 484 488 492 496 500 504 508 \ 1 5 9 13 17 21 25 29 33 37 41 45 49 53 57 61 65 69 73 77 81 85 89 93 97 101 105 109 113 117 121 125 129 133 137 141 145 149 153 157 161 165 169 173 177 181 185 189 193 197 201 205 209 213 217 221 225 229 233 237 241 245 249 253 257 261 265 269 273 277 281 285 289 293 297 301 305 309 313 317 321 325 329 333 337 341 345 349 353 357 361 365 369 373 377 381 385 389 393 397 401 405 409 413 417 421 425 429 433 437 441 445 449 453 457 461 465 469 473 477 481 485 489 493 497 501 505 509 \ 2 6 10 14 18 22 26 30 34 38 42 46 50 54 58 62 66 70 74 78 82 86 90 94 98 102 106 110 114 118 122 126 130 134 138 142 146 150 154 158 162 166 170 174 178 182 186 190 194 198 202 206 210 214 218 222 226 230 234 238 242 246 250 254 258 262 266 270 274 278 282 286 290 294 298 302 306 310 314 318 322 326 330 334 338 342 346 350 354 358 362 366 370 374 378 382 386 390 394 398 402 406 410 414 418 422 426 430 434 438 442 446 450 454 458 462 466 470 474 478 482 486 490 494 498 502 506 510 \ 3 7 11 15 19 23 27 31 35 39 43 47 51 55 59 63 67 71 75 79 83 87 91 95 99 103 107 111 115 119 123 127 131 135 139 143 147 151 155 159 163 167 171 175 179 183 187 191 195 199 203 207 211 215 219 223 227 231 235 239 243 247 251 255 259 263 267 271 275 279 283 287 291 295 299 303 307 311 315 319 323 327 331 335 339 343 347 351 355 359 363 367 371 375 379 383 387 391 395 399 403 407 411 415 419 423 427 431 435 439 443 447 451 455 459 463 467 471 475 479 483 487 491 495 499 503 507 511 # 16 NUMA nodes, 8-core per NUMA node # 128 cores, 4 threads per core (SMT4) # # Topology: # - Processors 0-31: NUMA node 0, # - Processors 32-63: NUMA node 1, # - Processors 64-95: NUMA node 2, # - Processors 96-127: NUMA node 3, # - Processors 128-159: NUMA node 4, # - Processors 160-191: NUMA node 5, # - Processors 192-223: NUMA node 6, # - Processors 224-255: NUMA node 7, # - Processors 256-287: NUMA node 8, # - Processors 288-319: NUMA node 9, # - Processors 320-351: NUMA node 10, # - Processors 352-383: NUMA node 11, # - Processors 384-415: NUMA node 12, # - Processors 416-447: NUMA node 13, # - Processors 448-479: NUMA node 14, # - Processors 480-511: NUMA node 15. %if %{numcores} == 128 copies = 512 submit = let "MYCPU=\$BIND"; MYMEM=`printf '%d' \$((\$MYCPU/32))` ; numactl --physcpubind=\$MYCPU --membind=\$MYMEM $command %ifdef %{hugectl_int} submit = let "MYCPU=\$BIND"; MYMEM=`printf '%d' \$((\$MYCPU/32))` ; hugectl --heap numactl --physcpubind=\$MYCPU --membind=\$MYMEM $command %endif %ifdef %{hugectl_fp} submit = let "MYCPU=\$BIND"; MYMEM=`printf '%d' \$((\$MYCPU/32))` ; hugectl --heap --text --data --bss numactl --physcpubind=\$MYCPU --membind=\$MYMEM $command %endif %endif notes_submit_000= The config file option 'submit' was used notes_submit_005= to assign benchmark copy to specific kernel thread using notes_submit_010= the "numactl" command (see flags file for details). #--prevent log file lines that are too long for vi log_line_width = 130 # Point to where the usr/compiler/OS Flags file is flagsurl000= http://www.spec.org/cpu2006/flags/IBM-Linux-XL.20121024.xml flagsurl001= http://www.spec.org/cpu2006/flags/IBM-Power.xml # IBM Compilers 12.1/14.1 updated to the Sep 2012 PTF CC_PATH = /opt/ibmcmp/vac/12.1/bin CXX_PATH = /opt/ibmcmp/vacpp/12.1/bin XLF_PATH = /opt/ibmcmp/xlf/14.1/bin #=============================================================================== # How the compilers are called # The settings used here are for IBM C/C++ and xl Fortran compilers #=============================================================================== default=default=default=default: CC = $(CC_PATH)/xlc -qlanglvl=extc99 CXX = $(CXX_PATH)/xlC FC = $(XLF_PATH)/xlf95 #====================================================================== # Base Level Optimizations # No limit to number of flags, must be same for all of each Language. #====================================================================== default=base=default=default: %if %{mymode64} sw_base_ptrsize = 64-bit %else sw_base_ptrsize = 32-bit %endif %ifndef %{debug} %define DEBUG %else %define DEBUG -g %endif %define BASEARCH %{P7} %if %{mymode64} %define MODE -q64 %else %define MODE -q32 %endif %define BASEOPT -O5 %{BASEARCH} %{MODE} %{DEBUG} -qipa=threads #Check for BASEOPT overrides %if %{mybaseopt} == 3 %define BASEOPT -O3 %{BASEARCH} %{MODE} %{DEBUG} %endif #====================================================================== # INT and FP Portability Flags # no optimizations allowed here #====================================================================== default=default=default=default: %if %{mymode64} CPORTABILITY = -DSPEC_CPU_LP64 CXXPORTABILITY = -DSPEC_CPU_LP64 FPPPORTABILITY = -DSPEC_CPU_LP64 400.perlbench=default=default=default: CPORTABILITY = -DSPEC_CPU_LINUX_PPC -DSPEC_CPU_LP64 403.gcc=peak=default=default: CPORTABILITY = -DSPEC_CPU_LP64 410.bwaves=default=default=default: FPORTABILITY = -qfixed 416.gamess=default=default=default: FPORTABILITY = -qfixed 434.zeusmp=default=default=default: FPORTABILITY = -qfixed 435.gromacs=default=default=default: FPORTABILITY = -qfixed -qextname 436.cactusADM=default=default=default: FPORTABILITY = -qfixed -qextname CPORTABILITY = -DSPEC_CPU_LP64 FPPPORTABILITY = -DSPEC_CPU_LP64 437.leslie3d=default=default=default: FPORTABILITY = -qfixed 453.povray=default=default=default: CXXPORTABILITY = -DSPEC_CPU_LP64 454.calculix=default=default=default: FPORTABILITY = -qfixed -qextname 462.libquantum=default=default=default: CPORTABILITY = -DSPEC_CPU_LINUX -DSPEC_CPU_LP64 464.h264ref=default=default=default: CPORTABILITY = -qchars=signed -DSPEC_CPU_LP64 481.wrf=default=default=default: CPORTABILITY = -DNOUNDERSCORE -DSPEC_CPU_LP64 482.sphinx3=default=default=default: CPORTABILITY = -qchars=signed -DSPEC_CPU_LP64 483.xalancbmk=default=default=default: CXXPORTABILITY = -DSPEC_CPU_LINUX -DSPEC_CPU_LP64 %else 400.perlbench=default=default=default: CPORTABILITY = -DSPEC_CPU_LINUX_PPC 462.libquantum=default=default=default: CPORTABILITY = -DSPEC_CPU_LINUX 464.h264ref=default=default=default: CPORTABILITY = -qchars=signed 483.xalancbmk=default=default=default: CXXPORTABILITY = -DSPEC_CPU_LINUX 410.bwaves=default=default=default: FPORTABILITY = -qfixed 416.gamess=default=default=default: FPORTABILITY = -qfixed 434.zeusmp=default=default=default: FPORTABILITY = -qfixed 435.gromacs=default=default=default: FPORTABILITY = -qfixed -qextname 436.cactusADM=default=default=default: FPORTABILITY = -qfixed -qextname 437.leslie3d=default=default=default: FPORTABILITY = -qfixed 454.calculix=default=default=default: FPORTABILITY = -qfixed -qextname 481.wrf=default=default=default: CPORTABILITY = -DNOUNDERSCORE 482.sphinx3=default=default=default: CPORTABILITY = -qchars=signed %endif # mymode64 #====================================================================== # INT and FP Base Flags #====================================================================== int=base=default=default: COPTIMIZE = %{BASEOPT} -qalias=noansi -qalloca CXXOPTIMIZE = %{BASEOPT} -qrtti EXTRA_CLIBS = %{LHLIB} EXTRA_CXXLIBS = -lsmartheap EXTRA_LDFLAGS = %{MODE} fp=base=default=default: COPTIMIZE = %{BASEOPT} %{LHBDT} CXXOPTIMIZE = %{BASEOPT} -qrtti EXTRA_CXXLIBS = %{LHBDT} #FOPTIMIZE = %{BASEOPT} -qsmallstack=dynlenonheap -qalias=nostd %{LHBDT} FOPTIMIZE = %{BASEOPT} -qalias=nostd %{LHBDT} EXTRA_LDFLAGS = %{MODE} #====================================================================== # # Default peak flags. # #====================================================================== default=peak=default=default: sw_peak_ptrsize = 32/64-bit %define O2 -O2 %{BASEARCH} %{DEBUG} %define O3 -O3 %{BASEARCH} %{DEBUG} %define O4 -O4 %{BASEARCH} %{DEBUG} -qipa=threads %define O5 -O5 %{BASEARCH} %{DEBUG} -qipa=threads #====================================================================== # INT peak Flags #====================================================================== int=peak=default=default: 400.perlbench=peak=default=default: # C only Benchmark # #fdpr 5503 failed with -O4 -vrox OPTIMIZE = %{O4} -qalias=noansi -qipa=level=2 EXTRA_LIBS = -lsmartheap LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr -imullX ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -omullX ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CPORTABILITY = -DSPEC_CPU_LINUX_PPC -DSPEC_CPU_LP64 COPTIMIZE = -q64 %else CPORTABILITY = -DSPEC_CPU_LINUX_PPC %endif notes_peak_fdpr_400_000= Post-Link optimization tool used for: notes_peak_fdpr_400_005 = 400.perlbench notes_peak_fdpr_400_010= with options -O4 -omullX for optimization phase, notes_peak_fdpr_400_015= and -imullX for instrumentation phase 401.bzip2=peak=default=default: # C only Benchmark OPTIMIZE = %{O3} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -vrox ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif notes_peak_fdpr_401_000= 401.bzip2 notes_peak_fdpr_401_005= with options -O4 -vrox 403.gcc=peak=default=default: # C only Benchmark OPTIMIZE = %{O4} -qalloca EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -nodp -rtb ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CPORTABILITY = -DSPEC_CPU_LP64 COPTIMIZE = -q64 %endif notes_peak_fdpr_403_000= 403.gcc notes_peak_fdpr_403_005= with options -O4 -nodp -rtb 429.mcf=peak=default=default: # C only Benchmark %if %{numcores} == 128 copies = 256 %endif OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q fdo_pre1 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run1 = $command fdo_post1 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif notes_peak_fdpr_429_000= 429.mcf 445.gobmk 458.sjeng 473.astar notes_peak_fdpr_429_005= with options -O3 445.gobmk=peak=default=default: # C only Benchmark OPTIMIZE = %{O4} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif 456.hmmer=peak=default=default: # C only Benchmark OPTIMIZE = %{O5} -qsimd -qassert=refalign -qipa=inline=threshold=2888 -qipa=inline=limit=11880 EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q fdo_pre1 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run1 = $command fdo_post1 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -nodp -m power7 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif notes_peak_fdpr_456_000= 456.hmmer notes_peak_fdpr_456_005= with options -O4 -nodp -m power7 458.sjeng=peak=default=default: # C only Benchmark OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif 462.libquantum=peak=default=default: # C only Benchmark %if %{numcores} == 128 copies = 256 %endif %define 64 OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -vrox -nodp ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif %undef 64 notes_peak_fdpr_462_000= 462.libquantum notes_peak_fdpr_462_005= with options -O4 -vrox -nodp 464.h264ref=peak=default=default: # C only Benchmark #%define 64 OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -vrox -nodp -rtb ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif #%undef 64 notes_peak_fdpr_464_000= 464.h264ref notes_peak_fdpr_464_005= with options -O4 -vrox -nodp -rtb 471.omnetpp=peak=default=default: # C++ Benchmark #OPTIMIZE = %{O5} -qrtti CXXOPTIMIZE = %{O4} -qrtti EXTRA_LIBS = -lsmartheap LDCXXFLAGS = -Wl,-q PASS1_CXXFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CXXFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 -lu -1 -nodp -sdp 9 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CXXOPTIMIZE = -q64 %endif notes_peak_fdpr_471_000= 471.omnetpp notes_peak_fdpr_471_005= with options -O3 -lu -1 -nodp -sdp 9 473.astar=peak=default=default: # C++ Benchmark OPTIMIZE = %{O4} EXTRA_LIBS = %{LHLIB} -lsmartheap LDCXXFLAGS = -Wl,-q PASS1_CXXFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CXXFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CXXOPTIMIZE = -q64 %endif 483.xalancbmk=peak=default=default: # C++ Benchmark OPTIMIZE = %{O4} -qipa=partition=large EXTRA_LIBS = -lsmartheap LDCXXFLAGS = -Wl,-q fdo_pre1 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run1 = $command fdo_post1 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 -m power7 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CXXOPTIMIZE = -q64 %endif notes_peak_fdpr_483_000= 483.xalancbmk notes_peak_fdpr_483_005= with options -O3 -m power7 999.specrand=peak=default=default: # C only Benchmark - Must run, but not reported unless fails OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 #====================================================================== # FP peak Flags #====================================================================== fp=peak=default=default: 410.bwaves=peak=default=default: # Fortran Benchmark #got 3% gain with -qsmallstack in single-threaded. %if %{numcores} == 128 copies = 128 #copies = 256 %endif %define 64 OPTIMIZE = %{O4} -qsmallstack=dynlenonheap EXTRA_LIBS = %{LHLIB} PASS1_FFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_FFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 %ifdef %{64} FOPTIMIZE = -q64 %endif %undef 64 416.gamess=peak=default=default: # Fortran Benchmark OPTIMIZE = %{O5} -qalias=nostd EXTRA_LIBS = %{LHLIB} PASS1_FFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_FFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 %ifdef %{64} FOPTIMIZE = -q64 %endif 433.milc=peak=default=default: # C only Benchmark %if %{numcores} == 128 copies = 128 #copies = 256 %endif OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q fdo_pre1 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run1 = $command fdo_post1 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -nodp ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif notes_peak_fdpr_433_000= Post-Link optimization tool used for: notes_peak_fdpr_433_005= 433.milc 435.gromacs 450.soplex 482.sphinx3 notes_peak_fdpr_433_010 = with options -O4 -nodp 434.zeusmp=peak=default=default: # Fortran Benchmark OPTIMIZE = %{O3} -qxlf90=nosignedzero EXTRA_LIBS = %{LHBDT} PASS1_FFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_FFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 LDFFLAGS = -Wl,-q fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -vrox -nodp ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} FOPTIMIZE = -q64 %endif notes_peak_fdpr_434_000= 434.zeusmp notes_peak_fdpr_434_005 = with options -O4 -vrox -nodp 435.gromacs=peak=default=default: # Fortran & C Benchmark OPTIMIZE = %{O4} -qsimd EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q LDFFLAGS = -Wl,-q PASS1_FFLAGS = -qpdf1 PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_FFLAGS = -qpdf2 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -nodp ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 FOPTIMIZE = -q64 %endif 436.cactusADM=peak=default=default: # Fortran & C Benchmark %if %{numcores} == 128 copies = 256 %endif %define 64 OPTIMIZE = %{O4} -qsimd -qnostrict FOPTIMIZE = -qsmallstack=dynlenonheap -qalias=nostd EXTRA_LIBS = %{LHLIB} %ifdef %{64} FPORTABILITY = -qfixed -qextname FPPPORTABILITY = -DSPEC_CPU_LP64 CPORTABILITY = -DSPEC_CPU_LP64 FOPTIMIZE = -q64 COPTIMIZE = -q64 %else FPORTABILITY = -qfixed -qextname %endif %undef 64 437.leslie3d=peak=default=default: # Fortran Benchmark %if %{numcores} == 128 copies = 128 #copies = 256 %endif %define 64 OPTIMIZE = %{O5} EXTRA_LIBS = %{LHBDT} LDFFLAGS = -Wl,-q fdo_pre1 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run1 = $command fdo_post1 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 -lu -1 -nodp -sdp 9 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} FOPTIMIZE = -q64 %endif %undef 64 notes_peak_fdpr_437_000 = 437.leslie3d notes_peak_fdpr_437_005 = with options -O3 -lu -1 -nodp -sdp 9 444.namd=peak=default=default: # C++ Benchmark OPTIMIZE = %{O5} EXTRA_LIBS = %{LHLIB} LDCXXFLAGS = -Wl,-q PASS1_CXXFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CXXFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 -lu -1 -nodp -sdp 9 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CXXOPTIMIZE = -q64 %endif notes_peak_fdpr_444_000 = 444.namd notes_peak_fdpr_444_005 = with options -O3 -lu -1 -nodp -sdp 9 447.dealII=peak=default=default: # C++ Benchmark OPTIMIZE = %{O4} -qrtti EXTRA_CXXFLAGS = -qcpp_stdinc=/autobench/sources/speccpu2006/stdcxx421/include/ansi:/autobench/sources/speccpu2006/stdcxx421/include:/opt/ibmcmp/vacpp/12.1/include EXTRA_CXXLIBS = -L/autobench/sources/speccpu2006/stdcxx421/lib -R/autobench/sources/speccpu2006/stdcxx421/lib -lstd8d EXTRA_LIBS = -lsmartheap %ifdef %{64} CXXOPTIMIZE = -q64 %endif 450.soplex=peak=default=default: # C++ Benchmark %if %{numcores} == 128 copies = 256 %endif %define 64 OPTIMIZE = %{O3} EXTRA_LIBS = %{LHLIB} LDCXXFLAGS = -Wl,-q PASS1_CXXFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CXXFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -nodp ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CXXOPTIMIZE = -q64 %endif %undef 64 notes_peak_fdpr_450_000 = 450.soplex notes_peak_fdpr_450_005 = with options -O4 -nodp 453.povray=peak=default=default: # C++ Benchmark %define 64 OPTIMIZE = %{O4} -qsimd EXTRA_LIBS = -lsmartheap64 LDCXXFLAGS = -Wl,-q PASS1_CXXFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CXXFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 #FDPR XL11 + 5.5.0.2 brokes it #FDPR XL11 + 5.5.0.3 looping with ref input #fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} #fdo_run2 = $command #fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} CXXPORTABILITY = -DSPEC_CPU_LP64 CXXOPTIMIZE = -q64 %endif %undef 64 454.calculix=peak=default=default: # Fortran & C Benchmark OPTIMIZE = %{O5} EXTRA_LIBS = %{LHBDT} ## fdpr 5503 failed when using with LHBDT #LDCFLAGS = -Wl,-q #LDFFLAGS = -Wl,-q PASS1_FFLAGS = -qpdf1 PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_FFLAGS = -qpdf2 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 #fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr ${baseexe}; cp ${baseexe}.instr ${baseexe} #fdo_run2 = $command #fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O3 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} FOPTIMIZE = -q64 COPTIMIZE = -q64 %endif 459.GemsFDTD=peak=default=default: # Fortran Benchmark %if %{numcores} == 128 copies = 128 #copies = 256 %endif OPTIMIZE = %{O4} -qsimd EXTRA_LIBS = %{LHBDT} %ifdef %{64} FOPTIMIZE = -q64 %endif 465.tonto=peak=default=default: # Fortran Benchmark OPTIMIZE = %{O5} -qsimd # SmartHeap version 9 is not supported with XL11 EXTRA_LIBS = %{LHLIB} PASS1_FFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_FFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 LDFFLAGS = -Wl,-q fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} FOPTIMIZE = -q64 %endif notes_peak_fdpr_465_000 = 465.tonto notes_peak_fdpr_465_005 = with options -O4 470.lbm=peak=default=default: # C Benchmark OPTIMIZE = %{O5} EXTRA_LIBS = %{LHBDT} PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 %ifdef %{64} COPTIMIZE = -q64 %endif 481.wrf=peak=default=default: # Fortran & C-for netCDF Benchmark #with or w/o smallstack make no diff # -O3 is better than O5 %define 64 OPTIMIZE = %{O3} EXTRA_LIBS = %{LHLIB} %ifdef %{64} COPTIMIZE = -q64 FOPTIMIZE = -q64 %endif %undef 64 482.sphinx3=peak=default=default: # C only Benchmark %if %{numcores} == 128 copies = 128 #copies = 256 %endif OPTIMIZE = %{O4} EXTRA_LIBS = %{LHLIB} LDCFLAGS = -Wl,-q PASS1_CFLAGS = -qpdf1 PASS1_LDFLAGS = -qpdf1 PASS2_CFLAGS = -qpdf2 PASS2_LDFLAGS = -qpdf2 fdo_pre2 = cp ${baseexe} ${baseexe}.orig ; /opt/bin/fdprpro -a instr %{FDPRINT} ${baseexe}; cp ${baseexe}.instr ${baseexe} fdo_run2 = $command fdo_post2 = cp ${baseexe}.orig ${baseexe} ; /opt/bin/fdprpro -a opt -f ${baseexe}.nprof -O4 -nodp ${baseexe} ; cp ${baseexe}.fdpr ${baseexe} %ifdef %{64} COPTIMIZE = -q64 %endif notes_peak_fdpr_482_000 = 482.sphinx3 notes_peak_fdpr_482_005 = with options -O4 -nodp 998.specrand=peak=default=default: # C only Benchmark - Must run, but not reported unless fails OPTIMIZE = %{O5} # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. 434.zeusmp: # The following setting was inserted automatically as a result of # post-run basepeak application. basepeak = 1 default: test_sponsor = IBM Corporation tester = IBM Corporation hw_cpu_char000 = Intelligent Energy Optimization enabled, hw_cpu_char001 = up to 4.144 GHz notes_plat_000 = Service processor memory mirroring property disabled. notes_plat_005 = Hardware Page Table (HPT) ratio changed as follows by root user on Hardware Management Console (HMC): notes_plat_010 = chsyscfg -m -r prof -i "name=,lpar_name=,hpt_ratio=1:512" notes_os_000 = ulimit -s (stack) set to 1048576. notes_os_005 = ulimit -s (open files) set to 500000. notes_os_010 = Filesystem cache changed as follows by root user: notes_os_015 = echo 150 > /proc/sys/vm/vfs_cache_pressure notes_os_020 = Large pages reserved as follows by root user: notes_os_025 = echo 6000 > /proc/sys/vm/nr_hugepages notes_os_030 = echo 30000 > /proc/sys/vm/nr_overcommit_hugepages notes_os_035 = The Apache C++ Standard Library V4.2.1 was installed from notes_os_040 = http://stdcxx.apache.org/download.html using: notes_os_045 = gmake BUILDTYPE=8d CONFIG=gcc.config notes_comp_iler_000= C/C++ compiler updated to December 2012 PTF notes_comp_iler_005= Version: 12.01.0000.0002 notes_comp_iler_010= Fortran compiler updated to December 2012 PTF notes_comp_iler_015= Version: 14.01.0000.0002