# Invocation command line: # /mnt/store/cpu2006/bin/runspec --define best_ratio --rate 32 --define cores=16 --define invoke_with_interleave -c ic121u2_avx_mix_hp_bl420c_gen8_intel_way.cfg -T all -o all fp # output_root was not used for this run ############################################################################ ############################################################################ ############################################################################ # This is a sample config file. It was tested with: # # Compiler name/version: Intel Compiler 12.1 U3 # Operating system version: 64-Bit RedHat Enterprise Linux64 6.2 # Hardware: Intel processors supporting AVX # ############################################################################ # SPEC CPU2006 Intel Linux64 config file # Mar 2011 IC 12.1 U3 Linux64 ############################################################################ action = validate tune = base,peak %define version 28jun2012 ext = ic121u2.avx_mix.rate.%{version} # fail_build = 1 PATHSEP = / check_md5=1 reportable=1 bench_post_setup=sync parallel_test=0 mean_anyway=1 #bind = 0 8 1 9 2 10 3 11 4 12 5 13 6 14 7 15 16 24 17 25 18 26 19 27 20 28 21 29 22 30 23 31 # Set some environment variables #preENV_LD_LIBRARY_PATH = /opt/smartheap/ # # These are listed as benchmark-tuning-extension-machine # int=default=default=default: CC= icc -m32 CXX= icpc -m32 OBJ = .o SMARTHEAP32_DIR = /opt/smartheap/ SMARTHEAP64_DIR = /opt/smartheap/ fp=default=default=default: CC= icc -m64 CXX= icpc -m64 FC= ifort -m64 OBJ = .o # For UP systems, we need to know if the processors are ordered across cores first or in order # If across cores, processors 0, 1, 2 and 3 are on distinct physical cores # Otherwise, processors 0, 2, 4 and 6 are on distinct physical cores default: submit = numactl --localalloc --physcpubind=$SPECCOPYNUM $command %ifdef %{no-numa} submit = taskset -c $SPECCOPYNUM $command %endif #################################################################### # Compiler options # for Nehalem use -xSSE4.2 # for processors prior to dunnington, replace -xSSE4.1 with -xSSSE3 #################################################################### default: SSE = -xAVX FASTNOSTATIC = $(SSE) -ipo -O3 -no-prec-div FAST = $(SSE) -ipo -O3 -no-prec-div -static ################################################################ # # portability & libraries # #################### Portability Flags and Notes ############################ 400.perlbench=default: CPORTABILITY= -DSPEC_CPU_LINUX_IA32 403.gcc=default: EXTRA_CFLAGS= -Dalloca=_alloca 462.libquantum=default: CPORTABILITY= -DSPEC_CPU_LINUX 483.xalancbmk=default: CXXPORTABILITY= -DSPEC_CPU_LINUX fp=default: PORTABILITY = -DSPEC_CPU_LP64 435.gromacs=default=default=default: LDPORTABILITY = -nofor_main 436.cactusADM=default=default=default: LDPORTABILITY = -nofor_main 454.calculix=default=default=default: LDPORTABILITY = -nofor_main 481.wrf=default=default=default: CPORTABILITY = -DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX ################################################################ # Tuning Flags ################################################################ # # Base tuning default optimization # Feedback directed optimization not allowed in baseline for CPU2006 # However there is no limit on the number of flags as long as the same # flags are used in the same order for all benchmarks of a given language 471.omnetpp,473.astar,483.xalancbmk=default: EXTRA_LIBS= -L$(SMARTHEAP32_DIR) -lsmartheap EXTRA_LDFLAGS= -Wl,-z,muldefs int=base=default=default: COPTIMIZE= $(FASTNOSTATIC) -opt-prefetch -opt-mem-layout-trans=3 CXXOPTIMIZE= $(FASTNOSTATIC) -opt-prefetch -opt-mem-layout-trans=3 fp=base=default=default: OPTIMIZE= $(FAST) -opt-prefetch COPTIMIZE= -auto-p32 -ansi-alias -opt-mem-layout-trans=3 CXXOPTIMIZE= -auto-p32 -ansi-alias -opt-mem-layout-trans=3 ################################################################ # Peak Tuning Flags int 2006 fast ################################################################ int=peak=default: COPTIMIZE= -ansi-alias -opt-mem-layout-trans=3 CXXOPTIMIZE= -ansi-alias -opt-mem-layout-trans=3 PASS1_CFLAGS = -prof-gen PASS2_CFLAGS = $(FASTNOSTATIC) -prof-use PASS1_CXXFLAGS = -prof-gen PASS2_CXXFLAGS = $(FASTNOSTATIC) -prof-use PASS1_LDCFLAGS = -prof-gen PASS2_LDCFLAGS = $(FASTNOSTATIC) -prof-use PASS1_LDCXXFLAGS = -prof-gen PASS2_LDCXXFLAGS = $(FASTNOSTATIC) -prof-use 400.perlbench=peak=default: CC= icc -m64 CPORTABILITY= -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX_X64 COPTIMIZE= -auto-ilp32 401.bzip2=peak=default: CC= icc -m64 CPORTABILITY= -DSPEC_CPU_LP64 COPTIMIZE= -opt-prefetch -auto-ilp32 -ansi-alias 403.gcc=peak=default: COPTIMIZE = $(FASTNOSTATIC) feedback=0 429.mcf=peak=default: basepeak=yes 445.gobmk=peak=default: PASS1_CFLAGS = -prof-gen PASS2_CFLAGS = $(SSE) -prof-use PASS1_LDCFLAGS = -prof-gen PASS2_LDCFLAGS = $(SSE) -prof-use 456.hmmer=peak=default: CC= icc -m64 CPORTABILITY= -DSPEC_CPU_LP64 COPTIMIZE= $(FASTNOSTATIC) -unroll2 -auto-ilp32 feedback=no 458.sjeng=peak=default: CC= icc -m64 CPORTABILITY= -DSPEC_CPU_LP64 COPTIMIZE= -unroll4 -auto-ilp32 462.libquantum=peak=default: basepeak=yes 464.h264ref=peak=default: COPTIMIZE= -unroll2 -ansi-alias 471.omnetpp=peak=default: CXXOPTIMIZE= -ansi-alias -opt-ra-region-strategy=block 473.astar=peak=default: basepeak=yes 483.xalancbmk=peak=default: basepeak=yes ################################################################ # Peak Tuning Flags for FP ################################################################ fp=peak=default: COPTIMIZE= -auto-ilp32 -opt-mem-layout-trans=3 CXXOPTIMIZE= -auto-ilp32 -opt-mem-layout-trans=3 PASS1_CFLAGS = -prof-gen PASS2_CFLAGS = $(FASTNOSTATIC) -prof-use PASS1_CXXFLAGS = -prof-gen PASS2_CXXFLAGS = $(FASTNOSTATIC) -prof-use PASS1_FFLAGS = -prof-gen PASS2_FFLAGS = $(FASTNOSTATIC) -prof-use PASS1_LDFLAGS = -prof-gen PASS2_LDFLAGS = $(FASTNOSTATIC) -prof-use 410.bwaves=peak=default: OPTIMIZE= -static %ifdef %{best_ratio} copies=%{cores} %endif 416.gamess=peak=default: OPTIMIZE= -unroll2 -inline-level=0 -scalar-rep- -static 433.milc=peak=default: OPTIMIZE= -static %ifdef %{best_ratio} copies=%{cores} %endif 434.zeusmp=peak=default: basepeak=yes feedback=0 435.gromacs=peak=default: OPTIMIZE= -xSSE4.2 -ipo -O3 -no-prec-div -opt-prefetch -static COPTIMIZE= -auto-p32 -ansi-alias -opt-mem-layout-trans=3 feedback=0 436.cactusADM=peak=default: OPTIMIZE= $(FAST) -opt-prefetch COPTIMIZE= -auto-p32 -ansi-alias -opt-mem-layout-trans=3 %ifdef %{best_ratio} copies=%{cores} %endif feedback=0 #basepeak=yes 437.leslie3d=peak=default: OPTIMIZE= $(FAST) -opt-prefetch feedback=no %ifdef %{best_ratio} copies=%{cores} %endif 444.namd=peak=default: CXXOPTIMIZE= -fno-alias -auto-ilp32 447.dealII=peak=default: #basepeak=yes OPTIMIZE= $(FAST) -opt-prefetch CXXOPTIMIZE= -auto-p32 -ansi-alias -opt-mem-layout-trans=3 feedback=no submit = numactl --localalloc $command 450.soplex=peak=default: PORTABILITY = CXX= icpc -m32 OPTIMIZE= -opt-malloc-options=3 CXXOPTIMIZE= %ifdef %{best_ratio} copies=%{cores} %endif 453.povray=peak=default: CXXOPTIMIZE= -unroll4 -ansi-alias 454.calculix=peak=default: OPTIMIZE= $(FAST) feedback=0 459.GemsFDTD=peak=default: CXX= icpc -m32 OPTIMIZE= -opt-malloc-options=3 #OPTIMIZE= $(FAST) -opt-prefetch #CXXOPTIMIZE= -auto-p32 -ansi-alias -opt-mem-layout-trans=3 #feedback=0 %ifdef %{best_ratio} copies=%{cores} %endif 465.tonto=peak=default: OPTIMIZE= -unroll4 -auto -inline-calloc -opt-malloc-options=3 470.lbm=peak=default: basepeak=yes 481.wrf=peak=default: OPTIMIZE= $(FAST) feedback=0 %ifdef %{best_ratio} copies=%{cores} %endif 482.sphinx3=peak=default: PORTABILITY= CC= icc -m32 OPTIMIZE= -xSSE4.2 -ipo -O3 -no-prec-div -opt-mem-layout-trans=3 COPTIMIZE= -unroll2 feedback=no ############################################################################ default=default=default=default: license_num = 3 test_sponsor = Hewlett-Packard Company hw_avail = Jun-2012 sw_avail = Feb-2012 tester = Hewlett-Packard Company hw_memory000 = 96 GB (12 x 8 GB 2Rx4 PC3-12800R-11, ECC) hw_disk = 1 x 250 GB 7200 RPM SATA hw_fpu = Integrated hw_ncpuorder = 1,2 chips hw_vendor = Hewlett-Packard Company sw_file = ext4 hw_pcache = 32 KB I + 32 KB D on chip per core hw_scache = 256 KB I+D on chip per core hw_tcache = 20 MB I+D on chip per chip hw_ocache = None hw_other = None hw_nthreadspercore = 2 prepared_by = Hewlett-Packard Company sw_os000 = Red Hat Enterprise Linux Server release 6.2 sw_os001 = 2.6.32-220.el6.x86_64 sw_state = Run level 3 (multi-user) hw_cpu_name = Intel Xeon E5-2450 hw_cpu_char = Intel Turbo Boost Technology up to 2.90 GHz hw_cpu_mhz = 2100 hw_model000 = ProLiant BL420c Gen8 hw_model001 = (2.10 GHz, Intel Xeon E5-2450) hw_ncores = 16 hw_nchips = 2 hw_ncoresperchip = 8 notes_submit_000 = The numactl mechanism was used to bind copies to processors. The config file option 'submit' notes_submit_005 = was used to generate numactl commands to bind each copy to a specific processor. notes_submit_010 = For details, please see the config file. notes_010 = Binaries compiled on a system with 2x E5-2470 CPU + 192 GB notes_015 = memory using RHEL 6.2 notes_020 = glibc-static-2.12-1.47.el6.x86_64.rpm and glibc-static-2.12-1.47.el6.i686.rpm notes_025 = are added to enable static linking notes_os_000 = Stack size set to unlimited using "ulimit -s unlimited" notes_os_005 = runspec command invoked through numactl i.e.: notes_os_010 = numactl --interleave=all runspec notes_os_015 = Transparent Huge Pages enabled with: notes_os_020 = echo always > /sys/kernel/mm/transparent_hugepage/enabled notes_plat_000 = BIOS configuration: notes_plat_005 = HP Power Profile set to Maximum Performance int=default=default=default: sw_compiler001 = C/C++: Version 12.1.2.273 of Intel C++ Studio XE for Linux sw_base_ptrsize = 32-bit sw_peak_ptrsize = 32/64-bit sw_other001 = Microquill SmartHeap V9.01 default: %ifdef %{THP_enabled} notes_035 = Transparent Huge Pages enabled with: notes_040 = echo always > /sys/kernel/mm/redhat_transparent_hugepage/enabled %endif %ifdef %{THP_disabled} notes_200 = Transparent Huge Pages disabled with: notes_201 = echo never > /sys/kernel/mm/redhat_transparent_hugepage/enabled %endif %ifdef %{drop_caches} notes_202 = Filesystem page cache cleared with: notes_203 = echo 1> /proc/sys/vm/drop_caches %endif %ifdef %{invoke_with_interleave} %endif fp=default=default=default: sw_compiler000 = C/C++: Version 12.1.2.273 of Intel C++ Studio XE sw_compiler001 = for Linux; sw_compiler002 = Fortran: Version 12.1.2.273 of Intel Fortran sw_compiler003 = Studio XE for Linux sw_base_ptrsize = 64-bit sw_peak_ptrsize = 32/64-bit sw_other = None default: flagsurl000 = http://www.spec.org/cpu2006/flags/HP-Platform-Flags-Intel-V1.2-A.20120605.xml flagsurl001 = http://www.spec.org/cpu2006/flags/Intel-ic12.1-official-linux64.20120425.xml notes_000 =Environment variables set by runspec before the start of the run: notes_005 =LD_LIBRARY_PATH = "/opt/smartheap/" # The following settings were obtained by running 'specperl $[top]/Docs/sysinfo' default: notes_plat_sysinfo_000 = Sysinfo program /mnt/store/cpu2006/Docs/sysinfo notes_plat_sysinfo_005 = $Rev: 6775 $ $Date:: 2011-08-16 #$ 8787f7622badcf24e01c368b1db4377c notes_plat_sysinfo_010 = running on bl420c-cpu Thu Jul 5 14:35:18 2012 notes_plat_sysinfo_015 = notes_plat_sysinfo_020 = This section contains SUT (System Under Test) info as seen by notes_plat_sysinfo_025 = some common utilities. To remove or add to this section, see: notes_plat_sysinfo_030 = http://www.spec.org/cpu2006/Docs/config.html#sysinfo notes_plat_sysinfo_035 = notes_plat_sysinfo_040 = From /proc/cpuinfo notes_plat_sysinfo_045 = model name : Intel(R) Xeon(R) CPU E5-2450 0 @ 2.10GHz notes_plat_sysinfo_050 = 2 "physical id"s (chips) notes_plat_sysinfo_055 = 32 "processors" notes_plat_sysinfo_060 = cores, siblings (Caution: counting these is hw and system dependent. The notes_plat_sysinfo_065 = following excerpts from /proc/cpuinfo might not be reliable. Use with notes_plat_sysinfo_070 = caution.) notes_plat_sysinfo_075 = cpu cores : 8 notes_plat_sysinfo_080 = siblings : 16 notes_plat_sysinfo_085 = physical 0: cores 0 1 2 3 4 5 6 7 notes_plat_sysinfo_090 = physical 1: cores 0 1 2 3 4 5 6 7 notes_plat_sysinfo_095 = cache size : 20480 KB notes_plat_sysinfo_100 = notes_plat_sysinfo_105 = From /proc/meminfo notes_plat_sysinfo_110 = MemTotal: 99026400 kB notes_plat_sysinfo_115 = HugePages_Total: 0 notes_plat_sysinfo_120 = Hugepagesize: 2048 kB notes_plat_sysinfo_125 = notes_plat_sysinfo_130 = /usr/bin/lsb_release -d notes_plat_sysinfo_135 = Red Hat Enterprise Linux Server release 6.2 (Santiago) notes_plat_sysinfo_140 = notes_plat_sysinfo_145 = From /etc/*release* /etc/*version* notes_plat_sysinfo_150 = redhat-release: Red Hat Enterprise Linux Server release 6.2 (Santiago) notes_plat_sysinfo_155 = system-release: Red Hat Enterprise Linux Server release 6.2 (Santiago) notes_plat_sysinfo_160 = system-release-cpe: cpe:/o:redhat:enterprise_linux:6server:ga:server notes_plat_sysinfo_165 = notes_plat_sysinfo_170 = uname -a: notes_plat_sysinfo_175 = Linux bl420c-cpu 2.6.32-220.el6.x86_64 #1 SMP Wed Nov 9 08:03:13 EST 2011 notes_plat_sysinfo_180 = x86_64 x86_64 x86_64 GNU/Linux notes_plat_sysinfo_185 = notes_plat_sysinfo_190 = run-level 3 Jul 3 03:10 notes_plat_sysinfo_195 = notes_plat_sysinfo_200 = SPEC is set to: /mnt/store/cpu2006 notes_plat_sysinfo_205 = Filesystem Type Size Used Avail Use% Mounted on notes_plat_sysinfo_210 = /dev/sda5 ext4 191G 19G 163G 11% /mnt/store notes_plat_sysinfo_215 = notes_plat_sysinfo_220 = (End of data from sysinfo program) hw_cpu_name = Intel Xeon E5-2450 hw_disk = 2 x 146 GB RAID 0 hw_nchips = 2 prepared_by = Hewlett-Packard Company sw_file = ext4 sw_os002 = (Santiago) sw_os003 = 2.6.32-220.el6.x86_64 sw_state = Run level 3 (multi-user)