# Invocation command line: # /root/cpu2006/bin/runspec -c linux64-pgi710b-k8-rate -F ./pgi710_flags.xml -r -C 8 -T all fp # output_root was not used for this run ############################################################################ # PGI 7.1 CPU2006 Configuration File for 64-bit Linux (Dual-Core) # # Compiler name/version: PGI 7.1-0 # Operating system version: 64-bit Linux # Hardware: AMD Opteron (Dual-core) # FP Base Pointer Size: 64-bit only # FP Peak Pointer Size: 64-bit only # INT Base Pointer Size: 32/64-bit # INT Peak Pointer Size: 32/64-bit # Auto Parallization: With FP/INT Peak # # Important! Please run with your stack size set to 'unlimited'. # Failure to do so may cause 483.xalancbmk to get a stack overflow during execution. # Using csh: unlimit # Using bash: ulimit -s unlimited # # Set your LD_LIBRARY_PATH to the location of the PGI and Smartheap runtime libraries # # Also be sure to adjust the submit command and makeflags to match # the number of cores in use. # Please adjust the SHL_DIR variable to the directory containing # the Smartheap library. ##################################################################### # Header Section ##################################################################### ext = pgi710b_k8_rate ignore_errors = no tune = base,peak output_format = asc,pdf,raw,flags,cfg,html size = test,train,ref check_md5 = yes reportable = yes env_vars = no teeout = yes teerunout = yes # Adjust the make flag for the number of cores. makeflags = -j 8 ##################################################################### # Macro section #################################################################### # Modify this section to use the appropriate architecture flags %define pgi_tp64 -tp k8-64 %define pgi_tp32 -tp k8-32 #################################################################### # Include the SUT hardware and tester information #################################################################### #include: pgi_sut.cfg # ----- Begin inclusion of 'pgi_sut.cfg' ############################################################################ ##################################################################### # Submit Section ##################################################################### # RATE #This config file is set to run these binaries on a 2P, 8 core system. If this #does not match the description of your system, change this config file, #specifically "bind0","bind1","bind2", etc. to match your system. Use #"man numactl" and "numactl --hardware" to better understand how to use #this command. bind0 = numactl -m 0 --physcpubind=0 bind1 = numactl -m 1 --physcpubind=1 bind2 = numactl -m 2 --physcpubind=2 bind3 = numactl -m 3 --physcpubind=3 bind4 = numactl -m 0 --physcpubind=4 bind5 = numactl -m 1 --physcpubind=5 bind6 = numactl -m 2 --physcpubind=6 bind7 = numactl -m 3 --physcpubind=7 # SPEED # Below is an example numactl command for a speed run using # 4 threads on a single Quad-core chip. # Please adjust as needed for your system # # bind0 = numactl -m 0 --physcpubind=0,1,2,3 # use_submit_for_speed = 1 submit = echo "$command" > run.sh ; $BIND bash run.sh #################################################################### # Tester information #################################################################### license_num = 55 prepared_by = -- tester = Dell Inc. test_date = Oct-2007 test_sponsor = Dell Inc. #################################################################### # Hardware information #################################################################### default=default=default=default: hw_avail = Dec-2006 hw_cpu_name = AMD Opteron 8216 hw_cpu_mhz = 2400 hw_fpu = Integrated hw_nchips = 4 hw_ncores = 8 hw_ncoresperchip = 2 hw_nthreadspercore = 1 hw_ncpuorder = 2,4 chips hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 1 MB I+D on chip per core hw_tcache = None hw_ocache = None hw_vendor = Dell Inc. hw_model = PowerEdge 6950 (AMD Opteron 8216, 2.40 GHz) hw_disk = 1 x 250 GB SATA 7200 RPM hw_memory = 32 GB (16x2GB, DDR2-667 CL5 ECC Dual Rank) hw_other = None ##################################################################### # Notes ##################################################################### int=default=default=default: notes100 = Environment stack size set to 'unlimited' fp=default=default=default: notes_000='ulimit -s unlimited' was used to set environment stack size notes_005 ='ulimit -l 2457600' was used to set environment locked pages in memory quantity notes_010 ='numactl' was used to bind one copy per core, and memory to a local NUMA node notes_015 =Set vm/nr_hugepages=1200 in /etc/sysctl.conf notes_020 =mount -t hugetlbfs nodev /mnt/hugepages notes_025 =Environment variable PGI_HUGE_PAGES set to 150 #notes110 = PGI_HUGE_PAGES set to 896. #notes120 = Total number of huge pages available is 7168. # ---- End inclusion of '/root/cpu2006/config/pgi_sut.cfg' ############################ Software Info ############################ fp=default=default=default: sw_avail = Oct-2007 sw_compiler000 = The Portland Group (PGI) sw_compiler001 = PGI pgf90 7.1-0 Fortran Compiler sw_compiler002 = PGI pgcc 7.1-0 C Compiler sw_compiler003 = PGI pgCC 7.1-0 C++ Compiler sw_peak_ptrsize = 32/64-bit sw_state = Multi-user, run level 3 sw_base_ptrsize = 32/64-bit sw_file = ReiserFS sw_os = 64-Bit SUSE LINUX Enterprise Server 10 SP1 sw_other = None sw_auto_parallel = No int=default=default=default: sw_avail = Oct-2007 sw_compiler1 = The Portland Group (PGI) sw_compiler3 = PGI pgcc 7.1-0 C Compiler sw_compiler4 = PGI pgCC 7.1-0 C++ Compiler sw_peak_ptrsize = 32/64-bit sw_base_ptrsize = 32/64-bit sw_auto_parallel = No sw_other = SmartHeap 8.0 32-bit Library for Linux default=default=default=default: ##################################################################### # Compiler selection # # CC = pgcc -w CXX = pgcpp -w FC = pgf95 -w SHL_DIR = /proj/qa/smartheap/SmartHeap_8/lib ##################################################################### # Optimization ##################################################################### default=default=default=default: EXTRA_LDFLAGS = -Bstatic_pgi fp=base=default=default: COPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:8 %{pgi_tp64} CXXOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:8 --zc_eh %{pgi_tp64} FOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:8 %{pgi_tp64} int=base=default=default: COPTIMIZE = -fast -Mipa=fast,inline,noarg -Mfprelaxed -Msmartalloc=huge:64 %{pgi_tp64} CXXOPTIMIZE = -fastsse -Mipa=fast,inline -Mfprelaxed -Msmartalloc --zc_eh %{pgi_tp32} EXTRA_CXXLIBS= -L$(SHL_DIR) -lsmartheap ##################################################################### ## FP Peak Flags ##################################################################### fp=peak=default=default: EXTRA_LIBS= basepeak=0 410.bwaves=peak=default=default: FOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Msmartalloc %{pgi_tp64} feedback=0 basepeak=0 416.gamess=peak=default=default: FOPTIMIZE = -fast -Mipa=fast,inline -Mfprelaxed -Mvect=noaltcode -Msmartalloc=huge:64 %{pgi_tp64} feedback=0 basepeak=0 433.milc=peak=default=default: COPTIMIZE = -fast -O4 -Mdse -Mfprelaxed -Msmartalloc=huge:8 %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline,noarg -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline,noarg -Mpfo feedback=1 basepeak=0 434.zeusmp=peak=default=default: feedback=0 basepeak=1 435.gromacs=peak=default=default: COPTIMIZE = -fast -O4 -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:16 %{pgi_tp64} FOPTIMIZE = -fast -O4 -Mfpapprox=rsqrt -Mipa=fast,inline -Mfprelaxed -Msmartalloc=huge:16 %{pgi_tp64} feedback=0 basepeak=0 436.cactusADM=peak=default=default: feedback=0 basepeak=1 437.leslie3d=peak=default=default: feedback=0 basepeak=1 444.namd=peak=default=default: CXXOPTIMIZE = -fast -O4 -Mfprelaxed -Msmartalloc=huge:32 --zc_eh %{pgi_tp64} PASS1_CXXFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CXXFLAGS = -Mpfo -Mipa=fast,inline PASS2_LDFLAGS = -Mpfo -Mipa=fast,inline feedback=1 basepeak=0 447.dealII=peak=default=default: feedback=0 basepeak=1 450.soplex=peak=default=default: feedback=0 basepeak=1 453.povray=peak=default=default: CXXOPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:32 -Mipa=fast,inline --zc_eh %{pgi_tp64} feedback=0 basepeak=0 454.calculix=peak=default=default: feedback=0 basepeak=1 459.GemsFDTD=peak=default=default: feedback=0 basepeak=1 465.tonto=peak=default=default: FOPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:128 -Mipa=fast,inline -Mvect=noaltcode %{pgi_tp64} feedback=0 basepeak=0 470.lbm=peak=default=default: COPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:8 -Mipa=fast,noarg %{pgi_tp64} feedback=0 basepeak=0 481.wrf=peak=default=default: FOPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:32 -Mvect=noaltcode %{pgi_tp64} COPTIMIZE = -fast -Mfprelaxed -Msmartalloc=huge:32 -Mvect=noaltcode %{pgi_tp64} basepeak=0 feedback=0 482.sphinx3=peak=default=default: feedback=0 basepeak=1 ##################################################################### ## INT Peak Flags ##################################################################### int=peak=default=default: EXTRA_LIBS = basepeak=1 400.perlbench=peak=default=default: COPTIMIZE = -fast -O4 -Mfprelaxed -Msmartalloc=huge:8 -Mnounroll %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mpfo -Mipa=inline PASS2_LDFLAGS = -Mpfo -Mipa=inline feedback=1 basepeak=0 401.bzip2=peak=default=default: COPTIMIZE = -fast -O4 -Msmartalloc=huge:64 %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mpfo PASS2_LDFLAGS = -Mpfo feedback=1 basepeak=0 403.gcc=peak=default=default: COPTIMIZE = -fastsse -Mfprelaxed -Msmartalloc=huge:32 -Mipa=fast,inline %{pgi_tp32} feedback=0 basepeak=0 429.mcf=peak=default=default: COPTIMIZE = -fastsse -Mipa=fast,inline -Msmartalloc=huge:16 %{pgi_tp32} feedback=0 basepeak=0 445.gobmk=peak=default=default: COPTIMIZE = -fast -O4 -Msmartalloc=huge:32 -Mfprelaxed -Mnovect %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mpfo -Mipa=fast PASS2_LDFLAGS = -Mpfo -Mipa=fast feedback=1 basepeak=0 456.hmmer=peak=default=default: COPTIMIZE = -fast -Msmartalloc=huge:32 -Mfprelaxed -Msafeptr -Mipa=const,ptr,arg %{pgi_tp64} feedback=0 basepeak=0 458.sjeng=peak=default=default: COPTIMIZE = -fast -Msmartalloc=huge:32 -Mfprelaxed %{pgi_tp64} PASS1_CFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CFLAGS = -Mipa=fast,inline,noarg -Mpfo PASS2_LDFLAGS = -Mipa=fast,inline,noarg -Mpfo feedback=1 basepeak=0 462.libquantum=peak=default=default: feedback=0 basepeak=1 464.h264ref=peak=default=default: feedback=0 basepeak=1 471.omnetpp=peak=default=default: feedback=0 basepeak=1 473.astar=peak=default=default: feedback=0 basepeak=1 483.xalancbmk=peak=default=default: CXXOPTIMIZE = -fastsse -O4 -Mipa=fast,inline -Mfprelaxed -Msmartalloc --zc_eh %{pgi_tp32} EXTRA_CXXLIBS= -L$(SHL_DIR) -lsmartheap feedback=0 basepeak=0 ##################################################################### # Portability ##################################################################### fp=default=default=default: PORTABILITY = -DSPEC_CPU_LP64 int=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 400.perlbench=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX_X64 403.gcc=peak=default=default: CPORTABILITY = 429.mcf=peak=default=default: CPORTABILITY = 435.gromacs=default=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=default=default=default: LDPORTABILITY = -Mnomain 454.calculix=default=default=default: LDPORTABILITY = -Mnomain 462.libquantum=default=default=default: CPORTABILITY = -DSPEC_CPU_LP64 -DSPEC_CPU_LINUX 481.wrf=default=default=default: CPORTABILITY=-DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX 483.xalancbmk=default=default=default: CXXPORTABILITY= -DSPEC_CPU_LINUX # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: flagsurl000= http://www.spec.org/cpu2006/flags/pgi710_flags.xml