# Invocation command line: # /home/omp2001/bin/runspec -a validate -c psc31_ompl_4985e_barc -n 3 --reportable -i ref -T base large ############################################################################ # Invocation command line: # /home/omp2001/bin/runspec -a validate -c gh4985_2P_v2.cfg -n 3 --reportable -i ref -T base,peak medium ############################################################################ ############################################################################ # # configuration file for SPEC OMPL2001 on AMD Tyan s4985 2P config # Mar-2008 # VENDOR = AMD action = validate tune = base,peak ext = gh_psc31_ompl_667_4P input = ref env_vars = 1 reportable = 1 #mean_anyway = 1 output_format = asc,pdf,config teeout = yes teerunout = yes check_md5 = 1 ###### Compiler used ################# default=default: CC=pathcc -gnu3 -mp FC=pathf90 -mp ######## Portability Flags and Environment variables ################## 330.art_m=default=default=default: EXTRA_CFLAGS = -DINTS_PER_CACHELINE=16 -DDBLS_PER_CACHELINE=8 notes00108 = Extra art Base Flags notes00109 = 330.art_m (extra): -DINTS_PER_CACHELINE=16 -DDBLS_PER_CACHELINE=8 default=default=default=default: notes41002= notes41003= Base and Peak User Environment (bash): ENV_OMP_NUM_THREADS=16 ENV_OMP_DYNAMIC=FALSE ENV_PSC_OMP_AFFINITY=TRUE #ENV_PSC_OMP_AFFINITY_MAP=0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15 ENV_PSC_OMP_STATIC_FAIR=TRUE ENV_PSC_OMP_THREAD_SPIN=1000000000 notes41003= export OMP_NUM_THREADS=16 notes41004= export OMP_DYNAMIC=FALSE notes41005= export PSC_OMP_AFFINITY=TRUE #notes41006= export PSC_OMP_AFFINITY_MAP=0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15 notes41007= export PSC_OMP_STATIC_FAIR=TRUE notes41008= export PSC_OMP_THREAD_SPIN=1000000000 notes41010= ulimit -s unlimited notes41011= notes41012= Default BIOS settings used, with DRAM bank interleave set to auto #notes41013= AMD PowerNow!(TM) disabled by use of command "powersave -f" #################### SPEC OMPM2001 src.alt ############################ #330.art_m=default=default=default: #srcalt = purdue1 #################### Baseline Optimization Flags ###################### large=base=default=default: COPTIMIZE = -Ofast -mcpu=barcelona -mcmodel=medium FOPTIMIZE = -Ofast -mcpu=barcelona -OPT:early_mp=on -CG:movnti=2500 -mcmodel=medium #F77OPTIMIZE = -Ofast -mcpu=barcelona -OPT:early_mp=on -CG:movnti=2500 -mcmodel=medium ONESTEP=yes default=default=default=default: notes120 = notes121 = Base tuning: notes123 = Fortran : pathf90 -mp -Ofast -mcpu=barcelona -OPT:early_mp=on -CG:movnti=2500 -mcmodel=medium notes122 = C : pathcc -mp -Ofast -mcpu=barcelona -mcmodel=medium notes124 = ONESTEP=yes ######################### Peak Flags ############################# default=peak=default=default: ONESTEP = yes notes300_0 = #notes300_1 = Peak tuning: #notes300_2 = ONESTEP=yes for all peak tests. notes300_3 = 311.wupwise_l=peak=default=default: srcalt=ompl.32 #basepeak=yes FOPTIMIZE = -mp -Ofast -msse3 -LNO:prefetch_ahead=5:prefetch=3 -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 -IPA:linear=on:plimit=50000:callee_limit=5000 -INLINE:aggressive=on F77OPTIMIZE = -mp -Ofast -msse3 -LNO:prefetch_ahead=5:prefetch=3 -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 -IPA:linear=on:plimit=50000:callee_limit=5000 -INLINE:aggressive=on #notes205= 311.wupwise_l: basepeak=yes notes205= 311.wupwise_l: -mp -Ofast -msse3 -LNO:prefetch_ahead=5:prefetch=3 notes206= -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 notes207= -IPA:linear=on:plimit=50000:callee_limit=5000 notes208: -INLINE:aggressive=on 313.swim_l=peak=default=default: #srcalt=ompl.32 FOPTIMIZE = -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -CG:movnti=2500 F77OPTIMIZE = -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -CG:movnti=2500 #notes210= 313.swim_l: -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -LNO:simd=0 notes210= 313.swim_l: -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -CG:movnti=2500 315.mgrid_l=peak=default=default: #srcalt=ompl basepeak=yes #FOPTIMIZE = -mp -Ofast -mcpu=barcelona -OPT:early_mp=on -mcmodel=medium #FOPTIMIZE = -mp -Ofast -CG:gcm=off:cflow=off -LNO:fusion=2:prefetch=0 -msse3 -OPT:early_mp=on:unroll_times_max=8:unroll_size=256:ro=3 -mcmodel=medium #F77OPTIMIZE = -mp -Ofast -CG:gcm=off:cflow=off -LNO:fusion=2:prefetch=0 -msse3 -OPT:early_mp=on:unroll_times_max=8:unroll_size=256:ro=3 -mcmodel=medium notes215= 315.mgrid_l: basepeak=yes #notes215= 315.mgrid_l: -mp -Ofast -mcpu=barcelona -OPT:early_mp=on -mcmodel=medium #notes215= 315.mgrid_l: -mp -Ofast -CG:gcm=off:cflow=off -LNO:fusion=2:prefetch=0 -msse3 #notes216= -OPT:early_mp=on:unroll_times_max=8:unroll_size=256:ro=3 #notes217= -mcmodel=medium 317.applu_l=peak=default=default: #srcalt=ompl basepeak=yes #FOPTIMIZE = -mp -Ofast -mcmodel=medium -CG:local_fwd_sched=on -LNO:fusion=2:fission=2:full_unroll_size=10000:prefetch=3 -TENV:X=3 #F77OPTIMIZE = -mp -Ofast -mcmodel=medium -CG:local_fwd_sched=on -LNO:fusion=2:fission=2:full_unroll_size=10000:prefetch=3 -TENV:X=3 notes220= 317.applu_l: basepeak=yes #notes220= 317.applu_l: -mp -Ofast -mcmodel=medium -CG:local_fwd_sched=on #notes221= -LNO:fusion=2:fission=2:full_unroll_size=10000:prefetch=3 #notes222= -TENV:X=3 321.equake_l=peak=default=default: srcalt=ompl.32 COPTIMIZE = -Ofast -mp -OPT:alias=disjoint notes230= 321.equake_l: -Ofast -mp -OPT:alias=disjoint 325.apsi_l=peak=default=default: #srcalt=ompl FOPTIMIZE = -mp -O3 -OPT:Ofast -TENV:X=4 -LNO:fusion=2:prefetch=0 F77OPTIMIZE = -mp -O3 -OPT:Ofast -TENV:x=4 -LNO:fusion=2:prefetch=0 notes235= 325.apsi_l: -mp -O3 -OPT:Ofast -TENV:x=4 -LNO:fusion=2:prefetch=0 327.gafort_l=peak=default=default: basepeak=yes #F77OPTIMIZE = -Ofast -OPT:early_mp=on -mp -LNO:vintr=0 #FOPTIMIZE = -Ofast -OPT:early_mp=on -mp -LNO:vintr=0 notes240= 327.gafort_l: basepeak=yes #notes240= 327.gafort_l: -Ofast -OPT:early_mp=on -mp -LNO:vintr=0 329.fma3d_l=peak=default=default: basepeak=yes notes245= 329.fma3d_l: basepeak=yes 331.art_l=peak=default=default: basepeak=yes notes250= 331.art_l: basepeak=yes # # machine configuration # default=default=default=default: hw_vendor = Advanced Micro Devices hw_model = Tyan s4985e hw_cpu = Quad-Core AMD Opteron(tm) Processor 8356 hw_cpu_mhz = 2300 hw_fpu = Integrated hw_ncpu = 16 cores, 4 chips, 4 cores/chip hw_ncpuorder= 1,2,3,4 hw_pcache = 64KBI + 64KBD on chip per core hw_scache = 512KB (I+D) on chip per core hw_tcache = 2MB (I+D) on chip per chip hw_ocache = None hw_memory = 16x2GB, PC2-5300 CL5 hw_disk = 320GB 7200 rpm SATA hw_avail = Mar-2008 hw_other = None sw_os = SLES10 SP1 64bit sw_compiler = PathScale Compiler Suite ver. 3.1 sw_Kernel_Extensions = None sw_file = Linux/Ext3 sw_state = Multi-User sw_avail = Nov-2007 sw_parallel = OpenMP license_num = HPG0017 tester_name = AMD test_date = Mar-2008 test_site = Austin TX company_name= Advanced Micro Devices machine_name= barctyan4895e