# Invocation command line: # /export/bmk2/keeper/omp2001/bin/runspec -c sun-ompm.cfg -a validate -n 3 -s medium ############################################################################ # Invocation command line: ######################################################################## ######################################################################## # # Sun configuration file for SPEC OMPM2001 # May 2008 # VENDOR = sun action = validate tune = base,peak ext = jf2 input = ref env_vars = 1 mean_anyway = 1 output_format = asc use_submit_for_speed=1 SPECLANG=/export/compilers/jupiter_for_fujitsu2/bin/ CC=${SPECLANG}cc -xjobs=6 FC=${SPECLANG}f90 -xjobs=6 F77=${SPECLANG}f77 -xjobs=6 ################### Baseline Optimization Flags ######################## default=base=default=default: fdo_pre0= rm -rf `pwd`/../feedback* PASS1_CFLAGS= -xprofile=collect:`pwd`/feedback PASS2_CFLAGS= -xprofile=use:`pwd`/feedback PASS1_FFLAGS= -xprofile=collect:`pwd`/feedback PASS2_FFLAGS= -xprofile=use:`pwd`/feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/feedback COPTIMIZE = -fast -xopenmp -xalias_level=std -xipo=2 -xprefetch_level=3 -m64 -lmtmalloc -g -xpagesize=4m -xprefetch=latx:4 FOPTIMIZE = -fast -openmp -m64 -xipo=2 -autopar -fma=fused -g -xpagesize=4m -xprefetch=latx:4 ONESTEP = yes EXTRA_LDFLAGS = EXTRA_LIBS= EXTRA_CFLAGS = -Xc notes100 = notes101 = Base Notes: notes103 = ONESTEP=yes notes104 = notes105 = C: -fast -xopenmp -xalias_level=std -xipo=2 notes106 = -xprefetch_level=3 -m64 -lmtmalloc -g notes107 = -xpagesize=4m -xprefetch=latx:4 -xprofile notes109 = f90: -fast -openmp -m64 -xipo=2 -autopar -fma=fused notes110 = -g -xpagesize=4m -xprefetch=latx:4 -xprofile notes111 = ######################### Portability Flags ############################# default=default=default=default: 310.wupwise_m=default=default=default: 312.swim_m=default=default=default: 314.mgrid_m=default=default=default: 316.applu_m=default=default=default: 318.galgel_m=default=default=default: EXTRA_FFLAGS = -e -fixed notes113 = 318.galgel_m portability flags: -e -fixed notes114 = 320.equake_m=default=default=default: 322.facerec_m=default=default=default: 324.apsi_m=default=default=default: 326.gafort_m=default=default=default: 328.fma3d_m=default=default=default: srcalt = sqrt.init notes201 = Setting allowed defines for art: 330.art_m=default=default=default: EXTRA_CFLAGS = -DINTS_PER_CACHELINE=16 -DDBLS_PER_CACHELINE=8 notes201 = Setting allowed defines for art: notes202 = 330.art_m: -DINTS_PER_CACHELINE=16 -DDBLS_PER_CACHELINE=8 332.ammp_m=default=default=default: ######################### Peak Flags ############################# default=peak=default=default: ONESTEP = yes notes3000 = notes3001 = Peak Notes: notes3003 = ONESTEP=yes notes3004 = 310.wupwise_m=peak=default=default: fdo_pre0= rm -rf `pwd`/feedback* PASS1_FFLAGS= -xprofile=collect:`pwd`/feedback PASS2_FFLAGS= -xprofile=use:`pwd`/feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/feedback #FOPTIMIZE = -fast -openmp -xunroll=5 -autopar -m32 -xipo=2 -fma=fused -xpagesize=512k -xprefetch_level=3 -Qoption iropt -Athr,-Apf:l2subblock=256,-Apf:ipa=9 FOPTIMIZE = -fast -openmp -xunroll=4 -autopar -m32 -xipo=2 -fma=fused -xpagesize=512k -xprefetch_level=3 -Qoption iropt -Athr,-Apf:l2subblock=256,-Apf:ipa=9 -xprefetch=latx:5 -Qoption iropt -Rloop_dist FOPTIMIZE = -fast -openmp -xunroll=4 -autopar -m32 -xipo=2 -fma=fused -xpagesize=512k -Qoption iropt -Athr,-Apf:l2subblock=256,-Apf:ipa=9 -xprefetch=latx:3 -Qoption iropt -Rloop_dist notes3110 = 310.wupwise_m: -fast -openmp -xunroll=4 -autopar -m32 notes3111 = -xipo=2 -fma=fused -xpagesize=512k notes3112 = -Qoption iropt -Athr,-Apf:l2subblock=256,-Apf:ipa=9 notes3113 = -xprefetch=latx:3 -Qoption iropt -Rloop_dist notes3114 = -xprofile 312.swim_m=peak=default=default: #FOPTIMIZE = -fast -openmp -m64 -xipo=2 -autopar -fma=fused -g -xpagesize=4m -xprefetch=latx:4 -xpad=common:1921 -Qoption iropt -Atile:skewp,-Ainline:cs=700 -unroll=5 FOPTIMIZE = -fast -openmp -m64 -xipo=2 -autopar -fma=fused -xpagesize=512k -xprefetch=latx:3 ##basepeak=yes srcalt = ompl.32 notes3120 = 312.swim_m: -fast -openmp -m64 -xipo=2 -autopar notes3121 = -fma=fused -xpagesize=512k -xprefetch=latx:3 notes3122 = used srcalt ompl.32 314.mgrid_m=peak=default=default: fdo_pre0= rm -rf `pwd`/feedback* PASS1_FFLAGS= -xprofile=collect:`pwd`/feedback PASS2_FFLAGS= -xprofile=use:`pwd`/feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/feedback FOPTIMIZE = -fast -openmp -xipo=2 -xprefetch_level=3 -m32 -xpagesize=512K -xprefetch=latx:4.8 -fma=fused -Qoption iropt -Apf:l2subblock=256 notes3140 = 314.mgrid_m: -fast -openmp -xipo=2 -xprefetch_level=3 notes3141 = -m32 -xpagesize=512K -xprefetch:latx:4.8 notes3142 = -fma=fused -Qoption iropt -Apf:l2subblock=256 notes3143 = -xprofile 316.applu_m=peak=default=default: fdo_pre0= rm -rf `pwd`/../feedback* PASS1_FFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_FFLAGS= -xprofile=use:`pwd`/../feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback ##FOPTIMIZE = -fast -unroll=5 -openmp -m64 -xipo=2 -autopar -fma=fused -g -xpagesize=4m -xprefetch=latx:4 -Qoption iropt -Rloop_dist FOPTIMIZE = -fast -xipo=2 -openmp -xautopar -m64 -fma=fused -xpagesize=4m -xprefetch=latx:2.8 -Qoption iropt -Rloop_dist -xunroll=3 ##basepeak=yes srcalt = ompl.32 notes3160 = 316.applu_m: -fast -xipo=2 -openmp -xautopar -m64 notes3161 = -fma=fused -xpagesize=4m -xprefetch=latx:2.8 notes3162 = -Qoption iropt -Rloop_dist -xunroll=3 -xprofile notes3162 = used srcalt ompl.32 318.galgel_m=peak=default=default: fdo_pre0= rm -rf `pwd`/../feedback* PASS1_FFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_FFLAGS= -xprofile=use:`pwd`/../feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback #FOPTIMIZE = -fast -xipo=2 -openmp -autopar -m32 -fma=fused -xlic_lib=sunperf FOPTIMIZE = -fast -openmp -xipo=2 -xprefetch=latx:1 -xlic_lib=sunperf RM_SOURCES = lapak.f90 notes3180 = 318.galgel_m: -fast -openmp -xipo=2 -xprefetch=latx:1 notes3181 = -xlic_lib=sunperf -xprofile notes3183 = RM_SOURCES=lapak.f90 320.equake_m=peak=default=default: fdo_pre0= rm -rf `pwd`/feedback* PASS1_CFLAGS= -xprofile=collect:`pwd`/feedback PASS2_CFLAGS= -xprofile=use:`pwd`/feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/feedback COPTIMIZE = -fast -xopenmp -xprefetch_level=3 -xpagesize=64K -xprefetch=latx:2 -xipo=2 -lmtmalloc -W2,-Apf:l2subblock=256 srcalt = ompl.32 notes3210 = 320.equake_m: -fast -xopenmp -xprefetch_level=3 notes3211 = -xpagesize=64k -xprefetch=latx:2 -xipo=2 notes3212 = -lmtmalloc -W2,-Apf:l2subblock=256 notes3214 = -xprofile 324.apsi_m=peak=default=default: fdo_pre0= rm -rf `pwd`/../feedback* PASS1_FFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_FFLAGS= -xprofile=use:`pwd`/../feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback FOPTIMIZE = -fast -openmp -m64 -xipo=2 -autopar -fma=fused -xpagesize=4m -xprefetch=latx:3.4 -Qoption iropt -Rloop_dist ##basepeak=yes ENV_OMP_NUM_THREADS=127 ENV_SUNW_MP_PROCBIND=1-127 notes3240 = 324.apsi_m: -fast -openmp -m64 -xipo=2 -autopar notes3241 = -fma=fused -xpagesize=4m -xprefetch=latx:3.4 notes3242 = -Qoption iropt -Rloop_dist -xprofile notes3243 = OMP_NUM_THREADS=127 notes3244 = SUNW_MP_PROCBIND=1-127 326.gafort_m=peak=default=default: fdo_pre0= rm -rf `pwd`/../feedback* PASS1_FFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_FFLAGS= -xprofile=use:`pwd`/../feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback FOPTIMIZE = -fast -openmp -xprefetch_level=3 -m64 -xipo=2 -fma=fused FOPTIMIZE = -fast -openmp -xprefetch_level=3 -m64 -fma=fused -xprefetch=latx:0.5 notes3260 = 326.gafort_m: -fast -openmp -xprefetch_level=3 -m64 notes3261 = -fma=fused -xprefetch=latx:0.5 -xprofile 328.fma3d_m=peak=default=default: #fdo_pre0= rm -rf `pwd`/../feedback* #PASS1_FFLAGS= -xprofile=collect:`pwd`/../feedback #PASS2_FFLAGS= -xprofile=use:`pwd`/../feedback #PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback #PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback #FOPTIMIZE = -fast -openmp -Qoption iropt -Athr,-Apf:pdl=1 -Qoption cg -Qlp-ip=1 -xipo=2 -xprefetch_level=3 -lmtmalloc -fma=fused -m32 #FOPTIMIZE = -fast -openmp -Qoption iropt -Athr,-Apf:pdl=1 -Qoption cg -Qlp-ip=1 -xipo=2 -xprefetch_level=3 -fma=fused -m32 FOPTIMIZE = -fast -openmp -autopar -xipo=2 -fma=fused -m32 -unroll=5 -xprefetch=latx:4 -lmtmalloc srcalt = ompl.sqrt.init notes3280 = 328.fma3d_m: -fast -openmp -autopar -xipo=2 -fma=fused notes3281 = -m32 -unroll=5 -xprefetch=latx:4 -lmtmalloc notes3286 = used srcalt ompl.sqrt.init 330.art_m=peak=default=default: fdo_pre0= rm -rf `pwd`/../feedback* PASS1_CFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_CFLAGS= -xprofile=use:`pwd`/../feedback PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback #COPTIMIZE = -fast -xopenmp -xalias_level=std -xipo=2 -xprefetch_level=3 -W2,-Apf:outer=0:pdl=1 -Wc,-Qlp-ip=1 -lmtmalloc -m64 #COPTIMIZE = -fast -xopenmp -xipo=2 -xprefetch -xprefetch_level=3 -m64 -lmtmalloc -xprefetch=latx:4 COPTIMIZE = -fast -xopenmp -xipo=2 -xprefetch_level=3 -m64 -xprefetch=latx:3 ENV_OMP_NUM_THREADS=32 ENV_SUNW_MP_PROCBIND= 2 4 8 12 16 20 24 28 32 36 40 44 48 52 56 60 64 68 72 76 80 84 88 92 96 100 104 108 112 116 120 124 notes3300 = 330.art_m: -fast -xopenmp -xipo=2 -xprefetch_level=3 notes3302 = -m64 -xprefetch=latx:3 -xprofile notes3303 = OMP_NUM_THREADS=32 notes3304 = SUNW_MP_PROCBIND=2 4 8 12 16 20 24 28 notes3305 = 32 36 40 44 48 52 56 60 64 68 72 76 notes3306 = 80 84 88 92 96 100 104 108 112 116 120 124 332.ammp_m=peak=default=default: #fdo_pre0= rm -rf `pwd`/../feedback* #PASS1_CFLAGS= -xprofile=collect:`pwd`/../feedback #PASS2_CFLAGS= -xprofile=use:`pwd`/../feedback #PASS1_LDFLAGS= -xprofile=collect:`pwd`/../feedback #PASS2_LDFLAGS= -xprofile=use:`pwd`/../feedback #COPTIMIZE = -fast -xopenmp -xalias_level=strong -xprefetch_level=3 -lmopt -lm -lmtmalloc -m32 #COPTIMIZE = -fast -xopenmp -xalias_level=strong -xprefetch_level=3 -lmopt -lm -xpagesize=64K #COPTIMIZE = -fast -xopenmp -xalias_level=strong -xprefetch_level=3 -lm -xpagesize=64K #COPTIMIZE = -fast -xopenmp -xalias_level=strong -lm -xpagesize=64K #ENV_SUNW_MP_GUIDED_SCHED_WEIGHT=2 COPTIMIZE = -fast -xipo=2 -xopenmp -xautopar -xalias_level=strong -lm -xpagesize=512K -g ENV_OMP_NUM_THREADS=127 ENV_SUNW_MP_PROCBIND=1-127 notes3320 = 332.ammp_m: -fast -xipo=2 -xopenmp -xautopar notes3321 = -xalias_level=strong -lm -xpagesize=512K -g notes3323 = OMP_NUM_THREADS=127 notes3324 = SUNW_MP_PROCBIND=1-127 notes3325 = notes4100 = Feedback optimization (-xprofile) is done as follows, notes4101 = unless otherwise noted: notes4102 notes4103 = fdo_pre0: rm -rf `pwd`/feedback.profile notes4104 = PASS1: -xprofile=collect:./feedback notes4105 = PASS2: -xprofile=use:./feedback notes4106 = # # machine configuration # default=default=default=default: hw_vendor = Sun Microsystems hw_model = Sun SPARC Enterprise M8000 Server hw_cpu = SPARC64 VII hw_cpu_mhz = 2520 hw_fpu = Integrated hw_ncpu = 16 chips, 64 cores, 4 cores/chip, 2 threads/core hw_ncpuorder= 1 to 4 CMUs; each CMU contains 2 or 4 chips hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 6 MB I+D on chip per chip hw_tcache = None hw_ocache = hw_memory = 256 GB (128 x 2 GB) hw_disk0 = 673 GB RAID 1+0 created by Solaris hw_disk1 = Volume Manager with 20 x 73 GB hw_disk2 = 10,000 RPM Fujitsu MAY2073RC SAS hw_avail = Apr-2008 sw_os = Solaris 10 5/08 plus patches sw_compiler = Sun Studio 12 plus patches sw_parallel = OpenMP and automatic parallel sw_file = ufs sw_state = Multi-User sw_avail = Jul-2008 license_num = HPG0010 tester_name = Sun Microsystems test_date = May-2008 test_site = company_name= Sun Microsystems machine_name= default=default=default=default: notes8000 = notes8001 = Base and Peak User Environment: notes8003 = unlimit stacksize (in /bin/csh) notes8004 = setenv SUNW_MP_THR_IDLE SPIN notes8005 = setenv OMP_DYNAMIC FALSE notes8006 = setenv OMP_NUM_THREADS 64 notes8007 = setenv SUNW_MP_PROCBIND " 1 2 4 6 8 10 12 14 notes8008 = 16 18 20 22 24 26 28 30 32 34 36 38 40 42 44 46 notes8009 = 48 50 52 54 56 58 60 62 64 66 68 70 72 74 76 78 notes8010 = 80 82 84 86 88 90 92 94 96 98 100 102 104 106 108 notes8011 = 110 112 114 116 118 120 122 124 126 " notes8018 = notes8019 = With additional changes for peak runs of 324.apsi_m, 330.art_m, notes8020 = 332.ammp_m which are as noted previously notes8021 = notes8040 = Kernel Paramters (/etc/system): notes8041 = set autoup=60 notes8042 = set tune_t_fsflushr=4 notes8043 = set bufhwm=3000 notes8044 = segmap_percent=1 notes8045 = notes8056 = Flags file description is xxx.xxx.xxx notes8058 =