# Invocation command line: # /store/hfeng/omp2001-3.2/bin/runspec --reportable -a validate -n 3 -o asc -i ref -T base,peak -c amd-open64-v2-m.cfg medium ############################################################################ # Invocation command line: # /store/hfeng/omp2001-3.2/bin/runspec --reportable -a validate -n 3 -o asc -i ref -T base,peak -c amd-open64-v2-m.cfg medium ############################################################################ VENDOR = SGI action = validate tune = base,peak ext = gh_open64-424_2s-v2 input = ref env_vars = 1 reportable = 1 #mean_anyway = 1 output_format = asc,pdf,config #teeout = yes #teerunout = yes mean_anyway = 1 check_md5 = 1 ###### Compiler used ################# default=default: CC=opencc -mp FC=openf90 -mp ######## Portability Flags and Environment variables ################## 318.galgel_m=default=default=default: FPORTABILITY = -fixedform -col80 notes41000= Portablility flags: notes41001 = 318.galgel_m : -fixedform -col80 notes41002= 330.art_m=default=default=default: EXTRA_CFLAGS = -DINTS_PER_CACHELINE=16 -DDBLS_PER_CACHELINE=8 notes00108 = Extra art Base Flags notes00109 = 330.art_m (extra): -DINTS_PER_CACHELINE=16 -DDBLS_PER_CACHELINE=8 default=default=default=default: notes41003= Base and Peak User Environment (bash): ENV_OMP_NUM_THREADS=24 ENV_OMP_DYNAMIC=FALSE ENV_OMP_SLAVE_STACK_SIZE=22M ENV_O64_OMP_SPIN_COUNT=1000000000 ENV_O64_OMP_SPIN_USER_LOCK=TRUE ENV_O64_OMP_SET_AFFINITY=TRUE ENV_O64_OMP_AFFINITY_MAP=" 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23" notes41004= export OMP_NUM_THREADS=24 notes41005= export OMP_DYNAMIC=FALSE notes41006= export O64_OMP_SPIN_COUNT=1000000000 notes41007= export O64_OMP_SPIN_USER_LOCK=TRUE notes41008= export OMP_SLAVE_STACK=22M notes41015 = export O64_OMP_SET_AFFINITY=TRUE notes41010= ulimit -s unlimited notes41011= #################### Baseline Optimization Flags ###################### medium=base=default=default: COPTIMIZE = -Ofast -march=barcelona -mcmodel=medium FOPTIMIZE = -Ofast -march=barcelona -OPT:early_mp=on -mcmodel=medium ONESTEP=yes large=base=default=default: COPTIMIZE = -Ofast -march=barcelona -mcmodel=medium FOPTIMIZE = -Ofast -march=barcelona -OPT:early_mp=on -mcmodel=medium ONESTEP=yes default=default=default=default: notes120 = notes121 = Base tuning: notes123 = Fortran : openf90 -mp -Ofast -OPT:early_mp=on -mcmodel=medium notes122 = C : opencc -mp -Ofast -mcmodel=medium notes124 = ONESTEP=yes # alt source 314.mgrid_m=base=default=default: srcalt=intel notes125 = Alternate Sources: notes126 = 314.mgrid_m (base and peak): intel ######################### Peak Flags ############################# default=peak=default=default: ONESTEP = yes notes200_0 = notes200_1 = Peak tuning: notes200_2 = ONESTEP=yes for all peak tests. notes200_3 = large=peak=default=default: COPTIMIZE = -Ofast -march=barcelona -mcmodel=medium FOPTIMIZE = -Ofast -march=barcelona -OPT:early_mp=on -mcmodel=medium ONESTEP=yes notes201_0 = COPTIMIZE = -mp -Ofast -march=barcelona -mcmodel=medium notes201_0 = FOPTIMIZE = -mp -Ofast -march=barcelona -OPT:early_mp=on -mcmodel=medium 310.wupwise_m=peak=default=default: FOPTIMIZE = -mp -Ofast -msse3 -OPT:early_mp=on -LNO:prefetch_ahead=5:prefetch=3 -march=barcelona -mcmodel=medium -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 -IPA:linear=on:plimit=50000:callee_limit=5000 -INLINE:aggressive=on -CG:load_exe=0 notes310_0 = 310.wupwise_m : FOPTIMIZE = -mp -Ofast -msse3 -OPT:early_mp=on -LNO:prefetch_ahead=5:prefetch=3 -march=barcelona notes310_1 = -mcmodel=medium -OPT:unroll_times_max=8:unroll_size=128:IEEE_NaN_Inf=off:ro=3 notes310_2 = -IPA:linear=on:plimit=50000:callee_limit=5000 -INLINE:aggressive=on -CG:load_exe=0 311.wupwise_l=peak=default=default: basepeak=yes notes311_0 = 311.wupwise_l: basepeak=yes 312.swim_m=peak=default=default: srcalt=ompl.32 FOPTIMIZE = -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -LNO:simd=0 notes312_0 = 312.swim_m : srcalt=ompl.32 notes312_1 = FOPTIMIZE = -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -LNO:simd=0 313.swim_l=peak=default=default: FOPTIMIZE = -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -LNO:simd=0:prefetch_ahead=5:prefetch=3 notes313_0 = 313.swim_l : FOPTIMIZE = -mp -O3 -OPT:Ofast -m3dnow -mcmodel=medium -LNO:simd=0:prefetch_ahead=5:prefetch=3 314.mgrid_m=peak=default=default: basepeak=yes notes314_0 = 314.mgrid_m : basepeak=yes 315.mgrid_l=peak=default=default: basepeak=yes notes315_0 = 315.mgrid_l : basepeak=yes 316.applu_m=peak=default=default: srcalt=ompl FOPTIMIZE = -Ofast -march=barcelona -OPT:early_mp=on -mcmodel=medium notes316_0 = 316.applu_m : srcalt=ompl notes316_1 = FOPTIMIZE =-Ofast -march=barcelona -OPT:early_mp=on -mcmodel=medium 317.applu_l=peak=default=default: basepeak=yes notes317_0 = 317.applu_l : basepeak=yes 318.galgel_m=peak=default=default: basepeak=yes notes318_0 = 318.galgel_m : basepeak=yes 320.equake_m=peak=default=default: srcalt=ompl COPTIMIZE = -Ofast -mp -OPT:alias=disjoint -march=barcelona -mcmodel=medium notes320_0 = 320.equake_m : COPTIMIZE = -Ofast -mp -OPT:alias=disjoint -march=barcelona -mcmodel=medium 321.equake_l=peak=default=default: basepeak=yes notes321_0 = 321.equake_l : basepeak=yes 324.apsi_m=peak=default=default: basepeak=yes notes324_0 = 324.apsi_m : basepeak=yes 325.apsi_l=peak=default=default: basepeak=yes notes325_0 = 325.apsi_l : basepeak=yes 326.gafort_m=peak=default=default: basepeak=yes notes326_0 = 326.gafort_m : basepeak=yes 327.gafort_l=peak=default=default: basepeak=yes notes327_0 = 327.gafort_l : basepeak=yes 328.fma3d_m=peak=default=default: basepeak=yes notes328_0 = 328.fma3d_m : basepeak=yes 329.fma3d_l=peak=default=default: basepeak=yes notes329_0 = 329.fma3d_l : basepeak=yes 330.art_m=peak=default=default: basepeak=yes notes330_0 = 330.art_m : basepeak=yes 331.art_l=peak=default=default: basepeak=yes notes331_0 = 331.art_l : basepeak=yes 332.ammp_m=peak=default=default: basepeak=yes notes332_0 = 332.ammp_m : basepeak=yes # # machine configuration # default=default=default=default: hw_vendor = na hw_model = dinar2 hw_cpu = Magnycours AMD Opteron(tm) Processor hw_cpu_mhz = 2200 hw_fpu = Integrated hw_ncpu = 24 cores, 2 chips, 12 cores/chip hw_ncpuorder= 1-4 hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 512 KB I+D on chip per core hw_tcache = 6 MB I+D on chip per chip hw_ocache = None hw_memory = 64GB (8x4GB, ddr3-1333, CL7 dual-rank) hw_disk = 250GB 7200 RPM SATA hw_avail = tbd hw_other = None sw_os = SLES11 sw_compiler = Open64 4.2.3 sw_Kernel_Extensions = None sw_file = Linux/Ext3 sw_state = Multi-User sw_avail = Sep-2009 sw_parallel = OpenMP license_num = HPG0017 tester_name = Advanced Micro Devices test_date = Sep-2009 test_site = Austin TX company_name= Advanced Micro Devices machine_name= dinar3-hpc-sles10