# Invocation command line: # /cpu2006/bin/runspec -c amd909gh.cfg --define NCPUS=4 --rate 16 -T all fp --nopreenv --note-preenv # output_root was not used for this run ############################################################################ # AMD SPEC CPU2006 V1.1 Configuration File for 64-bit Linux (Quad-Core) # # CPU2006 Version 1.1 # Compiler name/version: PGI 7.2, Pathscale 3.2 # Operating system version: 64-bit Linux # Hardware: AMD Opteron (Quad-core) # FP Base Pointer Size: 64-bit only # FP Peak Pointer Size: 32/64-bit # INT Base Pointer Size: 32/64-bit # INT Peak Pointer Size: 32/64-bit # Auto Parallization: Yes # # Important! Please run with your stack size set to 'unlimited'. # Failure to do so may cause 483.xalancbmk to get a stack overflow during # execution. # Using csh: unlimit # Using bash: ulimit -s unlimited # # Your LD_LIBRARY_PATH must be set to the location of the dependent # runtime libraries. (Though this should be taken care of by the # preENV_LD_LIBRARY_PATH found in the AMD909gh-sut.inc file.) # # The NCPUS environment variable must be set for the fp run. This # is passed to runspec by using --define NPCUS=4 on the runspec # command and is used to set an environment variable in the # AMD909gh-sut.inc file. # # If building new binaries, please adjust the SMARTHEAP_DIR variable to # the directory containing the Smartheap library. # ##################################################################### # Macro section #################################################################### # Modify this section to use the appropriate architecture flags %define pgi_tp64 -tp barcelona-64 %define pgi_tp32 -tp barcelona-32 # Adjust the build jobs to the number of concurrent build processses %define build_jobs 4 ##################################################################### # Header Section ##################################################################### ext = amd909gh ignore_errors = no tune = base,peak output_format = asc,raw flagsurl000 = http://www.spec.org/cpu2006/flags/pgi72_linux_flags.xml $[top]/pathscale-flags.xml \ $[top]/amd-platform.xml size = test,train,ref check_md5 = yes reportable = yes env_vars = no teeout = yes mean_anyway = yes makeflags = -j %{build_jobs} #################################################################### # Include file containing the SUT hardware information # as well as the submit command, tester information and notes #################################################################### #include: AMD909gh-sut.inc # ----- Begin inclusion of 'AMD909gh-sut.inc' ############################################################################ ##################################################################### # Pre-Environment settings ##################################################################### # These settings require using 4GB DIMMs - 4 per socket # For rate runs, use the following below: # In /etc/sysctl.conf, 1P configuration, use vm/nr_hugepages=3584 # In /etc/sysctl.conf, 2P configuration, use vm/nr_hugepages=7168 # In /etc/sysctl.conf, 4P configuration, use vm/nr_hugepages=14336 # Document amount of run time system hugepages setting # What is vm/nr_hugepages is set to in /etc/sysctl.conf? %define rt_sys_hp 14336 # Set number of sockets installed %define num_sockets 4 # Set NCPUS environment variable for PGI autopar binaries %ifdef %{NCPUS} preENV_NCPUS=%{NCPUS} %endif # Set location of run time libraries preENV_LD_LIBRARY_PATH = $[top]/amd909gh-libs/64:$[top]/amd909gh-libs/32 # Need this for libhugetlbfs library usage for Pathscale binaries preENV_HUGETLB_MORECORE=yes # Run the sync command after setup post_setup=sync ##################################################################### # Submit Section ##################################################################### # This config file is set to run these binaries on a 4P, 16 core system. # If this does not match the description of your system, change this # config file, specifically match the socket the memroy is bound (-m) to # the physical cpu number. Use "man numactl" and "numactl --hardware" to # better understand how to use this command. submit0 = echo "$command" > run.sh submit1 = if `test $SPECCOPYNUM -eq 0 `; then numactl -m 0 --physcpubind=0 sh run.sh; fi submit2 = if `test $SPECCOPYNUM -eq 1 `; then numactl -m 0 --physcpubind=4 sh run.sh; fi submit3 = if `test $SPECCOPYNUM -eq 2 `; then numactl -m 0 --physcpubind=8 sh run.sh; fi submit4 = if `test $SPECCOPYNUM -eq 3 `; then numactl -m 0 --physcpubind=12 sh run.sh; fi submit5 = if `test $SPECCOPYNUM -eq 4 `; then numactl -m 1 --physcpubind=1 sh run.sh; fi submit6 = if `test $SPECCOPYNUM -eq 5 `; then numactl -m 1 --physcpubind=5 sh run.sh; fi submit7 = if `test $SPECCOPYNUM -eq 6 `; then numactl -m 1 --physcpubind=9 sh run.sh; fi submit8 = if `test $SPECCOPYNUM -eq 7 `; then numactl -m 1 --physcpubind=13 sh run.sh; fi submit9 = if `test $SPECCOPYNUM -eq 8 `; then numactl -m 2 --physcpubind=2 sh run.sh; fi submit10 = if `test $SPECCOPYNUM -eq 9 `; then numactl -m 2 --physcpubind=6 sh run.sh; fi submit11 = if `test $SPECCOPYNUM -eq 10 `; then numactl -m 2 --physcpubind=10 sh run.sh; fi submit12 = if `test $SPECCOPYNUM -eq 11 `; then numactl -m 2 --physcpubind=14 sh run.sh; fi submit13 = if `test $SPECCOPYNUM -eq 12 `; then numactl -m 3 --physcpubind=3 sh run.sh; fi submit14 = if `test $SPECCOPYNUM -eq 13 `; then numactl -m 3 --physcpubind=7 sh run.sh; fi submit15 = if `test $SPECCOPYNUM -eq 14 `; then numactl -m 3 --physcpubind=11 sh run.sh; fi submit16 = if `test $SPECCOPYNUM -eq 15 `; then numactl -m 3 --physcpubind=15 sh run.sh; fi # SPEED # For a speed run, the submit1 command above will be used. # use_submit_for_speed = 1 #################################################################### # Tester information #################################################################### license_num = 11 prepared_by = IBM Corporation tester = IBM Corporation test_sponsor = IBM Corporation hw_vendor = IBM Corporation hw_model = IBM BladeCenter LS42 (AMD Opteron 8380) #################################################################### # Hardware information #################################################################### default=default=default=default: hw_avail = Nov-2008 hw_cpu_name = AMD Opteron 8380 hw_cpu_mhz = 2500 hw_fpu = Integrated hw_nchips = 4 hw_ncores = 16 hw_ncoresperchip = 4 hw_nthreadspercore = 1 hw_ncpuorder = 1,2,3,4 chips hw_pcache = 64 KB I + 64 KB D on chip per core hw_scache = 512 KB I+D on chip per core hw_tcache = 6 MB I+D on chip per chip hw_ocache = None hw_disk = 1 x 73 GB SAS, 10000 RPM hw_memory = 64 GB (16 x 4 GB DDR2-6400 ECC) hw_other = None sw_file = ReiserFS sw_os000 = SuSE Linux Enterprise Server 10 (x86_64) SP2, sw_os001 = Kernel 2.6.16.60-0.21-smp sw_state = Run level 3 (Full multiuser with network) ##################################################################### # Notes ##################################################################### notes_submit_000 = 'numactl' was used to bind copies to the cores # Uncomment this if you used this for a speed run #notes_os_045 = powersave -f was used to set the CPU frequency to its maximum. # ---- End inclusion of '/cpu2006/config/AMD909gh-sut.inc' ############################ Software Info ############################ fp=default=default=default: sw_base_ptrsize = 64-bit sw_peak_ptrsize = 32/64-bit sw_avail = Jun-2008 sw_compiler000 = PGI Server Complete Version 7.2 sw_compiler001 = PathScale Compiler Suite Version 3.2 sw_other000 = binutils 2.18 sw_other001 = 32-bit and 64-bit libhugetlbfs libraries int=default=default=default: sw_base_ptrsize = 32/64-bit sw_peak_ptrsize = 32/64-bit sw_avail = Jun-2008 sw_compiler1 = PGI Server Complete Version 7.2 sw_compiler2 = PathScale Compiler Suite Version 3.2 sw_other1 = binutils 2.18 sw_other2 = 32-bit and 64-bit libhugetlbfs libraries sw_other3 = SmartHeap 8.1 32-bit Library for Linux default=default=default=default: ##################################################################### # Compiler selection ##################################################################### CC = pgcc CXX = pgcpp FC = pgf95 SMARTHEAP_DIR = /root/work/libraries/SmartHeap_8.1/lib HUGEPAGE64 = -Wl,-T/usr/share/libhugetlbfs/ldscripts/elf_x86_64.xBDT -L/usr/lib64 -lhugetlbfs HUGEPAGE32 = -L/usr/lib -lhugetlbfs ##################################################################### # Portability ##################################################################### # Set for all base and peak benchmarks unless changed below fp=default=default=default: PORTABILITY = -DSPEC_CPU_LP64 int=default=default=default: PORTABILITY = -DSPEC_CPU_LP64 ##################################################################### # INT Base Flags ##################################################################### int=base=default=default: COPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} CXXOPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed --zc_eh -Mipa=jobs:%{build_jobs},fast,inline:10 %{pgi_tp32} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi ##################################################################### # FP Base Flags ##################################################################### fp=base=default=default: COPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} FOPTIMIZE = -fastsse -Mfprelaxed -Msmartalloc=huge -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} CXXOPTIMIZE = -fastsse -Msmartalloc=huge -Mfprelaxed --zc_eh -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi ##################################################################### # INT Portability Flags ##################################################################### 400.perlbench=default=default=default: CPORTABILITY = -DSPEC_CPU_LINUX_X64 403.gcc=peak=default=default: # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = 429.mcf=peak=default=default: # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = 462.libquantum=default=default=default: CPORTABILITY = -DSPEC_CPU_LINUX 471.omnetpp=base=default=default: # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = 473.astar=default=default=default: # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = 483.xalancbmk=default=default=default: CXXPORTABILITY = -DSPEC_CPU_LINUX # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = ##################################################################### # INT Peak Flags ##################################################################### # PATHSCALE 400.perlbench=peak=default=default: CC = pathcc -march=barcelona COPTIMIZE = -Ofast -IPA:plimit=20000:field_reorder=on -LNO:opt=0 -WOPT:if_conv=0 -CG:local_sched_alg=1 PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata $(HUGEPAGE64) feedback = 1 basepeak = 0 # PATHSCALE 401.bzip2=peak=default=default: CC = pathcc -march=barcelona COPTIMIZE=-O3 -OPT:alias=disjoint -OPT:Ofast:goto=off -INLINE:aggressive=on -CG:local_sched_alg=1 -m3dnow $(HUGEPAGE64) feedback = 0 basepeak = 0 # PATHSCALE 403.gcc=peak=default=default: CC = pathcc -march=barcelona COPTIMIZE = -Ofast -OPT:malloc_alg=1 -LNO:trip_count=256:prefetch_ahead=10 -CG:prefer_lru_reg=off -m32 PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 1 basepeak = 0 # PATHSCALE 429.mcf=peak=default=default: CC = pathcc -march=barcelona COPTIMIZE = -O3 -ipa -INLINE:aggressive=on -CG:gcm=off -GRA:prioritize_by_density=on -m32 $(HUGEPAGE32) feedback = 0 basepeak = 0 # PATHSCALE 445.gobmk=peak=default=default: CC = pathcc -march=barcelona COPTIMIZE = -O3 -OPT:alias=restrict -LNO:prefetch=1:ignore_feedback=off -CG:p2align=on PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata $(HUGEPAGE64) feedback = 1 basepeak = 0 # PGI 456.hmmer=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Mvect=partial -Munroll=n:8 -Msmartalloc=huge -Msafeptr -Mprefetch=t0 -Mfprelaxed -Mipa=jobs:%{build_jobs},const,ptr,arg,inline %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PATHSCALE 458.sjeng=peak=default=default: CC = pathcc -march=barcelona %ifdef %{gnu3_fe} COPTIMIZE = -O3 -ipa -LNO:ignore_feedback=off:full_unroll=10:fusion=0:fission=2 -IPA:plimit=50000:pu_reorder=2 -CG:ptr_load_use=0 -OPT:unroll_times_max=8 -INLINE:aggressive=on %else COPTIMIZE = -O3 -ipa -LNO:ignore_feedback=off:full_unroll=10:fusion=0:fission=2 -IPA:pu_reorder=2 -CG:ptr_load_use=0 -OPT:unroll_times_max=8 -INLINE:aggressive=on %endif PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata $(HUGEPAGE64) feedback = 1 basepeak = 0 # PGI 462.libquantum=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Munroll=m:8 -Msmartalloc=huge -Mprefetch=distance:4 -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline,noarg %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PATHSCALE 464.h264ref=peak=default=default: CC = pathcc -march=barcelona COPTIMIZE = -O3 -IPA:plimit=20000 -OPT:alias=disjoint -LNO:prefetch=0 -CG:ptr_load_use=0:push_pop_int_saved_regs=off:prefer_lru_reg=off PASS1_CFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata $(HUGEPAGE64) feedback = 1 basepeak = 0 # PGI 471.omnetpp=peak=default=default: feedback = 0 basepeak = 1 # PGI 473.astar=peak=default=default: CXX = pgcpp CXXOPTIMIZE = -fastsse -O4 -Msmartalloc=huge -Msafeptr=global -Mfprelaxed --zc_eh %{pgi_tp32} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CXXFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CXXFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline:6 PASS2_LDFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline:6 feedback = 1 basepeak = 0 # PATHSCALE 483.xalancbmk=peak=default=default: CXX = pathCC -march=barcelona CXXOPTIMIZE = -Ofast -INLINE:aggressive=on -m32 EXTRA_CXXLIBS = -L$(SMARTHEAP_DIR) -lsmartheap feedback = 0 basepeak = 0 ##################################################################### # FP Portability ##################################################################### 435.gromacs=base=default=default: LDPORTABILITY = -Mnomain 436.cactusADM=default=default=default: LDPORTABILITY = -Mnomain 447.dealII=default=default: %ifdef %{gnu3_fe} CXXPORTABILITY = -DSPEC_CPU_TABLE_WORKAROUND %else CXXPORTABILITY = %endif 447.dealII=peak=default: # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = 454.calculix=default=default=default: LDPORTABILITY = -Mnomain 450.soplex=peak=default=default: # Needed to avoid -DSPEC_CPU_LP64 on 32-bit codes PORTABILITY = 481.wrf=base=default=default: CPORTABILITY = -DSPEC_CPU_CASE_FLAG -DSPEC_CPU_LINUX 481.wrf=peak=default=default: FPORTABILITY = -fno-second-underscore CPORTABILITY = -DSPEC_CPU_LINUX ##################################################################### # FP Peak Flags ##################################################################### # PGI 410.bwaves=peak=default=default: FC = pgf95 FOPTIMIZE = -fastsse -Msmartalloc -Mprefetch=nta -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PATHSCALE 416.gamess=peak=default=default: FC = pathf95 -march=barcelona FOPTIMIZE = -O2 -OPT:Ofast:ro=3:unroll_size=256 PASS1_FFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_FFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata $(HUGEPAGE64) feedback = 1 basepeak = 0 # PGI 433.milc=peak=default=default: feedback = 0 basepeak = 1 # PGI 434.zeusmp=peak=default=default: FC = pgf95 FOPTIMIZE = -fastsse -Mfprelaxed -Mprefetch=distance:8,t0 -Msmartalloc=huge,hugebss -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PATHSCALE 435.gromacs=peak=default=default: CC = pathcc -march=barcelona FC = pathf95 -march=barcelona COPTIMIZE = -Ofast -OPT:rsqrt=2 -OPT:malloc_alg=1 $(HUGEPAGE64) FOPTIMIZE = -Ofast -OPT:rsqrt=2 -OPT:malloc_alg=1 $(HUGEPAGE64) feedback = 0 basepeak = 0 # PGI 436.cactusADM=peak=default=default: CC = pgcc FC = pgf95 COPTIMIZE = -fastsse -Mconcur -Msmartalloc=huge -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} FOPTIMIZE = -fastsse -Mconcur -Mfprelaxed -Msmartalloc=huge -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi %if '%{NCPUS}' eq '4' && '%{num_sockets}' gt '1' # 2P or 4P rate run uses submits below copies = %{num_sockets} %endif # 2P speed run %if '%{NCPUS}' eq '8' copies = 1 CPULIST=0,1,2,3,4,5,6,7 %endif # 4P speed run %if '%{NCPUS}' eq '16' copies = 1 CPULIST=0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16 %endif # 1P run runs (same for speed or rate) %if '%{NCPUS}' eq '4' && '%{num_sockets}' eq '1' copies = 1 CPULIST=0,1,2,3 %endif submit0 = echo "$command" > run.sh # Adjust submit1 based on number of copies submit1 = if `test $copies -eq 1 `; then numactl --physcpubind=$CPULIST sh run.sh \ else if `test $SPECCOPYNUM -eq 0 `; then numactl -m 0 --physcpubind=0,1,2,3 sh run.sh; fi; fi submit2 = if `test $SPECCOPYNUM -eq 1 `; then numactl -m 1 --physcpubind=4,5,6,7 sh run.sh; fi submit3 = if `test $SPECCOPYNUM -eq 2 `; then numactl -m 2 --physcpubind=8,9,10,11 sh run.sh; fi submit4 = if `test $SPECCOPYNUM -eq 3 `; then numactl -m 3 --physcpubind=12,13,14,15 sh run.sh; fi feedback = 0 basepeak = 0 # PGI 437.leslie3d=peak=default=default: FC = pgf95 FOPTIMIZE = -fastsse -Mvect=fuse -Msmartalloc=huge -Mprefetch=distance:8,t0 -Mfprelaxed %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi PASS1_FFLAGS = -Mpfi=indirect PASS1_LDFLAGS = -Mpfi=indirect PASS2_FFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # PGI 444.namd=peak=default=default: CXX = pgcpp CXXOPTIMIZE = -fastsse -Munroll=n:4,m:8 -Msmartalloc=huge -Mnodepchk -Mfprelaxed --zc_eh %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CXXFLAGS = -Mpfi PASS1_LDFLAGS = -Mpfi PASS2_CXXFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # PATHSCALE 447.dealII=peak=default=default: CXX = pathCC -march=barcelona %ifdef %{gnu3_fe} CXXOPTIMIZE = -Ofast -INLINE:aggressive=on -LNO:opt=0 -OPT:alias=disjoint -fno-exceptions -m32 %else CXXOPTIMIZE = -Ofast -static -INLINE:aggressive=on -fno-exceptions -m32 LDCXXFLAGS=-lm %endif feedback = 0 basepeak = 0 # PATHSCALE 450.soplex=peak=default=default: CXX = pathCC -march=barcelona CXXOPTIMIZE = -O3 -INLINE:aggressive=on -OPT:IEEE_arith=3:IEEE_NaN_Inf=off:fold_unsigned_relops=on:malloc_alg=1 -CG:load_exe=0 -fno-exceptions -m32 PASS1_CXXFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata $(HUGEPAGE32) feedback = 1 basepeak = 0 # PATHSCALE 453.povray=peak=default=default: CXX = pathCC -march=barcelona CXXOPTIMIZE = -Ofast -INLINE:aggressive=on PASS1_CXXFLAGS = -fb_create fbdata PASS1_LDFLAGS = -fb_create fbdata PASS2_CXXFLAGS = -fb_opt fbdata PASS2_LDFLAGS = -fb_opt fbdata feedback = 1 basepeak = 0 # PGI 454.calculix=peak=default=default: CC = pgcc FC = pgf95 COPTIMIZE = -fastsse -Msmartalloc=huge -Mprefetch=t0 -Mpre -Mfprelaxed %{pgi_tp64} FOPTIMIZE = -fastsse -Msmartalloc=huge -Mprefetch=t0 -Mpre -Mfprelaxed %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CFLAGS = -Mpfi=indirect PASS1_FFLAGS = -Mpfi=indirect PASS1_LDFLAGS = -Mpfi=indirect PASS2_CFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_FFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # PATHSCALE 459.GemsFDTD=peak=default=default: FC = pathf95 -march=barcelona FOPTIMIZE = -Ofast -LNO:fission=2:simd=2:prefetch_ahead=1 -CG:load_exe=0 -CG:prefer_lru_reg=off -OPT:malloc_alg=1 $(HUGEPAGE64) feedback = 0 basepeak = 0 # PATHSCALE 465.tonto=peak=default=default: FC = pathf95 -march=barcelona FOPTIMIZE = -Ofast -OPT:alias=no_f90_pointer_alias -LNO:blocking=off -CG:load_exe=1 -IPA:plimit=525 -OPT:malloc_alg=1 $(HUGEPAGE64) feedback = 0 basepeak = 0 # PGI 470.lbm=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Msmartalloc=huge -Mprefetch=t0 -Mloop32 -Mfprelaxed -Mipa=jobs:%{build_jobs},fast,inline %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi feedback = 0 basepeak = 0 # PATHSCALE 481.wrf=peak=default=default: CC = pathcc -march=barcelona FC = pathf95 -march=barcelona COPTIMIZE = -Ofast -LNO:blocking=off:prefetch_ahead=10 -LANG:copyinout=off -IPA:callee_limit=5000 -GRA:prioritize_by_density=on -OPT:malloc_alg=1 -m3dnow $(HUGEPAGE64) FOPTIMIZE = $(COPTIMIZE) feedback = 0 basepeak = 0 # PGI 482.sphinx3=peak=default=default: CC = pgcc COPTIMIZE = -fastsse -Mfprelaxed -Msmartalloc %{pgi_tp64} OPTIMIZE = -Mvect=cachesize:6291456 EXTRA_LDFLAGS = -Bstatic_pgi PASS1_CFLAGS = -Mpfi=indirect PASS1_LDFLAGS = -Mpfi=indirect PASS2_CFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline PASS2_LDFLAGS = -Mpfo=indirect -Mipa=jobs:%{build_jobs},fast,inline feedback = 1 basepeak = 0 # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: flagsurl001 = http://www.spec.org/cpu2006/flags/CPU2006_flags.20090710.xml flagsurl002 = http://www.spec.org/cpu2006/flags/amd-platform-amd909gh.20090713.xml notes_000 = The libhugetlbfs libraries were installed using the notes_005 = installation rpms that came with the distribution. notes_010 = notes_015 = 'ulimit -s unlimited' was used to set environment stack size notes_020 = 'ulimit -l 2097152' was used to set environment locked pages in memory limit notes_025 = notes_030 = Set vm/nr_hugepages=14336 in /etc/sysctl.conf notes_035 = mount -t hugetlbfs nodev /mnt/hugepages notes_040 = notes_045 =Environment variables set by runspec before the start of the run: notes_050 =HUGETLB_MORECORE = "yes" notes_055 =LD_LIBRARY_PATH = "/cpu2006/amd909gh-libs/64:/cpu2006/amd909gh-libs/32" notes_060 =NCPUS = "4" notes_065 = notes_070 =Processor Performance States Disabled in BIOS notes_075 =Memory ChipKill Disabled in BIOS