# Invocation command line: # /home/spec/accel2023/bin/harness/runaccel --config=tta_nvhpc.cfg --tune=base --define model=acc --size=ref --reportable --iterations=3 accel # output_root was not used for this run ############################################################################ # Invocation command line: # runaccel -c nvhpc --reportable -T base --define model= accel # # MODEL may be one of the following options: # 1. "acc" - Use OpenACC (default) # 2. "lop" - Use OpenMP with "loop" construct # 3. "tgt" - Use OpenMP with "distribute" construct # 4. "smd" - Use OpenMP with "distribute" and inner "simd" construct # 5. "acp" - Use OpenACC with the "parallel" src.alt # 6. "lops" - Use OpenMP with "loop" construct src.alt (no metadirectives) # 7. "tgts" - Use OpenMP with "distribute" construct src.alt (no metadirectives) # 8. "smds" - Use OpenMP with "distribute" and inner "simd" construct src.alt (no metadirectives) # ############################################################################ %ifndef %{model} # IF model is not set use acc % define model acc %endif #################################################################### # Tester information #################################################################### license_num = 068A tester = Telecommunications Technology Association test_sponsor = Telecommunications Technology Association ###################################################################### # The header section of the config file. Must appear # before any instances of "default=" # # label = how the binaries you generated will be identified # tune = specify "base" or "peak" or "all" label = nvhpc tune = base output_format = txt,html,pdf teeout = yes teerunout = yes strict_rundir_verify=1 #output_root = /tmp/accel2023 #flagsurl=$[top]/config/flags/nvhpc_flags.xml flagsurl000=http://www.spec.org/accel2023/flags/nv2021_flags_v1.0.3.xml # Adjust the number of make jobs to use here makeflags=-j 40 #################################################################### # Hardware information #################################################################### #include: SUT.inc # ----- Begin inclusion of 'SUT.inc' ############################################################################ ##### SUT.inc #### ##### Example of required hardware information for the system under test (SUT) #### default: hw_avail = Sep-2025 sw_avail = Sep-2025 hw_cpu_name = INTEL(R) XEON(R) PLATINUM 8558 hw_cpu_max_mhz = 4000 hw_cpu_nominal_mhz = 2100 hw_nchips = 2 hw_ncores = 96 hw_nthreadspercore = 2 hw_ncpuorder = 2 chips hw_pcache = 32 KB I + 48 KB D on chip per core hw_scache = 2 MB I+D on chip per core hw_tcache = 260 MB I+D on chip per chip hw_ocache = None hw_vendor = 3SCORE hw_model = FrightPro SR800 S4 hw_disk = 1x HDD, 1.78 TiB, 7.2K RPM hw_memory000 = 1024 GB (16 x 64 GB DDR5, 4800 MT/s, ECC) hw_other = None # Accelerator description hw_accel_connect = PCIe Gen5 hw_accel_desc = NVIDIA H100 NVL 96GB HBM3 device memory hw_accel_ecc = Yes hw_accel_model = H100 NVL 96GB hw_accel_name = NVIDIA H100 NVL 96GB hw_accel_type = GPU hw_accel_vendor = NVIDIA Corporation sw_accel_driver = 580.82.07 # ---- End inclusion of '/home/spec/accel2023/config/SUT.inc' #################################################################### # Software information #################################################################### default: CC = nvc CXX = nvc++ FC = nvfortran CC_VERSION_OPTION = -V CXX_VERSION_OPTION = -V FC_VERSION_OPTION = -V # Add additional software description sw_compiler = C/Fortran: Version 25.7 NVHPC SDK fw_bios = American Megatrends Inc. 2803 04/08/2025 sw_other = None %if %{model} eq 'acc' OPTIMIZE = -O3 -acc -Mfprelaxed -Mstack_arrays 450.md: OPTIMIZE = -O3 -acc -Mfprelaxed -Mstack_arrays 453.clvrleaf: OPTIMIZE = -O3 -acc -Mfprelaxed -Mstack_arrays 459.miniGhost: OPTIMIZE = -O3 -acc -Mfprelaxed -Mstack_arrays EXTRA_LDFLAGS += -Mnomain 457.spC: PORTABILITY += -mcmodel=medium -Wl,--no-relax %endif %if %{model} eq 'acp' pmodel=ACC OPTIMIZE = -fast -acc 450.md,453.clvrleaf,455.seismic,456.spF,457.spC,459.miniGhost,463.swim,470.bt: srcalt=acc_parallel %endif %if %{model} eq 'lop' pmodel=LOP OPTIMIZE = -fast -mp=gpu 403.stencil: PORTABILITY += -DSPEC_NO_NOTHING %endif %if %{model} eq 'lops' pmodel=LOP OPTIMIZE = -fast -mp=gpu srcalt = omp_loop 403.stencil: PORTABILITY += -DSPEC_NO_NOTHING %endif %if %{model} eq 'tgt' pmodel=TGT OPTIMIZE = -fast -mp=gpu 403.stencil: PORTABILITY += -DSPEC_NO_NOTHING %endif %if %{model} eq 'tgts' pmodel=TGT OPTIMIZE = -fast -mp=gpu srcalt = omp_target 403.stencil: PORTABILITY += -DSPEC_NO_NOTHING %endif %if %{model} eq 'smd' pmodel=SMD OPTIMIZE = -fast -mp=gpu 403.stencil: PORTABILITY += -DSPEC_NO_NOTHING %endif %if %{model} eq 'smds' pmodel=SMD OPTIMIZE = -fast -mp=gpu srcalt = omp_inner_simd 403.stencil: PORTABILITY += -DSPEC_NO_NOTHING %endif 457.spC: PORTABILITY += -mcmodel=medium -Wl,--no-relax 459.miniGhost: EXTRA_LDFLAGS += -Mnomain # The following settings were obtained by running the sysinfo_program # 'specperl $[top]/bin/sysinfo' (sysinfo:SHA:ac6f2b38b7dec295b8795065d3a13319ea78b9367f95037a5e6ed5e46e487861) default: notes_plat_sysinfo_000 = notes_plat_sysinfo_005 = Sysinfo program /home/spec/accel2023/bin/sysinfo notes_plat_sysinfo_010 = Rev: r6622 of 2021-04-07 b1a7d5f8f71be5aff70a755cad7211a0 notes_plat_sysinfo_015 = running on Client-1 Fri Sep 19 17:05:38 2025 notes_plat_sysinfo_020 = notes_plat_sysinfo_025 = SUT (System Under Test) info as seen by some common utilities. notes_plat_sysinfo_030 = For more information on this section, see notes_plat_sysinfo_035 = https://www.spec.org/cpu2017/Docs/config.html#sysinfo notes_plat_sysinfo_040 = notes_plat_sysinfo_045 = From /proc/cpuinfo notes_plat_sysinfo_050 = model name : INTEL(R) XEON(R) PLATINUM 8558 notes_plat_sysinfo_055 = 2 "physical id"s (chips) notes_plat_sysinfo_060 = 192 "processors" notes_plat_sysinfo_065 = cores, siblings (Caution: counting these is hw and system dependent. The following notes_plat_sysinfo_070 = excerpts from /proc/cpuinfo might not be reliable. Use with caution.) notes_plat_sysinfo_075 = cpu cores : 48 notes_plat_sysinfo_080 = siblings : 96 notes_plat_sysinfo_085 = physical 0: cores 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 notes_plat_sysinfo_090 = 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 notes_plat_sysinfo_095 = physical 1: cores 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 notes_plat_sysinfo_100 = 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 notes_plat_sysinfo_105 = notes_plat_sysinfo_110 = From lscpu from util-linux 2.37.4: notes_plat_sysinfo_115 = Architecture: x86_64 notes_plat_sysinfo_120 = CPU op-mode(s): 32-bit, 64-bit notes_plat_sysinfo_125 = Address sizes: 46 bits physical, 57 bits virtual notes_plat_sysinfo_130 = Byte Order: Little Endian notes_plat_sysinfo_135 = CPU(s): 192 notes_plat_sysinfo_140 = On-line CPU(s) list: 0-191 notes_plat_sysinfo_145 = Vendor ID: GenuineIntel notes_plat_sysinfo_150 = Model name: INTEL(R) XEON(R) PLATINUM 8558 notes_plat_sysinfo_155 = CPU family: 6 notes_plat_sysinfo_160 = Model: 207 notes_plat_sysinfo_165 = Thread(s) per core: 2 notes_plat_sysinfo_170 = Core(s) per socket: 48 notes_plat_sysinfo_175 = Socket(s): 2 notes_plat_sysinfo_180 = Stepping: 2 notes_plat_sysinfo_185 = CPU(s) scaling MHz: 25% notes_plat_sysinfo_190 = CPU max MHz: 4000.0000 notes_plat_sysinfo_195 = CPU min MHz: 800.0000 notes_plat_sysinfo_200 = BogoMIPS: 4200.00 notes_plat_sysinfo_205 = Flags: fpu vme de pse tsc msr pae mce cx8 apic sep notes_plat_sysinfo_210 = mtrr pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall notes_plat_sysinfo_215 = nx pdpe1gb rdtscp lm constant_tsc art arch_perfmon pebs bts rep_good nopl xtopology notes_plat_sysinfo_220 = nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq dtes64 monitor ds_cpl vmx notes_plat_sysinfo_225 = smx est tm2 ssse3 sdbg fma cx16 xtpr pdcm pcid dca sse4_1 sse4_2 x2apic movbe popcnt notes_plat_sysinfo_230 = tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm abm 3dnowprefetch cpuid_fault notes_plat_sysinfo_235 = epb cat_l3 cat_l2 cdp_l3 intel_ppin cdp_l2 ssbd mba ibrs ibpb stibp ibrs_enhanced notes_plat_sysinfo_240 = tpr_shadow flexpriority ept vpid ept_ad fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms notes_plat_sysinfo_245 = invpcid cqm rdt_a avx512f avx512dq rdseed adx smap avx512ifma clflushopt clwb notes_plat_sysinfo_250 = intel_pt avx512cd sha_ni avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves cqm_llc notes_plat_sysinfo_255 = cqm_occup_llc cqm_mbm_total cqm_mbm_local split_lock_detect avx_vnni avx512_bf16 notes_plat_sysinfo_260 = wbnoinvd dtherm ida arat pln pts hwp hwp_act_window hwp_epp hwp_pkg_req vnmi notes_plat_sysinfo_265 = avx512vbmi umip pku ospke waitpkg avx512_vbmi2 gfni vaes vpclmulqdq avx512_vnni notes_plat_sysinfo_270 = avx512_bitalg tme avx512_vpopcntdq la57 rdpid bus_lock_detect cldemote movdiri notes_plat_sysinfo_275 = movdir64b enqcmd fsrm md_clear serialize tsxldtrk pconfig arch_lbr ibt amx_bf16 notes_plat_sysinfo_280 = avx512_fp16 amx_tile amx_int8 flush_l1d arch_capabilities notes_plat_sysinfo_285 = Virtualization: VT-x notes_plat_sysinfo_290 = L1d cache: 4.5 MiB (96 instances) notes_plat_sysinfo_295 = L1i cache: 3 MiB (96 instances) notes_plat_sysinfo_300 = L2 cache: 192 MiB (96 instances) notes_plat_sysinfo_305 = L3 cache: 520 MiB (2 instances) notes_plat_sysinfo_310 = NUMA node(s): 4 notes_plat_sysinfo_315 = NUMA node0 CPU(s): 0-23,96-119 notes_plat_sysinfo_320 = NUMA node1 CPU(s): 24-47,120-143 notes_plat_sysinfo_325 = NUMA node2 CPU(s): 48-71,144-167 notes_plat_sysinfo_330 = NUMA node3 CPU(s): 72-95,168-191 notes_plat_sysinfo_335 = Vulnerability Gather data sampling: Not affected notes_plat_sysinfo_340 = Vulnerability Itlb multihit: Not affected notes_plat_sysinfo_345 = Vulnerability L1tf: Not affected notes_plat_sysinfo_350 = Vulnerability Mds: Not affected notes_plat_sysinfo_355 = Vulnerability Meltdown: Not affected notes_plat_sysinfo_360 = Vulnerability Mmio stale data: Not affected notes_plat_sysinfo_365 = Vulnerability Reg file data sampling: Not affected notes_plat_sysinfo_370 = Vulnerability Retbleed: Not affected notes_plat_sysinfo_375 = Vulnerability Spec rstack overflow: Not affected notes_plat_sysinfo_380 = Vulnerability Spec store bypass: Mitigation; Speculative Store Bypass disabled notes_plat_sysinfo_385 = via prctl notes_plat_sysinfo_390 = Vulnerability Spectre v1: Mitigation; usercopy/swapgs barriers and notes_plat_sysinfo_395 = __user pointer sanitization notes_plat_sysinfo_400 = Vulnerability Spectre v2: Mitigation; Enhanced / Automatic IBRS; IBPB notes_plat_sysinfo_405 = conditional; RSB filling; PBRSB-eIBRS SW sequence; BHI BHI_DIS_S notes_plat_sysinfo_410 = Vulnerability Srbds: Not affected notes_plat_sysinfo_415 = Vulnerability Tsx async abort: Not affected notes_plat_sysinfo_420 = notes_plat_sysinfo_425 = From lscpu --cache: notes_plat_sysinfo_430 = NAME ONE-SIZE ALL-SIZE WAYS TYPE LEVEL SETS PHY-LINE COHERENCY-SIZE notes_plat_sysinfo_435 = L1d 48K 4.5M 12 Data 1 64 1 64 notes_plat_sysinfo_440 = L1i 32K 3M 8 Instruction 1 64 1 64 notes_plat_sysinfo_445 = L2 2M 192M 16 Unified 2 2048 1 64 notes_plat_sysinfo_450 = L3 260M 520M 20 Unified 3 212992 1 64 notes_plat_sysinfo_455 = notes_plat_sysinfo_460 = /proc/cpuinfo cache data notes_plat_sysinfo_465 = cache size : 266240 KB notes_plat_sysinfo_470 = notes_plat_sysinfo_475 = From numactl --hardware notes_plat_sysinfo_480 = WARNING: a numactl 'node' might or might not correspond to a physical chip. notes_plat_sysinfo_485 = available: 4 nodes (0-3) notes_plat_sysinfo_490 = node 0 cpus: 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 96 97 98 99 notes_plat_sysinfo_495 = 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 notes_plat_sysinfo_500 = node 0 size: 257156 MB notes_plat_sysinfo_505 = node 0 free: 253926 MB notes_plat_sysinfo_510 = node 1 cpus: 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 notes_plat_sysinfo_515 = 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 notes_plat_sysinfo_520 = 142 143 notes_plat_sysinfo_525 = node 1 size: 258035 MB notes_plat_sysinfo_530 = node 1 free: 255879 MB notes_plat_sysinfo_535 = node 2 cpus: 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 notes_plat_sysinfo_540 = 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 notes_plat_sysinfo_545 = 166 167 notes_plat_sysinfo_550 = node 2 size: 258035 MB notes_plat_sysinfo_555 = node 2 free: 254200 MB notes_plat_sysinfo_560 = node 3 cpus: 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 notes_plat_sysinfo_565 = 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 notes_plat_sysinfo_570 = 190 191 notes_plat_sysinfo_575 = node 3 size: 257974 MB notes_plat_sysinfo_580 = node 3 free: 240794 MB notes_plat_sysinfo_585 = node distances: notes_plat_sysinfo_590 = node 0 1 2 3 notes_plat_sysinfo_595 = 0: 10 12 21 21 notes_plat_sysinfo_600 = 1: 12 10 21 21 notes_plat_sysinfo_605 = 2: 21 21 10 12 notes_plat_sysinfo_610 = 3: 21 21 12 10 notes_plat_sysinfo_615 = notes_plat_sysinfo_620 = From /proc/meminfo notes_plat_sysinfo_625 = MemTotal: 1055951048 kB notes_plat_sysinfo_630 = HugePages_Total: 0 notes_plat_sysinfo_635 = Hugepagesize: 2048 kB notes_plat_sysinfo_640 = notes_plat_sysinfo_645 = /sys/devices/system/cpu/cpu*/cpufreq/scaling_governor has notes_plat_sysinfo_650 = performance notes_plat_sysinfo_655 = notes_plat_sysinfo_660 = From /etc/*release* /etc/*version* notes_plat_sysinfo_665 = os-release: notes_plat_sysinfo_670 = NAME="Rocky Linux" notes_plat_sysinfo_675 = VERSION="9.6 (Blue Onyx)" notes_plat_sysinfo_680 = ID="rocky" notes_plat_sysinfo_685 = ID_LIKE="rhel centos fedora" notes_plat_sysinfo_690 = VERSION_ID="9.6" notes_plat_sysinfo_695 = PLATFORM_ID="platform:el9" notes_plat_sysinfo_700 = PRETTY_NAME="Rocky Linux 9.6 (Blue Onyx)" notes_plat_sysinfo_705 = ANSI_COLOR="0;32" notes_plat_sysinfo_710 = redhat-release: Rocky Linux release 9.6 (Blue Onyx) notes_plat_sysinfo_715 = rocky-release: Rocky Linux release 9.6 (Blue Onyx) notes_plat_sysinfo_720 = rocky-release-upstream: Derived from Red Hat Enterprise Linux 9.6 notes_plat_sysinfo_725 = system-release: Rocky Linux release 9.6 (Blue Onyx) notes_plat_sysinfo_730 = system-release-cpe: cpe:/o:rocky:rocky:9::baseos notes_plat_sysinfo_735 = notes_plat_sysinfo_740 = uname -a: notes_plat_sysinfo_745 = Linux Client-1 5.14.0-570.17.1.el9_6.x86_64 #1 SMP PREEMPT_DYNAMIC Fri May 23 22:47:01 notes_plat_sysinfo_750 = UTC 2025 x86_64 x86_64 x86_64 GNU/Linux notes_plat_sysinfo_755 = notes_plat_sysinfo_760 = Kernel self-reported vulnerability status: notes_plat_sysinfo_765 = notes_plat_sysinfo_770 = gather_data_sampling: Not affected notes_plat_sysinfo_775 = CVE-2018-12207 (iTLB Multihit): Not affected notes_plat_sysinfo_780 = CVE-2018-3620 (L1 Terminal Fault): Not affected notes_plat_sysinfo_785 = Microarchitectural Data Sampling: Not affected notes_plat_sysinfo_790 = CVE-2017-5754 (Meltdown): Not affected notes_plat_sysinfo_795 = mmio_stale_data: Not affected notes_plat_sysinfo_800 = reg_file_data_sampling: Not affected notes_plat_sysinfo_805 = retbleed: Not affected notes_plat_sysinfo_810 = spec_rstack_overflow: Not affected notes_plat_sysinfo_815 = CVE-2018-3639 (Speculative Store Bypass): Mitigation: Speculative Store notes_plat_sysinfo_820 = Bypass disabled via prctl notes_plat_sysinfo_825 = CVE-2017-5753 (Spectre variant 1): Mitigation: usercopy/swapgs notes_plat_sysinfo_830 = barriers and __user pointer notes_plat_sysinfo_835 = sanitization notes_plat_sysinfo_840 = CVE-2017-5715 (Spectre variant 2): Mitigation: Enhanced / Automatic notes_plat_sysinfo_845 = IBRS; IBPB: conditional; RSB notes_plat_sysinfo_850 = filling; PBRSB-eIBRS: SW sequence; notes_plat_sysinfo_855 = BHI: BHI_DIS_S notes_plat_sysinfo_860 = CVE-2020-0543 (Special Register Buffer Data Sampling): Not affected notes_plat_sysinfo_865 = CVE-2019-11135 (TSX Asynchronous Abort): Not affected notes_plat_sysinfo_870 = notes_plat_sysinfo_875 = run-level 3 Sep 12 13:20 notes_plat_sysinfo_880 = notes_plat_sysinfo_885 = SPEC is set to: /home/spec/accel2023 notes_plat_sysinfo_890 = Filesystem Type Size Used Avail Use% Mounted on notes_plat_sysinfo_895 = /dev/mapper/rl-home xfs 1.7T 19G 1.7T 2% /home notes_plat_sysinfo_900 = notes_plat_sysinfo_905 = From /sys/devices/virtual/dmi/id notes_plat_sysinfo_910 = Vendor: ASUSTeK COMPUTER INC. notes_plat_sysinfo_915 = Product: ESC8000-E11 notes_plat_sysinfo_920 = Product Family: Server notes_plat_sysinfo_925 = notes_plat_sysinfo_930 = Cannot run dmidecode; consider saying (as root) notes_plat_sysinfo_935 = chmod +s /usr/sbin/dmidecode notes_plat_sysinfo_940 = notes_plat_sysinfo_945 = BIOS: notes_plat_sysinfo_950 = BIOS Vendor: American Megatrends Inc. notes_plat_sysinfo_955 = BIOS Version: 2803 notes_plat_sysinfo_960 = BIOS Date: 04/08/2025 notes_plat_sysinfo_965 = notes_plat_sysinfo_970 = (End of data from sysinfo program) hw_cpu_name = INTEL XEON PLATINUM 8558 hw_disk = 1.92TB NVMe SSD hw_nchips = 2 prepared_by = spec (is never output, only tags rawfile) sw_file = xfs sw_os000 = Rocky Linux release 9.6 (Blue Onyx) sw_os001 = 5.14.0-570.17.1.el9_6.x86_64 sw_state = Run level 3 (multi-user) # End of settings added by sysinfo_program