# Invocation command line: # /var/data0/sandbox/nvuser/SPECACCEL/bin/harness/runaccel --configfile nvhpc_acc_2311 --reportable --iterations 2 --nopower --runmode speed --tune base --size ref accel # output_root was not used for this run ############################################################################ # Invocation command line: # runaccel -c nvhpc --reportable -T base --define model= accel # # MODEL may be one of the following options: # 1. "acc" - Use OpenACC (default) # 2. "lop" - Use OpenMP with "loop" construct # 3. "tgt" - Use OpenMP with "distribute" construct # 4. "smd" - Use OpenMP with "distribute" and inner "simd" construct # 5. "acp" - Use OpenACC with the "parallel" src.alt # 6. "lops" - Use OpenMP with "loop" construct src.alt (no metadirectives) # 7. "tgts" - Use OpenMP with "distribute" construct src.alt (no metadirectives) # 8. "smds" - Use OpenMP with "distribute" and inner "simd" construct src.alt (no metadirectives) # ############################################################################ # The following setting was inserted automatically as a result of # post-run basepeak application. basepeak = 1 %ifndef %{model} # IF model is not set use acc % define model acc %endif #################################################################### # Tester information #################################################################### license_num = 9045 tester = NVIDIA Corporation test_sponsor = NVIDIA Corporation ###################################################################### # The header section of the config file. Must appear # before any instances of "default=" # # label = how the binaries you generated will be identified # tune = specify "base" or "peak" or "all" label = nvhpc_acc_2311 tune = base output_format = txt,html,pdf teeout = yes teerunout = yes strict_rundir_verify=1 #output_root = /tmp/accel2023 flagsurl000=http://www.spec.org/accel2023/flags/nv2023_flags_v2.xml # Adjust the number of make jobs to use here makeflags=-j 40 #################################################################### # Hardware information #################################################################### #include: SUT.inc # ----- Begin inclusion of 'SUT.inc' ############################################################################ ##### SUT.inc #### ##### Example of required hardware information for the system under test (SUT) #### default: hw_avail = Jul-2023 sw_avail = Nov-2023 hw_cpu_name = CPU Name hw_cpu_max_mhz = 3800 hw_cpu_nominal_mhz = 2000 hw_nchips = 1 hw_ncores = 112 hw_nthreadspercore = 2 hw_ncpuorder = 2 chips hw_pcache = 32 KB I + 48 KB D on chip per core hw_scache = 2 MB I+D on chip per core hw_tcache = 105 MB I+D on chip per chip hw_ocache = None hw_vendor = NVIDIA Corporation hw_model = DGX-H100 hw_disk = 1x NVME, 1000 GB, 99999 RPM hw_memory000 = 2 TB (32 x 64 GB 2Rx8 PC5-4800B-R) hw_other = None # Accelerator description hw_accel_connect = NVLink 4 hw_accel_desc000 = System contains 8 H100 SXM with GPU 0 used for hw_accel_desc001 = measurement. GPU contain 80GB of memory. hw_accel_ecc = Yes hw_accel_model = H100 SXM 80GB hw_accel_name = Tesla H100 SXM 80GB hw_accel_type = GPU hw_accel_vendor = NVIDIA # ---- End inclusion of '/var/data0/sandbox/nvuser/SPECACCEL/config/SUT.inc' #################################################################### # Software information #################################################################### default: CC = nvc CXX = nvc++ FC = nvfortran CC_VERSION_OPTION = -V CXX_VERSION_OPTION = -V FC_VERSION_OPTION = -V preENV_LD_LIBRARY_PATH=$[top]/nv2311_libs OPTIMIZE = -Ofast -acc -Mfprelaxed -Mstack_arrays -static-nvidia 457.spC: PORTABILITY += -mcmodel=medium -Wl,--no-relax 459.miniGhost: EXTRA_LDFLAGS += -Mnomain # The following settings were obtained by running the sysinfo_program # 'specperl $[top]/bin/sysinfo' (sysinfo:SHA:ac6f2b38b7dec295b8795065d3a13319ea78b9367f95037a5e6ed5e46e487861) default: notes_plat_sysinfo_000 = notes_plat_sysinfo_005 = Sysinfo program /var/data0/sandbox/nvuser/SPECACCEL/bin/sysinfo notes_plat_sysinfo_010 = Rev: r6622 of 2021-04-07 b1a7d5f8f71be5aff70a755cad7211a0 notes_plat_sysinfo_015 = running on VIKING80-DVT-800 Thu Oct 19 14:11:28 2023 notes_plat_sysinfo_020 = notes_plat_sysinfo_025 = SUT (System Under Test) info as seen by some common utilities. notes_plat_sysinfo_030 = For more information on this section, see notes_plat_sysinfo_035 = https://www.spec.org/cpu2017/Docs/config.html#sysinfo notes_plat_sysinfo_040 = notes_plat_sysinfo_045 = From /proc/cpuinfo notes_plat_sysinfo_050 = model name : Intel(R) Xeon(R) Platinum 8480CL notes_plat_sysinfo_055 = 2 "physical id"s (chips) notes_plat_sysinfo_060 = 224 "processors" notes_plat_sysinfo_065 = cores, siblings (Caution: counting these is hw and system dependent. The following notes_plat_sysinfo_070 = excerpts from /proc/cpuinfo might not be reliable. Use with caution.) notes_plat_sysinfo_075 = cpu cores : 56 notes_plat_sysinfo_080 = siblings : 112 notes_plat_sysinfo_085 = physical 0: cores 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 notes_plat_sysinfo_090 = 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 notes_plat_sysinfo_095 = 53 54 55 notes_plat_sysinfo_100 = physical 1: cores 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 notes_plat_sysinfo_105 = 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 notes_plat_sysinfo_110 = 53 54 55 notes_plat_sysinfo_115 = notes_plat_sysinfo_120 = From lscpu from util-linux 2.37.2: notes_plat_sysinfo_125 = Architecture: x86_64 notes_plat_sysinfo_130 = CPU op-mode(s): 32-bit, 64-bit notes_plat_sysinfo_135 = Address sizes: 52 bits physical, 57 bits virtual notes_plat_sysinfo_140 = Byte Order: Little Endian notes_plat_sysinfo_145 = CPU(s): 224 notes_plat_sysinfo_150 = On-line CPU(s) list: 0-223 notes_plat_sysinfo_155 = Vendor ID: GenuineIntel notes_plat_sysinfo_160 = Model name: Intel(R) Xeon(R) Platinum 8480CL notes_plat_sysinfo_165 = CPU family: 6 notes_plat_sysinfo_170 = Model: 143 notes_plat_sysinfo_175 = Thread(s) per core: 2 notes_plat_sysinfo_180 = Core(s) per socket: 56 notes_plat_sysinfo_185 = Socket(s): 2 notes_plat_sysinfo_190 = Stepping: 7 notes_plat_sysinfo_195 = CPU max MHz: 3800.0000 notes_plat_sysinfo_200 = CPU min MHz: 800.0000 notes_plat_sysinfo_205 = BogoMIPS: 4000.00 notes_plat_sysinfo_210 = Flags: fpu vme de pse tsc msr pae mce cx8 apic sep mtrr notes_plat_sysinfo_215 = pge mca cmov pat pse36 clflush dts acpi mmx fxsr sse sse2 ss ht tm pbe syscall nx notes_plat_sysinfo_220 = pdpe1gb rdtscp lm constant_tsc art arch_perfmon pebs bts rep_good nopl xtopology notes_plat_sysinfo_225 = nonstop_tsc cpuid aperfmperf tsc_known_freq pni pclmulqdq dtes64 monitor ds_cpl smx notes_plat_sysinfo_230 = est tm2 ssse3 sdbg fma cx16 xtpr pdcm pcid dca sse4_1 sse4_2 x2apic movbe popcnt notes_plat_sysinfo_235 = tsc_deadline_timer aes xsave avx f16c rdrand lahf_lm abm 3dnowprefetch cpuid_fault notes_plat_sysinfo_240 = epb cat_l3 cat_l2 cdp_l3 invpcid_single intel_ppin cdp_l2 ssbd mba ibrs ibpb stibp notes_plat_sysinfo_245 = ibrs_enhanced fsgsbase tsc_adjust bmi1 avx2 smep bmi2 erms invpcid cqm rdt_a avx512f notes_plat_sysinfo_250 = avx512dq rdseed adx smap avx512ifma clflushopt clwb intel_pt avx512cd sha_ni notes_plat_sysinfo_255 = avx512bw avx512vl xsaveopt xsavec xgetbv1 xsaves cqm_llc cqm_occup_llc cqm_mbm_total notes_plat_sysinfo_260 = cqm_mbm_local split_lock_detect avx_vnni avx512_bf16 wbnoinvd dtherm ida arat pln notes_plat_sysinfo_265 = pts hwp hwp_act_window hwp_epp hwp_pkg_req avx512vbmi umip pku ospke waitpkg notes_plat_sysinfo_270 = avx512_vbmi2 gfni vaes vpclmulqdq avx512_vnni avx512_bitalg tme avx512_vpopcntdq notes_plat_sysinfo_275 = la57 rdpid bus_lock_detect cldemote movdiri movdir64b enqcmd fsrm md_clear serialize notes_plat_sysinfo_280 = tsxldtrk pconfig arch_lbr amx_bf16 avx512_fp16 amx_tile amx_int8 flush_l1d notes_plat_sysinfo_285 = arch_capabilities notes_plat_sysinfo_290 = L1d cache: 5.3 MiB (112 instances) notes_plat_sysinfo_295 = L1i cache: 3.5 MiB (112 instances) notes_plat_sysinfo_300 = L2 cache: 224 MiB (112 instances) notes_plat_sysinfo_305 = L3 cache: 210 MiB (2 instances) notes_plat_sysinfo_310 = NUMA node(s): 2 notes_plat_sysinfo_315 = NUMA node0 CPU(s): 0-55,112-167 notes_plat_sysinfo_320 = NUMA node1 CPU(s): 56-111,168-223 notes_plat_sysinfo_325 = Vulnerability Itlb multihit: Not affected notes_plat_sysinfo_330 = Vulnerability L1tf: Not affected notes_plat_sysinfo_335 = Vulnerability Mds: Not affected notes_plat_sysinfo_340 = Vulnerability Meltdown: Not affected notes_plat_sysinfo_345 = Vulnerability Mmio stale data: Not affected notes_plat_sysinfo_350 = Vulnerability Retbleed: Not affected notes_plat_sysinfo_355 = Vulnerability Spec store bypass: Mitigation; Speculative Store Bypass disabled via notes_plat_sysinfo_360 = prctl and seccomp notes_plat_sysinfo_365 = Vulnerability Spectre v1: Mitigation; usercopy/swapgs barriers and __user notes_plat_sysinfo_370 = pointer sanitization notes_plat_sysinfo_375 = Vulnerability Spectre v2: Mitigation; Enhanced IBRS, IBPB conditional, RSB notes_plat_sysinfo_380 = filling, PBRSB-eIBRS SW sequence notes_plat_sysinfo_385 = Vulnerability Srbds: Not affected notes_plat_sysinfo_390 = Vulnerability Tsx async abort: Not affected notes_plat_sysinfo_395 = notes_plat_sysinfo_400 = From lscpu --cache: notes_plat_sysinfo_405 = NAME ONE-SIZE ALL-SIZE WAYS TYPE LEVEL SETS PHY-LINE COHERENCY-SIZE notes_plat_sysinfo_410 = L1d 48K 5.3M 12 Data 1 64 1 64 notes_plat_sysinfo_415 = L1i 32K 3.5M 8 Instruction 1 64 1 64 notes_plat_sysinfo_420 = L2 2M 224M 16 Unified 2 2048 1 64 notes_plat_sysinfo_425 = L3 105M 210M 15 Unified 3 114688 1 64 notes_plat_sysinfo_430 = notes_plat_sysinfo_435 = /proc/cpuinfo cache data notes_plat_sysinfo_440 = cache size : 107520 KB notes_plat_sysinfo_445 = notes_plat_sysinfo_450 = From numactl --hardware notes_plat_sysinfo_455 = WARNING: a numactl 'node' might or might not correspond to a physical chip. notes_plat_sysinfo_460 = available: 2 nodes (0-1) notes_plat_sysinfo_465 = node 0 cpus: 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 notes_plat_sysinfo_470 = 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 112 notes_plat_sysinfo_475 = 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 notes_plat_sysinfo_480 = 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 notes_plat_sysinfo_485 = 157 158 159 160 161 162 163 164 165 166 167 notes_plat_sysinfo_490 = node 0 size: 1031795 MB notes_plat_sysinfo_495 = node 0 free: 854000 MB notes_plat_sysinfo_500 = node 1 cpus: 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 notes_plat_sysinfo_505 = 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 notes_plat_sysinfo_510 = 107 108 109 110 111 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 notes_plat_sysinfo_515 = 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 notes_plat_sysinfo_520 = 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 notes_plat_sysinfo_525 = node 1 size: 1032154 MB notes_plat_sysinfo_530 = node 1 free: 950860 MB notes_plat_sysinfo_535 = node distances: notes_plat_sysinfo_540 = node 0 1 notes_plat_sysinfo_545 = 0: 10 21 notes_plat_sysinfo_550 = 1: 21 10 notes_plat_sysinfo_555 = notes_plat_sysinfo_560 = From /proc/meminfo notes_plat_sysinfo_565 = MemTotal: 2113484880 kB notes_plat_sysinfo_570 = HugePages_Total: 0 notes_plat_sysinfo_575 = Hugepagesize: 2048 kB notes_plat_sysinfo_580 = notes_plat_sysinfo_585 = /sys/devices/system/cpu/cpu*/cpufreq/scaling_governor has notes_plat_sysinfo_590 = performance notes_plat_sysinfo_595 = notes_plat_sysinfo_600 = /usr/bin/lsb_release -d notes_plat_sysinfo_605 = Ubuntu 22.04.2 LTS notes_plat_sysinfo_610 = notes_plat_sysinfo_615 = From /etc/*release* /etc/*version* notes_plat_sysinfo_620 = debian_version: bookworm/sid notes_plat_sysinfo_625 = dgx-release: notes_plat_sysinfo_630 = DGX_NAME="DGX Server" notes_plat_sysinfo_635 = DGX_PRETTY_NAME="NVIDIA DGX Server" notes_plat_sysinfo_640 = DGX_SWBUILD_DATE="2023-05-16-16-18-31" notes_plat_sysinfo_645 = DGX_SWBUILD_VERSION="6.0.11" notes_plat_sysinfo_650 = DGX_COMMIT_ID="d0b730d" notes_plat_sysinfo_655 = DGX_PLATFORM="DGX Server for DGX H100" notes_plat_sysinfo_660 = DGX_SERIAL_NUMBER="1661623000112" notes_plat_sysinfo_665 = os-release: notes_plat_sysinfo_670 = PRETTY_NAME="Ubuntu 22.04.2 LTS" notes_plat_sysinfo_675 = NAME="Ubuntu" notes_plat_sysinfo_680 = VERSION_ID="22.04" notes_plat_sysinfo_685 = VERSION="22.04.2 LTS (Jammy Jellyfish)" notes_plat_sysinfo_690 = VERSION_CODENAME=jammy notes_plat_sysinfo_695 = ID=ubuntu notes_plat_sysinfo_700 = ID_LIKE=debian notes_plat_sysinfo_705 = HOME_URL="https://www.ubuntu.com/" notes_plat_sysinfo_710 = notes_plat_sysinfo_715 = uname -a: notes_plat_sysinfo_720 = Linux VIKING80-DVT-800 5.15.0-1025-nvidia #25-Ubuntu SMP Fri Apr 21 21:46:57 UTC 2023 notes_plat_sysinfo_725 = x86_64 x86_64 x86_64 GNU/Linux notes_plat_sysinfo_730 = notes_plat_sysinfo_735 = Kernel self-reported vulnerability status: notes_plat_sysinfo_740 = notes_plat_sysinfo_745 = CVE-2018-12207 (iTLB Multihit): Not affected notes_plat_sysinfo_750 = CVE-2018-3620 (L1 Terminal Fault): Not affected notes_plat_sysinfo_755 = Microarchitectural Data Sampling: Not affected notes_plat_sysinfo_760 = CVE-2017-5754 (Meltdown): Not affected notes_plat_sysinfo_765 = mmio_stale_data: Not affected notes_plat_sysinfo_770 = retbleed: Not affected notes_plat_sysinfo_775 = CVE-2018-3639 (Speculative Store Bypass): Mitigation: Speculative Store notes_plat_sysinfo_780 = Bypass disabled via prctl and notes_plat_sysinfo_785 = seccomp notes_plat_sysinfo_790 = CVE-2017-5753 (Spectre variant 1): Mitigation: usercopy/swapgs notes_plat_sysinfo_795 = barriers and __user pointer notes_plat_sysinfo_800 = sanitization notes_plat_sysinfo_805 = CVE-2017-5715 (Spectre variant 2): Mitigation: Enhanced IBRS, IBPB: notes_plat_sysinfo_810 = conditional, RSB filling, notes_plat_sysinfo_815 = PBRSB-eIBRS: SW sequence notes_plat_sysinfo_820 = CVE-2020-0543 (Special Register Buffer Data Sampling): Not affected notes_plat_sysinfo_825 = CVE-2019-11135 (TSX Asynchronous Abort): Not affected notes_plat_sysinfo_830 = notes_plat_sysinfo_835 = run-level 3 Oct 19 05:44 notes_plat_sysinfo_840 = notes_plat_sysinfo_845 = SPEC is set to: /var/data0/sandbox/nvuser/SPECACCEL notes_plat_sysinfo_850 = Filesystem Type Size Used Avail Use% Mounted on notes_plat_sysinfo_855 = /dev/md127 ext4 28T 11T 16T 41% /raid notes_plat_sysinfo_860 = notes_plat_sysinfo_865 = From /sys/devices/virtual/dmi/id notes_plat_sysinfo_870 = Vendor: NVIDIA notes_plat_sysinfo_875 = Product: DGXH100 notes_plat_sysinfo_880 = Product Family: DGX notes_plat_sysinfo_885 = notes_plat_sysinfo_890 = Cannot run dmidecode; consider saying (as root) notes_plat_sysinfo_895 = chmod +s /usr/sbin/dmidecode notes_plat_sysinfo_900 = notes_plat_sysinfo_905 = BIOS: notes_plat_sysinfo_910 = BIOS Vendor: NVIDIA notes_plat_sysinfo_915 = BIOS Version: 1.1.1 notes_plat_sysinfo_920 = BIOS Date: 07/31/2023 notes_plat_sysinfo_925 = notes_plat_sysinfo_930 = (End of data from sysinfo program) hw_cpu_name = Intel Xeon Platinum 8480CL hw_disk000 = OS: 2x 1.9TB NVMe M.2 hw_disk001 = Internal storage: 8x 3.84TB NVMe U.2 hw_nchips = 2 prepared_by = nvuser (is never output, only tags rawfile) sw_compiler = C/Fortran: Version 23.11 of NVHPC SDK fw_bios = 1.1.1 07/31/2023 sw_file = ext4 sw_os000 = Ubuntu 22.04.2 LTS sw_os001 = 5.15.0-1025-nvidia sw_state = Run level 3 (multi-user) sw_other = None # End of settings added by sysinfo_program # The following section was added automatically, and contains settings that # did not appear in the original configuration file, but were added to the # raw file after the run. default: notes_000 =Environment variables set by runaccel before the start of the run: notes_005 =LD_LIBRARY_PATH = "/var/data0/sandbox/nvuser/SPECACCEL/nv239_libs" notes_010 =Set to the location of the NVHPC compiler runtime libraries. sw_accel_driver000 = NVIDIA UNIX Open Kernel Module for x86_64 sw_accel_driver001 = 535.104.05 notes_os_000 =Shell stacksize set to unlimited via "limit stacksize unlimited"