292 lines
10 KiB
JSON
292 lines
10 KiB
JSON
{
|
|
"timestamp": "2026-05-22T15:26:29.511252",
|
|
"gpu_info": {
|
|
"driver_version": "580.159.03",
|
|
"cuda_version": "13.0",
|
|
"gpu_count": 8,
|
|
"gpus": [
|
|
{
|
|
"index": 0,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-dfbc9513-255d-4fe7-2b77-7b1ec3972e75",
|
|
"pci_bus_id": "00000000:18:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 4,
|
|
"vram_free_mb": 81076,
|
|
"power_draw": 69.81,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 20,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924016120",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 1,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-bb845ef7-d7b5-f011-9395-ea74274e2282",
|
|
"pci_bus_id": "00000000:2A:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 67.45,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 20,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924015483",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 2,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-3720cf13-2a34-be38-27be-0a7adc4addc4",
|
|
"pci_bus_id": "00000000:3A:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 66.69,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 21,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924025595",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 3,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-87080b2d-ac43-be0d-d574-c193078850ae",
|
|
"pci_bus_id": "00000000:5D:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 66.86,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 20,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924016862",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 4,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-599bd883-cc5c-a5dd-6c33-c15f7049da48",
|
|
"pci_bus_id": "00000000:9A:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 67.07,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 20,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924025670",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 5,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-a1c6bba4-61b0-e623-06c9-9c88635e26fe",
|
|
"pci_bus_id": "00000000:AB:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 69.12,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 22,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924027166",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 6,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-98745a0c-39bd-3e56-d6ca-54ba3647ab6d",
|
|
"pci_bus_id": "00000000:BA:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 67.61,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 20,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924026234",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
},
|
|
{
|
|
"index": 7,
|
|
"name": "NVIDIA H100 80GB HBM3",
|
|
"uuid": "GPU-8c73bd8b-666b-357e-ac5d-c75ac7a759db",
|
|
"pci_bus_id": "00000000:DB:00.0",
|
|
"pcie_link_gen": 5,
|
|
"pcie_link_width": 16,
|
|
"vram_total_mb": 81559,
|
|
"vram_used_mb": 0,
|
|
"vram_free_mb": 81079,
|
|
"power_draw": 66.19,
|
|
"power_limit": 700.0,
|
|
"clock_sm": 345,
|
|
"clock_mem": 2619,
|
|
"temperature": 20,
|
|
"fan_speed": 0,
|
|
"persistence_mode": false,
|
|
"compute_mode": "Default",
|
|
"serial_number": "1651924027255",
|
|
"ecc_errors_single": 0,
|
|
"ecc_errors_double": 0
|
|
}
|
|
],
|
|
"topology": "\t\u001b[4mGPU0\tGPU1\tGPU2\tGPU3\tGPU4\tGPU5\tGPU6\tGPU7\tNIC0\tNIC1\tNIC2\tNIC3\tNIC4\tNIC5\tNIC6\tNIC7\tNIC8\tNIC9\tCPU Affinity\tNUMA Affinity\tGPU NUMA ID\u001b[0m\nGPU0\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tPIX\tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU1\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNODE\tPIX\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU2\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNODE\tNODE\tPIX\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU3\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNODE\tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU4\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tPIX\tNODE\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nGPU5\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tPIX\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nGPU6\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tPIX\t56-111,168-223\t1\t\tN/A\nGPU7\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nNIC0\tPIX\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t X \tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC1\tNODE\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\t X \tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC2\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\t X \tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC3\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\t X \tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC4\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\t X \tPIX\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC5\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\tPIX\t X \tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC6\tSYS\tSYS\tSYS\tSYS\tPIX\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\t X \tNODE\tNODE\tNODE\t\t\t\t\nNIC7\tSYS\tSYS\tSYS\tSYS\tNODE\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\t X \tNODE\tNODE\t\t\t\t\nNIC8\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\t X \tPIX\t\t\t\t\nNIC9\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\t X \t\t\t\t\n\nLegend:\n\n X = Self\n SYS = Connection traversing PCIe as well as the SMP interconnect between NUMA nodes (e.g., QPI/UPI)\n NODE = Connection traversing PCIe as well as the interconnect between PCIe Host Bridges within a NUMA node\n PHB = Connection traversing PCIe as well as a PCIe Host Bridge (typically the CPU)\n PXB = Connection traversing multiple PCIe bridges (without traversing the PCIe Host Bridge)\n PIX = Connection traversing at most a single PCIe bridge\n NV# = Connection traversing a bonded set of # NVLinks\n\nNIC Legend:\n\n NIC0: mlx5_0\n NIC1: mlx5_1\n NIC2: mlx5_2\n NIC3: mlx5_3\n NIC4: mlx5_4\n NIC5: mlx5_5\n NIC6: mlx5_6\n NIC7: mlx5_7\n NIC8: mlx5_8\n NIC9: mlx5_9\n\n",
|
|
"timestamp": "2026-05-22T15:26:36.627805",
|
|
"detected_gpu_type": "h100",
|
|
"gpu_label": "H100 SXM5"
|
|
},
|
|
"memory_bench": {
|
|
"memory": {
|
|
"source": "pytorch",
|
|
"h2d_bandwidth_gbps": 11.8,
|
|
"d2h_bandwidth_gbps": 10.1,
|
|
"d2d_bandwidth_gbps": 829.0,
|
|
"peak_bandwidth_gbps": 3400,
|
|
"efficiency_pct": 24.4,
|
|
"test_sizes_mb": [
|
|
1,
|
|
4,
|
|
16,
|
|
64,
|
|
256,
|
|
1024,
|
|
4096
|
|
],
|
|
"bandwidth_by_size": {
|
|
"1": {
|
|
"h2d_gbps": 3.6,
|
|
"d2h_gbps": 1.4,
|
|
"d2d_gbps": 40.3
|
|
},
|
|
"4": {
|
|
"h2d_gbps": 7.7,
|
|
"d2h_gbps": 10.1,
|
|
"d2d_gbps": 159.5
|
|
},
|
|
"16": {
|
|
"h2d_gbps": 10.9,
|
|
"d2h_gbps": 1.9,
|
|
"d2d_gbps": 439.5
|
|
},
|
|
"64": {
|
|
"h2d_gbps": 11.8,
|
|
"d2h_gbps": 1.4,
|
|
"d2d_gbps": 740.5
|
|
},
|
|
"256": {
|
|
"h2d_gbps": 9.0,
|
|
"d2h_gbps": 1.4,
|
|
"d2d_gbps": 792.1
|
|
},
|
|
"1024": {
|
|
"h2d_gbps": 8.4,
|
|
"d2h_gbps": 1.4,
|
|
"d2d_gbps": 818.9
|
|
},
|
|
"4096": {
|
|
"h2d_gbps": 6.1,
|
|
"d2h_gbps": 1.4,
|
|
"d2d_gbps": 829.0
|
|
}
|
|
},
|
|
"per_gpu": []
|
|
}
|
|
},
|
|
"compute_bench": {
|
|
"compute": {
|
|
"per_dtype_tflops": {
|
|
"fp32": 51.9,
|
|
"tf32": 357.8,
|
|
"fp16": 667.2,
|
|
"bf16": 699.1,
|
|
"fp8": 1146.2
|
|
},
|
|
"peak_tflops": {
|
|
"fp32": 67,
|
|
"tf32": 495,
|
|
"fp16": 990,
|
|
"bf16": 990,
|
|
"fp8": 1979
|
|
},
|
|
"efficiency_pct": {
|
|
"fp32": 77.5,
|
|
"tf32": 72.3,
|
|
"fp16": 67.4,
|
|
"bf16": 70.6,
|
|
"fp8": 57.9
|
|
},
|
|
"pass_thresholds_tflops": {
|
|
"fp32": 54,
|
|
"tf32": 444,
|
|
"fp16": 734,
|
|
"bf16": 745,
|
|
"fp8": 1400
|
|
},
|
|
"per_gpu": [
|
|
{
|
|
"index": 0,
|
|
"fp32": 51.9,
|
|
"tf32": 357.8,
|
|
"fp16": 667.2,
|
|
"bf16": 699.1,
|
|
"fp8": 1146.2
|
|
}
|
|
],
|
|
"matrix_size": 8192,
|
|
"warmup": 50,
|
|
"iterations": 500
|
|
}
|
|
}
|
|
} |