{ "timestamp": "2026-05-22T15:26:26.973586", "gpu_info": { "driver_version": "580.159.03", "cuda_version": "13.0", "gpu_count": 8, "gpus": [ { "index": 0, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-7658c03c-7659-9886-041e-545c21d53e12", "pci_bus_id": "00000000:18:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 4, "vram_free_mb": 81076, "power_draw": 69.72, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 25, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1654923030411", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 1, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-6392d40b-893b-9fc2-4284-a3f1d8c4d7f1", "pci_bus_id": "00000000:2A:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 73.17, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 25, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1654724063165", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 2, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-2ae38735-10de-fb0b-fb20-9d1b5b434558", "pci_bus_id": "00000000:3A:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 68.71, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 26, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1654823036530", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 3, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-ec62123f-0c48-6dbd-49e4-8b231b3fed0e", "pci_bus_id": "00000000:5D:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 69.73, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 25, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1654923021638", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 4, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-b64fc270-109e-1543-fb0c-be7feecf14f1", "pci_bus_id": "00000000:9A:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 68.84, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 24, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1655023033179", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 5, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-15ab7baf-9010-7cf3-5462-eeb09f8dbe65", "pci_bus_id": "00000000:AB:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 69.94, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 27, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1655023034225", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 6, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-225f6f3c-6fef-d1e2-5428-d90f665fb3d3", "pci_bus_id": "00000000:BA:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 70.46, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 25, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1654923078278", "ecc_errors_single": 0, "ecc_errors_double": 0 }, { "index": 7, "name": "NVIDIA H100 80GB HBM3", "uuid": "GPU-79aeb6a8-c00c-6edb-956f-779ef56950a3", "pci_bus_id": "00000000:DB:00.0", "pcie_link_gen": 5, "pcie_link_width": 16, "vram_total_mb": 81559, "vram_used_mb": 0, "vram_free_mb": 81079, "power_draw": 71.76, "power_limit": 700.0, "clock_sm": 345, "clock_mem": 2619, "temperature": 24, "fan_speed": 0, "persistence_mode": false, "compute_mode": "Default", "serial_number": "1654024031464", "ecc_errors_single": 0, "ecc_errors_double": 0 } ], "topology": "\t\u001b[4mGPU0\tGPU1\tGPU2\tGPU3\tGPU4\tGPU5\tGPU6\tGPU7\tNIC0\tNIC1\tNIC2\tNIC3\tNIC4\tNIC5\tNIC6\tNIC7\tNIC8\tNIC9\tCPU Affinity\tNUMA Affinity\tGPU NUMA ID\u001b[0m\nGPU0\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tPIX\tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU1\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNODE\tPIX\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU2\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNODE\tNODE\tPIX\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU3\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNODE\tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU4\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tPIX\tNODE\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nGPU5\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tPIX\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nGPU6\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tPIX\t56-111,168-223\t1\t\tN/A\nGPU7\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nNIC0\tPIX\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t X \tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC1\tNODE\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\t X \tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC2\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\t X \tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC3\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\t X \tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC4\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\t X \tPIX\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC5\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\tPIX\t X \tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC6\tSYS\tSYS\tSYS\tSYS\tPIX\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\t X \tNODE\tNODE\tNODE\t\t\t\t\nNIC7\tSYS\tSYS\tSYS\tSYS\tNODE\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\t X \tNODE\tNODE\t\t\t\t\nNIC8\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\t X \tPIX\t\t\t\t\nNIC9\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\t X \t\t\t\t\n\nLegend:\n\n X = Self\n SYS = Connection traversing PCIe as well as the SMP interconnect between NUMA nodes (e.g., QPI/UPI)\n NODE = Connection traversing PCIe as well as the interconnect between PCIe Host Bridges within a NUMA node\n PHB = Connection traversing PCIe as well as a PCIe Host Bridge (typically the CPU)\n PXB = Connection traversing multiple PCIe bridges (without traversing the PCIe Host Bridge)\n PIX = Connection traversing at most a single PCIe bridge\n NV# = Connection traversing a bonded set of # NVLinks\n\nNIC Legend:\n\n NIC0: mlx5_0\n NIC1: mlx5_1\n NIC2: mlx5_2\n NIC3: mlx5_3\n NIC4: mlx5_4\n NIC5: mlx5_5\n NIC6: mlx5_6\n NIC7: mlx5_7\n NIC8: mlx5_8\n NIC9: mlx5_9\n\n", "timestamp": "2026-05-22T15:26:34.187409", "detected_gpu_type": "h100", "gpu_label": "H100 SXM5" }, "memory_bench": { "memory": { "source": "pytorch", "h2d_bandwidth_gbps": 11.8, "d2h_bandwidth_gbps": 9.9, "d2d_bandwidth_gbps": 829.1, "peak_bandwidth_gbps": 3400, "efficiency_pct": 24.4, "test_sizes_mb": [ 1, 4, 16, 64, 256, 1024, 4096 ], "bandwidth_by_size": { "1": { "h2d_gbps": 3.8, "d2h_gbps": 1.4, "d2d_gbps": 40.6 }, "4": { "h2d_gbps": 7.6, "d2h_gbps": 9.9, "d2d_gbps": 141.5 }, "16": { "h2d_gbps": 11.0, "d2h_gbps": 1.9, "d2d_gbps": 450.3 }, "64": { "h2d_gbps": 11.8, "d2h_gbps": 1.4, "d2d_gbps": 726.5 }, "256": { "h2d_gbps": 9.0, "d2h_gbps": 1.4, "d2d_gbps": 793.8 }, "1024": { "h2d_gbps": 5.5, "d2h_gbps": 1.4, "d2d_gbps": 821.2 }, "4096": { "h2d_gbps": 5.9, "d2h_gbps": 1.4, "d2d_gbps": 829.1 } }, "per_gpu": [] } }, "compute_bench": { "compute": { "per_dtype_tflops": { "fp32": 52.0, "tf32": 362.3, "fp16": 691.0, "bf16": 713.0, "fp8": 1148.8 }, "peak_tflops": { "fp32": 67, "tf32": 495, "fp16": 990, "bf16": 990, "fp8": 1979 }, "efficiency_pct": { "fp32": 77.6, "tf32": 73.2, "fp16": 69.8, "bf16": 72.0, "fp8": 58.0 }, "pass_thresholds_tflops": { "fp32": 54, "tf32": 444, "fp16": 734, "bf16": 745, "fp8": 1400 }, "per_gpu": [ { "index": 0, "fp32": 52.0, "tf32": 362.3, "fp16": 691.0, "bf16": 713.0, "fp8": 1148.8 } ], "matrix_size": 8192, "warmup": 50, "iterations": 500 } } }