test_gpu_scripts/reports_single_gpu_aikubeworker0012.json

292 lines
10 KiB
JSON

{
"timestamp": "2026-05-22T15:26:26.973586",
"gpu_info": {
"driver_version": "580.159.03",
"cuda_version": "13.0",
"gpu_count": 8,
"gpus": [
{
"index": 0,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-7658c03c-7659-9886-041e-545c21d53e12",
"pci_bus_id": "00000000:18:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 4,
"vram_free_mb": 81076,
"power_draw": 69.72,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 25,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1654923030411",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 1,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-6392d40b-893b-9fc2-4284-a3f1d8c4d7f1",
"pci_bus_id": "00000000:2A:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 73.17,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 25,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1654724063165",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 2,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-2ae38735-10de-fb0b-fb20-9d1b5b434558",
"pci_bus_id": "00000000:3A:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 68.71,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 26,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1654823036530",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 3,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-ec62123f-0c48-6dbd-49e4-8b231b3fed0e",
"pci_bus_id": "00000000:5D:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 69.73,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 25,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1654923021638",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 4,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-b64fc270-109e-1543-fb0c-be7feecf14f1",
"pci_bus_id": "00000000:9A:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 68.84,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 24,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1655023033179",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 5,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-15ab7baf-9010-7cf3-5462-eeb09f8dbe65",
"pci_bus_id": "00000000:AB:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 69.94,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 27,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1655023034225",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 6,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-225f6f3c-6fef-d1e2-5428-d90f665fb3d3",
"pci_bus_id": "00000000:BA:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 70.46,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 25,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1654923078278",
"ecc_errors_single": 0,
"ecc_errors_double": 0
},
{
"index": 7,
"name": "NVIDIA H100 80GB HBM3",
"uuid": "GPU-79aeb6a8-c00c-6edb-956f-779ef56950a3",
"pci_bus_id": "00000000:DB:00.0",
"pcie_link_gen": 5,
"pcie_link_width": 16,
"vram_total_mb": 81559,
"vram_used_mb": 0,
"vram_free_mb": 81079,
"power_draw": 71.76,
"power_limit": 700.0,
"clock_sm": 345,
"clock_mem": 2619,
"temperature": 24,
"fan_speed": 0,
"persistence_mode": false,
"compute_mode": "Default",
"serial_number": "1654024031464",
"ecc_errors_single": 0,
"ecc_errors_double": 0
}
],
"topology": "\t\u001b[4mGPU0\tGPU1\tGPU2\tGPU3\tGPU4\tGPU5\tGPU6\tGPU7\tNIC0\tNIC1\tNIC2\tNIC3\tNIC4\tNIC5\tNIC6\tNIC7\tNIC8\tNIC9\tCPU Affinity\tNUMA Affinity\tGPU NUMA ID\u001b[0m\nGPU0\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tPIX\tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU1\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNODE\tPIX\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU2\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNV18\tNODE\tNODE\tPIX\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU3\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tNV18\tNODE\tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t0-55,112-167\t0\t\tN/A\nGPU4\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tPIX\tNODE\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nGPU5\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tPIX\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nGPU6\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tNV18\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tPIX\t56-111,168-223\t1\t\tN/A\nGPU7\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\tNV18\t X \tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\t56-111,168-223\t1\t\tN/A\nNIC0\tPIX\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t X \tNODE\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC1\tNODE\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\t X \tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC2\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\t X \tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC3\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\t X \tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC4\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\t X \tPIX\tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC5\tNODE\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tNODE\tNODE\tPIX\t X \tSYS\tSYS\tSYS\tSYS\t\t\t\t\nNIC6\tSYS\tSYS\tSYS\tSYS\tPIX\tNODE\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\t X \tNODE\tNODE\tNODE\t\t\t\t\nNIC7\tSYS\tSYS\tSYS\tSYS\tNODE\tPIX\tNODE\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\t X \tNODE\tNODE\t\t\t\t\nNIC8\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\t X \tPIX\t\t\t\t\nNIC9\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\tNODE\tSYS\tSYS\tSYS\tSYS\tSYS\tSYS\tNODE\tNODE\tPIX\t X \t\t\t\t\n\nLegend:\n\n X = Self\n SYS = Connection traversing PCIe as well as the SMP interconnect between NUMA nodes (e.g., QPI/UPI)\n NODE = Connection traversing PCIe as well as the interconnect between PCIe Host Bridges within a NUMA node\n PHB = Connection traversing PCIe as well as a PCIe Host Bridge (typically the CPU)\n PXB = Connection traversing multiple PCIe bridges (without traversing the PCIe Host Bridge)\n PIX = Connection traversing at most a single PCIe bridge\n NV# = Connection traversing a bonded set of # NVLinks\n\nNIC Legend:\n\n NIC0: mlx5_0\n NIC1: mlx5_1\n NIC2: mlx5_2\n NIC3: mlx5_3\n NIC4: mlx5_4\n NIC5: mlx5_5\n NIC6: mlx5_6\n NIC7: mlx5_7\n NIC8: mlx5_8\n NIC9: mlx5_9\n\n",
"timestamp": "2026-05-22T15:26:34.187409",
"detected_gpu_type": "h100",
"gpu_label": "H100 SXM5"
},
"memory_bench": {
"memory": {
"source": "pytorch",
"h2d_bandwidth_gbps": 11.8,
"d2h_bandwidth_gbps": 9.9,
"d2d_bandwidth_gbps": 829.1,
"peak_bandwidth_gbps": 3400,
"efficiency_pct": 24.4,
"test_sizes_mb": [
1,
4,
16,
64,
256,
1024,
4096
],
"bandwidth_by_size": {
"1": {
"h2d_gbps": 3.8,
"d2h_gbps": 1.4,
"d2d_gbps": 40.6
},
"4": {
"h2d_gbps": 7.6,
"d2h_gbps": 9.9,
"d2d_gbps": 141.5
},
"16": {
"h2d_gbps": 11.0,
"d2h_gbps": 1.9,
"d2d_gbps": 450.3
},
"64": {
"h2d_gbps": 11.8,
"d2h_gbps": 1.4,
"d2d_gbps": 726.5
},
"256": {
"h2d_gbps": 9.0,
"d2h_gbps": 1.4,
"d2d_gbps": 793.8
},
"1024": {
"h2d_gbps": 5.5,
"d2h_gbps": 1.4,
"d2d_gbps": 821.2
},
"4096": {
"h2d_gbps": 5.9,
"d2h_gbps": 1.4,
"d2d_gbps": 829.1
}
},
"per_gpu": []
}
},
"compute_bench": {
"compute": {
"per_dtype_tflops": {
"fp32": 52.0,
"tf32": 362.3,
"fp16": 691.0,
"bf16": 713.0,
"fp8": 1148.8
},
"peak_tflops": {
"fp32": 67,
"tf32": 495,
"fp16": 990,
"bf16": 990,
"fp8": 1979
},
"efficiency_pct": {
"fp32": 77.6,
"tf32": 73.2,
"fp16": 69.8,
"bf16": 72.0,
"fp8": 58.0
},
"pass_thresholds_tflops": {
"fp32": 54,
"tf32": 444,
"fp16": 734,
"bf16": 745,
"fp8": 1400
},
"per_gpu": [
{
"index": 0,
"fp32": 52.0,
"tf32": 362.3,
"fp16": 691.0,
"bf16": 713.0,
"fp8": 1148.8
}
],
"matrix_size": 8192,
"warmup": 50,
"iterations": 500
}
}
}