Add device limit for B200 GPU (#207)

zhxchen17 · web-flow · commit ea2a7d637818 · 2025-10-23T20:16:54.000+02:00
diff --git a/autoparallel/compute_estimation.py b/autoparallel/compute_estimation.py
@@ -76,6 +76,21 @@ class DeviceLimit:
             torch.int8: 3958 // 2,
         },
     ),
+    DeviceLimit(
+        "B200",
+        "https://nvdam.widen.net/s/wwnsxrhm2w/blackwell-datasheet-3384703",
+        sm=(10, 0),
+        gmem_bandwidth=7.7 * (1024**4),
+        gemm_tflops={
+            torch.float64: 37,
+            # NOTE: NVIDIA gives all numbers "with 2:4 sparsity"
+            # but we want the full GEMM numbers
+            torch.float32: 2200 // 2,
+            torch.float16: 4500 // 2,
+            torch.bfloat16: 4500 // 2,
+            torch.int8: 9000 // 2,
+        },
+    ),
     DeviceLimit(
         "A100",
         "https://www.nvidia.com/content/dam/en-zz/Solutions/Data-Center/a100/pdf/nvidia-a100-datasheet-us-nvidia-1758950-r4-web.pdf",