vllm-project · mgoin · Apr 25, 2025 · Mar 27, 2025 · Mar 27, 2025 · Mar 27, 2025
diff --git a/vllm/usage/usage_lib.py b/vllm/usage/usage_lib.py
@@ -174,6 +174,15 @@ def _report_usage_once(self, model_architecture: str,
             self.gpu_memory_per_device = device_property.total_memory
         if current_platform.is_cuda():
             self.cuda_runtime = torch.version.cuda
+        if current_platform.is_tpu():
+            try:
+                import torch_xla.runtime as xr
+                from torch_xla.core import xla_model as xm
+                self.gpu_count = xr.world_size()
+                self.gpu_type = xm.xla_device_hw(xm.xla_device())
+                self.gpu_memory_per_device = xm.get_memory_info().bytes_limit
+            except ImportError:
+                pass
         self.provider = _detect_cloud_provider()
         self.architecture = platform.machine()
         self.platform = platform.platform()