Fix dataclass

octoml · masahi · Feb 23, 2024 · Feb 21, 2024 · Feb 21, 2024 · Feb 22, 2024
commit 48af6d5b263b26b86750bc650d136188bfd316ab
diff --git a/serve/mlc_serve/engine/base.py b/serve/mlc_serve/engine/base.py
@@ -36,7 +36,7 @@ class MLCServeEngineConfig:
     init_timeout: int = 120
     model_type: str = "tvm"  # "tvm", "torch"
     num_shards: Optional[int] = None  # Need to be specified for if model_type is "torch"
-    gpu_memory_utilization=0.9
+    gpu_memory_utilization: float = 0.9
 
     @classmethod
     def _from_json(config_cls, json_obj: Dict[Any, Any]):