aws · aviruthen · Apr 7, 2026 · Apr 7, 2026 · Apr 14, 2026 · Apr 16, 2026
diff --git a/sagemaker-serve/src/sagemaker/serve/model_builder_servers.py b/sagemaker-serve/src/sagemaker/serve/model_builder_servers.py
@@ -136,7 +136,7 @@ def _build_for_torchserve(self) -> Model:
         if isinstance(self.model, str):
             # Configure HuggingFace model support
             if not self._is_jumpstart_model_id():
-                self.env_vars.update({"HF_MODEL_ID": self.model})
+                self.env_vars.setdefault("HF_MODEL_ID", self.model)
 
                 # Add HuggingFace token if available
                 if self.env_vars.get("HUGGING_FACE_HUB_TOKEN"):
@@ -212,7 +212,7 @@ def _build_for_tgi(self) -> Model:
 
         if isinstance(self.model, str) and not self._is_jumpstart_model_id():
             # Configure HuggingFace model for TGI
-            self.env_vars.update({"HF_MODEL_ID": self.model})
+            self.env_vars.setdefault("HF_MODEL_ID", self.model)
 
             self.hf_model_config = _get_model_config_properties_from_hf(
                 self.model, self.env_vars.get("HUGGING_FACE_HUB_TOKEN")
@@ -320,7 +320,7 @@ def _build_for_djl(self) -> Model:
 
         if isinstance(self.model, str) and not self._is_jumpstart_model_id():
             # Configure HuggingFace model for DJL
-            self.env_vars.update({"HF_MODEL_ID": self.model})
+            self.env_vars.setdefault("HF_MODEL_ID", self.model)
 
             # Get model configuration for DJL optimization
             self.hf_model_config = _get_model_config_properties_from_hf(
@@ -426,7 +426,7 @@ def _build_for_triton(self) -> Model:
                     self.env_vars.update({"HF_TASK": model_task})
 
                 # Configure HuggingFace authentication
-                self.env_vars.update({"HF_MODEL_ID": self.model})
+                self.env_vars.setdefault("HF_MODEL_ID", self.model)
                 if self.env_vars.get("HUGGING_FACE_HUB_TOKEN"):
                     self.env_vars["HF_TOKEN"] = self.env_vars.get("HUGGING_FACE_HUB_TOKEN")
 
@@ -532,7 +532,7 @@ def _build_for_tei(self) -> Model:
 
         if isinstance(self.model, str) and not self._is_jumpstart_model_id():
             # Configure HuggingFace model for TEI
-            self.env_vars.update({"HF_MODEL_ID": self.model})
+            self.env_vars.setdefault("HF_MODEL_ID", self.model)
 
             self.hf_model_config = _get_model_config_properties_from_hf(
                 self.model, self.env_vars.get("HUGGING_FACE_HUB_TOKEN")
@@ -676,7 +676,7 @@ def _build_for_transformers(self) -> Model:
             if self.inference_spec is not None:
                 hf_model_id = self.inference_spec.get_model()
                 if isinstance(hf_model_id, str):  # Only if it's a valid HF model ID
-                    self.env_vars.update({"HF_MODEL_ID": hf_model_id})
+                    self.env_vars.setdefault("HF_MODEL_ID", hf_model_id)
                     # Get HF config only for string model IDs
                     if hasattr(self.env_vars, "HF_API_TOKEN"):
                         self.hf_model_config = _get_model_config_properties_from_hf(
@@ -695,7 +695,7 @@ def _build_for_transformers(self) -> Model:
                 if model_task:
                     self.env_vars.update({"HF_TASK": model_task})
 
-                self.env_vars.update({"HF_MODEL_ID": self.model})
+                self.env_vars.setdefault("HF_MODEL_ID", self.model)
 
                 # Add HuggingFace token if available
                 if self.env_vars.get("HUGGING_FACE_HUB_TOKEN"):