diff --git a/open-models/serving/vertex_ai_tgi_gemma_multi_lora_adapters_deployment.ipynb b/open-models/serving/vertex_ai_tgi_gemma_multi_lora_adapters_deployment.ipynb index 2f68245d2e0..d7796eaf93b 100644 --- a/open-models/serving/vertex_ai_tgi_gemma_multi_lora_adapters_deployment.ipynb +++ b/open-models/serving/vertex_ai_tgi_gemma_multi_lora_adapters_deployment.ipynb @@ -1162,7 +1162,7 @@ "model = Model.upload(\n", " display_name=\"google--gemma2-tgi-multi-lora-model\",\n", " artifact_uri=str(serve_uri),\n", - " serving_container_image_uri=\"us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-text-generation-inference-cu124.2-3.ubuntu2204.py311\",\n", + " serving_container_image_uri=\"us-docker.pkg.dev/deeplearning-platform-release/gcr.io/huggingface-pytorch-inference-cu121.2-3.transformers.4-46.ubuntu2204.py311\",\n", " serving_container_ports=[8080],\n", " serving_container_environment_variables={\n", " \"HUGGING_FACE_HUB_TOKEN\": get_token(),\n",