File tree Expand file tree Collapse file tree 3 files changed +6
-3
lines changed
tests/entrypoints/sagemaker Expand file tree Collapse file tree 3 files changed +6
-3
lines changed Original file line number Diff line number Diff line change @@ -497,5 +497,5 @@ ENTRYPOINT ["./sagemaker-entrypoint.sh"]
497497
498498FROM vllm-openai-base AS vllm-openai
499499
500- ENTRYPOINT ["vllm" , "serve" ]
500+ ENTRYPOINT ["standard-supervisor" , " vllm" , "serve" ]
501501# ################### OPENAI API SERVER ####################
Original file line number Diff line number Diff line change @@ -49,4 +49,4 @@ cbor2 # Required for cross-language serialization of hashable objects
4949setproctitle # Used to set process names for better debugging and monitoring
5050openai-harmony >= 0.0.3 # Required for gpt-oss
5151anthropic == 0.71.0
52- model-hosting-container-standards < 1.0.0
52+ model-hosting-container-standards >= 0.1.7, < 1.0.0 # Required for SageMaker integration
Original file line number Diff line number Diff line change @@ -46,7 +46,10 @@ def basic_server_with_lora(smollm2_lora_files):
4646 "64" ,
4747 ]
4848
49- envs = {"VLLM_ALLOW_RUNTIME_LORA_UPDATING" : "True" }
49+ envs = {
50+ "VLLM_ALLOW_RUNTIME_LORA_UPDATING" : "True" ,
51+ "SAGEMAKER_ENABLE_STATEFUL_SESSIONS" : "True" ,
52+ }
5053 with RemoteOpenAIServer (MODEL_NAME_SMOLLM , args , env_dict = envs ) as remote_server :
5154 yield remote_server
5255
You can’t perform that action at this time.
0 commit comments