Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 4 additions & 1 deletion docker/Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -593,5 +593,8 @@ ENTRYPOINT ["./sagemaker-entrypoint.sh"]

FROM vllm-openai-base AS vllm-openai

ENTRYPOINT ["vllm", "serve"]
COPY docker/entrypoint.sh .
RUN chmod +x entrypoint.sh

ENTRYPOINT ["./entrypoint.sh"]
#################### OPENAI API SERVER ####################
22 changes: 22 additions & 0 deletions docker/entrypoint.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
#!/bin/bash
set -e

# Standard-supervisor from github.com/aws/model-hosting-container-standards provides features like:
# - Process supervision and automatic restart
# - ENV variable to CLI argument conversion (VLLM_ARG_* -> --arg)
# - Graceful shutdown handling
#
# Control standard-supervisor usage with VLLM_USE_STANDARD_SUPERVISOR:
# - "false" (default): Direct execution without standard-supervisor
# - "true": Enable all standard-supervisor features
# - Future: Could support selective feature flags like "env-conversion-only"

VLLM_USE_STANDARD_SUPERVISOR="${VLLM_USE_STANDARD_SUPERVISOR:-false}"

if [ "$VLLM_USE_STANDARD_SUPERVISOR" = "true" ]; then
# Use standard-supervisor launcher with all features
exec standard-supervisor vllm serve "$@"
else
# Direct execution without standard-supervisor
exec vllm serve "$@"
fi
2 changes: 1 addition & 1 deletion requirements/common.txt
Original file line number Diff line number Diff line change
Expand Up @@ -50,4 +50,4 @@ ijson # Required for mistral streaming tool parser
setproctitle # Used to set process names for better debugging and monitoring
openai-harmony >= 0.0.3 # Required for gpt-oss
anthropic == 0.71.0
model-hosting-container-standards >= 0.1.9, < 1.0.0
model-hosting-container-standards >= 0.1.9, < 1.0.0 # Required for SageMaker integration