Skip to content

Commit f6ad5a1

Browse files
committed
[Refactor] [1/N] to simplify the vLLM serving architecture
Signed-off-by: chaunceyjiang <[email protected]>
1 parent 063e5a8 commit f6ad5a1

File tree

4 files changed

+3
-3
lines changed

4 files changed

+3
-3
lines changed

vllm/entrypoints/openai/api_server.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,7 @@
8282
from vllm.entrypoints.serve.elastic_ep.middleware import (
8383
ScalingMiddleware,
8484
)
85-
from vllm.entrypoints.serve.tokenize.protocol import OpenAIServingTokenization
85+
from vllm.entrypoints.serve.tokenize.serving import OpenAIServingTokenization
8686
from vllm.entrypoints.tool_server import DemoToolServer, MCPToolServer, ToolServer
8787
from vllm.entrypoints.utils import (
8888
cli_env_setup,

vllm/entrypoints/serve/disagg/api_router.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@
2121
from vllm.entrypoints.serve.disagg.serving import (
2222
ServingTokens,
2323
)
24-
from vllm.entrypoints.serve.tokenize.protocol import OpenAIServingTokenization
24+
from vllm.entrypoints.serve.tokenize.serving import OpenAIServingTokenization
2525
from vllm.entrypoints.utils import (
2626
load_aware_call,
2727
with_cancellation,

vllm/entrypoints/serve/tokenize/api_router.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717
TokenizeRequest,
1818
TokenizeResponse,
1919
)
20-
from vllm.entrypoints.serve.tokenize.protocol import OpenAIServingTokenization
20+
from vllm.entrypoints.serve.tokenize.serving import OpenAIServingTokenization
2121
from vllm.entrypoints.utils import (
2222
with_cancellation,
2323
)

0 commit comments

Comments
 (0)