Skip to content

Commit 5a458d3

Browse files
committed
feat: add MRoPE op and Qwen2.5-VL skeleton
1 parent 5890741 commit 5a458d3

File tree

7 files changed

+1037
-5
lines changed

7 files changed

+1037
-5
lines changed

python/mlc_llm/__init__.py

Lines changed: 27 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,11 +3,35 @@
33
MLC Chat is the app runtime of MLC LLM.
44
"""
55

6-
from tvm import register_func
6+
import logging
7+
import tvm
8+
9+
if hasattr(tvm, "register_func"):
10+
register_func = tvm.register_func # type: ignore[attr-defined]
11+
else: # pragma: no cover
12+
from tvm_ffi.registry import register_global_func as register_func # type: ignore
13+
14+
setattr(tvm, "register_func", register_func)
15+
16+
AsyncMLCEngine = None # type: ignore
17+
MLCEngine = None # type: ignore
18+
19+
try:
20+
from . import protocol as protocol # type: ignore
21+
except RuntimeError as err: # pragma: no cover
22+
logging.getLogger(__name__).debug("MLC-LLM protocol unavailable: %s", err)
23+
protocol = None # type: ignore
24+
25+
try:
26+
from . import serve as serve # type: ignore
27+
except RuntimeError as err: # pragma: no cover
28+
logging.getLogger(__name__).debug("MLC-LLM serve unavailable: %s", err)
29+
serve = None # type: ignore
30+
else:
31+
AsyncMLCEngine = serve.AsyncMLCEngine
32+
MLCEngine = serve.MLCEngine
733

8-
from . import protocol, serve
934
from .libinfo import __version__
10-
from .serve import AsyncMLCEngine, MLCEngine
1135

1236

1337
@register_func("runtime.disco.create_socket_session_local_workers", override=True)

python/mlc_llm/base.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ def _load_mlc_llm_lib():
2424
return ctypes.CDLL(lib_path[0]), lib_path[0]
2525

2626

27-
@tvm.register_func("mlc.debug_cuda_profiler_start")
27+
@tvm.register_func("mlc.debug_cuda_profiler_start", override=True)
2828
def _debug_cuda_profiler_start() -> None:
2929
"""Start cuda profiler."""
3030
import cuda # pylint: disable=import-outside-toplevel
@@ -33,7 +33,7 @@ def _debug_cuda_profiler_start() -> None:
3333
cuda.cudart.cudaProfilerStart() # pylint: disable=c-extension-no-member
3434

3535

36-
@tvm.register_func("mlc.debug_cuda_profiler_stop")
36+
@tvm.register_func("mlc.debug_cuda_profiler_stop", override=True)
3737
def _debug_cuda_profiler_stop() -> None:
3838
"""Stop cuda profiler."""
3939
import cuda # pylint: disable=import-outside-toplevel
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
"\"\"\"Qwen2.5-VL architecture entry.\"\"\"\n+\n+from .qwen2_5_vl_model import ( # noqa: F401\n+ Qwen25VLConfig,\n+ Qwen25VLLMHeadModel,\n+)\n*** End Patch"/>

0 commit comments

Comments
 (0)