-
Notifications
You must be signed in to change notification settings - Fork 3.6k
[rollout] chore: bump up trtllm image version to 1.3.0rc10 #5841
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: main
Are you sure you want to change the base?
Changes from 16 commits
1f97889
bcc4019
67e3889
ed9aedd
495766d
2ae5c3e
a95f3c3
c3c5123
559d20f
28810ce
4efee51
f58f143
132d4e1
096f77a
1eefcf5
029b394
522b7fa
af0fe9d
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
|
|
@@ -29,6 +29,11 @@ | |
| import ray | ||
| import torch | ||
| import torch.distributed as dist | ||
|
|
||
| try: | ||
| from tensorrt_llm.llmapi.llm_args import ExecutorMemoryType | ||
| except ImportError: | ||
| ExecutorMemoryType = None | ||
| from torch.distributed.device_mesh import DeviceMesh, init_device_mesh | ||
| from torch.multiprocessing.reductions import reduce_tensor | ||
|
|
||
|
|
@@ -260,16 +265,25 @@ async def update_weights(self, weights: dict[str, str]): | |
|
|
||
|
|
||
| class ServerAdapter(BaseRollout): | ||
| _WEIGHTS_TAGS = [ | ||
| "sampler", | ||
| "drafter", | ||
| "guided_decoder", | ||
| "spec_resource_manager", | ||
| "model_extra", | ||
| "executor_extra", | ||
| "model", | ||
| "draft_model", | ||
| ] | ||
| # All releasable/resumable weight tags: every ExecutorMemoryType except kv_cache | ||
| # (handled separately) and internal tags prefixed with "_". | ||
| # Fallback to hard-coded list for trtllm versions that don't export ExecutorMemoryType. | ||
| _WEIGHTS_TAGS = ( | ||
| [t.value for t in ExecutorMemoryType if t is not ExecutorMemoryType.KV_CACHE and not t.value.startswith("_")] | ||
| if ExecutorMemoryType is not None | ||
| else [ | ||
| "sampler", | ||
| "drafter", | ||
| "guided_decoder", | ||
| "spec_resource_manager", | ||
| "model_extra", | ||
| "executor_extra", | ||
| "model", | ||
| "model_weights", | ||
|
||
| "draft_model", | ||
| "draft_model_weights", | ||
| ] | ||
| ) | ||
|
|
||
| @staticmethod | ||
| def get_full_tags() -> list[str]: | ||
|
|
||
Uh oh!
There was an error while loading. Please reload this page.