File tree Expand file tree Collapse file tree 1 file changed +4
-2
lines changed Expand file tree Collapse file tree 1 file changed +4
-2
lines changed Original file line number Diff line number Diff line change @@ -75,6 +75,9 @@ def __init__(
75
75
vllm_config .model_config )
76
76
77
77
self .attn_metadata_builder : Optional [AttentionMetadataBuilder ] = None
78
+ self .draft_indexer_metadata_builder : Optional [AttentionMetadataBuilder ] = None
79
+ self .attn_layer_names : list [str ] = []
80
+ self .indexer_layer_names : list [str ] = []
78
81
79
82
self .use_cuda_graph = (not current_platform .is_xpu ()
80
83
and self .vllm_config .compilation_config .level
@@ -214,8 +217,7 @@ def propose(
214
217
self .runner .attn_groups [0 ][0 ].metadata_builders [ubatch_id ]
215
218
attn_metadata = attn_metadata_builder .build_for_drafting (
216
219
common_attn_metadata = common_attn_metadata , draft_index = 0 )
217
- # FIXME: support hybrid kv for draft model (remove separate indexer)
218
- if self .draft_indexer_metadata_builder :
220
+ if getattr (self , "draft_indexer_metadata_builder" , None ):
219
221
draft_indexer_metadata = (
220
222
self .draft_indexer_metadata_builder .build_for_drafting (
221
223
common_attn_metadata = common_attn_metadata ,
You can’t perform that action at this time.
0 commit comments