File tree Expand file tree Collapse file tree 1 file changed +2
-4
lines changed Expand file tree Collapse file tree 1 file changed +2
-4
lines changed Original file line number Diff line number Diff line change @@ -2317,15 +2317,13 @@ def _dummy_run(
2317
2317
2318
2318
# If force_attention is True, we always capture attention. Otherwise,
2319
2319
# it only happens for cudagraph_runtime_mode=FULL.
2320
- if force_attention or cudagraph_runtime_mode == \
2321
- CUDAGraphMode .FULL :
2320
+ if force_attention or cudagraph_runtime_mode == CUDAGraphMode .FULL :
2322
2321
attn_metadata = {}
2323
2322
2324
2323
# Make sure max_model_len is used at the graph capture time.
2325
2324
self .seq_lens_np [:num_reqs ] = self .max_model_len
2326
2325
self .seq_lens_np [num_reqs :] = 0
2327
- self .seq_lens [:num_reqs ].copy_ (self .seq_lens_cpu [:num_reqs ],
2328
- non_blocking = True )
2326
+ self .seq_lens .copy_ (self .seq_lens_cpu , non_blocking = True )
2329
2327
2330
2328
for kv_cache_group_id , kv_cache_group_spec in enumerate (
2331
2329
self .kv_cache_config .kv_cache_groups ):
You can’t perform that action at this time.
0 commit comments