File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed
python/sglang/srt/layers/attention Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -535,7 +535,7 @@ def _replay_metadata(
535535 self .query_start_loc_list [bs - 1 ][: bs - num_padding ].copy_ (
536536 self .cached_cuda_graph_decode_query_start_loc [: bs - num_padding ]
537537 )
538- self .query_start_loc_list [bs - 1 ][bs - num_padding :].copy_ (
538+ self .query_start_loc_list [bs - 1 ][bs - num_padding :].fill_ (
539539 bs - num_padding
540540 )
541541 elif forward_mode .is_target_verify ():
@@ -547,7 +547,7 @@ def _replay_metadata(
547547 self .query_start_loc_list [bs - 1 ][: bs - num_padding ].copy_ (
548548 self .cached_cuda_graph_verify_query_start_loc [: bs - num_padding ]
549549 )
550- self .query_start_loc_list [bs - 1 ][bs - num_padding :].copy_ (
550+ self .query_start_loc_list [bs - 1 ][bs - num_padding :].fill_ (
551551 (bs - num_padding ) * spec_info .draft_token_num
552552 )
553553 else :
You can’t perform that action at this time.
0 commit comments