We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent dcc63dc commit 5d185efCopy full SHA for 5d185ef
python/sglang/srt/dllm/mixin/scheduler.py
@@ -192,6 +192,18 @@ def _create_dllm_batch(
192
new_batch.prepare_for_extend()
193
new_batch.forward_mode = forward_mode
194
new_batch.decoding_reqs = None
195
+
196
+ # Record prefill stats for logging after forward
197
+ from sglang.srt.managers.scheduler_metrics_mixin import PrefillStats
198
199
+ new_batch.prefill_stats = PrefillStats(
200
+ log_input_tokens=self.adder.log_input_tokens,
201
+ log_hit_tokens=self.adder.log_hit_tokens,
202
+ new_token_ratio=self.adder.new_token_ratio,
203
+ running_bs=len(self.running_batch.reqs),
204
+ num_new_seqs=len(can_run_list),
205
+ )
206
207
return new_batch
208
209
def process_dllm_incoming_reqs(
0 commit comments