Add comment explaining in-place add requirement for symmetric memory

nvcastet · nvcastet · commit 5352aa10c377 · 2026-02-18T15:46:33.000-06:00
diff --git a/python/sglang/srt/models/qwen2_moe.py b/python/sglang/srt/models/qwen2_moe.py
@@ -324,6 +324,10 @@ def forward(
             final_hidden_states = self._forward_router_experts(hidden_states)
 
         if shared_output is not None:
+            # In-place add is required to keep final_hidden_states in the
+            # symmetric memory pool (when --enable-symm-mem is used).
+            # An out-of-place add would allocate a new tensor outside symm
+            # memory, breaking subsequent symmetric collective operations.
             final_hidden_states += shared_output
         if self.tp_size > 1 and not use_reduce_scatter:
             final_hidden_states = tensor_model_parallel_all_reduce(final_hidden_states)