Skip to content

Commit 2aa0db7

Browse files
authored
[Diffusion] [NPU] Fix CI run (#18921)
1 parent 8bb1037 commit 2aa0db7

File tree

4 files changed

+9
-9
lines changed

4 files changed

+9
-9
lines changed

.github/workflows/pr-test-npu.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -28,9 +28,9 @@ jobs:
2828
check-changes:
2929
runs-on: ubuntu-latest
3030
outputs:
31-
changes_exist: ${{ steps.filter.outputs.main_package || steps.filter.outputs.multimodal_gen || steps.run-mode.outputs.run_all_tests}}
32-
main_package: ${{ steps.filter.outputs.main_package || steps.run-mode.outputs.run_all_tests }}
33-
multimodal_gen: ${{ steps.filter.outputs.multimodal_gen || steps.run-mode.outputs.run_all_tests }}
31+
changes_exist: ${{ steps.filter.outputs.main_package == 'true' || steps.filter.outputs.multimodal_gen == 'true' || steps.run-mode.outputs.run_all_tests == 'true'}}
32+
main_package: ${{ steps.filter.outputs.main_package == 'true' || steps.run-mode.outputs.run_all_tests == 'true' }}
33+
multimodal_gen: ${{ steps.filter.outputs.multimodal_gen == 'true' || steps.run-mode.outputs.run_all_tests == 'true' }}
3434
steps:
3535
- name: Checkout code
3636
uses: actions/checkout@v4

python/sglang/multimodal_gen/runtime/managers/gpu_worker.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -154,8 +154,8 @@ def do_mem_analysis(self, output_batch: OutputBatch):
154154
output_batch.timings.record_memory_snapshot("mem_analysis", final_snapshot)
155155

156156
# for details on max_memory_reserved: https://docs.pytorch.org/docs/stable/generated/torch.cuda.memory.max_memory_reserved.html
157-
peak_reserved_bytes = torch.cuda.max_memory_reserved()
158-
peak_allocated_bytes = torch.cuda.max_memory_allocated()
157+
peak_reserved_bytes = torch.get_device_module().max_memory_reserved()
158+
peak_allocated_bytes = torch.get_device_module().max_memory_allocated()
159159

160160
output_batch.peak_memory_mb = peak_reserved_bytes / (1024**2)
161161
peak_reserved_gb = peak_reserved_bytes / (1024**3)

python/sglang/multimodal_gen/test/server/ascend/perf_baselines_npu.json

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -17,9 +17,9 @@
1717
"per_frame_generation": null
1818
},
1919
"denoise_step_ms": {
20-
"0": 195.27,
21-
"1": 329.05,
22-
"2": 545.43,
20+
"0": 364.97,
21+
"1": 542.66,
22+
"2": 542.1,
2323
"3": 541.3,
2424
"4": 537.07,
2525
"5": 537.21,

python/sglang/multimodal_gen/test/server/ascend/testcase_configs_npu.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
DiffusionServerArgs(
1313
model_path="/root/.cache/modelscope/hub/models/Wan-AI/Wan2.1-T2V-1.3B-Diffusers",
1414
modality="video",
15-
warmup=0,
15+
warmup=True,
1616
custom_validator="video",
1717
),
1818
DiffusionSamplingParams(

0 commit comments

Comments
 (0)