Skip to content

TurboQuant TQ4 KV cache compression for Qwen 3.5 MoE

94973a3
Select commit
Loading
Failed to load commit list.
Merged

TurboQuant TQ4 KV cache compression for Qwen 3.5 MoE #18687

TurboQuant TQ4 KV cache compression for Qwen 3.5 MoE
94973a3
Select commit
Loading
Failed to load commit list.
PyTorch Bot / Dr.CI completed Apr 5, 2026 in 0s

Dr.CI classification results

{"FAILED":[{"workflowId":23990279264,"workflowUniqueId":69064392,"id":69968661115,"runnerName":"GitHub Actions 1013453707","authorEmail":"mnachin@meta.com","name":"Lint / lintrunner-mypy","jobName":"lintrunner-mypy","conclusion":"failure","completed_at":"2026-04-05T00:01:09.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279264/job/69968661115","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968661115","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":[">>> Lint for backends/arm/test/modules/test_static_cache.py:"],"failure_lines":[">>> Lint for backends/arm/test/modules/test_static_cache.py:"],"failure_context":[],"time":"2026-04-04T23:58:04.000000000Z"},{"workflowId":23990279403,"workflowUniqueId":63454257,"id":69968690369,"runnerName":"i-05ae668f99a28b4e5","authorEmail":"mnachin@meta.com","name":"pull / unittest / macos / macos-job","jobName":"unittest / macos / macos-job","conclusion":"failure","completed_at":"2026-04-05T00:30:44.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279403/job/69968690369","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968690369","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":["export/tests/test_target_recipes.py::TestTargetRecipes::test_mv3_model"],"failure_lines":["FAILED export/tests/test_target_recipes.py::TestTargetRecipes::test_mv3_model - AssertionError: Model 'mv3' Recipe: ios-arm64-coreml-fp16, tolerance check failed"],"failure_context":[],"time":"2026-04-04T23:59:00.000000000Z"},{"workflowId":23990279417,"workflowUniqueId":71492439,"id":69968760750,"runnerName":"i-06ff69a70c80933fc","authorEmail":"mnachin@meta.com","name":"trunk / unittest-release / macos / macos-job","jobName":"unittest-release / macos / macos-job","conclusion":"failure","completed_at":"2026-04-05T00:33:10.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279417/job/69968760750","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968760750","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":["export/tests/test_target_recipes.py::TestTargetRecipes::test_mv3_model"],"failure_lines":["FAILED export/tests/test_target_recipes.py::TestTargetRecipes::test_mv3_model - AssertionError: Model 'mv3' Recipe: ios-arm64-coreml-fp16, tolerance check failed"],"failure_context":[],"time":"2026-04-05T00:00:42.000000000Z"},{"workflowId":23990279417,"workflowUniqueId":71492439,"id":69968760499,"runnerName":"i-0444b5e92ef3ef806","authorEmail":"mnachin@meta.com","name":"trunk / test-arm-backend-ethos-u (test_memory_allocation) / linux-job","jobName":"test-arm-backend-ethos-u (test_memory_allocation) / linux-job","conclusion":"failure","completed_at":"2026-04-05T00:10:03.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279417/job/69968760499","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968760499","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":["RuntimeError: Command docker exec -t 44e3c9967bf775dc010c4bfd2569ceea5bc0caa527bc07b1df9c489a78db6474 /exec failed with exit code 92"],"failure_lines":["RuntimeError: Command docker exec -t 44e3c9967bf775dc010c4bfd2569ceea5bc0caa527bc07b1df9c489a78db6474 /exec failed with exit code 92"],"failure_context":[],"time":"2026-04-05T00:00:41.000000000Z"}],"FLAKY":[],"BROKEN_TRUNK":[{"workflowId":23990279403,"workflowUniqueId":63454257,"id":69968690372,"runnerName":"i-07cd6e7cbfd2d369f","authorEmail":"mnachin@meta.com","name":"pull / unittest / windows / windows-job","jobName":"unittest / windows / windows-job","conclusion":"cancelled","completed_at":"2026-04-05T02:00:26.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279403/job/69968690372","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968690372","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":["##[error]The operation was canceled."],"failure_lines":["##[error]The operation was canceled."],"failure_context":[],"time":"2026-04-04T23:59:00.000000000Z"},{"workflowId":23990279403,"workflowUniqueId":63454257,"id":69968690258,"runnerName":"i-06797cf4394c11577","authorEmail":"mnachin@meta.com","name":"pull / unittest-editable / windows / windows-job","jobName":"unittest-editable / windows / windows-job","conclusion":"cancelled","completed_at":"2026-04-05T02:00:22.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279403/job/69968690258","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968690258","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":["##[error]The operation was canceled."],"failure_lines":["##[error]The operation was canceled."],"failure_context":[],"time":"2026-04-04T23:59:00.000000000Z"},{"workflowId":23990279417,"workflowUniqueId":71492439,"id":69968760760,"runnerName":"i-06fd1ec60e398e69a","authorEmail":"mnachin@meta.com","name":"trunk / unittest-release / windows / windows-job","jobName":"unittest-release / windows / windows-job","conclusion":"cancelled","completed_at":"2026-04-05T02:01:10.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/23990279417/job/69968760760","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/69968760760","head_branch":"mergennachin/turboquant","pr_number":18687,"head_sha":"94973a3437ce742c733bb7d97f6701c524a55bc7","head_sha_timestamp":"2026-04-04T23:56:40.000000000Z","failure_captures":["##[error]The operation was canceled."],"failure_lines":["##[error]The operation was canceled."],"failure_context":[],"time":"2026-04-05T00:00:42.000000000Z"}],"UNSTABLE":[],"AWAITING_APPROVAL":[]}