Skip to content

extension/llm/server: serving docs and comment cleanup#20193

Open
mergennachin wants to merge 3 commits into
gh/mergennachin/11/headfrom
gh/mergennachin/12/head
Open

extension/llm/server: serving docs and comment cleanup#20193
mergennachin wants to merge 3 commits into
gh/mergennachin/11/headfrom
gh/mergennachin/12/head

[UPDATE] Update

10e471e
Select commit
Loading
Failed to load commit list.
PyTorch Bot / Dr.CI completed Jun 11, 2026 in 0s

Dr.CI classification results

{"FAILED":[{"workflowId":27308068154,"workflowUniqueId":216132948,"id":80690604237,"runnerName":"i-0cd7f8458442d20a2","authorEmail":"mnachin@meta.com","name":"Test CUDA Windows Export and E2E / test-model-cuda-windows-e2e (facebook, dinov2-small-imagenet1k-1-layer, non-quantized) / windows-job","jobName":"test-model-cuda-windows-e2e (facebook, dinov2-small-imagenet1k-1-layer, non-quantized) / windows-job","conclusion":"failure","completed_at":"2026-06-11T00:35:59.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068154/job/80690604237","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80690604237","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["Process completed with exit code 1."],"failure_lines":["##[error]Process completed with exit code 1."],"failure_context":[],"time":"2026-06-10T23:53:38.000000000Z"},{"workflowId":27308068377,"workflowUniqueId":63454257,"id":80671057131,"runnerName":"i-0052bdd51d77bda7b","authorEmail":"mnachin@meta.com","name":"pull / unittest / macos / macos-job","jobName":"unittest / macos / macos-job","conclusion":"failure","completed_at":"2026-06-10T23:25:27.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068377/job/80671057131","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671057131","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["RuntimeError: Command bash /Users/ec2-user/runner/_work/_temp/exec_script failed with exit code 1"],"failure_lines":["RuntimeError: Command bash /Users/ec2-user/runner/_work/_temp/exec_script failed with exit code 1"],"failure_context":[],"time":"2026-06-10T21:38:59.000000000Z"},{"workflowId":27308068377,"workflowUniqueId":63454257,"id":80671057111,"runnerName":"i-075b57e8ac70ff3fe","authorEmail":"mnachin@meta.com","name":"pull / unittest / linux / linux-job","jobName":"unittest / linux / linux-job","conclusion":"failure","completed_at":"2026-06-10T22:47:42.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068377/job/80671057111","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671057111","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["RuntimeError: Command docker exec -t 2e8343d355655d6e03f56fdc5c892a2a1720d24be253a85fb4cc601a69507ce3 /exec failed with exit code 1"],"failure_lines":["RuntimeError: Command docker exec -t 2e8343d355655d6e03f56fdc5c892a2a1720d24be253a85fb4cc601a69507ce3 /exec failed with exit code 1"],"failure_context":[],"time":"2026-06-10T21:38:59.000000000Z"},{"workflowId":27308068377,"workflowUniqueId":63454257,"id":80671056884,"runnerName":"i-0fa38d4bff080af45","authorEmail":"mnachin@meta.com","name":"pull / unittest-editable / linux / linux-job","jobName":"unittest-editable / linux / linux-job","conclusion":"failure","completed_at":"2026-06-10T22:36:50.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068377/job/80671056884","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671056884","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["RuntimeError: Command docker exec -t 8566bcb5621ecca6aadeb60a56fa916e710955f9072a7ae8618290c71ddfad74 /exec failed with exit code 1"],"failure_lines":["RuntimeError: Command docker exec -t 8566bcb5621ecca6aadeb60a56fa916e710955f9072a7ae8618290c71ddfad74 /exec failed with exit code 1"],"failure_context":[],"time":"2026-06-10T21:38:59.000000000Z"},{"workflowId":27308068377,"workflowUniqueId":63454257,"id":80671056954,"runnerName":"i-0ca8ecc8412dd9412","authorEmail":"mnachin@meta.com","name":"pull / unittest-editable / macos / macos-job","jobName":"unittest-editable / macos / macos-job","conclusion":"failure","completed_at":"2026-06-10T23:23:49.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068377/job/80671056954","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671056954","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["RuntimeError: Command bash /Users/ec2-user/runner/_work/_temp/exec_script failed with exit code 1"],"failure_lines":["RuntimeError: Command bash /Users/ec2-user/runner/_work/_temp/exec_script failed with exit code 1"],"failure_context":[],"time":"2026-06-10T21:38:59.000000000Z"}],"FLAKY":[],"BROKEN_TRUNK":[{"workflowId":27308068377,"workflowUniqueId":63454257,"id":80671056085,"runnerName":"16-core-ubuntu-1018646152","authorEmail":"mnachin@meta.com","name":"pull / android / build-android","jobName":"android / build-android","conclusion":"failure","completed_at":"2026-06-10T21:49:12.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068377/job/80671056085","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671056085","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["Process completed with exit code 1."],"failure_lines":["##[error]Process completed with exit code 1."],"failure_context":[],"time":"2026-06-10T21:38:59.000000000Z"}],"UNSTABLE":[],"UNKNOWN":[{"workflowId":27308068272,"workflowUniqueId":185593211,"id":80671053156,"runnerName":"i-0a8404474f55531a9","authorEmail":"mnachin@meta.com","name":"Build Windows Wheels / pytorch/executorch / build-wheel-py3_10-cpu","jobName":"pytorch/executorch / build-wheel-py3_10-cpu","conclusion":"failure","completed_at":"2026-06-10T21:52:41.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068272/job/80671053156","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671053156","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":[],"failure_lines":[],"failure_context":[],"time":"2026-06-10T21:38:58.000000000Z"},{"workflowId":27308068272,"workflowUniqueId":185593211,"id":80673406567,"runnerName":"GitHub Actions 1018648335","authorEmail":"mnachin@meta.com","name":"Build Windows Wheels / pytorch/executorch / upload / upload-wheel-py3_10-cpu","jobName":"pytorch/executorch / upload / upload-wheel-py3_10-cpu","conclusion":"failure","completed_at":"2026-06-10T21:53:05.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068272/job/80673406567","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80673406567","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["Unable to download artifact(s): Artifact not found for name: pytorch_executorch__3.10_cpu_x64"],"failure_lines":["##[error]Unable to download artifact(s): Artifact not found for name: pytorch_executorch__3.10_cpu_x64"],"failure_context":[],"time":"2026-06-10T21:52:41.000000000Z"},{"workflowId":27308068188,"workflowUniqueId":236455973,"id":80671119524,"runnerName":"GitHub Actions 1018647126","authorEmail":"mnachin@meta.com","name":"MLX / test-mlx-voxtral-realtime / test-mlx-voxtral-realtime","jobName":"test-mlx-voxtral-realtime / test-mlx-voxtral-realtime","conclusion":"failure","completed_at":"2026-06-10T21:58:20.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068188/job/80671119524","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80671119524","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["RuntimeError: Command bash /Users/runner/work/_temp/exec_script failed with exit code 1"],"failure_lines":["RuntimeError: Command bash /Users/runner/work/_temp/exec_script failed with exit code 1"],"failure_context":[],"time":"2026-06-10T21:39:21.000000000Z"},{"workflowId":27308068177,"workflowUniqueId":195669493,"id":80870061052,"runnerName":"i-01eb92369eec9ae68","authorEmail":"mnachin@meta.com","name":"Test CUDA Builds / unittest-cuda / linux-job","jobName":"unittest-cuda / linux-job","conclusion":"failure","completed_at":"2026-06-11T18:59:38.000000000Z","html_url":"https://github.com/pytorch/executorch/actions/runs/27308068177/job/80870061052","logUrl":"https://ossci-raw-job-status.s3.amazonaws.com/log/pytorch/executorch/80870061052","head_branch":"gh/mergennachin/12/head","pr_number":20193,"head_sha":"10e471e20368827ed5e27747e532648137390331","head_sha_timestamp":"2026-06-10T21:38:26Z","failure_captures":["examples/models/gemma4_31b/tests/test_cuda_pipeline.py::TestGgufCudaPipeline::test_load_converts_weights"],"failure_lines":["FAILED examples/models/gemma4_31b/tests/test_cuda_pipeline.py::TestGgufCudaPipeline::test_load_converts_weights - AssertionError: CudaCoalescedInt4Tensor(qdata=tensor([[200, 26, 118, ..., 58, 133, 38],"],"failure_context":[],"time":"2026-06-11T18:03:52.000000000Z"}],"AWAITING_APPROVAL":[]}