Fix cross-SIP PE_TCM access by scoping deploy to target_device SIP

RuntimeContext._ensure_allocators() now limits SIP range to
target_device (single SIP or all). Prevents cross-SIP tensor
deployment that caused PE_TCM routing errors.
Also accept 'sip0' format (without colon) in DeviceSelector.

331 passed, 8 skipped

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
2026-04-04 18:03:11 -07:00
parent 624161f52f
commit 08256c1326
5 changed files with 19 additions and 11 deletions
+2 -2
View File
@@ -18,5 +18,5 @@ def test_cli_main_arg_parsing(monkeypatch):
def test_cli_main():
"""CLI bench run on single SIP device."""
import pytest
pytest.skip("Cross-SIP PE_TCM access not supported with router mesh topology")
rc = cli_main.main(["run", "--topology", "topology.yaml", "--bench", "qkv_gemm", "--device", "sip:0"])
assert rc == 0
-2
View File
@@ -861,7 +861,6 @@ def test_mcpu_kernel_launch_composite():
# ── 19. Stage 5: QKV GEMM benchmark completion ────────────────────
@pytest.mark.skip(reason="Cross-SIP PE_TCM access not supported with router mesh topology")
def test_qkv_gemm_bench_completes():
"""The qkv_gemm benchmark runs to completion without error."""
clear_registry()
@@ -956,7 +955,6 @@ def test_mcpu_multi_pe_kernel_launch():
# ── 21. Stage 5: QKV GEMM multi-PE benchmark completion ──────────
@pytest.mark.skip(reason="Cross-SIP PE_TCM access not supported with router mesh topology")
def test_qkv_gemm_bench_multi_pe_completes():
"""The qkv_gemm_multi_pe benchmark runs to completion without error."""
clear_registry()
-2
View File
@@ -131,7 +131,6 @@ def test_2d_va_translates_to_local_hbm():
# ── VO3. 2D: End-to-end bench completes ──────────────────────────────
@pytest.mark.skip(reason="Cross-SIP PE_TCM access not supported with router mesh topology")
def test_2d_bench_completes():
"""2D: full TP bench with standard Triton kernel pattern."""
graph = load_topology(TOPOLOGY_PATH)
@@ -199,7 +198,6 @@ def test_1d_va_translates_to_local_hbm():
# ── VO6. 1D: End-to-end ──────────────────────────────────────────────
@pytest.mark.skip(reason="Cross-SIP PE_TCM access not supported with router mesh topology")
def test_1d_e2e_completes():
"""1D: full engine run with column_wise TP sharding."""
graph = load_topology(TOPOLOGY_PATH)