Add persistent task workspace alpha

Start the first workspace milestone toward the task-oriented product without changing the existing one-shot vm_run/pyro run contract. Add a disk-backed task registry in the manager, auto-started task workspaces rooted at /workspace, repeated non-cleaning exec, and persisted command journals exposed through task create/exec/status/logs/delete across the CLI, Python SDK, and MCP server. Update the public contract, docs, examples, and version/catalog metadata for 2.1.0, and cover the new surface with manager, CLI, SDK, and MCP tests. Validation: UV_CACHE_DIR=.uv-cache make check and UV_CACHE_DIR=.uv-cache make dist-check.
2026-03-11 20:10:10 -03:00 · 2026-03-11 20:10:10 -03:00 · 58df176148
commit 58df176148
parent 6e16e74fd5
19 changed files with 1730 additions and 48 deletions
--- a/tests/test_server.py
+++ b/tests/test_server.py
@ -31,6 +31,8 @@ def test_create_server_registers_vm_tools(tmp_path: Path) -> None:
    assert "vm_network_info" in tool_names
    assert "vm_run" in tool_names
    assert "vm_status" in tool_names
+    assert "task_create" in tool_names
+    assert "task_logs" in tool_names


 def test_vm_run_round_trip(tmp_path: Path) -> None:
@ -161,3 +163,50 @@ def test_server_main_runs_stdio_transport(monkeypatch: pytest.MonkeyPatch) -> No
    monkeypatch.setattr(server_module, "create_server", lambda: StubServer())
    server_module.main()
    assert called == {"transport": "stdio"}
+
+
+def test_task_tools_round_trip(tmp_path: Path) -> None:
+    manager = VmManager(
+        backend_name="mock",
+        base_dir=tmp_path / "vms",
+        network_manager=TapNetworkManager(enabled=False),
+    )
+
+    def _extract_structured(raw_result: object) -> dict[str, Any]:
+        if not isinstance(raw_result, tuple) or len(raw_result) != 2:
+            raise TypeError("unexpected call_tool result shape")
+        _, structured = raw_result
+        if not isinstance(structured, dict):
+            raise TypeError("expected structured dictionary result")
+        return cast(dict[str, Any], structured)
+
+    async def _run() -> tuple[dict[str, Any], dict[str, Any], dict[str, Any], dict[str, Any]]:
+        server = create_server(manager=manager)
+        created = _extract_structured(
+            await server.call_tool(
+                "task_create",
+                {
+                    "environment": "debian:12-base",
+                    "allow_host_compat": True,
+                },
+            )
+        )
+        task_id = str(created["task_id"])
+        executed = _extract_structured(
+            await server.call_tool(
+                "task_exec",
+                {
+                    "task_id": task_id,
+                    "command": "printf 'ok\\n'",
+                },
+            )
+        )
+        logs = _extract_structured(await server.call_tool("task_logs", {"task_id": task_id}))
+        deleted = _extract_structured(await server.call_tool("task_delete", {"task_id": task_id}))
+        return created, executed, logs, deleted
+
+    created, executed, logs, deleted = asyncio.run(_run())
+    assert created["state"] == "started"
+    assert executed["stdout"] == "ok\n"
+    assert logs["count"] == 1
+    assert deleted["deleted"] is True