from __future__ import annotations import asyncio import sys import tempfile import time import unittest from pathlib import Path import httpx sys.path.insert(0, str(Path(__file__).resolve().parents[3])) from backend.app.dependencies import get_copy_task_service, get_task_service from backend.app.db.task_repository import TaskRepository from backend.app.main import app from backend.app.security.path_guard import PathGuard from backend.app.services.copy_task_service import CopyTaskService from backend.app.services.task_service import TaskService from backend.app.tasks_runner import TaskRunner from backend.app.fs.filesystem_adapter import FilesystemAdapter class FailingFilesystemAdapter(FilesystemAdapter): def copy_file(self, source: str, destination: str, on_progress: callable | None = None) -> None: raise OSError("forced copy failure") class CopyApiGoldenTest(unittest.TestCase): def setUp(self) -> None: self.temp_dir = tempfile.TemporaryDirectory() self.root = Path(self.temp_dir.name) / "root" self.root.mkdir(parents=True, exist_ok=True) self.repo = TaskRepository(str(Path(self.temp_dir.name) / "tasks.db")) path_guard = PathGuard({"storage1": str(self.root), "storage2": str(self.root)}) self._set_services(path_guard=path_guard, filesystem=FilesystemAdapter()) def tearDown(self) -> None: app.dependency_overrides.clear() self.temp_dir.cleanup() def _set_services(self, path_guard: PathGuard, filesystem: FilesystemAdapter) -> None: runner = TaskRunner(repository=self.repo, filesystem=filesystem) copy_service = CopyTaskService(path_guard=path_guard, repository=self.repo, runner=runner) task_service = TaskService(repository=self.repo) async def _override_copy_service() -> CopyTaskService: return copy_service async def _override_task_service() -> TaskService: return task_service app.dependency_overrides[get_copy_task_service] = _override_copy_service app.dependency_overrides[get_task_service] = _override_task_service def _request(self, method: str, url: str, payload: dict | None = None) -> httpx.Response: async def _run() -> httpx.Response: transport = httpx.ASGITransport(app=app) async with httpx.AsyncClient(transport=transport, base_url="http://testserver") as client: if method == "POST": return await client.post(url, json=payload) return await client.get(url) return asyncio.run(_run()) def _wait_task(self, task_id: str, timeout_s: float = 2.0) -> dict: deadline = time.time() + timeout_s while time.time() < deadline: response = self._request("GET", f"/api/tasks/{task_id}") body = response.json() if body["status"] in {"completed", "failed"}: return body time.sleep(0.02) self.fail("task did not reach terminal state in time") def test_copy_success_create_task_shape(self) -> None: src = self.root / "source.txt" src.write_text("hello", encoding="utf-8") response = self._request( "POST", "/api/files/copy", {"source": "storage1/source.txt", "destination": "storage1/copy.txt"}, ) self.assertEqual(response.status_code, 202) body = response.json() self.assertIn("task_id", body) self.assertEqual(body["status"], "queued") detail = self._wait_task(body["task_id"]) self.assertEqual(detail["status"], "completed") self.assertEqual(detail["total_bytes"], 5) self.assertEqual(detail["done_bytes"], 5) self.assertTrue((self.root / "copy.txt").exists()) self.assertEqual((self.root / "copy.txt").read_text(encoding="utf-8"), "hello") def test_copy_source_not_found(self) -> None: response = self._request( "POST", "/api/files/copy", {"source": "storage1/missing.txt", "destination": "storage1/out.txt"}, ) self.assertEqual(response.status_code, 404) self.assertEqual( response.json(), { "error": { "code": "path_not_found", "message": "Requested path was not found", "details": {"path": "storage1/missing.txt"}, } }, ) def test_copy_source_is_directory_type_conflict(self) -> None: (self.root / "dir").mkdir() response = self._request( "POST", "/api/files/copy", {"source": "storage1/dir", "destination": "storage1/out.txt"}, ) self.assertEqual(response.status_code, 409) self.assertEqual(response.json()["error"]["code"], "type_conflict") def test_copy_destination_exists_already_exists(self) -> None: (self.root / "source.txt").write_text("x", encoding="utf-8") (self.root / "exists.txt").write_text("y", encoding="utf-8") response = self._request( "POST", "/api/files/copy", {"source": "storage1/source.txt", "destination": "storage1/exists.txt"}, ) self.assertEqual(response.status_code, 409) self.assertEqual( response.json(), { "error": { "code": "already_exists", "message": "Target path already exists", "details": {"path": "storage1/exists.txt"}, } }, ) def test_copy_traversal_source(self) -> None: response = self._request( "POST", "/api/files/copy", {"source": "storage1/../etc/passwd", "destination": "storage1/out.txt"}, ) self.assertEqual(response.status_code, 403) self.assertEqual(response.json()["error"]["code"], "path_traversal_detected") def test_copy_traversal_destination(self) -> None: (self.root / "source.txt").write_text("x", encoding="utf-8") response = self._request( "POST", "/api/files/copy", {"source": "storage1/source.txt", "destination": "storage1/../etc/out.txt"}, ) self.assertEqual(response.status_code, 403) self.assertEqual(response.json()["error"]["code"], "path_traversal_detected") def test_copy_source_symlink_rejected(self) -> None: target = self.root / "real.txt" target.write_text("x", encoding="utf-8") link = self.root / "link.txt" link.symlink_to(target) response = self._request( "POST", "/api/files/copy", {"source": "storage1/link.txt", "destination": "storage1/out.txt"}, ) self.assertEqual(response.status_code, 409) self.assertEqual(response.json()["error"]["code"], "type_conflict") def test_copy_runtime_io_error_failed_task_shape(self) -> None: src = self.root / "source.txt" src.write_text("hello", encoding="utf-8") path_guard = PathGuard({"storage1": str(self.root), "storage2": str(self.root)}) self._set_services(path_guard=path_guard, filesystem=FailingFilesystemAdapter()) response = self._request( "POST", "/api/files/copy", {"source": "storage1/source.txt", "destination": "storage1/copy.txt"}, ) self.assertEqual(response.status_code, 202) task_id = response.json()["task_id"] detail = self._wait_task(task_id) self.assertEqual(detail["status"], "failed") self.assertEqual(detail["error_code"], "io_error") self.assertEqual(detail["failed_item"], str(src)) if __name__ == "__main__": unittest.main()