feat: implement 8 OpenSpec proposals for security, reliability, and UX improvements

## Security Enhancements (P0) - Add input validation with max_length and numeric range constraints - Implement WebSocket token authentication via first message - Add path traversal prevention in file storage service ## Permission Enhancements (P0) - Add project member management for cross-department access - Implement is_department_manager flag for workload visibility ## Cycle Detection (P0) - Add DFS-based cycle detection for task dependencies - Add formula field circular reference detection - Display user-friendly cycle path visualization ## Concurrency & Reliability (P1) - Implement optimistic locking with version field (409 Conflict on mismatch) - Add trigger retry mechanism with exponential backoff (1s, 2s, 4s) - Implement cascade restore for soft-deleted tasks ## Rate Limiting (P1) - Add tiered rate limits: standard (60/min), sensitive (20/min), heavy (5/min) - Apply rate limits to tasks, reports, attachments, and comments ## Frontend Improvements (P1) - Add responsive sidebar with hamburger menu for mobile - Improve touch-friendly UI with proper tap target sizes - Complete i18n translations for all components ## Backend Reliability (P2) - Configure database connection pool (size=10, overflow=20) - Add Redis fallback mechanism with message queue - Add blocker check before task deletion ## API Enhancements (P3) - Add standardized response wrapper utility - Add /health/ready and /health/live endpoints - Implement project templates with status/field copying ## Tests Added - test_input_validation.py - Schema and path traversal tests - test_concurrency_reliability.py - Optimistic locking and retry tests - test_backend_reliability.py - Connection pool and Redis tests - test_api_enhancements.py - Health check and template tests Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
2026-01-10 22:13:43 +08:00
parent 96210c7ad4
commit 3bdc6ff1c9
106 changed files with 9704 additions and 429 deletions
--- a/backend/app/services/file_storage_service.py
+++ b/backend/app/services/file_storage_service.py
@@ -1,26 +1,271 @@
 import os
 import hashlib
 import shutil
+import logging
+import tempfile
 from pathlib import Path
 from typing import BinaryIO, Optional, Tuple
 from fastapi import UploadFile, HTTPException
 from app.core.config import settings


+logger = logging.getLogger(__name__)
+
+
+class PathTraversalError(Exception):
+    """Raised when a path traversal attempt is detected."""
+    pass
+
+
+class StorageValidationError(Exception):
+    """Raised when storage validation fails."""
+    pass
+
+
 class FileStorageService:
    """Service for handling file storage operations."""

+    # Common NAS mount points to detect
+    NAS_MOUNT_INDICATORS = [
+        "/mnt/", "/mount/", "/nas/", "/nfs/", "/smb/", "/cifs/",
+        "/Volumes/", "/media/", "/srv/", "/storage/"
+    ]
+
    def __init__(self):
-        self.base_dir = Path(settings.UPLOAD_DIR)
-        self._ensure_base_dir()
+        self.base_dir = Path(settings.UPLOAD_DIR).resolve()
+        self._storage_status = {
+            "validated": False,
+            "path_exists": False,
+            "writable": False,
+            "is_nas": False,
+            "error": None,
+        }
+        self._validate_storage_on_init()
+
+    def _validate_storage_on_init(self):
+        """Validate storage configuration on service initialization."""
+        try:
+            # Step 1: Ensure directory exists
+            self._ensure_base_dir()
+            self._storage_status["path_exists"] = True
+
+            # Step 2: Check write permissions
+            self._check_write_permissions()
+            self._storage_status["writable"] = True
+
+            # Step 3: Check if using NAS
+            is_nas = self._detect_nas_storage()
+            self._storage_status["is_nas"] = is_nas
+
+            if not is_nas:
+                logger.warning(
+                    "Storage directory '%s' appears to be local storage, not NAS. "
+                    "Consider configuring UPLOAD_DIR to a NAS mount point for production use.",
+                    self.base_dir
+                )
+
+            self._storage_status["validated"] = True
+            logger.info(
+                "Storage validated successfully: path=%s, is_nas=%s",
+                self.base_dir, is_nas
+            )
+
+        except StorageValidationError as e:
+            self._storage_status["error"] = str(e)
+            logger.error("Storage validation failed: %s", e)
+            raise
+        except Exception as e:
+            self._storage_status["error"] = str(e)
+            logger.error("Unexpected error during storage validation: %s", e)
+            raise StorageValidationError(f"Storage validation failed: {e}")
+
+    def _check_write_permissions(self):
+        """Check if the storage directory has write permissions."""
+        test_file = self.base_dir / f".write_test_{os.getpid()}"
+        try:
+            # Try to create and write to a test file
+            test_file.write_text("write_test")
+            # Verify we can read it back
+            content = test_file.read_text()
+            if content != "write_test":
+                raise StorageValidationError(
+                    f"Write verification failed for directory: {self.base_dir}"
+                )
+            # Clean up
+            test_file.unlink()
+            logger.debug("Write permission check passed for %s", self.base_dir)
+        except PermissionError as e:
+            raise StorageValidationError(
+                f"No write permission for storage directory '{self.base_dir}': {e}"
+            )
+        except OSError as e:
+            raise StorageValidationError(
+                f"Failed to verify write permissions for '{self.base_dir}': {e}"
+            )
+        finally:
+            # Ensure test file is removed even on partial failure
+            if test_file.exists():
+                try:
+                    test_file.unlink()
+                except Exception:
+                    pass
+
+    def _detect_nas_storage(self) -> bool:
+        """
+        Detect if the storage directory appears to be on a NAS mount.
+
+        This is a best-effort detection based on common mount point patterns.
+        """
+        path_str = str(self.base_dir)
+
+        # Check common NAS mount point patterns
+        for indicator in self.NAS_MOUNT_INDICATORS:
+            if indicator in path_str:
+                logger.debug("NAS storage detected: path contains '%s'", indicator)
+                return True
+
+        # Check if it's a mount point (Unix-like systems)
+        try:
+            if self.base_dir.is_mount():
+                logger.debug("NAS storage detected: path is a mount point")
+                return True
+        except Exception:
+            pass
+
+        # Check mount info on Linux
+        try:
+            with open("/proc/mounts", "r") as f:
+                mounts = f.read()
+                if path_str in mounts:
+                    # Check for network filesystem types
+                    for line in mounts.splitlines():
+                        if path_str in line:
+                            fs_type = line.split()[2] if len(line.split()) > 2 else ""
+                            if fs_type in ["nfs", "nfs4", "cifs", "smb", "smbfs"]:
+                                logger.debug("NAS storage detected: mounted as %s", fs_type)
+                                return True
+        except FileNotFoundError:
+            pass  # Not on Linux
+        except Exception as e:
+            logger.debug("Could not check /proc/mounts: %s", e)
+
+        return False
+
+    def get_storage_status(self) -> dict:
+        """Get current storage status for health checks."""
+        return {
+            **self._storage_status,
+            "base_dir": str(self.base_dir),
+            "exists": self.base_dir.exists(),
+            "is_directory": self.base_dir.is_dir() if self.base_dir.exists() else False,
+        }

    def _ensure_base_dir(self):
        """Ensure the base upload directory exists."""
        self.base_dir.mkdir(parents=True, exist_ok=True)

+    def _validate_path_component(self, component: str, component_name: str) -> None:
+        """
+        Validate a path component to prevent path traversal attacks.
+
+        Args:
+            component: The path component to validate (e.g., project_id, task_id)
+            component_name: Name of the component for error messages
+
+        Raises:
+            PathTraversalError: If the component contains path traversal patterns
+        """
+        if not component:
+            raise PathTraversalError(f"Empty {component_name} is not allowed")
+
+        # Check for path traversal patterns
+        dangerous_patterns = ['..', '/', '\\', '\x00']
+        for pattern in dangerous_patterns:
+            if pattern in component:
+                logger.warning(
+                    "Path traversal attempt detected in %s: %r",
+                    component_name,
+                    component
+                )
+                raise PathTraversalError(
+                    f"Invalid characters in {component_name}: path traversal not allowed"
+                )
+
+        # Additional check: component should not start with special characters
+        if component.startswith('.') or component.startswith('-'):
+            logger.warning(
+                "Suspicious path component in %s: %r",
+                component_name,
+                component
+            )
+            raise PathTraversalError(
+                f"Invalid {component_name}: cannot start with '.' or '-'"
+            )
+
+    def _validate_path_in_base_dir(self, path: Path, context: str = "") -> Path:
+        """
+        Validate that a resolved path is within the base directory.
+
+        Args:
+            path: The path to validate
+            context: Additional context for logging
+
+        Returns:
+            The resolved path if valid
+
+        Raises:
+            PathTraversalError: If the path is outside the base directory
+        """
+        resolved_path = path.resolve()
+
+        # Check if the resolved path is within the base directory
+        try:
+            resolved_path.relative_to(self.base_dir)
+        except ValueError:
+            logger.warning(
+                "Path traversal attempt detected: path %s is outside base directory %s. Context: %s",
+                resolved_path,
+                self.base_dir,
+                context
+            )
+            raise PathTraversalError(
+                "Access denied: path is outside the allowed directory"
+            )
+
+        return resolved_path
+
    def _get_file_path(self, project_id: str, task_id: str, attachment_id: str, version: int) -> Path:
-        """Generate the file path for an attachment version."""
-        return self.base_dir / project_id / task_id / attachment_id / str(version)
+        """
+        Generate the file path for an attachment version.
+
+        Args:
+            project_id: The project ID
+            task_id: The task ID
+            attachment_id: The attachment ID
+            version: The version number
+
+        Returns:
+            Safe path within the base directory
+
+        Raises:
+            PathTraversalError: If any component contains path traversal patterns
+        """
+        # Validate all path components
+        self._validate_path_component(project_id, "project_id")
+        self._validate_path_component(task_id, "task_id")
+        self._validate_path_component(attachment_id, "attachment_id")
+
+        if version < 0:
+            raise PathTraversalError("Version must be non-negative")
+
+        # Build the path
+        path = self.base_dir / project_id / task_id / attachment_id / str(version)
+
+        # Validate the final path is within base directory
+        return self._validate_path_in_base_dir(
+            path,
+            f"project={project_id}, task={task_id}, attachment={attachment_id}, version={version}"
+        )

    @staticmethod
    def calculate_checksum(file: BinaryIO) -> str:
@@ -89,6 +334,10 @@ class FileStorageService:
        """
        Save uploaded file to storage.
        Returns (file_path, file_size, checksum).
+
+        Raises:
+            PathTraversalError: If path traversal is detected
+            HTTPException: If file validation fails
        """
        # Validate file
        extension, _ = self.validate_file(file)
@@ -96,14 +345,22 @@ class FileStorageService:
        # Calculate checksum first
        checksum = self.calculate_checksum(file.file)

-        # Create directory structure
-        dir_path = self._get_file_path(project_id, task_id, attachment_id, version)
+        # Create directory structure (path validation is done in _get_file_path)
+        try:
+            dir_path = self._get_file_path(project_id, task_id, attachment_id, version)
+        except PathTraversalError as e:
+            logger.error("Path traversal attempt during file save: %s", e)
+            raise HTTPException(status_code=400, detail=str(e))
+
        dir_path.mkdir(parents=True, exist_ok=True)

        # Save file with original extension
        filename = f"file.{extension}" if extension else "file"
        file_path = dir_path / filename

+        # Final validation of the file path
+        self._validate_path_in_base_dir(file_path, f"saving file {filename}")
+
        # Get file size
        file.file.seek(0, 2)
        file_size = file.file.tell()
@@ -125,8 +382,15 @@ class FileStorageService:
        """
        Get the file path for an attachment version.
        Returns None if file doesn't exist.
+
+        Raises:
+            PathTraversalError: If path traversal is detected
        """
-        dir_path = self._get_file_path(project_id, task_id, attachment_id, version)
+        try:
+            dir_path = self._get_file_path(project_id, task_id, attachment_id, version)
+        except PathTraversalError as e:
+            logger.error("Path traversal attempt during file retrieval: %s", e)
+            return None

        if not dir_path.exists():
            return None
@@ -139,21 +403,48 @@ class FileStorageService:
        return files[0]

    def get_file_by_path(self, file_path: str) -> Optional[Path]:
-        """Get file by stored path. Handles both absolute and relative paths."""
+        """
+        Get file by stored path. Handles both absolute and relative paths.
+
+        This method validates that the requested path is within the base directory
+        to prevent path traversal attacks.
+
+        Args:
+            file_path: The stored file path
+
+        Returns:
+            Path object if file exists and is within base directory, None otherwise
+        """
+        if not file_path:
+            return None
+
        path = Path(file_path)

-        # If path is absolute and exists, return it directly
-        if path.is_absolute() and path.exists():
-            return path
+        # For absolute paths, validate they are within base_dir
+        if path.is_absolute():
+            try:
+                validated_path = self._validate_path_in_base_dir(
+                    path,
+                    f"get_file_by_path absolute: {file_path}"
+                )
+                if validated_path.exists():
+                    return validated_path
+            except PathTraversalError:
+                return None
+            return None

-        # If path is relative, try prepending base_dir
+        # For relative paths, resolve from base_dir
        full_path = self.base_dir / path
-        if full_path.exists():
-            return full_path

-        # Fallback: check if original path exists (e.g., relative from current dir)
-        if path.exists():
-            return path
+        try:
+            validated_path = self._validate_path_in_base_dir(
+                full_path,
+                f"get_file_by_path relative: {file_path}"
+            )
+            if validated_path.exists():
+                return validated_path
+        except PathTraversalError:
+            return None

        return None

@@ -168,13 +459,29 @@ class FileStorageService:
        Delete file(s) from storage.
        If version is None, deletes all versions.
        Returns True if successful.
+
+        Raises:
+            PathTraversalError: If path traversal is detected
        """
-        if version is not None:
-            # Delete specific version
-            dir_path = self._get_file_path(project_id, task_id, attachment_id, version)
-        else:
-            # Delete all versions (attachment directory)
-            dir_path = self.base_dir / project_id / task_id / attachment_id
+        try:
+            if version is not None:
+                # Delete specific version
+                dir_path = self._get_file_path(project_id, task_id, attachment_id, version)
+            else:
+                # Delete all versions (attachment directory)
+                # Validate components first
+                self._validate_path_component(project_id, "project_id")
+                self._validate_path_component(task_id, "task_id")
+                self._validate_path_component(attachment_id, "attachment_id")
+
+                dir_path = self.base_dir / project_id / task_id / attachment_id
+                dir_path = self._validate_path_in_base_dir(
+                    dir_path,
+                    f"delete attachment: project={project_id}, task={task_id}, attachment={attachment_id}"
+                )
+        except PathTraversalError as e:
+            logger.error("Path traversal attempt during file deletion: %s", e)
+            return False

        if dir_path.exists():
            shutil.rmtree(dir_path)
@@ -182,8 +489,26 @@ class FileStorageService:
        return False

    def delete_task_files(self, project_id: str, task_id: str) -> bool:
-        """Delete all files for a task."""
-        dir_path = self.base_dir / project_id / task_id
+        """
+        Delete all files for a task.
+
+        Raises:
+            PathTraversalError: If path traversal is detected
+        """
+        try:
+            # Validate components
+            self._validate_path_component(project_id, "project_id")
+            self._validate_path_component(task_id, "task_id")
+
+            dir_path = self.base_dir / project_id / task_id
+            dir_path = self._validate_path_in_base_dir(
+                dir_path,
+                f"delete task files: project={project_id}, task={task_id}"
+            )
+        except PathTraversalError as e:
+            logger.error("Path traversal attempt during task file deletion: %s", e)
+            return False
+
        if dir_path.exists():
            shutil.rmtree(dir_path)
            return True