From 4eb81a5bca269453a692af50c9b4bb899bf36314 Mon Sep 17 00:00:00 2001
From: lintsinghua <lintsinghua@users.noreply.github.com>
Date: Tue, 9 Dec 2025 15:38:17 +0800
Subject: [PATCH] fix(scan): normalize file paths for cross-platform
 compatibility

- Add normalize_path() utility function to convert backslashes to forward slashes
- Ensure consistent path separators across Windows, Unix, and Mac platforms
- Apply path normalization to relative paths extracted from ZIP files
- Normalize target file paths before matching against scan configuration
- Update file filtering logic to use normalized path set for accurate matching
- Add inline comments explaining cross-platform path handling requirements
---
 backend/app/api/v1/endpoints/scan.py | 18 +++++++++++++++---
 1 file changed, 15 insertions(+), 3 deletions(-)

diff --git a/backend/app/api/v1/endpoints/scan.py b/backend/app/api/v1/endpoints/scan.py
index 6b20767..75b0aa4 100644
--- a/backend/app/api/v1/endpoints/scan.py
+++ b/backend/app/api/v1/endpoints/scan.py
@@ -27,6 +27,15 @@ from app.core.config import settings
 router = APIRouter()
 
 
+def normalize_path(path: str) -> str:
+    """
+    统一路径分隔符为正斜杠，确保跨平台兼容性
+    Windows 使用反斜杠 (\)，Unix/Mac 使用正斜杠 (/)
+    统一转换为正斜杠以保证一致性
+    """
+    return path.replace("\\", "/")
+
+
 # 支持的文件扩展名
 TEXT_EXTENSIONS = [
     ".js", ".ts", ".tsx", ".jsx", ".py", ".java", ".go", ".rs",
@@ -65,7 +74,8 @@ async def process_zip_task(task_id: str, file_path: str, db_session_factory, use
                 
                 for file in files:
                     full_path = Path(root) / file
-                    rel_path = str(full_path.relative_to(extract_dir))
+                    # 统一使用正斜杠，确保跨平台兼容性
+                    rel_path = normalize_path(str(full_path.relative_to(extract_dir)))
                     
                     # 检查文件类型和排除规则
                     if is_text_file(rel_path) and not should_exclude(rel_path):
@@ -83,8 +93,10 @@ async def process_zip_task(task_id: str, file_path: str, db_session_factory, use
             # 如果指定了特定文件，则只分析这些文件
             target_files = (user_config or {}).get('scan_config', {}).get('file_paths', [])
             if target_files:
-                print(f"🎯 ZIP任务: 指定分析 {len(target_files)} 个文件")
-                files_to_scan = [f for f in files_to_scan if f['path'] in target_files]
+                # 统一目标文件路径的分隔符，确保匹配一致性
+                normalized_targets = {normalize_path(p) for p in target_files}
+                print(f"🎯 ZIP任务: 指定分析 {len(normalized_targets)} 个文件")
+                files_to_scan = [f for f in files_to_scan if f['path'] in normalized_targets]
             else:
                 files_to_scan = files_to_scan[:settings.MAX_ANALYZE_FILES]