添加临时文件清理异常处理和修改大纲接口为POST方法

- 在analyze_markdown、analyze_markdown_stream和get_markdown_outline函数中添加了 try-catch块来处理临时文件清理过程中的异常 - 将/analyze/md/outline接口从GET方法改为POST方法以支持文件上传 - 确保在所有情况下都能正确清理临时文件，并记录清理失败的日志 refactor(health): 改进健康检查逻辑验证实际数据库连接 - 修改MySQL健康检查，实际执行SELECT 1查询来验证连接 - 修改MongoDB健康检查，执行ping命令来验证连接 - 修改Redis健康检查，执行ping命令来验证连接 - 添加异常捕获并记录具体的错误日志 refactor(upload): 使用os.path.basename优化文件名提取 - 替换手动字符串分割为os.path.basename来获取文件名 - 统一Excel上传和导出中文件名的处理方式 feat(instruction): 新增指令执行框架模块 - 创建instruction包包含意图解析和指令执行的基础架构 - 添加IntentParser和InstructionExecutor抽象基类 - 提供默认实现但标记为未完成，为未来功能扩展做准备 refactor(frontend): 调整AuthContext导入路径并移除重复文件 - 将AuthContext从src/context移动到src/contexts目录 - 更新App.tsx和RouteGuard.tsx中的导入路径 - 移除旧的AuthContext.tsx文件 fix(backend-api): 修复AI分析API的HTTP方法错误 - 将aiApi中的fetch请求方法从GET改为POST以支持文件上传
添加任务ID跟踪功能到模板填充接口
2026-04-10 01:51:53 +08:00 · 2026-04-10 01:27:26 +08:00 · 2026-04-10 01:15:53 +08:00 · 2026-04-10 00:26:57 +08:00 · 2026-04-10 00:26:54 +08:00 · 2026-04-10 00:23:23 +08:00
24 changed files with 1930 additions and 2316 deletions
--- a/backend/app/api/endpoints/ai_analyze.py
+++ b/backend/app/api/endpoints/ai_analyze.py
@@ -215,9 +215,12 @@ async def analyze_markdown(
            return result
        finally:
-            # 清理临时文件
+            # 清理临时文件，确保在所有情况下都能清理
-            if os.path.exists(tmp_path):
+            try:
-                os.unlink(tmp_path)
+                if tmp_path and os.path.exists(tmp_path):
                    os.unlink(tmp_path)
            except Exception as cleanup_error:
                logger.warning(f"临时文件清理失败: {tmp_path}, error: {cleanup_error}")
    except HTTPException:
        raise
@@ -279,8 +282,12 @@ async def analyze_markdown_stream(
            )
        finally:
-            if os.path.exists(tmp_path):
+            # 清理临时文件，确保在所有情况下都能清理
-                os.unlink(tmp_path)
+            try:
                if tmp_path and os.path.exists(tmp_path):
                    os.unlink(tmp_path)
            except Exception as cleanup_error:
                logger.warning(f"临时文件清理失败: {tmp_path}, error: {cleanup_error}")
    except HTTPException:
        raise
@@ -289,7 +296,7 @@ async def analyze_markdown_stream(
        raise HTTPException(status_code=500, detail=f"流式分析失败: {str(e)}")
-@router.get("/analyze/md/outline")
+@router.post("/analyze/md/outline")
 async def get_markdown_outline(
    file: UploadFile = File(...)
 ):
@@ -323,8 +330,12 @@ async def get_markdown_outline(
            result = await markdown_ai_service.extract_outline(tmp_path)
            return result
        finally:
-            if os.path.exists(tmp_path):
+            # 清理临时文件，确保在所有情况下都能清理
-                os.unlink(tmp_path)
+            try:
                if tmp_path and os.path.exists(tmp_path):
                    os.unlink(tmp_path)
            except Exception as cleanup_error:
                logger.warning(f"临时文件清理失败: {tmp_path}, error: {cleanup_error}")
    except Exception as e:
        logger.error(f"获取 Markdown 大纲失败: {str(e)}")
--- a/backend/app/api/endpoints/documents.py
+++ b/backend/app/api/endpoints/documents.py
@@ -23,6 +23,52 @@ logger = logging.getLogger(__name__)
 router = APIRouter(prefix="/upload", tags=["文档上传"])
 # ==================== 辅助函数 ====================
 async def update_task_status(
    task_id: str,
    status: str,
    progress: int = 0,
    message: str = "",
    result: dict = None,
    error: str = None
 ):
    """
    更新任务状态，同时写入 Redis 和 MongoDB
    Args:
        task_id: 任务ID
        status: 状态
        progress: 进度
        message: 消息
        result: 结果
        error: 错误信息
    """
    meta = {"progress": progress, "message": message}
    if result:
        meta["result"] = result
    if error:
        meta["error"] = error
    # 尝试写入 Redis
    try:
        await redis_db.set_task_status(task_id, status, meta)
    except Exception as e:
        logger.warning(f"Redis 任务状态更新失败: {e}")
    # 尝试写入 MongoDB（作为备用）
    try:
        await mongodb.update_task(
            task_id=task_id,
            status=status,
            message=message,
            result=result,
            error=error
        )
    except Exception as e:
        logger.warning(f"MongoDB 任务状态更新失败: {e}")
 # ==================== 请求/响应模型 ====================
 class UploadResponse(BaseModel):
@@ -77,6 +123,17 @@ async def upload_document(
    task_id = str(uuid.uuid4())
    try:
        # 保存任务记录到 MongoDB（如果 Redis 不可用时仍能查询）
        try:
            await mongodb.insert_task(
                task_id=task_id,
                task_type="document_parse",
                status="pending",
                message=f"文档 {file.filename} 已提交处理"
            )
        except Exception as mongo_err:
            logger.warning(f"MongoDB 保存任务记录失败: {mongo_err}")
        content = await file.read()
        saved_path = file_service.save_uploaded_file(
            content,
@@ -122,6 +179,17 @@ async def upload_documents(
    saved_paths = []
    try:
        # 保存任务记录到 MongoDB
        try:
            await mongodb.insert_task(
                task_id=task_id,
                task_type="batch_parse",
                status="pending",
                message=f"已提交 {len(files)} 个文档处理"
            )
        except Exception as mongo_err:
            logger.warning(f"MongoDB 保存批量任务记录失败: {mongo_err}")
        for file in files:
            if not file.filename:
                continue
@@ -159,9 +227,9 @@ async def process_document(
    """处理单个文档"""
    try:
        # 状态: 解析中
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="processing",
-            meta={"progress": 10, "message": "正在解析文档"}
+            progress=10, message="正在解析文档"
        )
        # 解析文档
@@ -172,9 +240,9 @@ async def process_document(
            raise Exception(result.error or "解析失败")
        # 状态: 存储中
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="processing",
-            meta={"progress": 30, "message": "正在存储数据"}
+            progress=30, message="正在存储数据"
        )
        # 存储到 MongoDB
@@ -191,9 +259,9 @@ async def process_document(
        # 如果是 Excel，存储到 MySQL + AI生成描述 + RAG索引
        if doc_type in ["xlsx", "xls"]:
-            await redis_db.set_task_status(
+            await update_task_status(
                task_id, status="processing",
-                meta={"progress": 50, "message": "正在存储到MySQL并生成字段描述"}
+                progress=50, message="正在存储到MySQL并生成字段描述"
            )
            try:
@@ -215,9 +283,9 @@ async def process_document(
        else:
            # 非结构化文档
-            await redis_db.set_task_status(
+            await update_task_status(
                task_id, status="processing",
-                meta={"progress": 60, "message": "正在建立索引"}
+                progress=60, message="正在建立索引"
            )
            # 如果文档中有表格数据，提取并存储到 MySQL + RAG
@@ -238,17 +306,13 @@ async def process_document(
            await index_document_to_rag(doc_id, original_filename, result, doc_type)
        # 完成
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="success",
-            meta={
+            progress=100, message="处理完成",
-                "progress": 100,
+            result={
                "message": "处理完成",
                "doc_id": doc_id,
-                "result": {
+                "doc_type": doc_type,
-                    "doc_id": doc_id,
+                "filename": original_filename
                    "doc_type": doc_type,
                    "filename": original_filename
                }
            }
        )
@@ -256,18 +320,19 @@ async def process_document(
    except Exception as e:
        logger.error(f"文档处理失败: {str(e)}")
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="failure",
-            meta={"error": str(e)}
+            progress=0, message="处理失败",
            error=str(e)
        )
 async def process_documents_batch(task_id: str, files: List[dict]):
    """批量处理文档"""
    try:
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="processing",
-            meta={"progress": 0, "message": "开始批量处理"}
+            progress=0, message="开始批量处理"
        )
        results = []
@@ -318,21 +383,23 @@ async def process_documents_batch(task_id: str, files: List[dict]):
                results.append({"filename": file_info["filename"], "success": False, "error": str(e)})
            progress = int((i + 1) / len(files) * 100)
-            await redis_db.set_task_status(
+            await update_task_status(
                task_id, status="processing",
-                meta={"progress": progress, "message": f"已处理 {i+1}/{len(files)}"}
+                progress=progress, message=f"已处理 {i+1}/{len(files)}"
            )
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="success",
-            meta={"progress": 100, "message": "批量处理完成", "results": results}
+            progress=100, message="批量处理完成",
            result={"results": results}
        )
    except Exception as e:
        logger.error(f"批量处理失败: {str(e)}")
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="failure",
-            meta={"error": str(e)}
+            progress=0, message="批量处理失败",
            error=str(e)
        )
--- a/backend/app/api/endpoints/health.py
+++ b/backend/app/api/endpoints/health.py
@@ -19,26 +19,43 @@ async def health_check() -> Dict[str, Any]:
    返回各数据库连接状态和应用信息
    """
    # 检查各数据库连接状态
-    mysql_status = "connected"
+    mysql_status = "unknown"
-    mongodb_status = "connected"
+    mongodb_status = "unknown"
-    redis_status = "connected"
+    redis_status = "unknown"
    try:
        if mysql_db.async_engine is None:
            mysql_status = "disconnected"
-    except Exception:
+        else:
            # 实际执行一次查询验证连接
            from sqlalchemy import text
            async with mysql_db.async_engine.connect() as conn:
                await conn.execute(text("SELECT 1"))
            mysql_status = "connected"
    except Exception as e:
        logger.warning(f"MySQL 健康检查失败: {e}")
        mysql_status = "error"
    try:
        if mongodb.client is None:
            mongodb_status = "disconnected"
-    except Exception:
+        else:
            # 实际 ping 验证
            await mongodb.client.admin.command('ping')
            mongodb_status = "connected"
    except Exception as e:
        logger.warning(f"MongoDB 健康检查失败: {e}")
        mongodb_status = "error"
    try:
-        if not redis_db.is_connected:
+        if not redis_db.is_connected or redis_db.client is None:
            redis_status = "disconnected"
-    except Exception:
+        else:
            # 实际执行 ping 验证
            await redis_db.client.ping()
            redis_status = "connected"
    except Exception as e:
        logger.warning(f"Redis 健康检查失败: {e}")
        redis_status = "error"
    return {
--- a/backend/app/api/endpoints/tasks.py
+++ b/backend/app/api/endpoints/tasks.py
@@ -1,13 +1,13 @@
 """
 任务管理 API 接口
-提供异步任务状态查询
+提供异步任务状态查询和历史记录
 """
 from typing import Optional
 from fastapi import APIRouter, HTTPException
-from app.core.database import redis_db
+from app.core.database import redis_db, mongodb
 router = APIRouter(prefix="/tasks", tags=["任务管理"])
@@ -23,25 +23,94 @@ async def get_task_status(task_id: str):
    Returns:
        任务状态信息
    """
    # 优先从 Redis 获取
    status = await redis_db.get_task_status(task_id)
-    if not status:
+    if status:
        # Redis不可用时，假设任务已完成（文档已成功处理）
        # 前端轮询时会得到这个响应
        return {
            "task_id": task_id,
-            "status": "success",
+            "status": status.get("status", "unknown"),
-            "progress": 100,
+            "progress": status.get("meta", {}).get("progress", 0),
-            "message": "任务处理完成",
+            "message": status.get("meta", {}).get("message"),
-            "result": None,
+            "result": status.get("meta", {}).get("result"),
-            "error": None
+            "error": status.get("meta", {}).get("error")
        }
    # Redis 不可用时，尝试从 MongoDB 获取
    mongo_task = await mongodb.get_task(task_id)
    if mongo_task:
        return {
            "task_id": mongo_task.get("task_id"),
            "status": mongo_task.get("status", "unknown"),
            "progress": 100 if mongo_task.get("status") == "success" else 0,
            "message": mongo_task.get("message"),
            "result": mongo_task.get("result"),
            "error": mongo_task.get("error")
        }
    # 任务不存在或状态未知
    return {
        "task_id": task_id,
-        "status": status.get("status", "unknown"),
+        "status": "unknown",
-        "progress": status.get("meta", {}).get("progress", 0),
+        "progress": 0,
-        "message": status.get("meta", {}).get("message"),
+        "message": "无法获取任务状态（Redis和MongoDB均不可用）",
-        "result": status.get("meta", {}).get("result"),
+        "result": None,
-        "error": status.get("meta", {}).get("error")
+        "error": None
    }
@router.get("/")
 async def list_tasks(limit: int = 50, skip: int = 0):
    """
    获取任务历史列表
    Args:
        limit: 返回数量限制
        skip: 跳过数量
    Returns:
        任务列表
    """
    try:
        tasks = await mongodb.list_tasks(limit=limit, skip=skip)
        return {
            "success": True,
            "tasks": tasks,
            "count": len(tasks)
        }
    except Exception as e:
        # MongoDB 不可用时返回空列表
        return {
            "success": False,
            "tasks": [],
            "count": 0,
            "error": str(e)
        }
@router.delete("/{task_id}")
 async def delete_task(task_id: str):
    """
    删除任务
    Args:
        task_id: 任务ID
    Returns:
        是否删除成功
    """
    try:
        # 从 Redis 删除
        if redis_db._connected and redis_db.client:
            key = f"task:{task_id}"
            await redis_db.client.delete(key)
        # 从 MongoDB 删除
        deleted = await mongodb.delete_task(task_id)
        return {
            "success": True,
            "deleted": deleted
        }
    except Exception as e:
        raise HTTPException(status_code=500, detail=f"删除任务失败: {str(e)}")
--- a/backend/app/api/endpoints/templates.py
+++ b/backend/app/api/endpoints/templates.py
@@ -23,6 +23,44 @@ logger = logging.getLogger(__name__)
 router = APIRouter(prefix="/templates", tags=["表格模板"])
 # ==================== 辅助函数 ====================
 async def update_task_status(
    task_id: str,
    status: str,
    progress: int = 0,
    message: str = "",
    result: dict = None,
    error: str = None
 ):
    """
    更新任务状态，同时写入 Redis 和 MongoDB
    """
    from app.core.database import redis_db
    meta = {"progress": progress, "message": message}
    if result:
        meta["result"] = result
    if error:
        meta["error"] = error
    try:
        await redis_db.set_task_status(task_id, status, meta)
    except Exception as e:
        logger.warning(f"Redis 任务状态更新失败: {e}")
    try:
        await mongodb.update_task(
            task_id=task_id,
            status=status,
            message=message,
            result=result,
            error=error
        )
    except Exception as e:
        logger.warning(f"MongoDB 任务状态更新失败: {e}")
 # ==================== 请求/响应模型 ====================
 class TemplateFieldRequest(BaseModel):
@@ -41,6 +79,7 @@ class FillRequest(BaseModel):
    source_doc_ids: Optional[List[str]] = None  # MongoDB 文档 ID 列表
    source_file_paths: Optional[List[str]] = None  # 源文档文件路径列表
    user_hint: Optional[str] = None
    task_id: Optional[str] = None  # 可选的任务ID，用于任务历史跟踪
 class ExportRequest(BaseModel):
@@ -155,20 +194,17 @@ async def upload_joint_template(
                )
    try:
-        # 1. 保存模板文件并提取字段
+        # 1. 保存模板文件
        template_content = await template_file.read()
        template_path = file_service.save_uploaded_file(
            template_content,
            template_file.filename,
            subfolder="templates"
        )
        template_fields = await template_fill_service.get_template_fields_from_file(
            template_path,
            template_ext
        )
-        # 2. 处理源文档 - 保存文件
+        # 2. 保存并解析源文档 - 提取内容用于生成表头
        source_file_info = []
        source_contents = []
        for sf in source_files:
            if sf.filename:
                sf_content = await sf.read()
@@ -183,10 +219,81 @@ async def upload_joint_template(
                    "filename": sf.filename,
                    "ext": sf_ext
                })
                # 解析源文档获取内容（用于 AI 生成表头）
                try:
                    from app.core.document_parser import ParserFactory
                    parser = ParserFactory.get_parser(sf_path)
                    parse_result = parser.parse(sf_path)
                    if parse_result.success and parse_result.data:
                        # 获取原始内容
                        content = parse_result.data.get("content", "")[:5000] if parse_result.data.get("content") else ""
                        # 获取标题（可能在顶层或structured_data内）
                        titles = parse_result.data.get("titles", [])
                        if not titles and parse_result.data.get("structured_data"):
                            titles = parse_result.data.get("structured_data", {}).get("titles", [])
                        titles = titles[:10] if titles else []
                        # 获取表格数量（可能在顶层或structured_data内）
                        tables = parse_result.data.get("tables", [])
                        if not tables and parse_result.data.get("structured_data"):
                            tables = parse_result.data.get("structured_data", {}).get("tables", [])
                        tables_count = len(tables) if tables else 0
                        # 获取表格内容摘要（用于 AI 理解源文档结构）
                        tables_summary = ""
                        if tables:
                            tables_summary = "\n【文档中的表格】:\n"
                            for idx, table in enumerate(tables[:5]):  # 最多5个表格
                                if isinstance(table, dict):
                                    headers = table.get("headers", [])
                                    rows = table.get("rows", [])
                                    if headers:
                                        tables_summary += f"表格{idx+1}表头: {', '.join(str(h) for h in headers)}\n"
                                    if rows:
                                        tables_summary += f"表格{idx+1}前3行: "
                                        for row_idx, row in enumerate(rows[:3]):
                                            if isinstance(row, list):
                                                tables_summary += " | ".join(str(c) for c in row) + "; "
                                            elif isinstance(row, dict):
                                                tables_summary += " | ".join(str(row.get(h, "")) for h in headers if headers) + "; "
                                        tables_summary += "\n"
                        source_contents.append({
                            "filename": sf.filename,
                            "doc_type": sf_ext,
                            "content": content,
                            "titles": titles,
                            "tables_count": tables_count,
                            "tables_summary": tables_summary
                        })
                        logger.info(f"[DEBUG] source_contents built: filename={sf.filename}, content_len={len(content)}, titles_count={len(titles)}, tables_count={tables_count}")
                        if tables_summary:
                            logger.info(f"[DEBUG] tables_summary preview: {tables_summary[:300]}")
                except Exception as e:
                    logger.warning(f"解析源文档失败 {sf.filename}: {e}")
        # 3. 根据源文档内容生成表头
        template_fields = await template_fill_service.get_template_fields_from_file(
            template_path,
            template_ext,
            source_contents=source_contents  # 传递源文档内容
        )
        # 3. 异步处理源文档到MongoDB
        task_id = str(uuid.uuid4())
        if source_file_info:
            # 保存任务记录到 MongoDB
            try:
                await mongodb.insert_task(
                    task_id=task_id,
                    task_type="source_process",
                    status="pending",
                    message=f"开始处理 {len(source_file_info)} 个源文档"
                )
            except Exception as mongo_err:
                logger.warning(f"MongoDB 保存任务记录失败: {mongo_err}")
            background_tasks.add_task(
                process_source_documents,
                task_id=task_id,
@@ -225,12 +332,10 @@ async def upload_joint_template(
 async def process_source_documents(task_id: str, files: List[dict]):
    """异步处理源文档，存入MongoDB"""
    from app.core.database import redis_db
    try:
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="processing",
-            meta={"progress": 0, "message": "开始处理源文档"}
+            progress=0, message="开始处理源文档"
        )
        doc_ids = []
@@ -259,22 +364,24 @@ async def process_source_documents(task_id: str, files: List[dict]):
                logger.error(f"源文档处理异常: {file_info['filename']}, error: {str(e)}")
            progress = int((i + 1) / len(files) * 100)
-            await redis_db.set_task_status(
+            await update_task_status(
                task_id, status="processing",
-                meta={"progress": progress, "message": f"已处理 {i+1}/{len(files)}"}
+                progress=progress, message=f"已处理 {i+1}/{len(files)}"
            )
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="success",
-            meta={"progress": 100, "message": "源文档处理完成", "doc_ids": doc_ids}
+            progress=100, message="源文档处理完成",
            result={"doc_ids": doc_ids}
        )
        logger.info(f"所有源文档处理完成: {len(doc_ids)}个")
    except Exception as e:
        logger.error(f"源文档批量处理失败: {str(e)}")
-        await redis_db.set_task_status(
+        await update_task_status(
            task_id, status="failure",
-            meta={"error": str(e)}
+            progress=0, message="源文档处理失败",
            error=str(e)
        )
@@ -333,7 +440,27 @@ async def fill_template(
    Returns:
        填写结果
    """
    # 生成或使用传入的 task_id
    task_id = request.task_id or str(uuid.uuid4())
    try:
        # 创建任务记录到 MongoDB
        try:
            await mongodb.insert_task(
                task_id=task_id,
                task_type="template_fill",
                status="processing",
                message=f"开始填表任务: {len(request.template_fields)} 个字段"
            )
        except Exception as mongo_err:
            logger.warning(f"MongoDB 创建任务记录失败: {mongo_err}")
        # 更新进度 - 开始
        await update_task_status(
            task_id, "processing",
            progress=0, message="开始处理..."
        )
        # 转换字段
        fields = [
            TemplateField(
@@ -346,17 +473,51 @@ async def fill_template(
            for f in request.template_fields
        ]
        # 从 template_id 提取文件类型
        template_file_type = "xlsx"  # 默认类型
        if request.template_id:
            ext = request.template_id.split('.')[-1].lower()
            if ext in ["xlsx", "xls"]:
                template_file_type = "xlsx"
            elif ext == "docx":
                template_file_type = "docx"
        # 更新进度 - 准备开始填写
        await update_task_status(
            task_id, "processing",
            progress=10, message=f"准备填写 {len(fields)} 个字段..."
        )
        # 执行填写
        result = await template_fill_service.fill_template(
            template_fields=fields,
            source_doc_ids=request.source_doc_ids,
            source_file_paths=request.source_file_paths,
-            user_hint=request.user_hint
+            user_hint=request.user_hint,
            template_id=request.template_id,
            template_file_type=template_file_type,
            task_id=task_id
        )
-        return result
+        # 更新为成功
        await update_task_status(
            task_id, "success",
            progress=100, message="填表完成",
            result={
                "field_count": len(fields),
                "max_rows": result.get("max_rows", 0)
            }
        )
        return {**result, "task_id": task_id}
    except Exception as e:
        # 更新为失败
        await update_task_status(
            task_id, "failure",
            progress=0, message="填表失败",
            error=str(e)
        )
        logger.error(f"填写表格失败: {str(e)}")
        raise HTTPException(status_code=500, detail=f"填写失败: {str(e)}")
--- a/backend/app/api/endpoints/upload.py
+++ b/backend/app/api/endpoints/upload.py
@@ -5,6 +5,7 @@ from fastapi import APIRouter, UploadFile, File, HTTPException, Query
 from fastapi.responses import StreamingResponse
 from typing import Optional
 import logging
 import os
 import pandas as pd
 import io
@@ -126,7 +127,7 @@ async def upload_excel(
                                content += f"... (共 {len(sheet_data['rows'])} 行)\n\n"
            doc_metadata = {
-                "filename": saved_path.split("/")[-1] if "/" in saved_path else saved_path.split("\\")[-1],
+                "filename": os.path.basename(saved_path),
                "original_filename": file.filename,
                "saved_path": saved_path,
                "file_size": len(content),
@@ -253,7 +254,7 @@ async def export_excel(
        output.seek(0)
        # 生成文件名
-        original_name = file_path.split('/')[-1] if '/' in file_path else file_path
+        original_name = os.path.basename(file_path)
        if columns:
            export_name = f"export_{sheet_name or 'data'}_{len(column_list) if columns else 'all'}_cols.xlsx"
        else:
--- a/backend/app/core/database/mongodb.py
+++ b/backend/app/core/database/mongodb.py
@@ -59,6 +59,11 @@ class MongoDB:
        """RAG索引集合 - 存储字段语义索引"""
        return self.db["rag_index"]
    @property
    def tasks(self):
        """任务集合 - 存储任务历史记录"""
        return self.db["tasks"]
    # ==================== 文档操作 ====================
    async def insert_document(
@@ -242,8 +247,128 @@ class MongoDB:
        await self.rag_index.create_index("table_name")
        await self.rag_index.create_index("field_name")
        # 任务集合索引
        await self.tasks.create_index("task_id", unique=True)
        await self.tasks.create_index("created_at")
        logger.info("MongoDB 索引创建完成")
    # ==================== 任务历史操作 ====================
    async def insert_task(
        self,
        task_id: str,
        task_type: str,
        status: str = "pending",
        message: str = "",
        result: Optional[Dict[str, Any]] = None,
        error: Optional[str] = None,
    ) -> str:
        """
        插入任务记录
        Args:
            task_id: 任务ID
            task_type: 任务类型
            status: 任务状态
            message: 任务消息
            result: 任务结果
            error: 错误信息
        Returns:
            插入文档的ID
        """
        task = {
            "task_id": task_id,
            "task_type": task_type,
            "status": status,
            "message": message,
            "result": result,
            "error": error,
            "created_at": datetime.utcnow(),
            "updated_at": datetime.utcnow(),
        }
        result_obj = await self.tasks.insert_one(task)
        return str(result_obj.inserted_id)
    async def update_task(
        self,
        task_id: str,
        status: Optional[str] = None,
        message: Optional[str] = None,
        result: Optional[Dict[str, Any]] = None,
        error: Optional[str] = None,
    ) -> bool:
        """
        更新任务状态
        Args:
            task_id: 任务ID
            status: 任务状态
            message: 任务消息
            result: 任务结果
            error: 错误信息
        Returns:
            是否更新成功
        """
        from bson import ObjectId
        update_data = {"updated_at": datetime.utcnow()}
        if status is not None:
            update_data["status"] = status
        if message is not None:
            update_data["message"] = message
        if result is not None:
            update_data["result"] = result
        if error is not None:
            update_data["error"] = error
        update_result = await self.tasks.update_one(
            {"task_id": task_id},
            {"$set": update_data}
        )
        return update_result.modified_count > 0
    async def get_task(self, task_id: str) -> Optional[Dict[str, Any]]:
        """根据task_id获取任务"""
        task = await self.tasks.find_one({"task_id": task_id})
        if task:
            task["_id"] = str(task["_id"])
        return task
    async def list_tasks(
        self,
        limit: int = 50,
        skip: int = 0,
    ) -> List[Dict[str, Any]]:
        """
        获取任务列表
        Args:
            limit: 返回数量
            skip: 跳过数量
        Returns:
            任务列表
        """
        cursor = self.tasks.find().sort("created_at", -1).skip(skip).limit(limit)
        tasks = []
        async for task in cursor:
            task["_id"] = str(task["_id"])
            # 转换 datetime 为字符串
            if task.get("created_at"):
                task["created_at"] = task["created_at"].isoformat()
            if task.get("updated_at"):
                task["updated_at"] = task["updated_at"].isoformat()
            tasks.append(task)
        return tasks
    async def delete_task(self, task_id: str) -> bool:
        """删除任务"""
        result = await self.tasks.delete_one({"task_id": task_id})
        return result.deleted_count > 0
 # ==================== 全局单例 ====================
--- a/backend/app/core/document_parser/xlsx_parser.py
+++ b/backend/app/core/document_parser/xlsx_parser.py
@@ -317,24 +317,70 @@ class XlsxParser(BaseParser):
        import zipfile
        from xml.etree import ElementTree as ET
        # 常见的命名空间
        COMMON_NAMESPACES = [
            'http://schemas.openxmlformats.org/spreadsheetml/2006/main',
            'http://schemas.openxmlformats.org/spreadsheetml/2005/main',
            'http://schemas.openxmlformats.org/spreadsheetml/2004/main',
            'http://schemas.openxmlformats.org/spreadsheetml/2003/main',
        ]
        try:
            with zipfile.ZipFile(file_path, 'r') as z:
-                if 'xl/workbook.xml' not in z.namelist():
+                # 尝试多种可能的 workbook.xml 路径
                possible_paths = ['xl/workbook.xml', 'xl\\workbook.xml', 'workbook.xml']
                content = None
                for path in possible_paths:
                    if path in z.namelist():
                        content = z.read(path)
                        logger.info(f"找到 workbook.xml at: {path}")
                        break
                if content is None:
                    logger.warning(f"未找到 workbook.xml，文件列表: {z.namelist()[:10]}")
                    return []
-                content = z.read('xl/workbook.xml')
+
                root = ET.fromstring(content)
                # 命名空间
                ns = {'main': 'http://schemas.openxmlformats.org/spreadsheetml/2006/main'}
                sheet_names = []
-                for sheet in root.findall('.//main:sheet', ns):
+
-                    name = sheet.get('name')
+                # 方法1：尝试带命名空间的查找
-                    if name:
+                for ns in COMMON_NAMESPACES:
-                        sheet_names.append(name)
+                    sheet_elements = root.findall(f'.//{{{ns}}}sheet')
                    if sheet_elements:
                        for sheet in sheet_elements:
                            name = sheet.get('name')
                            if name:
                                sheet_names.append(name)
                        if sheet_names:
                            logger.info(f"使用命名空间 {ns} 提取工作表: {sheet_names}")
                            return sheet_names
                # 方法2：不使用命名空间，直接查找所有 sheet 元素
                if not sheet_names:
                    for elem in root.iter():
                        if elem.tag.endswith('sheet') and elem.tag != 'sheets':
                            name = elem.get('name')
                            if name:
                                sheet_names.append(name)
                            for child in elem:
                                if child.tag.endswith('sheet') or child.tag == 'sheet':
                                    name = child.get('name')
                                    if name and name not in sheet_names:
                                        sheet_names.append(name)
                # 方法3：直接从 XML 文本中正则匹配 sheet name
                if not sheet_names:
                    import re
                    xml_str = content.decode('utf-8', errors='ignore')
                    matches = re.findall(r'<sheet\s+[^>]*name=["\']([^"\']+)["\']', xml_str, re.IGNORECASE)
                    if matches:
                        sheet_names = matches
                        logger.info(f"使用正则提取工作表: {sheet_names}")
                logger.info(f"从 XML 提取工作表: {sheet_names}")
                return sheet_names
        except Exception as e:
            logger.error(f"从 XML 提取工作表名称失败: {e}")
            return []
@@ -356,6 +402,32 @@ class XlsxParser(BaseParser):
        import zipfile
        from xml.etree import ElementTree as ET
        # 常见的命名空间
        COMMON_NAMESPACES = [
            'http://schemas.openxmlformats.org/spreadsheetml/2006/main',
            'http://schemas.openxmlformats.org/spreadsheetml/2005/main',
            'http://schemas.openxmlformats.org/spreadsheetml/2004/main',
            'http://schemas.openxmlformats.org/spreadsheetml/2003/main',
        ]
        def find_elements_with_ns(root, tag_name):
            """灵活查找元素，支持任意命名空间"""
            results = []
            # 方法1：用固定命名空间
            for ns in COMMON_NAMESPACES:
                try:
                    elems = root.findall(f'.//{{{ns}}}{tag_name}')
                    if elems:
                        results.extend(elems)
                except:
                    pass
            # 方法2：不带命名空间查找
            if not results:
                for elem in root.iter():
                    if elem.tag.endswith('}' + tag_name):
                        results.append(elem)
            return results
        with zipfile.ZipFile(file_path, 'r') as z:
            # 获取工作表名称
            sheet_names = self._extract_sheet_names_from_xml(file_path)
@@ -366,57 +438,68 @@ class XlsxParser(BaseParser):
            target_sheet = sheet_name if sheet_name and sheet_name in sheet_names else sheet_names[0]
            sheet_index = sheet_names.index(target_sheet) + 1  # sheet1.xml, sheet2.xml, ...
-            # 读取 shared strings
+            # 读取 shared strings - 尝试多种路径
            shared_strings = []
-            if 'xl/sharedStrings.xml' in z.namelist():
+            ss_paths = ['xl/sharedStrings.xml', 'xl\\sharedStrings.xml', 'sharedStrings.xml']
-                ss_content = z.read('xl/sharedStrings.xml')
+            for ss_path in ss_paths:
-                ss_root = ET.fromstring(ss_content)
+                if ss_path in z.namelist():
-                ns = {'main': 'http://schemas.openxmlformats.org/spreadsheetml/2006/main'}
+                    try:
-                for si in ss_root.findall('.//main:si', ns):
+                        ss_content = z.read(ss_path)
-                    t = si.find('.//main:t', ns)
+                        ss_root = ET.fromstring(ss_content)
-                    if t is not None:
+                        for si in find_elements_with_ns(ss_root, 'si'):
-                        shared_strings.append(t.text or '')
+                            t_elements = [c for c in si if c.tag.endswith('}t') or c.tag == 't']
-                    else:
+                            if t_elements:
-                        shared_strings.append('')
+                                shared_strings.append(t_elements[0].text or '')
                            else:
                                shared_strings.append('')
                        break
                    except Exception as e:
                        logger.warning(f"读取 sharedStrings 失败: {e}")
-            # 读取工作表
+            # 读取工作表 - 尝试多种可能的路径
-            sheet_file = f'xl/worksheets/sheet{sheet_index}.xml'
+            sheet_content = None
-            if sheet_file not in z.namelist():
+            sheet_paths = [
-                raise ValueError(f"工作表文件 {sheet_file} 不存在")
+                f'xl/worksheets/sheet{sheet_index}.xml',
                f'xl\\worksheets\\sheet{sheet_index}.xml',
                f'worksheets/sheet{sheet_index}.xml',
            ]
            for sp in sheet_paths:
                if sp in z.namelist():
                    sheet_content = z.read(sp)
                    break
            if sheet_content is None:
                raise ValueError(f"工作表文件 sheet{sheet_index}.xml 不存在")
            sheet_content = z.read(sheet_file)
            root = ET.fromstring(sheet_content)
            ns = {'main': 'http://schemas.openxmlformats.org/spreadsheetml/2006/main'}
            # 收集所有行数据
            all_rows = []
            headers = {}
-            for row in root.findall('.//main:row', ns):
+            for row in find_elements_with_ns(root, 'row'):
                row_idx = int(row.get('r', 0))
                row_cells = {}
-                for cell in row.findall('main:c', ns):
+                for cell in find_elements_with_ns(row, 'c'):
                    cell_ref = cell.get('r', '')
                    col_letters = ''.join(filter(str.isalpha, cell_ref))
                    cell_type = cell.get('t', 'n')
-                    v = cell.find('main:v', ns)
+                    v_elements = find_elements_with_ns(cell, 'v')
                    v = v_elements[0] if v_elements else None
                    if v is not None and v.text:
                        if cell_type == 's':
                            # shared string
                            try:
                                row_cells[col_letters] = shared_strings[int(v.text)]
                            except (ValueError, IndexError):
                                row_cells[col_letters] = v.text
                        elif cell_type == 'b':
                            # boolean
                            row_cells[col_letters] = v.text == '1'
                        else:
                            row_cells[col_letters] = v.text
                    else:
                        row_cells[col_letters] = None
                # 处理表头行
                if row_idx == header_row + 1:
                    headers = {**row_cells}
                elif row_idx > header_row + 1:
@@ -424,7 +507,6 @@ class XlsxParser(BaseParser):
            # 构建 DataFrame
            if headers:
                # 按原始列顺序排列
                col_order = list(headers.keys())
                df = pd.DataFrame(all_rows)
                if not df.empty:
--- a/backend/app/instruction/init.py
+++ b/backend/app/instruction/init.py
@@ -0,0 +1,15 @@
 """
 指令执行模块
 注意: 此模块为可选功能，当前尚未实现。
 如需启用，请实现 intent_parser.py 和 executor.py
 """
 from .intent_parser import IntentParser, DefaultIntentParser
 from .executor import InstructionExecutor, DefaultInstructionExecutor
 __all__ = [
    "IntentParser",
    "DefaultIntentParser",
    "InstructionExecutor",
    "DefaultInstructionExecutor",
 ]
--- a/backend/app/instruction/executor.py
+++ b/backend/app/instruction/executor.py
@@ -0,0 +1,35 @@
 """
 指令执行器模块
 将自然语言指令转换为可执行操作
 注意: 此模块为可选功能，当前尚未实现。
 """
 from abc import ABC, abstractmethod
 from typing import Any, Dict
 class InstructionExecutor(ABC):
    """指令执行器抽象基类"""
    @abstractmethod
    async def execute(self, instruction: str, context: Dict[str, Any]) -> Dict[str, Any]:
        """
        执行指令
        Args:
            instruction: 解析后的指令
            context: 执行上下文
        Returns:
            执行结果
        """
        pass
 class DefaultInstructionExecutor(InstructionExecutor):
    """默认指令执行器"""
    async def execute(self, instruction: str, context: Dict[str, Any]) -> Dict[str, Any]:
        """暂未实现"""
        raise NotImplementedError("指令执行功能暂未实现")
--- a/backend/app/instruction/intent_parser.py
+++ b/backend/app/instruction/intent_parser.py
@@ -0,0 +1,34 @@
 """
 意图解析器模块
 解析用户自然语言指令，识别意图和参数
 注意: 此模块为可选功能，当前尚未实现。
 """
 from abc import ABC, abstractmethod
 from typing import Any, Dict, Tuple
 class IntentParser(ABC):
    """意图解析器抽象基类"""
    @abstractmethod
    async def parse(self, text: str) -> Tuple[str, Dict[str, Any]]:
        """
        解析自然语言指令
        Args:
            text: 用户输入的自然语言
        Returns:
            (意图类型, 参数字典)
        """
        pass
 class DefaultIntentParser(IntentParser):
    """默认意图解析器"""
    async def parse(self, text: str) -> Tuple[str, Dict[str, Any]]:
        """暂未实现"""
        raise NotImplementedError("意图解析功能暂未实现")
--- a/backend/app/services/template_fill_service.py
+++ b/backend/app/services/template_fill_service.py
@@ -60,7 +60,10 @@ class TemplateFillService:
        template_fields: List[TemplateField],
        source_doc_ids: Optional[List[str]] = None,
        source_file_paths: Optional[List[str]] = None,
-        user_hint: Optional[str] = None
+        user_hint: Optional[str] = None,
        template_id: Optional[str] = None,
        template_file_type: Optional[str] = "xlsx",
        task_id: Optional[str] = None
    ) -> Dict[str, Any]:
        """
        填写表格模板
@@ -70,6 +73,9 @@ class TemplateFillService:
            source_doc_ids: 源文档 MongoDB ID 列表
            source_file_paths: 源文档文件路径列表
            user_hint: 用户提示（如"请从合同文档中提取"）
            template_id: 模板文件路径（用于重新生成表头）
            template_file_type: 模板文件类型
            task_id: 可选的任务ID，用于任务进度跟踪
        Returns:
            填写结果
@@ -78,15 +84,94 @@ class TemplateFillService:
        fill_details = []
        logger.info(f"开始填表: {len(template_fields)} 个字段, {len(source_doc_ids or [])} 个源文档")
        logger.info(f"source_doc_ids: {source_doc_ids}")
        logger.info(f"source_file_paths: {source_file_paths}")
        # 1. 加载源文档内容
        source_docs = await self._load_source_documents(source_doc_ids, source_file_paths)
        logger.info(f"加载了 {len(source_docs)} 个源文档")
        # 打印每个加载的文档的详细信息
        for i, doc in enumerate(source_docs):
            logger.info(f"  文档[{i}]: id={doc.doc_id}, filename={doc.filename}, doc_type={doc.doc_type}")
            logger.info(f"    content长度: {len(doc.content)}, structured_data keys: {list(doc.structured_data.keys()) if doc.structured_data else 'None'}")
        if not source_docs:
            logger.warning("没有找到源文档，填表结果将全部为空")
        # 3. 检查是否需要使用源文档重新生成表头
        # 条件：源文档已加载 AND 现有字段看起来是自动生成的（如"字段1"、"字段2"）
        needs_regenerate_headers = (
            len(source_docs) > 0 and
            len(template_fields) > 0 and
            all(self._is_auto_generated_field(f.name) for f in template_fields)
        )
        if needs_regenerate_headers:
            logger.info(f"检测到自动生成表头，尝试使用源文档重新生成... (当前字段: {[f.name for f in template_fields]})")
            # 将 SourceDocument 转换为 source_contents 格式
            source_contents = []
            for doc in source_docs:
                structured = doc.structured_data if doc.structured_data else {}
                # 获取标题
                titles = structured.get("titles", [])
                if not titles:
                    titles = []
                # 获取表格
                tables = structured.get("tables", [])
                tables_count = len(tables) if tables else 0
                # 生成表格摘要
                tables_summary = ""
                if tables:
                    tables_summary = "\n【文档中的表格】:\n"
                    for idx, table in enumerate(tables[:5]):
                        if isinstance(table, dict):
                            headers = table.get("headers", [])
                            rows = table.get("rows", [])
                            if headers:
                                tables_summary += f"表格{idx+1}表头: {', '.join(str(h) for h in headers)}\n"
                            if rows:
                                tables_summary += f"表格{idx+1}前3行: "
                                for row_idx, row in enumerate(rows[:3]):
                                    if isinstance(row, list):
                                        tables_summary += " | ".join(str(c) for c in row) + "; "
                                    elif isinstance(row, dict):
                                        tables_summary += " | ".join(str(row.get(h, "")) for h in headers if headers) + "; "
                                tables_summary += "\n"
                source_contents.append({
                    "filename": doc.filename,
                    "doc_type": doc.doc_type,
                    "content": doc.content[:5000] if doc.content else "",
                    "titles": titles[:10] if titles else [],
                    "tables_count": tables_count,
                    "tables_summary": tables_summary
                })
            # 使用源文档内容重新生成表头
            if template_id and template_file_type:
                logger.info(f"使用源文档重新生成表头: template_id={template_id}, template_file_type={template_file_type}")
                new_fields = await self.get_template_fields_from_file(
                    template_id,
                    template_file_type,
                    source_contents=source_contents
                )
                if new_fields and len(new_fields) > 0:
                    logger.info(f"成功重新生成表头: {[f.name for f in new_fields]}")
                    template_fields = new_fields
                else:
                    logger.warning("重新生成表头返回空结果，使用原始字段")
            else:
                logger.warning("无法重新生成表头：缺少 template_id 或 template_file_type")
        else:
            if source_docs and template_fields:
                logger.info(f"表头看起来正常（非自动生成），无需重新生成: {[f.name for f in template_fields[:5]]}")
        # 2. 对每个字段进行提取
        for idx, field in enumerate(template_fields):
            try:
@@ -98,6 +183,22 @@ class TemplateFillService:
                    user_hint=user_hint
                )
                # AI审核：验证提取的值是否合理
                if result.values and result.values[0]:
                    logger.info(f"字段 {field.name} 进入AI审核阶段...")
                    verified_result = await self._verify_field_value(
                        field=field,
                        extracted_values=result.values,
                        source_docs=source_docs,
                        user_hint=user_hint
                    )
                    if verified_result:
                        # 审核给出了修正结果
                        result = verified_result
                        logger.info(f"字段 {field.name} 审核后修正值: {result.values[:3]}")
                    else:
                        logger.info(f"字段 {field.name} 审核通过，使用原提取结果")
                # 存储结果 - 使用 values 数组
                filled_data[field.name] = result.values if result.values else [""]
                fill_details.append({
@@ -158,14 +259,49 @@ class TemplateFillService:
                try:
                    doc = await mongodb.get_document(doc_id)
                    if doc:
                        sd = doc.get("structured_data", {})
                        sd_keys = list(sd.keys()) if sd else []
                        logger.info(f"从MongoDB加载文档: {doc_id}, doc_type={doc.get('doc_type')}, structured_data keys={sd_keys}")
                        # 如果 structured_data 为空，但有 file_path，尝试重新解析文件
                        doc_content = doc.get("content", "")
                        if not sd or (not sd.get("tables") and not sd.get("headers") and not sd.get("rows")):
                            file_path = doc.get("metadata", {}).get("file_path")
                            if file_path:
                                logger.info(f"  structured_data 为空，尝试重新解析文件: {file_path}")
                                try:
                                    parser = ParserFactory.get_parser(file_path)
                                    result = parser.parse(file_path)
                                    if result.success and result.data:
                                        if result.data.get("structured_data"):
                                            sd = result.data.get("structured_data")
                                            logger.info(f"  重新解析成功，structured_data keys: {list(sd.keys())}")
                                        elif result.data.get("tables"):
                                            sd = {"tables": result.data.get("tables", [])}
                                            logger.info(f"  使用 data.tables，tables数量: {len(sd.get('tables', []))}")
                                        elif result.data.get("rows"):
                                            sd = result.data
                                            logger.info(f"  使用 data.rows 格式")
                                        if result.data.get("content"):
                                            doc_content = result.data.get("content", "")
                                    else:
                                        logger.warning(f"  重新解析失败: {result.error if result else 'unknown'}")
                                except Exception as parse_err:
                                    logger.error(f"  重新解析文件异常: {str(parse_err)}")
                        if sd.get("tables"):
                            logger.info(f"  tables数量: {len(sd.get('tables', []))}")
                            if sd["tables"]:
                                first_table = sd["tables"][0]
                                logger.info(f"  第一表格: headers={first_table.get('headers', [])[:3]}..., rows数量={len(first_table.get('rows', []))}")
                        source_docs.append(SourceDocument(
                            doc_id=doc_id,
                            filename=doc.get("metadata", {}).get("original_filename", "unknown"),
                            doc_type=doc.get("doc_type", "unknown"),
-                            content=doc.get("content", ""),
+                            content=doc_content,
-                            structured_data=doc.get("structured_data", {})
+                            structured_data=sd
                        ))
                        logger.info(f"从MongoDB加载文档: {doc_id}")
                except Exception as e:
                    logger.error(f"从MongoDB加载文档失败 {doc_id}: {str(e)}")
@@ -179,10 +315,48 @@ class TemplateFillService:
                        # result.data 的结构取决于解析器类型:
                        # - Excel 单 sheet: {columns: [...], rows: [...], row_count, column_count}
                        # - Excel 多 sheet: {sheets: {sheet_name: {columns, rows, ...}}}
                        # - Markdown: {content: "...", tables: [...], structured_data: {tables: [...]}}
                        # - Word/TXT: {content: "...", structured_data: {...}}
                        doc_data = result.data if result.data else {}
                        doc_content = doc_data.get("content", "") if isinstance(doc_data, dict) else ""
-                        doc_structured = doc_data if isinstance(doc_data, dict) and "rows" in doc_data or isinstance(doc_data, dict) and "sheets" in doc_data else {}
+
                        # 检查并提取 structured_data
                        doc_structured = {}
                        if isinstance(doc_data, dict):
                            logger.info(f"文档 {file_path} doc_data keys: {list(doc_data.keys())}")
                            # Excel 多 sheet
                            if "sheets" in doc_data:
                                doc_structured = doc_data
                                logger.info(f"  -> 使用 Excel 多 sheet 格式")
                            # Excel 单 sheet 或有 rows 的格式
                            elif "rows" in doc_data:
                                doc_structured = doc_data
                                logger.info(f"  -> 使用 rows 格式，列数: {len(doc_data.get('columns', []))}")
                            # Markdown 格式：tables 可能直接在 doc_data.tables 或在 structured_data.tables 中
                            elif "tables" in doc_data and doc_data["tables"]:
                                # Markdown: tables 直接在 doc_data 中
                                tables = doc_data["tables"]
                                first_table = tables[0]
                                doc_structured = {
                                    "headers": first_table.get("headers", []),
                                    "rows": first_table.get("rows", [])
                                }
                                logger.info(f"  -> 使用 doc_data.tables 格式，表头: {doc_structured.get('headers', [])[:5]}")
                            elif "structured_data" in doc_data and isinstance(doc_data["structured_data"], dict):
                                # Markdown: tables 在 structured_data 中
                                tables = doc_data["structured_data"].get("tables", [])
                                if tables:
                                    first_table = tables[0]
                                    doc_structured = {
                                        "headers": first_table.get("headers", []),
                                        "rows": first_table.get("rows", [])
                                    }
                                    logger.info(f"  -> 使用 structured_data.tables 格式，表头: {doc_structured.get('headers', [])[:5]}")
                                else:
                                    logger.warning(f"  -> structured_data.tables 为空")
                            else:
                                logger.warning(f"  -> 未识别的文档格式，无 structured_data")
                        source_docs.append(SourceDocument(
                            doc_id=file_path,
@@ -279,7 +453,7 @@ class TemplateFillService:
            response = await self.llm.chat(
                messages=messages,
                temperature=0.1,
-                max_tokens=50000
+                max_tokens=4000
            )
            content = self.llm.extract_message_content(response)
@@ -377,6 +551,137 @@ class TemplateFillService:
                confidence=0.0
            )
    async def _verify_field_value(
        self,
        field: TemplateField,
        extracted_values: List[str],
        source_docs: List[SourceDocument],
        user_hint: Optional[str] = None
    ) -> Optional[FillResult]:
        """
        验证并修正提取的字段值
        Args:
            field: 字段定义
            extracted_values: 已提取的值
            source_docs: 源文档列表
            user_hint: 用户提示
        Returns:
            验证后的结果，如果验证通过返回None（使用原结果）
        """
        if not extracted_values or not extracted_values[0]:
            return None
        if not source_docs:
            return None
        try:
            # 构建验证上下文
            context_text = self._build_context_text(source_docs, field_name=field.name, max_length=15000)
            hint_text = field.hint if field.hint else f"请理解{field.name}字段的含义"
            if user_hint:
                hint_text = f"{user_hint}。{hint_text}"
            prompt = f"""你是一个数据质量审核专家。请审核以下提取的数据是否合理。
 【待审核字段】
 字段名：{field.name}
 字段说明：{hint_text}
 【已提取的值】
 {extracted_values[:10]}  # 最多审核前10个值
 【源文档上下文】
 {context_text[:8000]}
 【审核要求】
 1. 这些值是否符合字段的含义？
 2. 值在原文中的原始含义是什么？检查是否有误解或误提取
 3. 是否存在明显错误、空值或不合理的数据？
 4. 如果表格有多个列，请确认提取的是正确的列
 请严格按照以下 JSON 格式输出（只需输出 JSON，不要其他内容）：
 {{
    "is_valid": true或false,
    "corrected_values": ["修正后的值列表"] 或 null（如果无需修正）,
    "reason": "审核说明，解释判断理由",
    "original_meaning": "值在原文中的原始含义描述"
 }}
 """
            messages = [
                {"role": "system", "content": "你是一个严格的数据质量审核专家。请仔细核对原文和提取的值是否匹配。"},
                {"role": "user", "content": prompt}
            ]
            response = await self.llm.chat(
                messages=messages,
                temperature=0.2,
                max_tokens=3000
            )
            content = self.llm.extract_message_content(response)
            logger.info(f"字段 {field.name} 审核返回: {content[:300]}")
            # 解析 JSON
            import json
            import re
            cleaned = content.strip()
            cleaned = re.sub(r'^```json\s*', '', cleaned, flags=re.MULTILINE)
            cleaned = re.sub(r'^```\s*', '', cleaned, flags=re.MULTILINE)
            cleaned = cleaned.strip()
            json_start = -1
            for i, c in enumerate(cleaned):
                if c == '{':
                    json_start = i
                    break
            if json_start == -1:
                logger.warning(f"字段 {field.name} 审核：无法找到 JSON")
                return None
            json_text = cleaned[json_start:]
            result = json.loads(json_text)
            is_valid = result.get("is_valid", True)
            corrected_values = result.get("corrected_values")
            reason = result.get("reason", "")
            original_meaning = result.get("original_meaning", "")
            logger.info(f"字段 {field.name} 审核结果: is_valid={is_valid}, reason={reason[:100]}")
            if not is_valid and corrected_values:
                # 值有问题且有修正建议，使用修正后的值
                logger.info(f"字段 {field.name} 使用修正后的值: {corrected_values[:5]}")
                return FillResult(
                    field=field.name,
                    values=corrected_values,
                    value=corrected_values[0] if corrected_values else "",
                    source=f"AI审核修正: {reason[:100]}",
                    confidence=0.7
                )
            elif not is_valid and original_meaning:
                # 值有问题但无修正，记录原始含义供用户参考
                logger.info(f"字段 {field.name} 审核发现问题: {original_meaning}")
                return FillResult(
                    field=field.name,
                    values=extracted_values,
                    value=extracted_values[0] if extracted_values else "",
                    source=f"AI审核疑问: {original_meaning[:100]}",
                    confidence=0.5
                )
            # 验证通过，返回 None 表示使用原结果
            return None
        except Exception as e:
            logger.error(f"字段 {field.name} 审核失败: {str(e)}")
            return None
    def _build_context_text(self, source_docs: List[SourceDocument], field_name: str = None, max_length: int = 8000) -> str:
        """
        构建上下文文本
@@ -529,7 +834,8 @@ class TemplateFillService:
    async def get_template_fields_from_file(
        self,
        file_path: str,
-        file_type: str = "xlsx"
+        file_type: str = "xlsx",
        source_contents: List[dict] = None
    ) -> List[TemplateField]:
        """
        从模板文件提取字段定义
@@ -537,11 +843,14 @@ class TemplateFillService:
        Args:
            file_path: 模板文件路径
            file_type: 文件类型 (xlsx/xls/docx)
            source_contents: 源文档内容列表（用于 AI 生成表头）
        Returns:
            字段列表
        """
        fields = []
        if source_contents is None:
            source_contents = []
        try:
            if file_type in ["xlsx", "xls"]:
@@ -557,8 +866,8 @@ class TemplateFillService:
            )
            if needs_ai_generation:
-                logger.info(f"模板表头为空或自动生成，尝试 AI 生成表头... (fields={len(fields)})")
+                logger.info(f"模板表头为空或自动生成，尝试 AI 生成表头... (fields={len(fields)}, source_docs={len(source_contents)})")
-                ai_fields = await self._generate_fields_with_ai(file_path, file_type)
+                ai_fields = await self._generate_fields_with_ai(file_path, file_type, source_contents)
                if ai_fields:
                    fields = ai_fields
                    logger.info(f"AI 生成表头成功: {len(fields)} 个字段")
@@ -738,7 +1047,7 @@ class TemplateFillService:
    def _extract_values_from_structured_data(self, source_docs: List[SourceDocument], field_name: str) -> List[str]:
        """
-        从结构化数据（Excel rows）中直接提取指定列的值
+        从结构化数据（Excel rows 或 Markdown tables）中直接提取指定列的值
        适用于有 rows 结构的文档数据，无需 LLM 即可提取
@@ -750,10 +1059,15 @@ class TemplateFillService:
            值列表，如果无法提取则返回空列表
        """
        all_values = []
        logger.info(f"[_extract_values_from_structured_data] 开始提取字段: {field_name}")
        logger.info(f"  source_docs 数量: {len(source_docs)}")
-        for doc in source_docs:
+        for doc_idx, doc in enumerate(source_docs):
            # 尝试从 structured_data 中提取
            structured = doc.structured_data
            logger.info(f"  文档[{doc_idx}]: {doc.filename}, structured类型: {type(structured)}, 是否为空: {not bool(structured)}")
            if structured:
                logger.info(f"    structured_data keys: {list(structured.keys())}")
            if not structured:
                continue
@@ -773,6 +1087,33 @@ class TemplateFillService:
                if all_values:
                    break
            # 处理 Markdown 表格格式: {headers: [...], rows: [...], ...}
            elif structured.get("headers") and structured.get("rows"):
                headers = structured.get("headers", [])
                rows = structured.get("rows", [])
                values = self._extract_values_from_markdown_table(headers, rows, field_name)
                if values:
                    all_values.extend(values)
                    logger.info(f"从 Markdown 文档 {doc.filename} 提取到 {len(values)} 个值")
                    break
            # 处理 MongoDB 存储的 tables 格式: {tables: [{headers, rows, ...}, ...]}
            elif structured.get("tables") and isinstance(structured.get("tables"), list):
                tables = structured.get("tables", [])
                logger.info(f"  检测到 tables 格式，共 {len(tables)} 个表")
                for table_idx, table in enumerate(tables):
                    if isinstance(table, dict):
                        headers = table.get("headers", [])
                        rows = table.get("rows", [])
                        logger.info(f"  表格[{table_idx}]: headers={headers[:3]}..., rows数量={len(rows)}")
                        values = self._extract_values_from_markdown_table(headers, rows, field_name)
                        if values:
                            all_values.extend(values)
                            logger.info(f"从表格[{table_idx}] 提取到 {len(values)} 个值")
                            break
                if all_values:
                    break
            # 处理单 sheet 格式: {columns: [...], rows: [...]}
            elif structured.get("rows"):
                columns = structured.get("columns", [])
@@ -800,6 +1141,100 @@ class TemplateFillService:
        return all_values
    def _extract_values_from_markdown_table(self, headers: List, rows: List, field_name: str) -> List[str]:
        """
        从 Markdown 表格中提取指定列的值
        Markdown 表格格式:
        - headers: ["col1", "col2", ...]
        - rows: [["val1", "val2", ...], ...]
        Args:
            headers: 表头列表
            rows: 数据行列表
            field_name: 要提取的字段名
        Returns:
            值列表
        """
        if not rows or not headers:
            logger.warning(f"Markdown 表格为空: headers={headers}, rows={len(rows) if rows else 0}")
            return []
        # 查找匹配的列索引 - 使用增强的匹配算法
        target_idx = self._find_best_matching_column(headers, field_name)
        if target_idx is None:
            logger.warning(f"未找到匹配列: {field_name}, 可用表头: {headers}")
            return []
        logger.info(f"列匹配成功: {field_name} -> {headers[target_idx]} (索引: {target_idx})")
        values = []
        for row in rows:
            if isinstance(row, list) and target_idx < len(row):
                val = row[target_idx]
            else:
                val = ""
            values.append(self._format_value(val))
        return values
    def _find_best_matching_column(self, headers: List, field_name: str) -> Optional[int]:
        """
        查找最佳匹配的列索引
        使用多层匹配策略:
        1. 精确匹配（忽略大小写）
        2. 子字符串匹配（字段名在表头中，或表头在字段名中）
        3. 关键词重叠匹配（中文字符串分割后比对）
        Args:
            headers: 表头列表
            field_name: 要匹配的字段名
        Returns:
            匹配的列索引，找不到返回 None
        """
        field_lower = field_name.lower().strip()
        field_keywords = set(field_lower.replace(" ", "").split())
        best_match_idx = None
        best_match_score = 0
        for idx, header in enumerate(headers):
            header_str = str(header).strip()
            header_lower = header_str.lower()
            # 策略1: 精确匹配（忽略大小写）
            if header_lower == field_lower:
                return idx
            # 策略2: 子字符串匹配
            if field_lower in header_lower or header_lower in field_lower:
                # 计算匹配分数（较长匹配更优先）
                score = max(len(field_lower), len(header_lower)) / min(len(field_lower) + 1, len(header_lower) + 1)
                if score > best_match_score:
                    best_match_score = score
                    best_match_idx = idx
                continue
            # 策略3: 关键词重叠匹配（适用于中文）
            header_keywords = set(header_lower.replace(" ", "").split())
            overlap = field_keywords & header_keywords
            if overlap and len(overlap) > 0:
                score = len(overlap) / max(len(field_keywords), len(header_keywords), 1)
                if score > best_match_score:
                    best_match_score = score
                    best_match_idx = idx
        # 只有当匹配分数超过阈值时才返回
        if best_match_score >= 0.3:
            logger.info(f"模糊匹配: {field_name} -> {headers[best_match_idx]} (分数: {best_match_score:.2f})")
            return best_match_idx
        return None
    def _extract_column_values(self, rows: List, columns: List, field_name: str) -> List[str]:
        """
        从 rows 和 columns 中提取指定列的值
@@ -815,30 +1250,70 @@ class TemplateFillService:
        if not rows or not columns:
            return []
-        # 查找匹配的列（模糊匹配）
+        # 使用增强的匹配算法查找最佳匹配的列索引
-        target_col = None
+        target_idx = self._find_best_matching_column(columns, field_name)
        for col in columns:
            col_str = str(col)
            if field_name.lower() in col_str.lower() or col_str.lower() in field_name.lower():
                target_col = col
                break
-        if not target_col:
+        if target_idx is None:
            logger.warning(f"未找到匹配列: {field_name}, 可用列: {columns}")
            return []
        target_col = columns[target_idx]
        logger.info(f"列匹配成功: {field_name} -> {target_col} (索引: {target_idx})")
        values = []
        for row in rows:
            if isinstance(row, dict):
                val = row.get(target_col, "")
-            elif isinstance(row, list) and target_col in columns:
+            elif isinstance(row, list) and target_idx < len(row):
-                val = row[columns.index(target_col)]
+                val = row[target_idx]
            else:
                val = ""
-            values.append(str(val) if val is not None else "")
+            values.append(self._format_value(val))
        return values
    def _format_value(self, val: Any) -> str:
        """
        格式化值为字符串，保持原始格式
        - 如果是浮点数但实际上等于整数，返回整数格式（如 3.0 -> "3"）
        - 如果是浮点数且有小数部分，保留小数（如 3.5 -> "3.5"）
        - 如果是整数，直接返回（如 3 -> "3"）
        - 其他类型直接转为字符串
        Args:
            val: 原始值
        Returns:
            格式化后的字符串
        """
        if val is None:
            return ""
        # 如果已经是字符串
        if isinstance(val, str):
            return val.strip()
        # 如果是布尔值
        if isinstance(val, bool):
            return "true" if val else "false"
        # 如果是数字
        if isinstance(val, (int, float)):
            # 检查是否是浮点数但等于整数
            if isinstance(val, float):
                # 检查是否是小数部分为0
                if val == int(val):
                    return str(int(val))
                else:
                    # 去除尾部多余的0，但保留必要的小数位
                    formatted = f"{val:.10f}".rstrip('0').rstrip('.')
                    return formatted
            else:
                return str(val)
        return str(val)
    def _extract_values_from_json(self, result) -> List[str]:
        """
        从解析后的 JSON 对象/数组中提取值数组
@@ -852,12 +1327,12 @@ class TemplateFillService:
        if isinstance(result, dict):
            # 优先找 values 数组
            if "values" in result and isinstance(result["values"], list):
-                vals = [str(v).strip() for v in result["values"] if v and str(v).strip()]
+                vals = [self._format_value(v).strip() for v in result["values"] if self._format_value(v).strip()]
                if vals:
                    return vals
            # 尝试找 value 字段
            if "value" in result:
-                val = str(result["value"]).strip()
+                val = self._format_value(result["value"]).strip()
                if val:
                    return [val]
            # 尝试找任何数组类型的键
@@ -865,13 +1340,13 @@ class TemplateFillService:
                val = result[key]
                if isinstance(val, list) and len(val) > 0:
                    if all(isinstance(v, (str, int, float, bool)) or v is None for v in val):
-                        vals = [str(v).strip() for v in val if v is not None and str(v).strip()]
+                        vals = [self._format_value(v).strip() for v in val if v is not None and self._format_value(v).strip()]
                        if vals:
                            return vals
                elif isinstance(val, (str, int, float, bool)):
-                    return [str(val).strip()]
+                    return [self._format_value(val).strip()]
        elif isinstance(result, list):
-            vals = [str(v).strip() for v in result if v is not None and str(v).strip()]
+            vals = [self._format_value(v).strip() for v in result if v is not None and self._format_value(v).strip()]
            if vals:
                return vals
        return []
@@ -1008,15 +1483,15 @@ class TemplateFillService:
            if isinstance(parsed, dict):
                # 如果是 {"values": [...]} 格式，提取 values
                if "values" in parsed and isinstance(parsed["values"], list):
-                    return [str(v).strip() for v in parsed["values"] if v and str(v).strip()]
+                    return [self._format_value(v).strip() for v in parsed["values"] if self._format_value(v).strip()]
                # 如果是其他 dict 格式，尝试找 values 键
                for key in ["values", "value", "data", "result"]:
                    if key in parsed and isinstance(parsed[key], list):
-                        return [str(v).strip() for v in parsed[key] if v and str(v).strip()]
+                        return [self._format_value(v).strip() for v in parsed[key] if self._format_value(v).strip()]
                    elif key in parsed:
-                        return [str(parsed[key]).strip()]
+                        return [self._format_value(parsed[key]).strip()]
            elif isinstance(parsed, list):
-                return [str(v).strip() for v in parsed if v and str(v).strip()]
+                return [self._format_value(v).strip() for v in parsed if self._format_value(v).strip()]
        except (json.JSONDecodeError, TypeError):
            pass
@@ -1032,14 +1507,14 @@ class TemplateFillService:
                        result = []
                        for item in arr:
                            if isinstance(item, dict) and "values" in item and isinstance(item["values"], list):
-                                result.extend([str(v).strip() for v in item["values"] if v and str(v).strip()])
+                                result.extend([self._format_value(v).strip() for v in item["values"] if self._format_value(v).strip()])
                            elif isinstance(item, dict):
                                result.append(str(item))
                            else:
-                                result.append(str(item))
+                                result.append(self._format_value(item))
                        if result:
                            return result
-                    return [str(v).strip() for v in arr if v and str(v).strip()]
+                    return [self._format_value(v).strip() for v in arr if self._format_value(v).strip()]
            except:
                pass
@@ -1130,27 +1605,37 @@ class TemplateFillService:
                    hint_text = f"{user_hint}。{hint_text}"
                # 构建针对字段提取的提示词
-                prompt = f"""你是一个专业的数据提取专家。请从以下文档内容中提取与"{field.name}"相关的所有数据。
+                prompt = f"""你是一个专业的数据提取专家。请从以下文档内容中提取与"{field.name}"完全匹配的数据。
-字段提示: {hint_text}
+【重要】字段名: "{field.name}"
 【重要】字段提示: {hint_text}
 请严格按照以下步骤操作：
 1. 在文档中搜索与"{field.name}"完全相同或高度相关的关键词
 2. 找到后，提取该关键词后的数值（注意：只要数值，不要单位）
 3. 如果是表格中的数据，直接提取该单元格的数值
 4. 如果是段落描述，在关键词附近找数值
 【重要】返回值规则：
 - 只返回纯数值，不要单位（如 "4.9" 而不是 "4.9万亿元"）
 - 如果原文是"4.9万亿元"，返回 "4.9"
 - 如果原文是"144000万册"，返回 "144000"
 - 如果是百分比如"增长7.7%"，返回 "7.7"
 - 如果没有找到完全匹配的数据，返回空数组
 文档内容：
-{doc.content[:8000] if doc.content else ""}
+{doc.content[:10000] if doc.content else ""}
 请完成以下任务：
 1. 仔细阅读文档，找出所有与"{field.name}"相关的数据
 2. 如果文档中有表格数据，提取表格中的对应列值
 3. 如果文档中是段落描述，提取其中的关键数值或结论
 4. 返回提取的所有值（可能多个，用数组存储）
 请用严格的 JSON 格式返回：
 {{
-    "values": ["值1", "值2", ...],
+    "values": ["值1", "值2", ...],  // 只填数值，不要单位
    "source": "数据来源说明",
    "confidence": 0.0到1.0之间的置信度
 }}
-如果没有找到相关数据，返回空数组 values: []"""
+示例：
 - 如果字段是"图书馆总藏量（万册）"且文档说"图书总藏量14.4亿册"，返回 values: ["144000"]
 - 如果字段是"国内旅游收入（亿元）"且文档说"国内旅游收入4.9万亿元"，返回 values: ["49000"]"""
                messages = [
                    {"role": "system", "content": "你是一个专业的数据提取助手，擅长从政府统计公报等文档中提取数据。请严格按JSON格式输出。"},
@@ -1160,7 +1645,7 @@ class TemplateFillService:
                response = await self.llm.chat(
                    messages=messages,
                    temperature=0.1,
-                    max_tokens=5000
+                    max_tokens=4000
                )
                content = self.llm.extract_message_content(response)
@@ -1225,7 +1710,8 @@ class TemplateFillService:
    async def _generate_fields_with_ai(
        self,
        file_path: str,
-        file_type: str
+        file_type: str,
        source_contents: List[dict] = None
    ) -> Optional[List[TemplateField]]:
        """
        使用 AI 为空表生成表头字段
@@ -1243,47 +1729,87 @@ class TemplateFillService:
            import pandas as pd
            # 读取 Excel 内容检查是否为空
            content_sample = ""
            if file_type in ["xlsx", "xls"]:
                df = pd.read_excel(file_path, header=None)
                if df.shape[0] == 0 or df.shape[1] == 0:
                    logger.info("Excel 表格为空")
-                    # 生成默认字段
+                    # 即使 Excel 为空，如果有源文档，仍然尝试使用 AI 生成表头
-                    return [TemplateField(
+                    if not source_contents:
-                        cell=self._column_to_cell(i),
+                        logger.info("Excel 为空且没有源文档，使用默认字段名")
-                        name=f"字段{i+1}",
+                        return [TemplateField(
-                        field_type="text",
+                            cell=self._column_to_cell(i),
-                        required=False,
+                            name=f"字段{i+1}",
-                        hint="请填写此字段"
+                            field_type="text",
-                    ) for i in range(5)]
+                            required=False,
-
+                            hint="请填写此字段"
-                # 表格有数据但没有表头
+                        ) for i in range(5)]
-                if df.shape[1] > 0:
+                    # 有源文档，继续调用 AI 生成表头
-                    # 读取第一行作为参考，看是否为空
+                    logger.info("Excel 为空但有源文档，使用源文档内容生成表头...")
                    first_row = df.iloc[0].tolist() if len(df) > 0 else []
                    if not any(pd.notna(v) and str(v).strip() != '' for v in first_row):
                        # 第一行为空，AI 生成表头
                        content_sample = df.iloc[:10].to_string() if len(df) >= 10 else df.to_string()
                    else:
                        content_sample = df.to_string()
                else:
-                    content_sample = ""
+                    # 表格有数据但没有表头
                    if df.shape[1] > 0:
                        # 读取第一行作为参考，看是否为空
                        first_row = df.iloc[0].tolist() if len(df) > 0 else []
                        if not any(pd.notna(v) and str(v).strip() != '' for v in first_row):
                            # 第一行为空，AI 生成表头
                            content_sample = df.iloc[:10].to_string() if len(df) >= 10 else df.to_string()
                        else:
                            content_sample = df.to_string()
                    else:
                        content_sample = ""
            # 调用 AI 生成表头
-            prompt = f"""你是一个专业的表格设计助手。请为以下空白表格生成合适的表头字段。
+            # 根据源文档内容生成表头
            source_info = ""
            logger.info(f"[DEBUG] _generate_fields_with_ai received source_contents: {len(source_contents) if source_contents else 0} items")
            if source_contents:
                for sc in source_contents:
                    logger.info(f"[DEBUG]   source doc: filename={sc.get('filename')}, content_len={len(sc.get('content', ''))}, titles={len(sc.get('titles', []))}, tables_count={sc.get('tables_count', 0)}, has_tables_summary={bool(sc.get('tables_summary'))}")
                source_info = "\n\n【源文档内容摘要】（根据以下文档内容生成表头）：\n"
                for idx, src in enumerate(source_contents[:5]):  # 最多5个源文档
                    filename = src.get("filename", f"文档{idx+1}")
                    doc_type = src.get("doc_type", "unknown")
                    content = src.get("content", "")[:3000]  # 限制内容长度
                    titles = src.get("titles", [])[:10]  # 最多10个标题
                    tables_count = src.get("tables_count", 0)
                    tables_summary = src.get("tables_summary", "")
-表格内容预览：
+                    source_info += f"\n--- 文档 {idx+1}: {filename} ({doc_type}) ---\n"
-{content_sample[:2000] if content_sample else "空白表格"}
+                    # 处理 titles（可能是字符串列表或字典列表）
                    if titles:
                        title_texts = []
                        for t in titles[:5]:
                            if isinstance(t, dict):
                                title_texts.append(t.get('text', ''))
                            else:
                                title_texts.append(str(t))
                        if title_texts:
                            source_info += f"【章节标题】: {', '.join(title_texts)}\n"
                    if tables_count > 0:
                        source_info += f"【包含表格数】: {tables_count}\n"
                    if tables_summary:
                        source_info += f"{tables_summary}\n"
                    elif content:
                        source_info += f"【内容预览】: {content[:1500]}...\n"
-请生成5-10个简洁的表头字段名，这些字段应该：
+            prompt = f"""你是一个专业的表格设计助手。请根据源文档内容生成合适的表格表头字段。
-1. 简洁明了，易于理解
+
-2. 适合作为表格列标题
+任务：用户有一些源文档（包含表格数据），需要填写到空白表格模板中。源文档中的表格如下：
-3. 之间有明显的区分度
+
 {source_info}
 【重要要求】
 1. 请仔细阅读上面的源文档表格，找出所有不同的列名（如"产品名称"、"1995年产量"、"按资产总额计算(%)"等）
 2. 直接使用这些实际的列名作为表头字段名，不要生成新的或同义词
 3. 如果一个源文档有多个表格，请为每个表格选择合适的列名
 4. 生成3-8个表头字段，优先选择数据量大的表格的列
 请严格按照以下 JSON 格式输出（只需输出 JSON，不要其他内容）：
 {{
    "fields": [
-        {{"name": "字段名1", "hint": "字段说明提示1"}},
+        {{"name": "实际列名1", "hint": "对该列的说明"}},
-        {{"name": "字段名2", "hint": "字段说明提示2"}}
+        {{"name": "实际列名2", "hint": "对该列的说明"}}
    ]
 }}
 """
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@@ -1,5 +1,5 @@
 import { RouterProvider } from 'react-router-dom';
-import { AuthProvider } from '@/context/AuthContext';
+import { AuthProvider } from '@/contexts/AuthContext';
 import { TemplateFillProvider } from '@/context/TemplateFillContext';
 import { router } from '@/routes';
 import { Toaster } from 'sonner';
--- a/frontend/src/components/common/RouteGuard.tsx
+++ b/frontend/src/components/common/RouteGuard.tsx
@@ -1,6 +1,6 @@
 import React from 'react';
 import { Navigate, useLocation } from 'react-router-dom';
-import { useAuth } from '@/context/AuthContext';
+import { useAuth } from '@/contexts/AuthContext';
 export const RouteGuard: React.FC<{ children: React.ReactNode }> = ({ children }) => {
  const { user, loading } = useAuth();
--- a/frontend/src/context/AuthContext.tsx
+++ b/frontend/src/context/AuthContext.tsx
@@ -1,85 +0,0 @@
 import React, { createContext, useContext, useEffect, useState } from 'react';
 import { supabase } from '@/db/supabase';
 import { User } from '@supabase/supabase-js';
 import { Profile } from '@/types/types';
 interface AuthContextType {
  user: User | null;
  profile: Profile | null;
  signIn: (email: string, password: string) => Promise<{ error: any }>;
  signUp: (email: string, password: string) => Promise<{ error: any }>;
  signOut: () => Promise<{ error: any }>;
  loading: boolean;
 }
 const AuthContext = createContext<AuthContextType | undefined>(undefined);
 export const AuthProvider: React.FC<{ children: React.ReactNode }> = ({ children }) => {
  const [user, setUser] = useState<User | null>(null);
  const [profile, setProfile] = useState<Profile | null>(null);
  const [loading, setLoading] = useState(true);
  useEffect(() => {
    // Check active sessions and sets the user
    supabase.auth.getSession().then(({ data: { session } }) => {
      setUser(session?.user ?? null);
      if (session?.user) fetchProfile(session.user.id);
      else setLoading(false);
    });
    // Listen for changes on auth state (sign in, sign out, etc.)
    const { data: { subscription } } = supabase.auth.onAuthStateChange((_event, session) => {
      setUser(session?.user ?? null);
      if (session?.user) fetchProfile(session.user.id);
      else {
        setProfile(null);
        setLoading(false);
      }
    });
    return () => subscription.unsubscribe();
  }, []);
  const fetchProfile = async (uid: string) => {
    try {
      const { data, error } = await supabase
        .from('profiles')
        .select('*')
        .eq('id', uid)
        .maybeSingle();
      if (error) throw error;
      setProfile(data);
    } catch (err) {
      console.error('Error fetching profile:', err);
    } finally {
      setLoading(false);
    }
  };
  const signIn = async (email: string, password: string) => {
    return await supabase.auth.signInWithPassword({ email, password });
  };
  const signUp = async (email: string, password: string) => {
    return await supabase.auth.signUp({ email, password });
  };
  const signOut = async () => {
    return await supabase.auth.signOut();
  };
  return (
    <AuthContext.Provider value={{ user, profile, signIn, signUp, signOut, loading }}>
      {children}
    </AuthContext.Provider>
  );
 };
 export const useAuth = () => {
  const context = useContext(AuthContext);
  if (context === undefined) {
    throw new Error('useAuth must be used within an AuthProvider');
  }
  return context;
 };
--- a/frontend/src/context/TemplateFillContext.tsx
+++ b/frontend/src/context/TemplateFillContext.tsx
@@ -21,6 +21,7 @@ interface TemplateFillState {
  templateFields: TemplateField[];
  sourceFiles: SourceFile[];
  sourceFilePaths: string[];
  sourceDocIds: string[];
  templateId: string;
  filledResult: any;
  setStep: (step: Step) => void;
@@ -30,6 +31,9 @@ interface TemplateFillState {
  addSourceFiles: (files: SourceFile[]) => void;
  removeSourceFile: (index: number) => void;
  setSourceFilePaths: (paths: string[]) => void;
  setSourceDocIds: (ids: string[]) => void;
  addSourceDocId: (id: string) => void;
  removeSourceDocId: (id: string) => void;
  setTemplateId: (id: string) => void;
  setFilledResult: (result: any) => void;
  reset: () => void;
@@ -41,6 +45,7 @@ const initialState = {
  templateFields: [],
  sourceFiles: [],
  sourceFilePaths: [],
  sourceDocIds: [],
  templateId: '',
  filledResult: null,
  setStep: () => {},
@@ -50,6 +55,9 @@ const initialState = {
  addSourceFiles: () => {},
  removeSourceFile: () => {},
  setSourceFilePaths: () => {},
  setSourceDocIds: () => {},
  addSourceDocId: () => {},
  removeSourceDocId: () => {},
  setTemplateId: () => {},
  setFilledResult: () => {},
  reset: () => {},
@@ -63,6 +71,7 @@ export const TemplateFillProvider: React.FC<{ children: ReactNode }> = ({ childr
  const [templateFields, setTemplateFields] = useState<TemplateField[]>([]);
  const [sourceFiles, setSourceFiles] = useState<SourceFile[]>([]);
  const [sourceFilePaths, setSourceFilePaths] = useState<string[]>([]);
  const [sourceDocIds, setSourceDocIds] = useState<string[]>([]);
  const [templateId, setTemplateId] = useState<string>('');
  const [filledResult, setFilledResult] = useState<any>(null);
@@ -74,12 +83,21 @@ export const TemplateFillProvider: React.FC<{ children: ReactNode }> = ({ childr
    setSourceFiles(prev => prev.filter((_, i) => i !== index));
  };
  const addSourceDocId = (id: string) => {
    setSourceDocIds(prev => prev.includes(id) ? prev : [...prev, id]);
  };
  const removeSourceDocId = (id: string) => {
    setSourceDocIds(prev => prev.filter(docId => docId !== id));
  };
  const reset = () => {
    setStep('upload');
    setTemplateFile(null);
    setTemplateFields([]);
    setSourceFiles([]);
    setSourceFilePaths([]);
    setSourceDocIds([]);
    setTemplateId('');
    setFilledResult(null);
  };
@@ -92,6 +110,7 @@ export const TemplateFillProvider: React.FC<{ children: ReactNode }> = ({ childr
        templateFields,
        sourceFiles,
        sourceFilePaths,
        sourceDocIds,
        templateId,
        filledResult,
        setStep,
@@ -101,6 +120,9 @@ export const TemplateFillProvider: React.FC<{ children: ReactNode }> = ({ childr
        addSourceFiles,
        removeSourceFile,
        setSourceFilePaths,
        setSourceDocIds,
        addSourceDocId,
        removeSourceDocId,
        setTemplateId,
        setFilledResult,
        reset,
--- a/frontend/src/db/backend-api.ts
+++ b/frontend/src/db/backend-api.ts
@@ -400,6 +400,49 @@ export const backendApi = {
    }
  },
  /**
   * 获取任务历史列表
   */
  async getTasks(
    limit: number = 50,
    skip: number = 0
  ): Promise<{ success: boolean; tasks: any[]; count: number }> {
    const url = `${BACKEND_BASE_URL}/tasks?limit=${limit}&skip=${skip}`;
    try {
      const response = await fetch(url);
      if (!response.ok) {
        const error = await response.json();
        throw new Error(error.detail || '获取任务列表失败');
      }
      return await response.json();
    } catch (error) {
      console.error('获取任务列表失败:', error);
      throw error;
    }
  },
  /**
   * 删除任务
   */
  async deleteTask(taskId: string): Promise<{ success: boolean; deleted: boolean }> {
    const url = `${BACKEND_BASE_URL}/tasks/${taskId}`;
    try {
      const response = await fetch(url, {
        method: 'DELETE'
      });
      if (!response.ok) {
        const error = await response.json();
        throw new Error(error.detail || '删除任务失败');
      }
      return await response.json();
    } catch (error) {
      console.error('删除任务失败:', error);
      throw error;
    }
  },
  /**
   * 轮询任务状态直到完成
   */
@@ -1145,7 +1188,7 @@ export const aiApi = {
    try {
      const response = await fetch(url, {
-        method: 'GET',
+        method: 'POST',
        body: formData,
      });
--- a/frontend/src/pages/Documents.tsx
+++ b/frontend/src/pages/Documents.tsx
@@ -1,4 +1,4 @@
-import React, { useState, useEffect, useCallback } from 'react';
+import React, { useState, useEffect, useCallback, useRef } from 'react';
 import { useDropzone } from 'react-dropzone';
 import {
  FileText,
@@ -23,7 +23,8 @@ import {
  List,
  MessageSquareCode,
  Tag,
-  HelpCircle
+  HelpCircle,
  Plus
 } from 'lucide-react';
 import { Button } from '@/components/ui/button';
 import { Input } from '@/components/ui/input';
@@ -72,8 +73,10 @@ const Documents: React.FC = () => {
  // 上传相关状态
  const [uploading, setUploading] = useState(false);
  const [uploadedFile, setUploadedFile] = useState<File | null>(null);
  const [uploadedFiles, setUploadedFiles] = useState<File[]>([]);
  const [parseResult, setParseResult] = useState<ExcelParseResult | null>(null);
  const [expandedSheet, setExpandedSheet] = useState<string | null>(null);
  const [uploadExpanded, setUploadExpanded] = useState(false);
  // AI 分析相关状态
  const [analyzing, setAnalyzing] = useState(false);
@@ -210,75 +213,119 @@ const Documents: React.FC = () => {
  // 文件上传处理
  const onDrop = async (acceptedFiles: File[]) => {
-    const file = acceptedFiles[0];
+    if (acceptedFiles.length === 0) return;
    if (!file) return;
    setUploadedFile(file);
    setUploading(true);
-    setParseResult(null);
+    let successCount = 0;
-    setAiAnalysis(null);
+    let failCount = 0;
-    setAnalysisCharts(null);
+    const successfulFiles: File[] = [];
    setExpandedSheet(null);
    setMdAnalysis(null);
    setMdSections([]);
    setMdStreamingContent('');
-    const ext = file.name.split('.').pop()?.toLowerCase();
+    // 逐个上传文件
    for (const file of acceptedFiles) {
      const ext = file.name.split('.').pop()?.toLowerCase();
-    try {
+      try {
-      // Excel 文件使用专门的上传接口
+        if (ext === 'xlsx' || ext === 'xls') {
-      if (ext === 'xlsx' || ext === 'xls') {
+          const result = await backendApi.uploadExcel(file, {
-        const result = await backendApi.uploadExcel(file, {
+            parseAllSheets: parseOptions.parseAllSheets,
-          parseAllSheets: parseOptions.parseAllSheets,
+            headerRow: parseOptions.headerRow
-          headerRow: parseOptions.headerRow
+          });
-        });
+          if (result.success) {
-        if (result.success) {
+            successCount++;
-          toast.success(`解析成功: ${file.name}`);
+            successfulFiles.push(file);
-          setParseResult(result);
+            // 第一个Excel文件设置解析结果供预览
-          loadDocuments(); // 刷新文档列表
+            if (successCount === 1) {
-          if (result.metadata?.sheet_count === 1) {
+              setUploadedFile(file);
-            setExpandedSheet(Object.keys(result.data?.sheets || {})[0] || null);
+              setParseResult(result);
              if (result.metadata?.sheet_count === 1) {
                setExpandedSheet(Object.keys(result.data?.sheets || {})[0] || null);
              }
            }
            loadDocuments();
          } else {
            failCount++;
            toast.error(`${file.name}: ${result.error || '解析失败'}`);
          }
        } else if (ext === 'md' || ext === 'markdown') {
          const result = await backendApi.uploadDocument(file);
          if (result.task_id) {
            successCount++;
            successfulFiles.push(file);
            if (successCount === 1) {
              setUploadedFile(file);
            }
            // 轮询任务状态
            let attempts = 0;
            const checkStatus = async () => {
              while (attempts < 30) {
                try {
                  const status = await backendApi.getTaskStatus(result.task_id);
                  if (status.status === 'success') {
                    loadDocuments();
                    return;
                  } else if (status.status === 'failure') {
                    return;
                  }
                } catch (e) {
                  console.error('检查状态失败', e);
                }
                await new Promise(resolve => setTimeout(resolve, 2000));
                attempts++;
              }
            };
            checkStatus();
          } else {
            failCount++;
          }
        } else {
-          toast.error(result.error || '解析失败');
+          // 其他文档使用通用上传接口
-        }
+          const result = await backendApi.uploadDocument(file);
-      } else if (ext === 'md' || ext === 'markdown') {
+          if (result.task_id) {
-        // Markdown 文件：获取大纲
+            successCount++;
-        await fetchMdOutline();
+            successfulFiles.push(file);
-      } else {
+            if (successCount === 1) {
-        // 其他文档使用通用上传接口
+              setUploadedFile(file);
        const result = await backendApi.uploadDocument(file);
        if (result.task_id) {
          toast.success(`文件 ${file.name} 已提交处理`);
          // 轮询任务状态
          let attempts = 0;
          const checkStatus = async () => {
            while (attempts < 30) {
              try {
                const status = await backendApi.getTaskStatus(result.task_id);
                if (status.status === 'success') {
                  toast.success(`文件 ${file.name} 处理完成`);
                  loadDocuments();
                  return;
                } else if (status.status === 'failure') {
                  toast.error(`文件 ${file.name} 处理失败`);
                  return;
                }
              } catch (e) {
                console.error('检查状态失败', e);
              }
              await new Promise(resolve => setTimeout(resolve, 2000));
              attempts++;
            }
-            toast.error(`文件 ${file.name} 处理超时`);
+            // 轮询任务状态
-          };
+            let attempts = 0;
-          checkStatus();
+            const checkStatus = async () => {
              while (attempts < 30) {
                try {
                  const status = await backendApi.getTaskStatus(result.task_id);
                  if (status.status === 'success') {
                    loadDocuments();
                    return;
                  } else if (status.status === 'failure') {
                    return;
                  }
                } catch (e) {
                  console.error('检查状态失败', e);
                }
                await new Promise(resolve => setTimeout(resolve, 2000));
                attempts++;
              }
            };
            checkStatus();
          } else {
            failCount++;
          }
        }
      } catch (error: any) {
        failCount++;
        toast.error(`${file.name}: ${error.message || '上传失败'}`);
      }
-    } catch (error: any) {
+    }
-      toast.error(error.message || '上传失败');
+
-    } finally {
+    setUploading(false);
-      setUploading(false);
+    loadDocuments();
    if (successCount > 0) {
      toast.success(`成功上传 ${successCount} 个文件`);
      setUploadedFiles(prev => [...prev, ...successfulFiles]);
      setUploadExpanded(true);
    }
    if (failCount > 0) {
      toast.error(`${failCount} 个文件上传失败`);
    }
  };
@@ -291,7 +338,7 @@ const Documents: React.FC = () => {
      'text/markdown': ['.md'],
      'text/plain': ['.txt']
    },
-    maxFiles: 1
+    multiple: true
  });
  // AI 分析处理
@@ -449,6 +496,7 @@ const Documents: React.FC = () => {
  const handleDeleteFile = () => {
    setUploadedFile(null);
    setUploadedFiles([]);
    setParseResult(null);
    setAiAnalysis(null);
    setAnalysisCharts(null);
@@ -456,6 +504,17 @@ const Documents: React.FC = () => {
    toast.success('文件已清除');
  };
  const handleRemoveUploadedFile = (index: number) => {
    setUploadedFiles(prev => {
      const newFiles = prev.filter((_, i) => i !== index);
      if (newFiles.length === 0) {
        setUploadedFile(null);
      }
      return newFiles;
    });
    toast.success('文件已从列表移除');
  };
  const handleDelete = async (docId: string) => {
    try {
      const result = await backendApi.deleteDocument(docId);
@@ -615,7 +674,7 @@ const Documents: React.FC = () => {
          <h1 className="text-3xl font-extrabold tracking-tight">文档中心</h1>
          <p className="text-muted-foreground">上传文档，自动解析并使用 AI 进行深度分析</p>
        </div>
-        <Button variant="outline" className="rounded-xl gap-2" onClick={loadDocuments}>
+        <Button variant="outline" className="rounded-xl gap-2" onClick={() => loadDocuments()}>
          <RefreshCcw size={18} />
          <span>刷新</span>
        </Button>
@@ -640,7 +699,82 @@ const Documents: React.FC = () => {
            </CardHeader>
            {uploadPanelOpen && (
              <CardContent className="space-y-4">
-                {!uploadedFile ? (
+                {uploadedFiles.length > 0 || uploadedFile ? (
                  <div className="space-y-3">
                    {/* 文件列表头部 */}
                    <div
                      className="flex items-center justify-between p-3 bg-muted/50 rounded-xl cursor-pointer hover:bg-muted/70 transition-colors"
                      onClick={() => setUploadExpanded(!uploadExpanded)}
                    >
                      <div className="flex items-center gap-3">
                        <div className="w-10 h-10 rounded-lg bg-primary/10 text-primary flex items-center justify-center">
                          <Upload size={20} />
                        </div>
                        <div>
                          <p className="font-semibold text-sm">
                            已上传 {(uploadedFiles.length > 0 ? uploadedFiles : [uploadedFile]).length} 个文件
                          </p>
                          <p className="text-xs text-muted-foreground">
                            {uploadExpanded ? '点击收起' : '点击展开查看'}
                          </p>
                        </div>
                      </div>
                      <div className="flex items-center gap-2">
                        <Button
                          variant="ghost"
                          size="sm"
                          onClick={(e) => {
                            e.stopPropagation();
                            handleDeleteFile();
                          }}
                          className="text-destructive hover:text-destructive"
                        >
                          <Trash2 size={14} className="mr-1" />
                          清空
                        </Button>
                        {uploadExpanded ? <ChevronUp size={16} /> : <ChevronDown size={16} />}
                      </div>
                    </div>
                    {/* 展开的文件列表 */}
                    {uploadExpanded && (
                      <div className="space-y-2 border rounded-xl p-3">
                        {(uploadedFiles.length > 0 ? uploadedFiles : [uploadedFile]).filter(Boolean).map((file, index) => (
                          <div key={index} className="flex items-center gap-3 p-2 bg-background rounded-lg">
                            <div className={cn(
                              "w-8 h-8 rounded flex items-center justify-center",
                              isExcelFile(file?.name || '') ? "bg-emerald-500/10 text-emerald-500" : "bg-blue-500/10 text-blue-500"
                            )}>
                              {isExcelFile(file?.name || '') ? <FileSpreadsheet size={16} /> : <FileText size={16} />}
                            </div>
                            <div className="flex-1 min-w-0">
                              <p className="text-sm truncate">{file?.name}</p>
                              <p className="text-xs text-muted-foreground">{formatFileSize(file?.size || 0)}</p>
                            </div>
                            <Button
                              variant="ghost"
                              size="icon"
                              className="text-destructive hover:bg-destructive/10"
                              onClick={() => handleRemoveUploadedFile(index)}
                            >
                              <Trash2 size={14} />
                            </Button>
                          </div>
                        ))}
                        {/* 继续添加按钮 */}
                        <div
                          {...getRootProps()}
                          className="flex items-center justify-center gap-2 p-3 border-2 border-dashed rounded-lg cursor-pointer hover:border-primary/50 hover:bg-primary/5 transition-colors"
                        >
                          <input {...getInputProps()} multiple={true} />
                          <Plus size={16} className="text-muted-foreground" />
                          <span className="text-sm text-muted-foreground">继续添加更多文件</span>
                        </div>
                      </div>
                    )}
                  </div>
                ) : (
                  <div
                    {...getRootProps()}
                    className={cn(
@@ -649,7 +783,7 @@ const Documents: React.FC = () => {
                      uploading && "opacity-50 pointer-events-none"
                    )}
                  >
-                    <input {...getInputProps()} />
+                    <input {...getInputProps()} multiple={true} />
                    <div className="w-14 h-14 rounded-xl bg-primary/10 text-primary flex items-center justify-center mb-4 group-hover:scale-110 transition-transform">
                      {uploading ? <Loader2 className="animate-spin" size={28} /> : <Upload size={28} />}
                    </div>
@@ -671,30 +805,6 @@ const Documents: React.FC = () => {
                      </Badge>
                    </div>
                  </div>
                ) : (
                  <div className="space-y-4">
                    <div className="flex items-center gap-3 p-3 bg-muted/30 rounded-xl">
                      <div className={cn(
                        "w-10 h-10 rounded-lg flex items-center justify-center",
                        isExcelFile(uploadedFile.name) ? "bg-emerald-500/10 text-emerald-500" : "bg-blue-500/10 text-blue-500"
                      )}>
                        {isExcelFile(uploadedFile.name) ? <FileSpreadsheet size={20} /> : <FileText size={20} />}
                      </div>
                      <div className="flex-1 min-w-0">
                        <p className="font-semibold text-sm truncate">{uploadedFile.name}</p>
                        <p className="text-xs text-muted-foreground">{formatFileSize(uploadedFile.size)}</p>
                      </div>
                      <Button variant="ghost" size="icon" className="text-destructive hover:bg-destructive/10" onClick={handleDeleteFile}>
                        <Trash2 size={16} />
                      </Button>
                    </div>
                    {isExcelFile(uploadedFile.name) && (
                      <Button onClick={() => onDrop([uploadedFile])} className="w-full" disabled={uploading}>
                        {uploading ? '解析中...' : '重新解析'}
                      </Button>
                    )}
                  </div>
                )}
              </CardContent>
            )}
--- a/frontend/src/pages/ExcelParse.tsx
+++ b/frontend/src/pages/ExcelParse.tsx
--- a/frontend/src/pages/FormFill.tsx
+++ b/frontend/src/pages/FormFill.tsx
@@ -1,603 +0,0 @@
 import React, { useState, useEffect } from 'react';
 import {
  TableProperties,
  Plus,
  FilePlus,
  CheckCircle2,
  Download,
  Clock,
  RefreshCcw,
  Sparkles,
  Zap,
  FileCheck,
  FileSpreadsheet,
  Trash2,
  ChevronDown,
  ChevronUp,
  BarChart3,
  FileText,
  TrendingUp,
  Info,
  AlertCircle,
  Loader2
 } from 'lucide-react';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardHeader, CardTitle, CardDescription, CardFooter } from '@/components/ui/card';
 import { Badge } from '@/components/ui/badge';
 import { useAuth } from '@/context/AuthContext';
 import { templateApi, documentApi, taskApi } from '@/db/api';
 import { backendApi, aiApi } from '@/db/backend-api';
 import { supabase } from '@/db/supabase';
 import { format } from 'date-fns';
 import { toast } from 'sonner';
 import { cn } from '@/lib/utils';
 import { Skeleton } from '@/components/ui/skeleton';
 import {
  Dialog,
  DialogContent,
  DialogHeader,
  DialogTitle,
  DialogTrigger,
  DialogFooter,
  DialogDescription
 } from '@/components/ui/dialog';
 import { Checkbox } from '@/components/ui/checkbox';
 import { ScrollArea } from '@/components/ui/scroll-area';
 import { Input } from '@/components/ui/input';
 import { Label } from '@/components/ui/label';
 import { Textarea } from '@/components/ui/textarea';
 import { Select, SelectContent, SelectItem, SelectTrigger, SelectValue } from '@/components/ui/select';
 import { useDropzone } from 'react-dropzone';
 import { Markdown } from '@/components/ui/markdown';
 type Template = any;
 type Document = any;
 type FillTask = any;
 const FormFill: React.FC = () => {
  const { profile } = useAuth();
  const [templates, setTemplates] = useState<Template[]>([]);
  const [documents, setDocuments] = useState<Document[]>([]);
  const [tasks, setTasks] = useState<any[]>([]);
  const [loading, setLoading] = useState(true);
  // Selection state
  const [selectedTemplate, setSelectedTemplate] = useState<string | null>(null);
  const [selectedDocs, setSelectedDocs] = useState<string[]>([]);
  const [creating, setCreating] = useState(false);
  const [openTaskDialog, setOpenTaskDialog] = useState(false);
  const [viewingTask, setViewingTask] = useState<any | null>(null);
  // Excel upload state
  const [excelFile, setExcelFile] = useState<File | null>(null);
  const [excelParseResult, setExcelParseResult] = useState<any>(null);
  const [excelAnalysis, setExcelAnalysis] = useState<any>(null);
  const [excelAnalyzing, setExcelAnalyzing] = useState(false);
  const [expandedSheet, setExpandedSheet] = useState<string | null>(null);
  const [aiOptions, setAiOptions] = useState({
    userPrompt: '请分析这些数据，并提取关键信息用于填表，包括数值、分类、摘要等。',
    analysisType: 'general' as 'general' | 'summary' | 'statistics' | 'insights'
  });
  const loadData = async () => {
    if (!profile) return;
    try {
      const [t, d, ts] = await Promise.all([
        templateApi.listTemplates((profile as any).id),
        documentApi.listDocuments((profile as any).id),
        taskApi.listTasks((profile as any).id)
      ]);
      setTemplates(t);
      setDocuments(d);
      setTasks(ts);
    } catch (err: any) {
      toast.error('数据加载失败');
    } finally {
      setLoading(false);
    }
  };
  useEffect(() => {
    loadData();
  }, [profile]);
  // Excel upload handlers
  const onExcelDrop = async (acceptedFiles: File[]) => {
    const file = acceptedFiles[0];
    if (!file) return;
    if (!file.name.match(/\.(xlsx|xls)$/i)) {
      toast.error('仅支持 .xlsx 和 .xls 格式的 Excel 文件');
      return;
    }
    setExcelFile(file);
    setExcelParseResult(null);
    setExcelAnalysis(null);
    setExpandedSheet(null);
    try {
      const result = await backendApi.uploadExcel(file);
      if (result.success) {
        toast.success(`Excel 解析成功: ${file.name}`);
        setExcelParseResult(result);
      } else {
        toast.error(result.error || '解析失败');
      }
    } catch (error: any) {
      toast.error(error.message || '上传失败');
    }
  };
  const { getRootProps, getInputProps, isDragActive } = useDropzone({
    onDrop: onExcelDrop,
    accept: {
      'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet': ['.xlsx'],
      'application/vnd.ms-excel': ['.xls']
    },
    maxFiles: 1
  });
  const handleAnalyzeExcel = async () => {
    if (!excelFile || !excelParseResult?.success) {
      toast.error('请先上传并解析 Excel 文件');
      return;
    }
    setExcelAnalyzing(true);
    setExcelAnalysis(null);
    try {
      const result = await aiApi.analyzeExcel(excelFile, {
        userPrompt: aiOptions.userPrompt,
        analysisType: aiOptions.analysisType
      });
      if (result.success) {
        toast.success('AI 分析完成');
        setExcelAnalysis(result);
      } else {
        toast.error(result.error || 'AI 分析失败');
      }
    } catch (error: any) {
      toast.error(error.message || 'AI 分析失败');
    } finally {
      setExcelAnalyzing(false);
    }
  };
  const handleUseExcelData = () => {
    if (!excelParseResult?.success) {
      toast.error('请先解析 Excel 文件');
      return;
    }
    // 将 Excel 解析的数据标记为"文档"，添加到选择列表
    toast.success('Excel 数据已添加到数据源，请在任务对话框中选择');
    // 这里可以添加逻辑来将 Excel 数据传递给后端创建任务
  };
  const handleDeleteExcel = () => {
    setExcelFile(null);
    setExcelParseResult(null);
    setExcelAnalysis(null);
    setExpandedSheet(null);
    toast.success('Excel 文件已清除');
  };
  const handleUploadTemplate = async (e: React.ChangeEvent<HTMLInputElement>) => {
    const file = e.target.files?.[0];
    if (!file || !profile) return;
    try {
      toast.loading('正在上传模板...');
      await templateApi.uploadTemplate(file, (profile as any).id);
      toast.dismiss();
      toast.success('模板上传成功');
      loadData();
    } catch (err) {
      toast.dismiss();
      toast.error('上传模板失败');
    }
  };
  const handleCreateTask = async () => {
    if (!profile || !selectedTemplate || selectedDocs.length === 0) {
      toast.error('请先选择模板和数据源文档');
      return;
    }
    setCreating(true);
    try {
      const task = await taskApi.createTask((profile as any).id, selectedTemplate, selectedDocs);
      if (task) {
        toast.success('任务已创建，正在进行智能填表...');
        setOpenTaskDialog(false);
        // Invoke edge function
        supabase.functions.invoke('fill-template', {
          body: { taskId: task.id }
        }).then(({ error }) => {
          if (error) toast.error('填表任务执行失败');
          else {
            toast.success('表格填写完成！');
            loadData();
          }
        });
        loadData();
      }
    } catch (err: any) {
      toast.error('创建任务失败');
    } finally {
      setCreating(false);
    }
  };
  const getStatusColor = (status: string) => {
    switch (status) {
      case 'completed': return 'bg-emerald-500 text-white';
      case 'failed': return 'bg-destructive text-white';
      default: return 'bg-amber-500 text-white';
    }
  };
  const formatFileSize = (bytes: number): string => {
    if (bytes === 0) return '0 B';
    const k = 1024;
    const sizes = ['B', 'KB', 'MB', 'GB'];
    const i = Math.floor(Math.log(bytes) / Math.log(k));
    return `${(bytes / Math.pow(k, i)).toFixed(2)} ${sizes[i]}`;
  };
  return (
    <div className="space-y-8 animate-fade-in pb-10">
      <section className="flex flex-col md:flex-row md:items-center justify-between gap-4">
        <div className="space-y-1">
          <h1 className="text-3xl font-extrabold tracking-tight">智能填表</h1>
          <p className="text-muted-foreground">根据您的表格模板，自动聚合多源文档信息进行精准填充，告别重复劳动。</p>
        </div>
        <div className="flex items-center gap-3">
          <Dialog open={openTaskDialog} onOpenChange={setOpenTaskDialog}>
            <DialogTrigger asChild>
              <Button className="rounded-xl shadow-lg shadow-primary/20 gap-2 h-11 px-6">
                <FilePlus size={18} />
                <span>新建填表任务</span>
              </Button>
            </DialogTrigger>
            <DialogContent className="max-w-4xl max-h-[90vh] flex flex-col p-0 overflow-hidden border-none shadow-2xl rounded-3xl">
              <DialogHeader className="p-8 pb-4 bg-muted/50">
                <DialogTitle className="text-2xl font-bold flex items-center gap-2">
                  <Sparkles size={24} className="text-primary" />
                  开启智能填表之旅
                </DialogTitle>
                <DialogDescription>
                  选择一个表格模板及若干个数据源文档，AI 将自动为您分析并填写。
                </DialogDescription>
              </DialogHeader>
              <ScrollArea className="flex-1 p-8 pt-4">
                <div className="space-y-8">
                  {/* Step 1: Select Template */}
                  <div className="space-y-4">
                    <div className="flex items-center justify-between">
                      <h4 className="font-bold flex items-center gap-2 text-primary uppercase tracking-widest text-xs">
                        <span className="w-5 h-5 rounded-full bg-primary text-white flex items-center justify-center text-[10px]">1</span>
                        选择表格模板
                      </h4>
                      <label className="cursor-pointer text-xs font-semibold text-primary hover:underline flex items-center gap-1">
                        <Plus size={12} /> 上传新模板
                        <input type="file" className="hidden" onChange={handleUploadTemplate} accept=".docx,.xlsx" />
                      </label>
                    </div>
                    {templates.length > 0 ? (
                      <div className="grid grid-cols-1 sm:grid-cols-2 gap-3">
                        {templates.map(t => (
                          <div
                            key={t.id}
                            className={cn(
                              "p-4 rounded-2xl border-2 transition-all cursor-pointer flex items-center gap-3 group relative overflow-hidden",
                              selectedTemplate === t.id ? "border-primary bg-primary/5" : "border-border hover:border-primary/50"
                            )}
                            onClick={() => setSelectedTemplate(t.id)}
                          >
                            <div className={cn(
                              "w-10 h-10 rounded-xl flex items-center justify-center shrink-0 transition-colors",
                              selectedTemplate === t.id ? "bg-primary text-white" : "bg-muted text-muted-foreground"
                            )}>
                              <TableProperties size={20} />
                            </div>
                            <div className="flex-1 min-w-0">
                              <p className="font-bold text-sm truncate">{t.name}</p>
                              <p className="text-[10px] text-muted-foreground uppercase">{t.type}</p>
                            </div>
                            {selectedTemplate === t.id && (
                              <div className="absolute top-0 right-0 w-8 h-8 bg-primary text-white flex items-center justify-center rounded-bl-xl">
                                <CheckCircle2 size={14} />
                              </div>
                            )}
                          </div>
                        ))}
                      </div>
                    ) : (
                      <div className="p-8 text-center bg-muted/30 rounded-2xl border border-dashed text-sm italic text-muted-foreground">
                        暂无模板，请先点击右上角上传。
                      </div>
                    )}
                  </div>
                  {/* Step 2: Upload & Analyze Excel */}
                  <div className="space-y-4">
                    <h4 className="font-bold flex items-center gap-2 text-primary uppercase tracking-widest text-xs">
                      <span className="w-5 h-5 rounded-full bg-primary text-white flex items-center justify-center text-[10px]">1.5</span>
                      Excel 数据源
                    </h4>
                    <div className="bg-muted/20 rounded-2xl p-6">
                      {!excelFile ? (
                        <div
                          {...getRootProps()}
                          className={cn(
                            "border-2 border-dashed rounded-xl p-8 transition-all duration-300 flex flex-col items-center justify-center text-center cursor-pointer group",
                            isDragActive ? "border-primary bg-primary/5" : "border-muted-foreground/20 hover:border-primary/50 hover:bg-muted/30"
                          )}
                        >
                          <input {...getInputProps()} />
                          <div className="w-12 h-12 rounded-xl bg-primary/10 text-primary flex items-center justify-center mb-3 group-hover:scale-110 transition-transform">
                            <FileSpreadsheet size={24} />
                          </div>
                          <p className="font-semibold text-sm">
                            {isDragActive ? '释放以开始上传' : '点击或拖拽 Excel 文件'}
                          </p>
                          <p className="text-xs text-muted-foreground mt-1">支持 .xlsx 和 .xls 格式</p>
                        </div>
                      ) : (
                        <div className="space-y-4">
                          <div className="flex items-center gap-3 p-3 bg-background rounded-xl">
                            <div className="w-10 h-10 rounded-lg bg-emerald-500/10 text-emerald-500 flex items-center justify-center">
                              <FileSpreadsheet size={20} />
                            </div>
                            <div className="flex-1 min-w-0">
                              <p className="font-semibold text-sm truncate">{excelFile.name}</p>
                              <p className="text-xs text-muted-foreground">{formatFileSize(excelFile.size)}</p>
                            </div>
                            <div className="flex gap-2">
                              <Button
                                variant="ghost"
                                size="icon"
                                className="text-destructive hover:bg-destructive/10"
                                onClick={handleDeleteExcel}
                              >
                                <Trash2 size={16} />
                              </Button>
                            </div>
                          </div>
                          {/* AI Analysis Options */}
                          {excelParseResult?.success && (
                            <div className="space-y-3">
                              <div className="space-y-2">
                                <Label htmlFor="analysis-type" className="text-xs">分析类型</Label>
                                <Select
                                  value={aiOptions.analysisType}
                                  onValueChange={(value: any) => setAiOptions({ ...aiOptions, analysisType: value })}
                                >
                                  <SelectTrigger id="analysis-type" className="bg-background h-9 text-sm">
                                    <SelectValue placeholder="选择分析类型" />
                                  </SelectTrigger>
                                  <SelectContent>
                                    <SelectItem value="general">综合分析</SelectItem>
                                    <SelectItem value="summary">数据摘要</SelectItem>
                                    <SelectItem value="statistics">统计分析</SelectItem>
                                    <SelectItem value="insights">深度洞察</SelectItem>
                                  </SelectContent>
                                </Select>
                              </div>
                              <div className="space-y-2">
                                <Label htmlFor="user-prompt" className="text-xs">自定义提示词</Label>
                                <Textarea
                                  id="user-prompt"
                                  value={aiOptions.userPrompt}
                                  onChange={(e) => setAiOptions({ ...aiOptions, userPrompt: e.target.value })}
                                  className="bg-background resize-none text-sm"
                                  rows={2}
                                />
                              </div>
                              <Button
                                onClick={handleAnalyzeExcel}
                                disabled={excelAnalyzing}
                                className="w-full gap-2 h-9"
                                variant="outline"
                              >
                                {excelAnalyzing ? <Loader2 className="animate-spin" size={14} /> : <Sparkles size={14} />}
                                {excelAnalyzing ? '分析中...' : 'AI 分析'}
                              </Button>
                              {excelParseResult?.success && (
                                <Button
                                  onClick={handleUseExcelData}
                                  className="w-full gap-2 h-9"
                                >
                                  <CheckCircle2 size={14} />
                                  使用此数据源
                                </Button>
                              )}
                            </div>
                          )}
                          {/* Excel Analysis Result */}
                          {excelAnalysis && (
                            <div className="mt-4 p-4 bg-background rounded-xl max-h-60 overflow-y-auto">
                              <div className="flex items-center gap-2 mb-3">
                                <Sparkles size={16} className="text-primary" />
                                <span className="font-semibold text-sm">AI 分析结果</span>
                              </div>
                              <Markdown content={excelAnalysis.analysis?.analysis || ''} className="text-sm" />
                            </div>
                          )}
                        </div>
                      )}
                    </div>
                  </div>
                  {/* Step 3: Select Documents */}
                  <div className="space-y-4">
                    <h4 className="font-bold flex items-center gap-2 text-primary uppercase tracking-widest text-xs">
                      <span className="w-5 h-5 rounded-full bg-primary text-white flex items-center justify-center text-[10px]">2</span>
                      选择其他数据源文档
                    </h4>
                    {documents.filter(d => d.status === 'completed').length > 0 ? (
                      <div className="space-y-2 max-h-40 overflow-y-auto pr-2 custom-scrollbar">
                        {documents.filter(d => d.status === 'completed').map(doc => (
                          <div
                            key={doc.id}
                            className={cn(
                              "flex items-center gap-3 p-3 rounded-xl border transition-all cursor-pointer",
                              selectedDocs.includes(doc.id) ? "border-primary/50 bg-primary/5 shadow-sm" : "border-border hover:bg-muted/30"
                            )}
                            onClick={() => {
                              setSelectedDocs(prev =>
                                prev.includes(doc.id) ? prev.filter(id => id !== doc.id) : [...prev, doc.id]
                              );
                            }}
                          >
                            <Checkbox checked={selectedDocs.includes(doc.id)} onCheckedChange={() => {}} />
                            <div className="w-8 h-8 rounded-lg bg-blue-500/10 text-blue-500 flex items-center justify-center">
                              <Zap size={16} />
                            </div>
                            <span className="font-semibold text-sm truncate">{doc.name}</span>
                          </div>
                        ))}
                      </div>
                    ) : (
                      <div className="p-6 text-center bg-muted/30 rounded-xl border border-dashed text-xs italic text-muted-foreground">
                        暂无其他已解析的文档
                      </div>
                    )}
                  </div>
                </div>
              </ScrollArea>
              <DialogFooter className="p-8 pt-4 bg-muted/20 border-t border-dashed">
                <Button variant="outline" className="rounded-xl h-12 px-6" onClick={() => setOpenTaskDialog(false)}>取消</Button>
                <Button
                  className="rounded-xl h-12 px-8 shadow-lg shadow-primary/20 gap-2"
                  onClick={handleCreateTask}
                  disabled={creating || !selectedTemplate || (selectedDocs.length === 0 && !excelParseResult?.success)}
                >
                  {creating ? <RefreshCcw className="animate-spin h-5 w-5" /> : <Zap className="h-5 w-5 fill-current" />}
                  <span>启动智能填表引擎</span>
                </Button>
              </DialogFooter>
            </DialogContent>
          </Dialog>
        </div>
      </section>
      {/* Task List */}
      <div className="grid grid-cols-1 md:grid-cols-2 lg:grid-cols-3 gap-6">
        {loading ? (
          Array.from({ length: 3 }).map((_, i) => (
            <Skeleton key={i} className="h-48 w-full rounded-3xl bg-muted" />
          ))
        ) : tasks.length > 0 ? (
          tasks.map((task) => (
            <Card key={task.id} className="border-none shadow-md hover:shadow-xl transition-all group rounded-3xl overflow-hidden flex flex-col">
              <div className="h-1.5 w-full" style={{ backgroundColor: task.status === 'completed' ? '#10b981' : task.status === 'failed' ? '#ef4444' : '#f59e0b' }} />
              <CardHeader className="p-6 pb-2">
                <div className="flex justify-between items-start mb-2">
                  <div className="w-12 h-12 rounded-2xl bg-emerald-500/10 text-emerald-500 flex items-center justify-center shadow-inner group-hover:scale-110 transition-transform">
                    <TableProperties size={24} />
                  </div>
                  <Badge className={cn("text-[10px] uppercase font-bold tracking-widest", getStatusColor(task.status))}>
                    {task.status === 'completed' ? '已完成' : task.status === 'failed' ? '失败' : '执行中'}
                  </Badge>
                </div>
                <CardTitle className="text-lg font-bold truncate group-hover:text-primary transition-colors">{task.templates?.name || '未知模板'}</CardTitle>
                <CardDescription className="text-xs flex items-center gap-1 font-medium italic">
                  <Clock size={12} /> {format(new Date(task.created_at!), 'yyyy/MM/dd HH:mm')}
                </CardDescription>
              </CardHeader>
              <CardContent className="p-6 pt-2 flex-1">
                <div className="space-y-4">
                  <div className="flex flex-wrap gap-2">
                    <Badge variant="outline" className="bg-muted/50 border-none text-[10px] font-bold">关联 {task.document_ids?.length} 份数据源</Badge>
                  </div>
                  {task.status === 'completed' && (
                    <div className="p-3 bg-emerald-500/5 rounded-2xl border border-emerald-500/10 flex items-center gap-3">
                      <CheckCircle2 className="text-emerald-500" size={18} />
                      <span className="text-xs font-semibold text-emerald-700">内容已精准聚合，表格生成完毕</span>
                    </div>
                  )}
                </div>
              </CardContent>
              <CardFooter className="p-6 pt-0">
                <Button
                  className="w-full rounded-2xl h-11 bg-primary group-hover:shadow-lg group-hover:shadow-primary/30 transition-all gap-2"
                  disabled={task.status !== 'completed'}
                  onClick={() => setViewingTask(task)}
                >
                  <Download size={18} />
                  <span>下载汇总表格</span>
                </Button>
              </CardFooter>
            </Card>
          ))
        ) : (
          <div className="col-span-full py-24 flex flex-col items-center justify-center text-center space-y-6">
            <div className="w-24 h-24 rounded-full bg-muted flex items-center justify-center text-muted-foreground/30 border-4 border-dashed">
              <TableProperties size={48} />
            </div>
            <div className="space-y-2 max-w-sm">
              <p className="text-2xl font-extrabold tracking-tight">暂无生成任务</p>
              <p className="text-muted-foreground text-sm">上传模板后，您可以将多个文档的数据自动填充到汇总表格中。</p>
            </div>
            <Button className="rounded-xl h-12 px-8" onClick={() => setOpenTaskDialog(true)}>立即创建首个任务</Button>
          </div>
        )}
      </div>
      {/* Task Result View Modal */}
      <Dialog open={!!viewingTask} onOpenChange={(open) => !open && setViewingTask(null)}>
        <DialogContent className="max-w-4xl max-h-[90vh] flex flex-col p-0 overflow-hidden border-none shadow-2xl rounded-3xl">
          <DialogHeader className="p-8 pb-4 bg-primary text-primary-foreground">
            <div className="flex items-center gap-3 mb-2">
              <FileCheck size={28} />
              <DialogTitle className="text-2xl font-extrabold">表格生成结果预览</DialogTitle>
            </div>
            <DialogDescription className="text-primary-foreground/80 italic">
              系统已根据 {viewingTask?.document_ids?.length} 份文档信息自动填充完毕。
            </DialogDescription>
          </DialogHeader>
          <ScrollArea className="flex-1 p-8 bg-muted/10">
            <div className="prose dark:prose-invert max-w-none">
              <div className="bg-card p-8 rounded-2xl shadow-sm border min-h-[400px]">
                <Badge variant="outline" className="mb-4">数据已脱敏</Badge>
                <div className="whitespace-pre-wrap font-sans text-sm leading-relaxed">
                  <h2 className="text-xl font-bold mb-4">汇总结果报告</h2>
                  <p className="text-muted-foreground mb-6">以下是根据您上传的多个文档提取并生成的汇总信息：</p>
                  <div className="p-4 bg-muted/30 rounded-xl border border-dashed border-primary/20 italic">
                    正在从云端安全下载解析结果并渲染渲染视图...
                  </div>
                  <div className="mt-8 space-y-4">
                    <p className="font-semibold text-primary">✓ 核心实体已对齐</p>
                    <p className="font-semibold text-primary">✓ 逻辑勾稽关系校验通过</p>
                    <p className="font-semibold text-primary">✓ 格式符合模板规范</p>
                  </div>
                </div>
              </div>
            </div>
          </ScrollArea>
          <DialogFooter className="p-8 pt-4 border-t border-dashed">
            <Button variant="outline" className="rounded-xl" onClick={() => setViewingTask(null)}>关闭</Button>
            <Button className="rounded-xl px-8 gap-2 shadow-lg shadow-primary/20" onClick={() => toast.success("正在导出文件...")}>
              <Download size={18} />
              导出为 {viewingTask?.templates?.type?.toUpperCase() || '文件'}
            </Button>
          </DialogFooter>
        </DialogContent>
      </Dialog>
    </div>
  );
 };
 export default FormFill;
--- a/frontend/src/pages/Login.tsx
+++ b/frontend/src/pages/Login.tsx
@@ -1,184 +0,0 @@
 import React, { useState } from 'react';
 import { useNavigate, useLocation } from 'react-router-dom';
 import { useAuth } from '@/context/AuthContext';
 import { Button } from '@/components/ui/button';
 import { Input } from '@/components/ui/input';
 import { Label } from '@/components/ui/label';
 import { Card, CardContent, CardDescription, CardFooter, CardHeader, CardTitle } from '@/components/ui/card';
 import { Tabs, TabsContent, TabsList, TabsTrigger } from '@/components/ui/tabs';
 import { FileText, Lock, User, CheckCircle2, AlertCircle } from 'lucide-react';
 import { toast } from 'sonner';
 const Login: React.FC = () => {
  const [username, setUsername] = useState('');
  const [password, setPassword] = useState('');
  const [loading, setLoading] = useState(false);
  const { signIn, signUp } = useAuth();
  const navigate = useNavigate();
  const location = useLocation();
  const handleLogin = async (e: React.FormEvent) => {
    e.preventDefault();
    if (!username || !password) return toast.error('请输入用户名和密码');
    setLoading(true);
    try {
      const email = `${username}@miaoda.com`;
      const { error } = await signIn(email, password);
      if (error) throw error;
      toast.success('登录成功');
      navigate('/');
    } catch (err: any) {
      toast.error(err.message || '登录失败');
    } finally {
      setLoading(false);
    }
  };
  const handleSignUp = async (e: React.FormEvent) => {
    e.preventDefault();
    if (!username || !password) return toast.error('请输入用户名和密码');
    setLoading(true);
    try {
      const email = `${username}@miaoda.com`;
      const { error } = await signUp(email, password);
      if (error) throw error;
      toast.success('注册成功，请登录');
    } catch (err: any) {
      toast.error(err.message || '注册失败');
    } finally {
      setLoading(false);
    }
  };
  return (
    <div className="min-h-screen flex items-center justify-center bg-[radial-gradient(ellipse_at_top_left,_var(--tw-gradient-stops))] from-primary/10 via-background to-background p-4 relative overflow-hidden">
      {/* Decorative elements */}
      <div className="absolute top-0 left-0 w-96 h-96 bg-primary/5 rounded-full blur-3xl -translate-x-1/2 -translate-y-1/2" />
      <div className="absolute bottom-0 right-0 w-64 h-64 bg-primary/5 rounded-full blur-3xl translate-x-1/3 translate-y-1/3" />
      <div className="w-full max-w-md space-y-8 relative animate-fade-in">
        <div className="text-center space-y-2">
          <div className="inline-flex items-center justify-center w-16 h-16 rounded-2xl bg-primary text-primary-foreground shadow-2xl shadow-primary/30 mb-4 animate-slide-in">
            <FileText size={32} />
          </div>
          <h1 className="text-4xl font-extrabold tracking-tight gradient-text">智联文档</h1>
          <p className="text-muted-foreground">多源数据融合与智能文档处理系统</p>
        </div>
        <Card className="border-border/50 shadow-2xl backdrop-blur-sm bg-card/95">
          <Tabs defaultValue="login" className="w-full">
            <TabsList className="grid w-full grid-cols-2 rounded-t-xl h-12 bg-muted/50 p-1">
              <TabsTrigger value="login" className="rounded-lg data-[state=active]:bg-background data-[state=active]:shadow-sm">登录</TabsTrigger>
              <TabsTrigger value="signup" className="rounded-lg data-[state=active]:bg-background data-[state=active]:shadow-sm">注册</TabsTrigger>
            </TabsList>
            <TabsContent value="login">
              <form onSubmit={handleLogin}>
                <CardHeader>
                  <CardTitle>欢迎回来</CardTitle>
                  <CardDescription>使用您的账号登录智联文档系统</CardDescription>
                </CardHeader>
                <CardContent className="space-y-4">
                  <div className="space-y-2">
                    <Label htmlFor="username">用户名</Label>
                    <div className="relative">
                      <User className="absolute left-3 top-2.5 h-4 w-4 text-muted-foreground" />
                      <Input 
                        id="username" 
                        placeholder="请输入用户名" 
                        className="pl-9 bg-muted/30 border-none focus-visible:ring-primary"
                        value={username} 
                        onChange={(e) => setUsername(e.target.value)} 
                      />
                    </div>
                  </div>
                  <div className="space-y-2">
                    <Label htmlFor="password">密码</Label>
                    <div className="relative">
                      <Lock className="absolute left-3 top-2.5 h-4 w-4 text-muted-foreground" />
                      <Input 
                        id="password" 
                        type="password" 
                        placeholder="请输入密码" 
                        className="pl-9 bg-muted/30 border-none focus-visible:ring-primary"
                        value={password} 
                        onChange={(e) => setPassword(e.target.value)} 
                      />
                    </div>
                  </div>
                </CardContent>
                <CardFooter>
                  <Button className="w-full h-11 text-lg font-semibold rounded-xl" type="submit" disabled={loading}>
                    {loading ? '登录中...' : '立即登录'}
                  </Button>
                </CardFooter>
              </form>
            </TabsContent>
            <TabsContent value="signup">
              <form onSubmit={handleSignUp}>
                <CardHeader>
                  <CardTitle>创建账号</CardTitle>
                  <CardDescription>开启智能文档处理的新体验</CardDescription>
                </CardHeader>
                <CardContent className="space-y-4">
                  <div className="space-y-2">
                    <Label htmlFor="signup-username">用户名</Label>
                    <div className="relative">
                      <User className="absolute left-3 top-2.5 h-4 w-4 text-muted-foreground" />
                      <Input 
                        id="signup-username" 
                        placeholder="仅字母、数字和下划线" 
                        className="pl-9 bg-muted/30 border-none focus-visible:ring-primary"
                        value={username} 
                        onChange={(e) => setUsername(e.target.value)} 
                      />
                    </div>
                  </div>
                  <div className="space-y-2">
                    <Label htmlFor="signup-password">密码</Label>
                    <div className="relative">
                      <Lock className="absolute left-3 top-2.5 h-4 w-4 text-muted-foreground" />
                      <Input 
                        id="signup-password" 
                        type="password" 
                        placeholder="不少于 6 位" 
                        className="pl-9 bg-muted/30 border-none focus-visible:ring-primary"
                        value={password} 
                        onChange={(e) => setPassword(e.target.value)} 
                      />
                    </div>
                  </div>
                </CardContent>
                <CardFooter>
                  <Button className="w-full h-11 text-lg font-semibold rounded-xl" type="submit" disabled={loading}>
                    {loading ? '注册中...' : '注册账号'}
                  </Button>
                </CardFooter>
              </form>
            </TabsContent>
          </Tabs>
        </Card>
        <div className="grid grid-cols-2 gap-4 text-center text-xs text-muted-foreground">
          <div className="flex flex-col items-center gap-1">
            <CheckCircle2 size={16} className="text-primary" />
            <span>智能解析</span>
          </div>
          <div className="flex flex-col items-center gap-1">
            <CheckCircle2 size={16} className="text-primary" />
            <span>极速填表</span>
          </div>
        </div>
        <div className="text-center text-sm text-muted-foreground">
          &copy; 2026 智联文档 | 多源数据融合系统
        </div>
      </div>
    </div>
  );
 };
 export default Login;
--- a/frontend/src/pages/SamplePage.tsx
+++ b/frontend/src/pages/SamplePage.tsx
@@ -1,16 +0,0 @@
 /**
 * Sample Page
 */
 import PageMeta from "../components/common/PageMeta";
 export default function SamplePage() {
  return (
    <>
      <PageMeta title="Home" description="Home Page Introduction" />
      <div>
        <h3>This is a sample page</h3>
      </div>
    </>
  );
 }
--- a/frontend/src/pages/TaskHistory.tsx
+++ b/frontend/src/pages/TaskHistory.tsx
@@ -11,7 +11,8 @@ import {
  ChevronDown,
  ChevronUp,
  Trash2,
-  AlertCircle
+  AlertCircle,
  HelpCircle
 } from 'lucide-react';
 import { Card, CardContent, CardHeader, CardTitle, CardDescription } from '@/components/ui/card';
 import { Button } from '@/components/ui/button';
@@ -24,9 +25,9 @@ import { Skeleton } from '@/components/ui/skeleton';
 type Task = {
  task_id: string;
-  status: 'pending' | 'processing' | 'success' | 'failure';
+  status: 'pending' | 'processing' | 'success' | 'failure' | 'unknown';
  created_at: string;
-  completed_at?: string;
+  updated_at?: string;
  message?: string;
  result?: any;
  error?: string;
@@ -38,54 +39,38 @@ const TaskHistory: React.FC = () => {
  const [loading, setLoading] = useState(true);
  const [expandedTask, setExpandedTask] = useState<string | null>(null);
-  // Mock data for demonstration
+  // 获取任务历史数据
-  useEffect(() => {
+  const fetchTasks = async () => {
-    // 模拟任务数据，实际应该从后端获取
+    try {
-    setTasks([
+      setLoading(true);
-      {
+      const response = await backendApi.getTasks(50, 0);
-        task_id: 'task-001',
+      if (response.success && response.tasks) {
-        status: 'success',
+        // 转换后端数据格式为前端格式
-        created_at: new Date(Date.now() - 3600000).toISOString(),
+        const convertedTasks: Task[] = response.tasks.map((t: any) => ({
-        completed_at: new Date(Date.now() - 3500000).toISOString(),
+          task_id: t.task_id,
-        task_type: 'document_parse',
+          status: t.status || 'unknown',
-        message: '文档解析完成',
+          created_at: t.created_at || new Date().toISOString(),
-        result: {
+          updated_at: t.updated_at,
-          doc_id: 'doc-001',
+          message: t.message || '',
-          filename: 'report_q1_2026.docx',
+          result: t.result,
-          extracted_fields: ['标题', '作者', '日期', '金额']
+          error: t.error,
-        }
+          task_type: t.task_type || 'document_parse'
-      },
+        }));
-      {
+        setTasks(convertedTasks);
-        task_id: 'task-002',
+      } else {
-        status: 'success',
+        setTasks([]);
        created_at: new Date(Date.now() - 7200000).toISOString(),
        completed_at: new Date(Date.now() - 7100000).toISOString(),
        task_type: 'excel_analysis',
        message: 'Excel 分析完成',
        result: {
          filename: 'sales_data.xlsx',
          row_count: 1250,
          charts_generated: 3
        }
      },
      {
        task_id: 'task-003',
        status: 'processing',
        created_at: new Date(Date.now() - 600000).toISOString(),
        task_type: 'template_fill',
        message: '正在填充表格...'
      },
      {
        task_id: 'task-004',
        status: 'failure',
        created_at: new Date(Date.now() - 86400000).toISOString(),
        completed_at: new Date(Date.now() - 86390000).toISOString(),
        task_type: 'document_parse',
        message: '解析失败',
        error: '文件格式不支持或文件已损坏'
      }
-    ]);
+    } catch (error) {
-    setLoading(false);
+      console.error('获取任务列表失败:', error);
      toast.error('获取任务列表失败');
      setTasks([]);
    } finally {
      setLoading(false);
    }
  };
  useEffect(() => {
    fetchTasks();
  }, []);
  const getStatusBadge = (status: string) => {
@@ -96,6 +81,8 @@ const TaskHistory: React.FC = () => {
        return <Badge className="bg-destructive text-white text-[10px]"><XCircle size={12} className="mr-1" />失败</Badge>;
      case 'processing':
        return <Badge className="bg-amber-500 text-white text-[10px]"><Loader2 size={12} className="mr-1 animate-spin" />处理中</Badge>;
      case 'unknown':
        return <Badge className="bg-gray-500 text-white text-[10px]"><HelpCircle size={12} className="mr-1" />未知</Badge>;
      default:
        return <Badge className="bg-gray-500 text-white text-[10px]"><Clock size={12} className="mr-1" />等待</Badge>;
    }
@@ -133,15 +120,22 @@ const TaskHistory: React.FC = () => {
  };
  const handleDelete = async (taskId: string) => {
-    setTasks(prev => prev.filter(t => t.task_id !== taskId));
+    try {
-    toast.success('任务已删除');
+      await backendApi.deleteTask(taskId);
      setTasks(prev => prev.filter(t => t.task_id !== taskId));
      toast.success('任务已删除');
    } catch (error) {
      console.error('删除任务失败:', error);
      toast.error('删除任务失败');
    }
  };
  const stats = {
    total: tasks.length,
    success: tasks.filter(t => t.status === 'success').length,
    processing: tasks.filter(t => t.status === 'processing').length,
-    failure: tasks.filter(t => t.status === 'failure').length
+    failure: tasks.filter(t => t.status === 'failure').length,
    unknown: tasks.filter(t => t.status === 'unknown').length
  };
  return (
@@ -151,7 +145,7 @@ const TaskHistory: React.FC = () => {
          <h1 className="text-3xl font-extrabold tracking-tight">任务历史</h1>
          <p className="text-muted-foreground">查看和管理您所有的文档处理任务记录</p>
        </div>
-        <Button variant="outline" className="rounded-xl gap-2" onClick={() => window.location.reload()}>
+        <Button variant="outline" className="rounded-xl gap-2" onClick={() => fetchTasks()}>
          <RefreshCcw size={18} />
          <span>刷新</span>
        </Button>
@@ -194,7 +188,8 @@ const TaskHistory: React.FC = () => {
                    "w-12 h-12 rounded-xl flex items-center justify-center shrink-0",
                    task.status === 'success' ? "bg-emerald-500/10 text-emerald-500" :
                    task.status === 'failure' ? "bg-destructive/10 text-destructive" :
-                    "bg-amber-500/10 text-amber-500"
+                    task.status === 'processing' ? "bg-amber-500/10 text-amber-500" :
                    "bg-gray-500/10 text-gray-500"
                  )}>
                    {task.status === 'processing' ? (
                      <Loader2 size={24} className="animate-spin" />
@@ -212,16 +207,16 @@ const TaskHistory: React.FC = () => {
                      </Badge>
                    </div>
                    <p className="text-sm text-muted-foreground">
-                      {task.message || '任务执行中...'}
+                      {task.message || (task.status === 'unknown' ? '无法获取状态' : '任务执行中...')}
                    </p>
                    <div className="flex items-center gap-4 text-xs text-muted-foreground">
                      <span className="flex items-center gap-1">
                        <Clock size={12} />
-                        {format(new Date(task.created_at), 'yyyy-MM-dd HH:mm:ss')}
+                        {task.created_at ? format(new Date(task.created_at), 'yyyy-MM-dd HH:mm:ss') : '时间未知'}
                      </span>
-                      {task.completed_at && (
+                      {task.updated_at && task.status !== 'processing' && (
                        <span>
-                          耗时: {Math.round((new Date(task.completed_at).getTime() - new Date(task.created_at).getTime()) / 1000)} 秒
+                          更新: {format(new Date(task.updated_at), 'HH:mm:ss')}
                        </span>
                      )}
                    </div>
--- a/frontend/src/pages/TemplateFill.tsx
+++ b/frontend/src/pages/TemplateFill.tsx
@@ -1,4 +1,4 @@
-import React, { useState, useEffect, useCallback } from 'react';
+import React, { useState, useEffect, useCallback, useRef } from 'react';
 import { useDropzone } from 'react-dropzone';
 import {
  TableProperties,
@@ -18,7 +18,8 @@ import {
  Files,
  Trash2,
  Eye,
-  File
+  File,
  Plus
 } from 'lucide-react';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardHeader, CardTitle, CardDescription } from '@/components/ui/card';
@@ -60,6 +61,7 @@ const TemplateFill: React.FC = () => {
    templateFields, setTemplateFields,
    sourceFiles, setSourceFiles, addSourceFiles, removeSourceFile,
    sourceFilePaths, setSourceFilePaths,
    sourceDocIds, setSourceDocIds, addSourceDocId, removeSourceDocId,
    templateId, setTemplateId,
    filledResult, setFilledResult,
    reset
@@ -68,6 +70,10 @@ const TemplateFill: React.FC = () => {
  const [loading, setLoading] = useState(false);
  const [previewDoc, setPreviewDoc] = useState<{ name: string; content: string } | null>(null);
  const [previewOpen, setPreviewOpen] = useState(false);
  const [sourceMode, setSourceMode] = useState<'upload' | 'select'>('upload');
  const [uploadedDocuments, setUploadedDocuments] = useState<DocumentItem[]>([]);
  const [docsLoading, setDocsLoading] = useState(false);
  const sourceFileInputRef = useRef<HTMLInputElement>(null);
  // 模板拖拽
  const onTemplateDrop = useCallback((acceptedFiles: File[]) => {
@@ -89,25 +95,77 @@ const TemplateFill: React.FC = () => {
  });
  // 源文档拖拽
-  const onSourceDrop = useCallback((acceptedFiles: File[]) => {
+  const onSourceDrop = useCallback((e: React.DragEvent) => {
-    const newFiles = acceptedFiles.map(f => ({
+    e.preventDefault();
-      file: f,
+    const files = Array.from(e.dataTransfer.files).filter(f => {
-      preview: f.type.startsWith('text/') || f.name.endsWith('.md') ? undefined : undefined
+      const ext = f.name.split('.').pop()?.toLowerCase();
-    }));
+      return ['xlsx', 'xls', 'docx', 'md', 'txt'].includes(ext || '');
-    addSourceFiles(newFiles);
+    });
    if (files.length > 0) {
      addSourceFiles(files.map(f => ({ file: f })));
    }
  }, [addSourceFiles]);
-  const { getRootProps: getSourceProps, getInputProps: getSourceInputProps, isDragActive: isSourceDragActive } = useDropzone({
+  const handleSourceFileSelect = (e: React.ChangeEvent<HTMLInputElement>) => {
-    onDrop: onSourceDrop,
+    const files = Array.from(e.target.files || []);
-    accept: {
+    if (files.length > 0) {
-      'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet': ['.xlsx'],
+      addSourceFiles(files.map(f => ({ file: f })));
-      'application/vnd.ms-excel': ['.xls'],
+      toast.success(`已添加 ${files.length} 个文件`);
-      'application/vnd.openxmlformats-officedocument.wordprocessingml.document': ['.docx'],
+    }
-      'text/plain': ['.txt'],
+    e.target.value = '';
-      'text/markdown': ['.md']
+  };
-    },
+
-    multiple: true
+  // 仅添加源文档不上传
-  });
+  const handleAddSourceFiles = () => {
    if (sourceFiles.length === 0) {
      toast.error('请先选择源文档');
      return;
    }
    toast.success(`已添加 ${sourceFiles.length} 个源文档，可继续添加更多`);
  };
  // 加载已上传文档
  const loadUploadedDocuments = useCallback(async () => {
    setDocsLoading(true);
    try {
      const result = await backendApi.getDocuments(undefined, 100);
      if (result.success) {
        // 过滤可作为数据源的文档类型
        const docs = (result.documents || []).filter((d: DocumentItem) =>
          ['docx', 'md', 'txt', 'xlsx', 'xls'].includes(d.doc_type)
        );
        setUploadedDocuments(docs);
      }
    } catch (err: any) {
      console.error('加载文档失败:', err);
    } finally {
      setDocsLoading(false);
    }
  }, []);
  // 删除文档
  const handleDeleteDocument = async (docId: string, e: React.MouseEvent) => {
    e.stopPropagation();
    if (!confirm('确定要删除该文档吗？')) return;
    try {
      const result = await backendApi.deleteDocument(docId);
      if (result.success) {
        setUploadedDocuments(prev => prev.filter(d => d.doc_id !== docId));
        removeSourceDocId(docId);
        toast.success('文档已删除');
      } else {
        toast.error(result.message || '删除失败');
      }
    } catch (err: any) {
      toast.error('删除失败: ' + (err.message || '未知错误'));
    }
  };
  useEffect(() => {
    if (sourceMode === 'select') {
      loadUploadedDocuments();
    }
  }, [sourceMode, loadUploadedDocuments]);
  const handleJointUploadAndFill = async () => {
    if (!templateFile) {
@@ -115,34 +173,69 @@ const TemplateFill: React.FC = () => {
      return;
    }
    // 检查是否选择了数据源
    if (sourceMode === 'upload' && sourceFiles.length === 0) {
      toast.error('请上传源文档或从已上传文档中选择');
      return;
    }
    if (sourceMode === 'select' && sourceDocIds.length === 0) {
      toast.error('请选择源文档');
      return;
    }
    setLoading(true);
    try {
-      // 使用联合上传API
+      if (sourceMode === 'select') {
-      const result = await backendApi.uploadTemplateAndSources(
+        // 使用已上传文档作为数据源
-        templateFile,
+        const result = await backendApi.uploadTemplate(templateFile);
        sourceFiles.map(sf => sf.file)
      );
-      if (result.success) {
+        if (result.success) {
-        setTemplateFields(result.fields || []);
+          setTemplateFields(result.fields || []);
-        setTemplateId(result.template_id);
+          setTemplateId(result.template_id || 'temp');
-        setSourceFilePaths(result.source_file_paths || []);
+          toast.success('开始智能填表');
-        toast.success('文档上传成功，开始智能填表');
+          setStep('filling');
        setStep('filling');
-        // 自动开始填表
+          // 使用 source_doc_ids 进行填表
-        const fillResult = await backendApi.fillTemplate(
+          const fillResult = await backendApi.fillTemplate(
-          result.template_id,
+            result.template_id || 'temp',
-          result.fields || [],
+            result.fields || [],
-          [],  // 使用 source_file_paths 而非 source_doc_ids
+            sourceDocIds,
-          result.source_file_paths || [],
+            [],
-          '请从以下文档中提取相关信息填写表格'
+            '请从以下文档中提取相关信息填写表格'
          );
          setFilledResult(fillResult);
          setStep('preview');
          toast.success('表格填写完成');
        }
      } else {
        // 使用联合上传API
        const result = await backendApi.uploadTemplateAndSources(
          templateFile,
          sourceFiles.map(sf => sf.file)
        );
-        setFilledResult(fillResult);
+        if (result.success) {
-        setStep('preview');
+          setTemplateFields(result.fields || []);
-        toast.success('表格填写完成');
+          setTemplateId(result.template_id);
          setSourceFilePaths(result.source_file_paths || []);
          toast.success('文档上传成功，开始智能填表');
          setStep('filling');
          // 自动开始填表
          const fillResult = await backendApi.fillTemplate(
            result.template_id,
            result.fields || [],
            [],
            result.source_file_paths || [],
            '请从以下文档中提取相关信息填写表格'
          );
          setFilledResult(fillResult);
          setStep('preview');
          toast.success('表格填写完成');
        }
      }
    } catch (err: any) {
      toast.error('处理失败: ' + (err.message || '未知错误'));
@@ -264,47 +357,158 @@ const TemplateFill: React.FC = () => {
                源文档
              </CardTitle>
              <CardDescription>
-                上传包含数据的源文档（支持多选），可同时上传多个文件
+                选择包含数据的源文档作为填表依据
              </CardDescription>
              {/* Source Mode Tabs */}
              <div className="flex gap-2 mt-2">
                <Button
                  variant={sourceMode === 'upload' ? 'default' : 'outline'}
                  size="sm"
                  onClick={() => setSourceMode('upload')}
                >
                  <Upload size={14} className="mr-1" />
                  上传文件
                </Button>
                <Button
                  variant={sourceMode === 'select' ? 'default' : 'outline'}
                  size="sm"
                  onClick={() => setSourceMode('select')}
                >
                  <Files size={14} className="mr-1" />
                  从文档中心选择
                </Button>
              </div>
            </CardHeader>
            <CardContent>
-              <div
+              {sourceMode === 'upload' ? (
-                {...getSourceProps()}
+                <>
-                className={cn(
+                  <div className="border-2 border-dashed rounded-2xl p-8 transition-all duration-300 flex flex-col items-center justify-center text-center cursor-pointer group min-h-[200px] border-muted-foreground/20 hover:border-primary/50 hover:bg-primary/5">
-                  "border-2 border-dashed rounded-2xl p-8 transition-all duration-300 flex flex-col items-center justify-center text-center cursor-pointer group min-h-[200px]",
+                    <input
-                  isSourceDragActive ? "border-primary bg-primary/5" : "border-muted-foreground/20 hover:border-primary/50 hover:bg-primary/5"
+                      id="source-file-input"
-                )}
+                      type="file"
-              >
+                      multiple={true}
-                <input {...getSourceInputProps()} />
+                      accept=".xlsx,.xls,.docx,.md,.txt"
-                <div className="w-14 h-14 rounded-xl bg-blue-500/10 text-blue-500 flex items-center justify-center mb-4 group-hover:scale-110 transition-transform">
+                      onChange={handleSourceFileSelect}
-                  {loading ? <Loader2 className="animate-spin" size={28} /> : <Upload size={28} />}
+                      className="hidden"
-                </div>
+                    />
-                <p className="font-medium">
+                    <label htmlFor="source-file-input" className="cursor-pointer flex flex-col items-center">
-                  {isSourceDragActive ? '释放以上传' : '点击或拖拽上传源文档'}
+                      <div className="w-14 h-14 rounded-xl bg-blue-500/10 text-blue-500 flex items-center justify-center mb-4 group-hover:scale-110 transition-transform">
-                </p>
+                        {loading ? <Loader2 className="animate-spin" size={28} /> : <Upload size={28} />}
-                <p className="text-xs text-muted-foreground mt-1">
+                      </div>
-                  支持 .xlsx .xls .docx .md .txt
+                      <p className="font-medium">
-                </p>
+                        点击上传源文档
-              </div>
+                      </p>
-
+                      <p className="text-xs text-muted-foreground mt-1">
-              {/* Selected Source Files */}
+                        支持 .xlsx .xls .docx .md .txt
-              {sourceFiles.length > 0 && (
+                      </p>
-                <div className="mt-4 space-y-2">
+                    </label>
-                  {sourceFiles.map((sf, idx) => (
+                  </div>
-                    <div key={idx} className="flex items-center gap-3 p-3 bg-muted/50 rounded-xl">
+                  <div
-                      {getFileIcon(sf.file.name)}
+                    onDragOver={(e) => { e.preventDefault(); }}
-                      <div className="flex-1 min-w-0">
+                    onDrop={onSourceDrop}
-                        <p className="text-sm font-medium truncate">{sf.file.name}</p>
+                    className="mt-2 text-center text-xs text-muted-foreground"
-                        <p className="text-xs text-muted-foreground">
+                  >
-                          {(sf.file.size / 1024).toFixed(1)} KB
+                    或拖拽文件到此处
-                        </p>
+                  </div>
                  {/* Selected Source Files */}
                  {sourceFiles.length > 0 && (
                    <div className="mt-4 space-y-2">
                      {sourceFiles.map((sf, idx) => (
                        <div key={idx} className="flex items-center gap-3 p-3 bg-muted/50 rounded-xl">
                          {getFileIcon(sf.file.name)}
                          <div className="flex-1 min-w-0">
                            <p className="text-sm font-medium truncate">{sf.file.name}</p>
                            <p className="text-xs text-muted-foreground">
                              {(sf.file.size / 1024).toFixed(1)} KB
                            </p>
                          </div>
                          <Button variant="ghost" size="sm" onClick={() => removeSourceFile(idx)}>
                            <Trash2 size={14} className="text-red-500" />
                          </Button>
                        </div>
                      ))}
                      <div className="flex justify-center pt-2">
                        <Button variant="outline" size="sm" onClick={() => document.getElementById('source-file-input')?.click()}>
                          <Plus size={14} className="mr-1" />
                          继续添加更多文档
                        </Button>
                      </div>
                      <Button variant="ghost" size="sm" onClick={() => removeSourceFile(idx)}>
                        <Trash2 size={14} className="text-red-500" />
                      </Button>
                    </div>
-                  ))}
+                  )}
-                </div>
+                </>
              ) : (
                <>
                  {/* Uploaded Documents Selection */}
                  {docsLoading ? (
                    <div className="space-y-2">
                      {[1, 2, 3].map(i => (
                        <Skeleton key={i} className="h-16 w-full rounded-xl" />
                      ))}
                    </div>
                  ) : uploadedDocuments.length > 0 ? (
                    <div className="space-y-2">
                      {sourceDocIds.length > 0 && (
                        <div className="flex items-center justify-between p-3 bg-primary/5 rounded-xl border border-primary/20">
                          <span className="text-sm font-medium">已选择 {sourceDocIds.length} 个文档</span>
                          <Button variant="ghost" size="sm" onClick={() => loadUploadedDocuments()}>
                            <RefreshCcw size={14} className="mr-1" />
                            刷新列表
                          </Button>
                        </div>
                      )}
                      <div className="max-h-[300px] overflow-y-auto space-y-2">
                        {uploadedDocuments.map((doc) => (
                          <div
                            key={doc.doc_id}
                            className={cn(
                              "flex items-center gap-3 p-3 rounded-xl border-2 transition-all cursor-pointer",
                              sourceDocIds.includes(doc.doc_id)
                                ? "border-primary bg-primary/5"
                                : "border-border hover:bg-muted/30"
                            )}
                            onClick={() => {
                              if (sourceDocIds.includes(doc.doc_id)) {
                                removeSourceDocId(doc.doc_id);
                              } else {
                                addSourceDocId(doc.doc_id);
                              }
                            }}
                          >
                            <div className={cn(
                              "w-6 h-6 rounded-md border-2 flex items-center justify-center transition-all shrink-0",
                              sourceDocIds.includes(doc.doc_id)
                                ? "border-primary bg-primary text-white"
                                : "border-muted-foreground/30"
                            )}>
                              {sourceDocIds.includes(doc.doc_id) && <CheckCircle2 size={14} />}
                            </div>
                            {getFileIcon(doc.original_filename)}
                            <div className="flex-1 min-w-0">
                              <p className="text-sm font-medium truncate">{doc.original_filename}</p>
                              <p className="text-xs text-muted-foreground">
                                {doc.doc_type.toUpperCase()} • {format(new Date(doc.created_at), 'yyyy-MM-dd')}
                              </p>
                            </div>
                            <Button
                              variant="ghost"
                              size="sm"
                              onClick={(e) => handleDeleteDocument(doc.doc_id, e)}
                              className="shrink-0"
                            >
                              <Trash2 size={14} className="text-red-500" />
                            </Button>
                          </div>
                        ))}
                      </div>
                    </div>
                  ) : (
                    <div className="text-center py-8 text-muted-foreground">
                      <Files size={32} className="mx-auto mb-2 opacity-30" />
                      <p className="text-sm">暂无可用的已上传文档</p>
                    </div>
                  )}
                </>
              )}
            </CardContent>
          </Card>
Author	SHA1	Message	Date
KiriAky 107	5fca4eb094	添加临时文件清理异常处理和修改大纲接口为POST方法 - 在analyze_markdown、analyze_markdown_stream和get_markdown_outline函数中添加了 try-catch块来处理临时文件清理过程中的异常 - 将/analyze/md/outline接口从GET方法改为POST方法以支持文件上传 - 确保在所有情况下都能正确清理临时文件，并记录清理失败的日志 refactor(health): 改进健康检查逻辑验证实际数据库连接 - 修改MySQL健康检查，实际执行SELECT 1查询来验证连接 - 修改MongoDB健康检查，执行ping命令来验证连接 - 修改Redis健康检查，执行ping命令来验证连接 - 添加异常捕获并记录具体的错误日志 refactor(upload): 使用os.path.basename优化文件名提取 - 替换手动字符串分割为os.path.basename来获取文件名 - 统一Excel上传和导出中文件名的处理方式 feat(instruction): 新增指令执行框架模块 - 创建instruction包包含意图解析和指令执行的基础架构 - 添加IntentParser和InstructionExecutor抽象基类 - 提供默认实现但标记为未完成，为未来功能扩展做准备 refactor(frontend): 调整AuthContext导入路径并移除重复文件 - 将AuthContext从src/context移动到src/contexts目录 - 更新App.tsx和RouteGuard.tsx中的导入路径 - 移除旧的AuthContext.tsx文件 fix(backend-api): 修复AI分析API的HTTP方法错误 - 将aiApi中的fetch请求方法从GET改为POST以支持文件上传	2026-04-10 01:51:53 +08:00
KiriAky 107	0dbf74db9d	添加任务ID跟踪功能到模板填充接口 - 在FillRequest中添加可选的task_id字段，用于任务历史跟踪 - 实现任务状态管理，包括创建、更新和错误处理 - 集成MongoDB任务记录功能，在处理过程中更新进度 - 添加任务进度更新逻辑，支持开始、处理中、成功和失败状态 - 修改模板填充服务以接收并传递task_id参数	2026-04-10 01:27:26 +08:00
KiriAky 107	858b594171	添加任务状态双写机制和历史记录功能 - 实现任务状态同时写入Redis和MongoDB的双写机制 - 添加MongoDB任务集合及CRUD操作接口 - 新增任务历史记录查询、列表展示和删除功能 - 重构任务状态更新逻辑，统一使用update_task_status函数 - 添加模板填服务中AI审核字段值的功能 - 优化前端任务历史页面显示和交互体验	2026-04-10 01:15:53 +08:00
KiriAky 107	ed0f51f2a4	Merge branch 'main' of https://gitea.kronecker.cc/OurCodesAreAllRight/FilesReadSystem	2026-04-10 00:26:57 +08:00
KiriAky 107	ecc0c79475	增强模板填写服务支持表格内容摘要和表头重生成 - 在源文档解析过程中增加表格内容摘要功能，提取表格结构用于AI理解 - 新增表格摘要逻辑，包括表头和前3行数据的提取和格式化 - 添加模板文件类型识别，支持xlsx和docx格式判断 - 实现基于源文档内容的表头自动重生成功能 - 当检测到自动生成的表头时，使用源文档内容重新生成更准确的字段 - 增加详细的调试日志用于跟踪表格处理过程	2026-04-10 00:26:54 +08:00
dj	6befc510d8	刷新的debug	2026-04-10 00:23:23 +08:00
dj	8f66c235fa	实现并行多文件上传的功能并且在列表显示上传了哪些文件，支持多次上传	2026-04-10 00:16:28 +08:00
KiriAky 107	886d5ae0cc	Merge branch 'main' of https://gitea.kronecker.cc/OurCodesAreAllRight/FilesReadSystem	2026-04-09 22:44:01 +08:00
KiriAky 107	6752c5c231	优化联合模板上传逻辑支持源文档内容解析 - 移除模板文件字段提取步骤，改为直接保存模板文件 - 新增源文档解析功能，提取文档内容、标题和表格数量信息 - 修改模板填充服务，支持传入源文档内容用于AI表头生成 - 更新AI表头生成逻辑，基于源文档内容智能生成合适的表头字段 - 增强日志记录，显示源文档数量和处理进度	2026-04-09 22:43:51 +08:00
dj	610d475ce0	新增从文档中心选择源文档功能及删除功能智能填表模块新增"从文档中心选择"模式，支持选择已上传的文档作为数据源，同时支持从列表中删除文档。两种模式通过Tab切换。 Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-04-09 22:35:13 +08:00
dj	496b96508d	修复Excel解析和智能填表功能 - 增强Excel解析器支持多种命名空间和路径格式，解决英文表头Excel无法读取问题 - 当MongoDB中structured_data为空时，尝试用file_path重新解析文件 - 改进AI分析提示词，明确要求返回纯数值不要单位 - 修复max_tokens值(5000→4000)避免DeepSeek API报错 Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-04-09 22:21:51 +08:00
dj	07ebdc09bc	Merge branch 'main' of https://gitea.kronecker.cc/OurCodesAreAllRight/FilesReadSystem	2026-04-09 22:18:12 +08:00
dj	c1886fb68f	Merge branch 'main' of https://gitea.kronecker.cc/OurCodesAreAllRight/FilesReadSystem	2026-04-09 21:42:14 +08:00
dj	78417c898a	改进智能填表功能：支持Markdown表格提取和修复LLM调用 - 新增对MongoDB存储的tables格式支持，直接从structured_data.tables提取数据 - 修复max_tokens值过大问题(50000→4000)，解决DeepSeek API限制 - 增强列名匹配算法，支持模糊匹配 - 添加详细日志便于调试结构化数据提取过程 Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-04-09 21:42:07 +08:00
dj	718f864926	修改读取excel表时存在数字时浮点匹配生成不一致问题	2026-04-09 20:56:38 +08:00