diff --git a/alembic/versions/4fc61e385531_add_faq_and_chunk_config.py b/alembic/versions/4fc61e385531_add_faq_and_chunk_config.py
new file mode 100644
index 000000000..9fa924fc6
--- /dev/null
+++ b/alembic/versions/4fc61e385531_add_faq_and_chunk_config.py
@@ -0,0 +1,37 @@
+"""add chunk_config, FAQ tables and FAQ config columns
+
+Revision ID: 4fc61e385531
+Revises: 1432eea7c5b9
+Create Date: 2025-12-25 17:00:00.000000
+
+"""
+from typing import Sequence, Union
+
+from alembic import op
+import sqlalchemy as sa
+
+from db.op.safe_add import safe_add_column
+
+
+# revision identifiers, used by Alembic.
+revision: str = '4fc61e385531'
+down_revision: Union[str, Sequence[str], None] = '1432eea7c5b9'
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    """Upgrade schema."""
+    # 1. Add chunk_config column to pai_knowledgebase_file table
+    safe_add_column('pai_knowledgebase_file', sa.Column('chunk_config', sa.JSON(), nullable=True))
+    safe_add_column('pai_chatbot_model', sa.Column('enable_faq', sa.Boolean(), nullable=True, default=False))
+    safe_add_column('pai_chatbot_model', sa.Column('faq_config', sa.JSON(), nullable=True))
+    
+
+def downgrade() -> None:
+    """Downgrade schema."""
+    # Remove chunk_config column from pai_knowledgebase_file table
+    op.drop_column('pai_knowledgebase_file', 'chunk_config')
+    op.drop_column('pai_chatbot_model', 'faq_config')
+    op.drop_column('pai_chatbot_model', 'enable_faq')
+
diff --git a/backend/agent/actor.py b/backend/agent/actor.py
index 70e1bc30f..a1f758f9d 100644
--- a/backend/agent/actor.py
+++ b/backend/agent/actor.py
@@ -14,6 +14,7 @@
 from common.chat.constants import MessageRole
 from opentelemetry import trace
 from utils.json_utils import parse_tool_arguments
+from agent.tool_utils import check_and_handle_return_direct
 
 
 @retry(stop=stop_after_attempt(3), wait=wait_fixed(1))
@@ -118,6 +119,19 @@ async def gen():
 
                         state.current_tool_call = None
                         observations += message_content + "\n\n"
+
+                        # Check if tool has return_direct=True, if so, return directly
+                        tool_obj = self.tool_fn_map[tool_name]
+                        return_chunk = check_and_handle_return_direct(
+                            tool_obj=tool_obj,
+                            tool_name=tool_name,
+                            tool_content=tool_content,
+                            tool_error=tool_error,
+                            agent_name=self.name,
+                        )
+                        if return_chunk:
+                            yield return_chunk
+                            return
                     act_prompt = self.build_prompt(state)
                     messages = [{"role": "system", "content": act_prompt}] + messages
 
@@ -212,6 +226,19 @@ async def gen():
                             )
                             observations += message_content + "\n\n"
 
+                            # Check if tool has return_direct=True, if so, return directly
+                            tool_obj = self.tool_fn_map[function_name]
+                            return_chunk = check_and_handle_return_direct(
+                                tool_obj=tool_obj,
+                                tool_name=function_name,
+                                tool_content=tool_content,
+                                tool_error=tool_error,
+                                agent_name=self.name,
+                            )
+                            if return_chunk:
+                                yield return_chunk
+                                return
+
                     # 超出步数保护
                     if react_step > self.max_steps:
                         logger.warning(f"Reached max recursion steps: {self.max_steps}")
diff --git a/backend/agent/actor_with_plan.py b/backend/agent/actor_with_plan.py
index 440796b98..16dc5c0e0 100644
--- a/backend/agent/actor_with_plan.py
+++ b/backend/agent/actor_with_plan.py
@@ -10,6 +10,7 @@
 from extensions.trace.base import use_current_span
 from opentelemetry import trace
 from utils.json_utils import parse_tool_arguments
+from agent.tool_utils import check_and_handle_return_direct
 
 
 @retry(stop=stop_after_attempt(3), wait=wait_fixed(1))
@@ -157,6 +158,19 @@ async def gen():
                                         result=tool_content,
                                         error=tool_error
                                     )
+
+                                    # Check if tool has return_direct=True, if so, return directly
+                                    tool_obj = self.tool_fn_map[function_name]
+                                    return_chunk = check_and_handle_return_direct(
+                                        tool_obj=tool_obj,
+                                        tool_name=function_name,
+                                        tool_content=tool_content,
+                                        tool_error=tool_error,
+                                        agent_name=self.name,
+                                    )
+                                    if return_chunk:
+                                        yield return_chunk
+                                        return
                         else:
                             break
 
diff --git a/backend/agent/tool_utils.py b/backend/agent/tool_utils.py
new file mode 100644
index 000000000..580f0eb36
--- /dev/null
+++ b/backend/agent/tool_utils.py
@@ -0,0 +1,60 @@
+"""Utility functions for handling tool calls and results."""
+
+import json
+from typing import Optional
+from llama_index.core.tools.function_tool import FunctionTool
+from common.llm.models import TextChunk
+from loguru import logger
+
+
+def check_and_handle_return_direct(
+    tool_obj: FunctionTool,
+    tool_name: str,
+    tool_content: Optional[str],
+    tool_error: Optional[str],
+    agent_name: str = "agent",
+) -> Optional[TextChunk]:
+    """
+    Check if a tool has return_direct=True and format the result accordingly.
+
+    Args:
+        tool_obj: The FunctionTool object
+        tool_name: Name of the tool
+        tool_content: Content returned by the tool (None if error)
+        tool_error: Error message if tool call failed (None if success)
+        agent_name: Name of the agent (for logging)
+
+    Returns:
+        TextChunk if return_direct=True, None otherwise
+    """
+    return_direct = getattr(tool_obj.metadata, 'return_direct', False)
+
+    if not return_direct:
+        return None
+
+    logger.info(f"[{agent_name}] Tool {tool_name} has return_direct=True, returning tool result directly.")
+
+    if tool_error:
+        return TextChunk(delta=f"工具调用失败: {tool_error}")
+
+    if not tool_content:
+        return TextChunk(delta="工具调用成功，但未返回内容。")
+
+    try:
+        result_data = json.loads(tool_content)
+        if isinstance(result_data, dict) and "result" in result_data:
+            # Format FAQ results or similar structured results
+            formatted_result = ""
+            for item in result_data.get("result", []):
+                if isinstance(item, dict):
+                    content = item.get("content", "")
+                    if content:
+                        formatted_result += content + "\n\n"
+            if formatted_result:
+                return TextChunk(delta=formatted_result.strip())
+            else:
+                return TextChunk(delta=tool_content)
+        else:
+            return TextChunk(delta=tool_content)
+    except (json.JSONDecodeError, Exception):
+        return TextChunk(delta=tool_content)
diff --git a/backend/api/v1/config_apis/chatapp.py b/backend/api/v1/config_apis/chatapp.py
index 87ea7e0ce..6ee6e54d9 100644
--- a/backend/api/v1/config_apis/chatapp.py
+++ b/backend/api/v1/config_apis/chatapp.py
@@ -1,24 +1,502 @@
 ### Embedding configuration API ###
 
-from fastapi import APIRouter, Depends, Query
+import time
+import asyncio
+import tempfile
+import os
+from datetime import datetime, timezone
+from fastapi import APIRouter, Depends, Query, File, UploadFile, Form
 from sqlmodel import select, func
 from sqlmodel.ext.asyncio.session import AsyncSession
 from db.models.chatbot import (
     ChatBotCreate,
     ChatBotEntity,
 )
+from pairag.file.models.file_item import FileItem
+import uuid
+import hashlib
+from rag.kb_file_client import kb_file_client
+from rag.parse_utils import sanitize_text
+from tqdm import tqdm
 from db.db_context import get_db_session
 from sqlalchemy.exc import IntegrityError
 from common.chat.response_model import PagedResult, ResponseModel, success_response
-from api.v1.utils.paginate import get_pagination_meta
-from service.injection import get_chatapp_service, get_tenant_id
+from service.injection import get_chatapp_service, get_tenant_id, get_faq_config_service, get_faq_item_service, get_rag_service, get_embedding_service, get_knowledgebase_service, get_file_service
 from service.tool.chatapp_service import ChatappService
+from service.tool.faq_config_service import FAQConfigService
+from service.tool.faq_item_service import FAQItemService
+from service.injection import get_faq_item_service
+from db.models.faq_item import FAQItemCreate
+from service.knowledgebase.rag_service import RagService
+from service.knowledgebase.knowledgebase_service import KnowledgebaseService
+from service.knowledgebase.file_service import FileService
+from service.model.embedding_service import EmbeddingService
+from db.models.knowledgebase.knowledgebase import KnowledgebaseCreate, RetrievalConfig, ChunkConfig, TableParserConfig
+from common.knowledgebase.constants import FAQ_KNOWLEDGEBASE_NAME, DEFAULT_FAQ_SIMILARITY_THRESHOLD
+from common.knowledgebase.types import VectorIndexRetrievalType, FileStatus
+from rag.file_item_utils import to_file_entity
+from typing import Optional, List
+from io import BytesIO
+import json
 from api.api_exception import ApiException
 import traceback
 from loguru import logger
 
 app_router = APIRouter()
 
+# Import FAQ dependencies
+from db.models.faq_config import FAQConfigCreate
+from db.models.faq_item import FAQItemCreate, FAQItemEntity
+
+# FAQ routes - MUST be defined before /{id} routes to avoid route conflicts
+# FastAPI matches routes in order, so more specific routes must come first
+@app_router.post("/{app_id}/faqs", response_model=ResponseModel[FAQItemEntity], tags=["FAQ"])
+async def create_faq_item(
+    app_id: str,
+    faq_item_create: FAQItemCreate,
+    tenant_id: str = Depends(get_tenant_id),
+    session: AsyncSession = Depends(get_db_session),
+    chatapp_service: ChatappService = Depends(get_chatapp_service),
+    faq_item_service: FAQItemService = Depends(get_faq_item_service),
+    rag_service: RagService = Depends(get_rag_service),
+):
+    logger.info(f"Creating FAQ item for app_id: {app_id}")
+    try:
+        # Get chatbot by app_id to get chatbot_id
+        chatbot = await chatapp_service.get_chatapp_by_app_id(app_id=app_id, tenant_id=tenant_id)
+        if not chatbot:
+            raise ApiException(code=404, message=f"应用 '{app_id}' 不存在。")
+
+        if not chatbot.enable_faq or not chatbot.faq_config:
+            raise ApiException(code=400, message="请先启用FAQ功能。")
+
+        faq_item = await faq_item_service.create_faq_item(
+            chatbot_id=chatbot.app_id,
+            faq_item_data=faq_item_create,
+            tenant_id=tenant_id,
+        )
+        await faq_item_service.save_faq_to_knowledgebase(faq_item, tenant_id, rag_service)
+        await session.commit()
+        await session.refresh(faq_item)
+        return success_response(data=faq_item, message="创建FAQ成功。")
+    except ValueError as e:
+        logger.error(f"Failed to create FAQ item: {str(e)}")
+        raise ApiException(code=400, message=str(e))
+    except ApiException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to create FAQ item: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"创建FAQ失败: {traceback.format_exc()}")
+
+@app_router.get("/{app_id}/faqs", tags=["FAQ"])
+async def list_faq_items(
+    app_id: str,
+    page: int = Query(default=1, ge=1),
+    size: int = Query(default=100, le=1000),
+    tenant_id: str = Depends(get_tenant_id),
+    session: AsyncSession = Depends(get_db_session),
+    chatapp_service: ChatappService = Depends(get_chatapp_service),
+    faq_item_service: FAQItemService = Depends(get_faq_item_service),
+):
+    logger.info(f"Listing FAQ items for app_id: {app_id}")
+    try:
+        # Get chatbot by app_id to get chatbot_id
+        chatbot = await chatapp_service.get_chatapp_by_app_id(app_id=app_id, tenant_id=tenant_id)
+        if not chatbot:
+            raise ApiException(code=404, message=f"应用 '{app_id}' 不存在。")
+
+        faq_items = await faq_item_service.list_faq_items(
+            chatbot_id=chatbot.app_id,
+            tenant_id=tenant_id,
+            page=page,
+            size=size,
+        )
+        return success_response(data=faq_items, message="查询FAQ列表成功。")
+    except ValueError as e:
+        logger.error(f"Failed to list FAQ items: {str(e)}")
+        raise ApiException(code=400, message=str(e))
+    except ApiException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to list FAQ items: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"查询FAQ列表失败: {traceback.format_exc()}")
+
+@app_router.put("/{app_id}/faqs/{faq_item_id}", response_model=ResponseModel[FAQItemEntity], tags=["FAQ"])
+async def update_faq_item(
+    app_id: str,
+    faq_item_id: str,
+    faq_item_update: FAQItemCreate,
+    tenant_id: str = Depends(get_tenant_id),
+    session: AsyncSession = Depends(get_db_session),
+    faq_item_service: FAQItemService = Depends(get_faq_item_service),
+    rag_service: RagService = Depends(get_rag_service),
+):
+    try:
+        faq_item = await faq_item_service.update_faq_item(
+            id=faq_item_id, update_data=faq_item_update, tenant_id=tenant_id, rag_service=rag_service
+        )
+        await session.commit()
+        await session.refresh(faq_item)
+        return success_response(data=faq_item, message="更新FAQ成功。")
+    except ValueError as e:
+        logger.error(f"Failed to update FAQ item: {str(e)}")
+        raise ApiException(code=400, message=str(e))
+    except Exception as e:
+        logger.error(f"Failed to update FAQ item: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"更新FAQ失败: {traceback.format_exc()}")
+
+@app_router.delete("/{app_id}/faqs/{faq_item_id}", tags=["FAQ"])
+async def delete_faq_item(
+    app_id: str,
+    faq_item_id: str,
+    tenant_id: str = Depends(get_tenant_id),
+    session: AsyncSession = Depends(get_db_session),
+    faq_item_service: FAQItemService = Depends(get_faq_item_service),
+    rag_service: RagService = Depends(get_rag_service),
+):
+    try:
+        await faq_item_service.delete_faq_item(id=faq_item_id, tenant_id=tenant_id, rag_service=rag_service)
+        await session.commit()
+        return success_response(message=f"FAQ'{faq_item_id}'删除成功。")
+    except ValueError as e:
+        logger.error(f"Failed to delete FAQ item: {str(e)}")
+        raise ApiException(code=400, message=str(e))
+    except Exception as e:
+        logger.error(f"Failed to delete FAQ item: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"删除FAQ失败: {traceback.format_exc()}")
+
+@app_router.get("/{app_id}/faq-config", response_model=ResponseModel[FAQConfigCreate], tags=["FAQ"])
+async def get_faq_config(
+    app_id: str,
+    tenant_id: str = Depends(get_tenant_id),
+    session: AsyncSession = Depends(get_db_session),
+    chatapp_service: ChatappService = Depends(get_chatapp_service),
+    faq_config_service: FAQConfigService = Depends(get_faq_config_service),
+):
+    """Get FAQ config for an app."""
+    try:
+        # Get chatbot by app_id to get chatbot_id
+        chatbot = await chatapp_service.get_chatapp_by_app_id(app_id=app_id, tenant_id=tenant_id)
+        if not chatbot:
+            raise ApiException(code=404, message=f"应用 '{app_id}' 不存在。")
+
+        faq_config = await faq_config_service.get_or_create_faq_config(
+            chatbot_id=chatbot.id, tenant_id=tenant_id
+        )
+        await session.commit()
+        return success_response(data=faq_config, message="获取FAQ配置成功。")
+    except ValueError as e:
+        logger.error(f"Failed to get FAQ config: {str(e)}")
+        raise ApiException(code=400, message=str(e))
+    except ApiException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to get FAQ config: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"获取FAQ配置失败: {traceback.format_exc()}")
+
+@app_router.put("/{app_id}/faq-config", response_model=ResponseModel[FAQConfigCreate], tags=["FAQ"])
+async def update_faq_config(
+    app_id: str,
+    faq_config_data: FAQConfigCreate,
+    tenant_id: str = Depends(get_tenant_id),
+    session: AsyncSession = Depends(get_db_session),
+    chatapp_service: ChatappService = Depends(get_chatapp_service),
+    faq_config_service: FAQConfigService = Depends(get_faq_config_service),
+    knowledgebase_service: KnowledgebaseService = Depends(get_knowledgebase_service),
+):
+    """Update FAQ config for an app."""
+    try:
+        # Get chatbot by app_id to get chatbot_id
+        chatbot = await chatapp_service.get_chatapp_by_app_id(app_id=app_id, tenant_id=tenant_id)
+        if not chatbot:
+            raise ApiException(code=404, message=f"应用 '{app_id}' 不存在。")
+
+        # Update FAQ config with full synchronization logic
+        updated_faq_config = await faq_config_service.update_faq_config_with_sync(
+            app_id=app_id,
+            chatbot_id=chatbot.id,
+            update_data=faq_config_data,
+            tenant_id=tenant_id,
+            knowledgebase_service=knowledgebase_service
+        )
+
+        await session.commit()
+        return success_response(data=updated_faq_config, message="更新FAQ配置成功。")
+    except ValueError as e:
+        logger.error(f"Failed to update FAQ config: {str(e)}")
+        raise ApiException(code=400, message=str(e))
+    except ApiException:
+        raise
+    except Exception as e:
+        logger.error(f"Failed to update FAQ config: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"更新FAQ配置失败: {traceback.format_exc()}")
+
+MAX_CHECK_ATTEMPTS = 100
+CHECK_INTERVAL = 3
+
+@app_router.post("/{app_id}/faq-files", tags=["FAQ"])
+async def upload_faq_files(
+    app_id: str,
+    files: Optional[List[UploadFile]] = File(...),
+    table_config: Optional[str] = Form(None, description="JSON string of table_config, shared by all files in this upload"),
+    session: AsyncSession = Depends(get_db_session),
+    chatapp_service: ChatappService = Depends(get_chatapp_service),
+    embedding_service: EmbeddingService = Depends(get_embedding_service),
+    knowledgebase_service: KnowledgebaseService = Depends(get_knowledgebase_service),
+    rag_service: RagService = Depends(get_rag_service),
+    tenant_id: str = Depends(get_tenant_id),
+):
+    """Upload and parse FAQ files directly without storing file entity."""
+    knowledgebase = None
+    try:
+        if not files:
+            raise ApiException(code=400, message="没有上传任何文件。")
+        # Get chatbot by app_id to get chatbot_id
+        chatbot = await chatapp_service.get_chatapp_by_app_id(app_id=app_id, tenant_id=tenant_id)
+        if not chatbot:
+            raise ApiException(code=404, message=f"应用 '{app_id}' 不存在。")
+
+        if not chatbot.enable_faq or not chatbot.faq_config:
+            raise ApiException(code=400, message="请先启用FAQ功能。")
+
+        # Get or create FAQ knowledgebase
+        kb_name = f"{app_id}_{FAQ_KNOWLEDGEBASE_NAME}"
+        knowledgebase = await knowledgebase_service.get_knowledgebase_by_name(kb_name, tenant_id=tenant_id)
+        default_embedding_config = await embedding_service.get_default_embedding(tenant_id=tenant_id)
+
+        if not knowledgebase:
+            logger.info(f"Creating FAQ knowledgebase {kb_name} for tenant {tenant_id}")
+            faq_config_service = FAQConfigService(session)
+            faq_config = await faq_config_service.get_faq_config_by_chatbot_id(
+                chatbot_id=chatbot.id, tenant_id=tenant_id
+            )
+
+            if faq_config and faq_config.embedding_model:
+                embedding_model = faq_config.embedding_model
+            else:
+                embedding_model = default_embedding_config.model_id
+
+            default_similarity_threshold = faq_config.similarity_threshold if faq_config else DEFAULT_FAQ_SIMILARITY_THRESHOLD
+
+            retrieval_config = RetrievalConfig(
+                retrieval_mode=VectorIndexRetrievalType.vector,
+                top_k=1,
+                enable_rerank=False,
+                rerank_top_k=None,
+                vector_weight=1.0,
+                similarity_threshold=default_similarity_threshold,
+            )
+
+            kb_create = KnowledgebaseCreate(
+                name=kb_name,
+                description="FAQ知识库",
+                embedding_model=embedding_model,
+                retrieval_config=retrieval_config,
+            )
+            knowledgebase = await knowledgebase_service.create_knowledgebase(kb_data=kb_create, tenant_id=tenant_id)
+            try:
+                await session.commit()
+                await session.refresh(knowledgebase)
+                await knowledgebase_service.write_cache_after_commit(knowledgebase, tenant_id)
+                logger.info(f"Created FAQ knowledgebase {knowledgebase.id} for tenant {tenant_id}")
+            except IntegrityError:
+                await session.rollback()
+                if knowledgebase:
+                    await knowledgebase_service.delete_cache_on_rollback(knowledgebase.id, tenant_id, kb_create.name)
+                knowledgebase = await knowledgebase_service.get_knowledgebase_by_name(kb_name, tenant_id=tenant_id)
+                if not knowledgebase:
+                    raise ApiException(code=500, message="无法创建或获取FAQ知识库: 并发创建冲突")
+                logger.info(f"Retrieved existing FAQ knowledgebase {knowledgebase.id} for tenant {tenant_id}")
+            except Exception:
+                await session.rollback()
+                if knowledgebase:
+                    await knowledgebase_service.delete_cache_on_rollback(knowledgebase.id, tenant_id, kb_create.name)
+                raise
+        else:
+            logger.info(f"Found existing FAQ knowledgebase {knowledgebase.id} for tenant {tenant_id}")
+
+
+
+        parsed_chunk_config = knowledgebase.chunk_config
+        parsed_chunk_config = ChunkConfig.model_validate(parsed_chunk_config)
+
+        # Parse and validate table_config if provided
+        parsed_table_config = None
+        if table_config:
+            try:
+                table_config_dict = json.loads(table_config)
+                if not isinstance(table_config_dict, dict):
+                    raise ValueError("table_config must be a JSON object")
+                parsed_table_config = TableParserConfig.model_validate(table_config_dict)
+                if parsed_chunk_config.table_config:
+                    table_config_dict_merged = parsed_chunk_config.table_config.model_dump()
+                    table_config_dict_merged.update(table_config_dict)
+                    parsed_chunk_config.table_config = TableParserConfig.model_validate(table_config_dict_merged)
+                else:
+                    parsed_chunk_config.table_config = parsed_table_config
+            except json.JSONDecodeError as e:
+                raise ApiException(code=400, message=f"table_config 格式错误: {e}")
+            except Exception as e:
+                raise ApiException(code=400, message=f"table_config 验证失败: {e}")
+
+
+
+        # Process each file
+        response_data = []
+        total_chunks = 0
+
+        for file in files:
+            temp_file_path = None
+            try:
+                file_content = await file.read()
+                file_content_io = BytesIO(file_content)
+                file_extension = "." + (file.filename.split(".")[-1] if "." in file.filename else "")
+
+                # Create temporary file to store file content
+                temp_file = tempfile.NamedTemporaryFile(
+                    mode='wb',
+                    suffix=file_extension,
+                    delete=False,
+                    prefix=f"faq_upload_{uuid.uuid4().hex}_"
+                )
+                temp_file_path = temp_file.name
+                temp_file.write(file_content)
+                temp_file.close()
+
+                # Create FileItem for parsing
+                file_id = uuid.uuid4().hex
+                file_md5 = hashlib.md5(file_content).hexdigest()
+
+                file_item = FileItem(
+                    id=file_id,
+                    file_path=temp_file_path,
+                    file=file_content_io,
+                    kb_id=knowledgebase.id,
+                    file_extension=file_extension,
+                    file_name=file.filename or f"faq_file_{file_id}",
+                    file_md5=file_md5,
+                    file_size=len(file_content),
+                    tenant_id=tenant_id,
+                )
+
+                logger.info(f"Parsing FAQ file {file_item.file_name} from temporary path {temp_file_path}...")
+                file_entity = to_file_entity(file_item=file_item)
+                # Convert ChunkConfig object to dict for file_entity
+                file_entity.chunk_config = parsed_chunk_config.model_dump()
+                file_parser = await kb_file_client.create_file_parser(knowledgebase, file_entity)
+                documents, nodes = file_parser.parse(file_item, is_attachment=False)
+
+                if not nodes:
+                    logger.warning(f"No nodes parsed from file {file_item.file_name}.")
+                    response_data.append({"file_name": file_item.file_name, "items_count": 0})
+                    continue
+
+                # Sanitize text
+                for node in nodes:
+                    node.text = sanitize_text(node.text)
+
+                logger.info(f"Parsed {len(nodes)} documents from FAQ file {file_item.file_name}.")
+
+                # Save FAQ items to database from node metadata
+                faq_item_service = FAQItemService(session)
+                saved_faq_count = 0
+
+                # Prepare FAQ items data from all nodes
+                faq_items_to_create = []
+                for node in nodes:
+                    question = node.metadata.get("question", "").strip() if node.metadata else ""
+                    answer = node.metadata.get("answer", "").strip() if node.metadata else ""
+
+                    # Skip if both question and answer are empty
+                    if not question and not answer:
+                        logger.warning(f"Skipping node with empty question and answer from file {file_item.file_name}")
+                        continue
+
+                    faq_item_data = FAQItemCreate(
+                        question=question,
+                        answer=answer,
+                        chatbot_id=chatbot.app_id,
+                        file_id=file_id,
+                        active=True,
+                    )
+                    faq_items_to_create.append(faq_item_data)
+
+                if faq_items_to_create:
+                    created_faq_items = []
+                    for faq_item_data in tqdm(faq_items_to_create, desc=f"Creating FAQ Items for file {file_item.file_name}"):
+                        try:
+                            faq_item = await faq_item_service.create_faq_item(
+                                chatbot_id=chatbot.app_id,
+                                faq_item_data=faq_item_data,
+                                tenant_id=tenant_id,
+                            )
+                            created_faq_items.append(faq_item)
+                        except Exception as create_error:
+                            logger.error(f"Failed to create FAQ item: {create_error}")
+                            continue
+
+                    # Save to knowledgebase in parallel batches
+                    if created_faq_items:
+                        save_tasks = [
+                            faq_item_service.save_faq_to_knowledgebase(faq_item, tenant_id, rag_service)
+                            for faq_item in created_faq_items
+                        ]
+
+                        if save_tasks:
+                            # Process save tasks in batches to avoid overwhelming the system
+                            save_batch_size = 50
+                            for j in tqdm(range(0, len(save_tasks), save_batch_size), desc=f"Saving FAQ Items to KB for file {file_item.file_name}"):
+                                save_batch = save_tasks[j:j + save_batch_size]
+                                await asyncio.gather(*save_batch, return_exceptions=True)
+
+                        saved_faq_count = len(created_faq_items)
+
+                        # Commit all FAQ items
+                        await session.commit()
+
+                        # Refresh all created items (skip if refresh fails)
+                        for faq_item in created_faq_items:
+                            try:
+                                await session.refresh(faq_item)
+                            except Exception as refresh_error:
+                                logger.debug(f"Could not refresh FAQ item {faq_item.id} (may not be persistent): {refresh_error}")
+
+                logger.info(f"Saved {saved_faq_count}/{len(nodes)} FAQ items to database from file {file_item.file_name}.")
+
+                # Add successful result to response_data
+                response_data.append({
+                    "file_name": file_item.file_name,
+                    "items_count": saved_faq_count
+                })
+                total_chunks += saved_faq_count
+            except Exception as file_error:
+                logger.error(f"Failed to process FAQ file {file.filename}: {traceback.format_exc()}")
+                response_data.append({
+                    "file_name": file.filename,
+                    "items_count": 0,
+                    "error": str(file_error)
+                })
+                # Continue processing other files even if one fails
+            finally:
+                # Clean up temporary file
+                if temp_file_path and os.path.exists(temp_file_path):
+                    try:
+                        os.unlink(temp_file_path)
+                        logger.debug(f"Deleted temporary file: {temp_file_path}")
+                    except Exception as cleanup_error:
+                        logger.warning(f"Failed to delete temporary file {temp_file_path}: {cleanup_error}")
+
+        await session.commit()
+
+        logger.info(f"Uploaded {len(files)} FAQ files successfully, total chunks: {total_chunks}.")
+        return success_response(
+            data=response_data,
+            message=f"成功上传并解析 {len(files)} 个文件，共提取 {total_chunks} 个片段。"
+        )
+    except Exception as e:
+        logger.error(f"Failed to process FAQ file: {traceback.format_exc()}")
+        raise ApiException(code=400, message=f"文件处理失败: {e}")
+
 
 @app_router.post("", response_model=ResponseModel[ChatBotEntity])
 async def create_chatbot(
@@ -29,6 +507,8 @@ async def create_chatbot(
 ):
     try:
         chatbot = await chatapp_service.create_chatapp(app_data=chatbot_create, tenant_id=tenant_id)
+        await session.commit()
+        await session.refresh(chatbot)
         return success_response(data=chatbot, message="创建应用成功。")
     except ValueError as e:
         logger.error(f"Failed to create chatapp: {str(e)}")
@@ -89,9 +569,11 @@ async def delete_chatbot(
     tenant_id: str = Depends(get_tenant_id),
     session: AsyncSession = Depends(get_db_session),
     chatapp_service: ChatappService = Depends(get_chatapp_service),
+    rag_service: RagService = Depends(get_rag_service),
 ):
     try:
-        await chatapp_service.delete_chatapp(id=id, tenant_id=tenant_id)
+        await chatapp_service.delete_chatapp(id=id, tenant_id=tenant_id, rag_service=rag_service)
+        await session.commit()
         return success_response(message=f"应用'{id}'删除成功。")
     except ValueError as e:
         logger.error(f"Failed to delete chatapp: {str(e)}")
diff --git a/backend/api/v1/config_apis/knowledgebase.py b/backend/api/v1/config_apis/knowledgebase.py
index 2c879bfa4..3bb7f6ee5 100644
--- a/backend/api/v1/config_apis/knowledgebase.py
+++ b/backend/api/v1/config_apis/knowledgebase.py
@@ -4,7 +4,8 @@
 import traceback
 from typing import List, Optional
 from common.knowledgebase.types import FileStatus
-from fastapi import APIRouter, Depends, File, Query, UploadFile, Form
+from fastapi import APIRouter, Depends, File, Query, UploadFile, Form, Body
+import json
 from pydantic import BaseModel, Field
 from sqlmodel.ext.asyncio.session import AsyncSession
 from rag.file_item_utils import to_file_entity
@@ -13,6 +14,7 @@
 from db.models.knowledgebase.knowledgebase import (
     KbEntity,
     KnowledgebaseCreate,
+    ChunkConfig,
 )
 from db.db_context import get_db_session
 from pairag.file.store.file_store_helper import file_store
@@ -208,6 +210,13 @@ async def start_parse_task(
         if not kb_entity:
             raise ValueError(f"知识库 {kb_id} 不存在。")
 
+        # Validate chunk_config if provided
+        if parse_request.chunk_config:
+            try:
+                ChunkConfig.model_validate(parse_request.chunk_config)
+            except Exception as e:
+                raise ApiException(code=400, message=f"chunk_config 格式错误: {e}")
+
         file_items = await upload_file_names_async(kb_id=kb_id, parse_tasks=parse_request.files, tenant_id=tenant_id)
 
         file_version = int(time.time())
@@ -228,13 +237,23 @@ async def start_parse_task(
             else:
                 file_entity = to_file_entity(file_item=file_item)
 
+            # Update chunk_config if provided
+            if parse_request.chunk_config:
+                file_entity.chunk_config = parse_request.chunk_config
+
             file_entity.file_version = file_version
             background_worker.enqueue_file_tasks.delay(file_entity.id, file_entity.file_version, is_attachment=False, tenant_id=tenant_id)
             session.add(file_entity)
             file_entities.append(file_entity)
 
+        await session.commit()
+        for file_entity in file_entities:
+            await session.refresh(file_entity)
+
         logger.info(f"Uploaded {len(file_entities)} files successfully.")
         return success_response(data=file_entities, message="启动解析任务成功")
+    except ApiException:
+        raise
     except ValueError as e:
         logger.error(f"启动解析任务失败。\nValueError:{traceback.format_exc()}")
         raise ApiException(code=400, message=str(e))
@@ -250,15 +269,39 @@ async def upload_files(
     auto_parse: bool = Query(default=True),
     files: Optional[List[UploadFile]] = File(...),
     file_sources: Optional[List[str]] = Form(None),
+    chunk_config: Optional[str] = Form(None, description="JSON string of chunk_config, shared by all files in this upload"),
     tenant_id: str = Depends(get_tenant_id),
     session: AsyncSession = Depends(get_db_session),
     rag_service: RagService = Depends(get_rag_service),
     file_service: FileService = Depends(get_file_service),
+    knowledgebase_service: KnowledgebaseService = Depends(get_knowledgebase_service),
 ):
     try:
         file_version = int(time.time())
         if not files:
             raise ApiException(code=400, message="没有上传任何文件。")
+
+
+        knowledgebase = await knowledgebase_service.get_knowledgebase(kb_id=kb_id, tenant_id=tenant_id)
+        if not knowledgebase:
+            raise ApiException.not_found(kb_id, "知识库")
+
+        kb_chunk_config = knowledgebase.chunk_config
+
+
+        parsed_chunk_config = None
+        if chunk_config:
+            try:
+                parsed_chunk_config = json.loads(chunk_config)
+                if not isinstance(parsed_chunk_config, dict):
+                    raise ValueError("chunk_config must be a JSON object")
+                # Validate chunk_config
+                ChunkConfig.model_validate(parsed_chunk_config)
+            except json.JSONDecodeError as e:
+                raise ApiException(code=400, message=f"chunk_config 格式错误: {e}")
+            except Exception as e:
+                raise ApiException(code=400, message=f"chunk_config 验证失败: {e}")
+
         file_items = await upload_form_files_async(kb_id=kb_id, files=files, tenant_id=tenant_id)
 
         file_names = [file_item.file_name for file_item in file_items]
@@ -281,10 +324,15 @@ async def upload_files(
         if file_sources:
             assert len(file_sources) == len(new_file_entities), "文件来源列表长度与文件列表长度不一致"
 
-        for i,file_entity in enumerate(new_file_entities):
+        # Apply chunk_config to all files if provided (shared by all files in this upload)
+        for i, file_entity in enumerate(new_file_entities):
             if file_sources:
                 file_entity.file_source = file_sources[i]
 
+            # All files share the same chunk_config if provided
+            if parsed_chunk_config:
+                file_entity.chunk_config = parsed_chunk_config
+
             if auto_parse:
                 import app.worker as background_worker
                 background_worker.enqueue_file_tasks.delay(file_entity.id, file_entity.file_version, is_attachment=False, tenant_id=tenant_id)
@@ -292,8 +340,22 @@ async def upload_files(
 
             session.add(file_entity)
 
+        await session.commit()
+
+
+        for file_entity in new_file_entities:
+            await session.refresh(file_entity)
+
+
+        response_entities = []
+        for file_entity in new_file_entities:
+            file_dict = file_entity.model_dump()
+            if not file_entity.chunk_config:
+                file_dict["chunk_config"] = kb_chunk_config
+            response_entities.append(file_dict)
+
         logger.info(f"Uploaded {len(new_file_entities)} files successfully.")
-        return success_response(data=new_file_entities, message="上传文件成功")
+        return success_response(data=response_entities, message="上传文件成功")
     except ValueError as e:
         logger.error(f"上传文件失败。\nValueError:{e}")
         raise ApiException(code=400, message=str(e))
@@ -327,21 +389,44 @@ async def get_kb_file(
         raise ApiException(code=400, message=f"查询文件失败: {e}.")
 
 
+class ReprocessFileRequest(BaseModel):
+    chunk_config: Optional[dict] = Field(default=None, description="Optional chunk configuration for the file")
+
+
 @knowledgebase_router.put("/{kb_id}/files/{file_id}")
 async def reprocess_file(
     kb_id: str,
     file_id: str,
+    body: Optional[ReprocessFileRequest] = Body(None),
     tenant_id: str = Depends(get_tenant_id),
     session: AsyncSession = Depends(get_db_session),
     file_service: FileService = Depends(get_file_service),
+    rag_service: RagService = Depends(get_rag_service),
 ):
     try:
         file_entities = await file_service.get_files_by_ids(kb_id=kb_id, file_ids=[file_id], tenant_id=tenant_id)
         if not file_entities:
             raise ApiException.not_found(file_id, "文件")
 
-        reprocessed_count = await _batch_reprocess_files(kb_id=kb_id, file_entities=file_entities, session=session, tenant_id=tenant_id)
+        # 如果提供了 chunk_config，先验证并更新
+        chunk_config = None
+        if body and body.chunk_config:
+            try:
+                ChunkConfig.model_validate(body.chunk_config)
+                chunk_config = body.chunk_config
+            except Exception as e:
+                raise ApiException(code=400, message=f"chunk_config 格式错误: {e}")
+
+        reprocessed_count = await _batch_reprocess_files(
+            kb_id=kb_id,
+            file_entities=file_entities,
+            session=session,
+            tenant_id=tenant_id,
+            chunk_config=chunk_config
+        )
         return success_response(data=reprocessed_count, message=f"成功将 {reprocessed_count} 个文件加入重新处理队列。")
+    except ApiException:
+        raise
     except ValueError as e:
         logger.error(f"重新处理文件失败。\nValueError:{e}")
         raise ApiException(code=400, message=str(e))
@@ -369,10 +454,10 @@ async def delete_file(
         raise ApiException(code=400, message=f"删除文件失败: {e}.")
 
 
-
 class BatchOperationRequest(BaseModel):
     operation: str = Field(..., description="操作类型: 'delete' 或 'reprocess'")
     file_id_list: List[str] = Field(..., description="要操作的文件ID列表")
+    chunk_config: Optional[dict] = Field(default=None, description="Optional chunk configuration for reprocess operation, shared by all files")
 
 
 @knowledgebase_router.post("/{kb_id}/files/batch", response_model=ResponseModel[dict])
@@ -422,8 +507,24 @@ async def batch_operations(
             raise ApiException(code=400, message=f"删除文件失败: {e}.")
     elif request.operation == "reprocess":
         try:
-            reprocessed_count = await _batch_reprocess_files(kb_id=kb_id, file_entities=file_entities, session=session, tenant_id=tenant_id)
+            chunk_config = None
+            if request.chunk_config:
+                try:
+                    ChunkConfig.model_validate(request.chunk_config)
+                    chunk_config = request.chunk_config
+                except Exception as e:
+                    raise ApiException(code=400, message=f"chunk_config 格式错误: {e}")
+
+            reprocessed_count = await _batch_reprocess_files(
+                kb_id=kb_id,
+                file_entities=file_entities,
+                session=session,
+                tenant_id=tenant_id,
+                chunk_config=chunk_config
+            )
             return success_response(data=reprocessed_count, message=f"成功将 {reprocessed_count} 个文件加入重新处理队列。")
+        except ApiException:
+            raise
         except ValueError as e:
             logger.error(f"重新处理文件失败。\nValueError:{e}")
             raise ApiException(code=400, message=str(e))
@@ -437,9 +538,11 @@ async def _batch_reprocess_files(
     file_entities: List[KbFileEntity],
     session: AsyncSession,
     tenant_id: str,
+    chunk_config: Optional[dict] = None,
 ) -> ResponseModel[dict]:
     """
     批量重新处理文件的内部实现
+    如果提供了 chunk_config，会在重新解析之前更新所有文件的 chunk_config
     """
     import app.worker as background_worker
 
@@ -450,6 +553,12 @@ async def _batch_reprocess_files(
         file_entity.status = FileStatus.pending
         file_entity.file_version = file_version
         file_entity.updated_at = datetime.now(timezone.utc).replace(tzinfo=None)
+
+        # 如果提供了 chunk_config，更新文件的 chunk_config
+        if chunk_config:
+            file_entity.chunk_config = chunk_config
+            logger.info(f"Updated chunk_config for file {file_entity.id} before reprocessing.")
+
         session.add(file_entity)
         reprocessed_count += 1
 
@@ -474,7 +583,6 @@ class FileSourceParam(BaseModel):
     file_source: str = Field(default=None)
 
 
-
 @knowledgebase_router.post("/{kb_id}/files/{file_id}/source", response_model=ResponseModel[KbFileEntity])
 async def set_file_source(
     kb_id: str,
diff --git a/backend/api/v1/faq_retrieval.py b/backend/api/v1/faq_retrieval.py
new file mode 100644
index 000000000..c00c089e3
--- /dev/null
+++ b/backend/api/v1/faq_retrieval.py
@@ -0,0 +1,124 @@
+from fastapi import APIRouter, Depends
+from pydantic import BaseModel
+from typing import Optional, List
+from common.chat.response_model import ResponseModel, success_response
+from api.api_exception import ApiException
+from db.db_context import get_db_session
+from common.chat.models import DocRecord, NewRetrievalResponse, RetrievalSetting, MetadataFilteringCondition
+from sqlmodel.ext.asyncio.session import AsyncSession
+from service.injection import get_rag_service, get_tenant_id, get_chatapp_service, get_faq_config_service
+from service.knowledgebase.rag_service import RagService
+from service.tool.chatapp_service import ChatappService
+from service.tool.faq_config_service import FAQConfigService
+from service.knowledgebase.knowledgebase_service import KnowledgebaseService
+from common.knowledgebase.constants import DEFAULT_FAQ_SIMILARITY_THRESHOLD
+from common.knowledgebase.types import VectorIndexRetrievalType
+from common.tool.search_result import SearchResult
+import traceback
+from loguru import logger
+
+
+faq_retrieval_router = APIRouter()
+
+
+class FAQRetrievalRequest(BaseModel):
+    chatapp_id: str  # chatbot.id
+    query: str  # 查询内容
+    user_id: Optional[str] = None
+    retrieval_setting: Optional[RetrievalSetting] = None
+    metadata_condition: Optional[MetadataFilteringCondition] = None
+
+
+@faq_retrieval_router.post(
+    "", response_model=ResponseModel[NewRetrievalResponse]
+)
+async def faq_retrieval(
+    retrieval_request: FAQRetrievalRequest,
+    session: AsyncSession = Depends(get_db_session),
+    tenant_id: str = Depends(get_tenant_id),
+    rag_service: RagService = Depends(get_rag_service),
+    chatapp_service: ChatappService = Depends(get_chatapp_service),
+    faq_config_service: FAQConfigService = Depends(get_faq_config_service),
+):
+    logger.info(f"FAQ Retrieval request: chatapp_id={retrieval_request.chatapp_id}, query={retrieval_request.query}, tenant_id={tenant_id}")
+    try:
+        chatbot = await chatapp_service.get_chatapp_by_app_id(
+            app_id=retrieval_request.chatapp_id,
+            tenant_id=tenant_id
+        )
+        if not chatbot:
+            raise ApiException(code=404, message=f"应用 '{retrieval_request.chatapp_id}' 不存在。")
+
+        # Get FAQ config to get similarity_threshold
+        faq_config = chatbot.faq_config
+        if not faq_config:
+            raise ApiException(code=404, message=f"FAQ配置 '{retrieval_request.chatapp_id}' 不存在。")
+
+
+        kb_id = faq_config.kb_id
+        knowledgebase_service = KnowledgebaseService(session)
+        kb = await knowledgebase_service.get_knowledgebase(kb_id, tenant_id=tenant_id)
+
+        if not kb:
+            raise ApiException(code=404, message=f"FAQ知识库 '{kb_id}' 不存在。")
+
+        # Set default retrieval_setting if not provided, or merge with defaults
+        default_similarity_threshold = faq_config.similarity_threshold if faq_config else DEFAULT_FAQ_SIMILARITY_THRESHOLD
+
+        if retrieval_request.retrieval_setting is None:
+            retrieval_setting = RetrievalSetting(
+                retrieval_mode=VectorIndexRetrievalType.vector,
+                top_k=1,
+                enable_rerank=False,
+                rerank_top_k=None,
+                vector_weight=1.0,
+                similarity_threshold=default_similarity_threshold,
+            )
+        else:
+            # Merge user-provided settings with defaults
+            retrieval_setting = RetrievalSetting(
+                retrieval_mode=retrieval_request.retrieval_setting.retrieval_mode or VectorIndexRetrievalType.vector,
+                top_k=retrieval_request.retrieval_setting.top_k if retrieval_request.retrieval_setting.top_k is not None else 1,
+                enable_rerank=retrieval_request.retrieval_setting.enable_rerank if retrieval_request.retrieval_setting.enable_rerank is not None else False,
+                rerank_top_k=retrieval_request.retrieval_setting.rerank_top_k,
+                rerank_model=retrieval_request.retrieval_setting.rerank_model,
+                rerank_provider_name=retrieval_request.retrieval_setting.rerank_provider_name,
+                vector_weight=retrieval_request.retrieval_setting.vector_weight if retrieval_request.retrieval_setting.vector_weight is not None else 1.0,
+                similarity_threshold=retrieval_request.retrieval_setting.similarity_threshold if retrieval_request.retrieval_setting.similarity_threshold is not None else default_similarity_threshold,
+                score_threshold=retrieval_request.retrieval_setting.score_threshold,
+            )
+
+        search_results: List[SearchResult] = await rag_service.aquery(
+            query=retrieval_request.query,
+            user_id=retrieval_request.user_id,
+            kb_id=kb.id,
+            kb_id_list=None,
+            retrieval_setting=retrieval_setting,
+            metadata_condition=None,
+            tenant_id=tenant_id,
+        )
+
+        logger.info(
+            f"Retrieved {len(search_results)} FAQ results for query '{retrieval_request.query}' from knowledgebase {kb.id}."
+        )
+
+        records = []
+        for node in search_results:
+            records.append(DocRecord(
+                content=node.content,
+                score=node.score,
+                title=node.title,
+                metadata=node.metadata,
+            ))
+
+        # 使用统一的响应格式
+        retrieval_response = NewRetrievalResponse(records=records)
+        return success_response(data=retrieval_response, message="FAQ检索成功")
+    except ApiException:
+        raise
+    except ValueError as e:
+        logger.error(f"Failed to retrieve FAQ: {traceback.format_exc()}")
+        raise ApiException(code=400, message=f"FAQ检索失败: {e}")
+    except Exception as e:
+        logger.error(f"Failed to retrieve FAQ: {traceback.format_exc()}")
+        raise ApiException(code=500, message=f"FAQ检索失败: {e}")
diff --git a/backend/api/v1/routers.py b/backend/api/v1/routers.py
index 8cfba1602..a826a7b30 100644
--- a/backend/api/v1/routers.py
+++ b/backend/api/v1/routers.py
@@ -44,6 +44,7 @@ def add_chat_router(app: FastAPI):
     from api.v1.chat import chat_agent_router
     from api.v1.thread import thread_router
     from api.v1.retrieval import retrieval_router
+    from api.v1.faq_retrieval import faq_retrieval_router
     from api.v1.retrieval_tool_api import retrieval_tool_router
     from api.v1.healthcheck import health_router
     from api.v1.embed import embedding_router
@@ -51,6 +52,7 @@ def add_chat_router(app: FastAPI):
     app.include_router(chat_agent_router, prefix="/v1/chat/completions")
     app.include_router(thread_router, prefix="/v1/threads")
     app.include_router(retrieval_router, prefix="/v1/retrieval")
+    app.include_router(faq_retrieval_router, prefix="/v1/faq-retrieval")
     app.include_router(retrieval_tool_router, prefix="/v1/tools/retrieval")
     app.include_router(embedding_router, prefix="/v1/embeddings")
 
diff --git a/backend/common/chat/models.py b/backend/common/chat/models.py
index e6d4ee918..e0920f5d7 100644
--- a/backend/common/chat/models.py
+++ b/backend/common/chat/models.py
@@ -94,6 +94,7 @@ class ChatAgentRequest(BaseModel):
 
     mcp_ids: Optional[List[str]] = []
     kb_ids: Optional[List[str]] = []
+    faq_config: Optional[dict] = None
     enable_search: Optional[bool] = False
     enable_agent: Optional[bool] = False
     enable_chatdb: Optional[bool] = False
diff --git a/backend/common/knowledgebase/constants.py b/backend/common/knowledgebase/constants.py
index 90b023bf8..be0482dca 100644
--- a/backend/common/knowledgebase/constants.py
+++ b/backend/common/knowledgebase/constants.py
@@ -1,7 +1,7 @@
 DEFAULT_CHUNK_SIZE = 1024
 DEFAULT_CHUNK_OVERLAP = 50
 DEFAULT_PARSER_TYPE = "structure"
-DEFAULT_SENTENCE_SEPARATOR = "\n\n"
+DEFAULT_PARAGRAPH_SEPARATOR = "\n\n"
 
 DEFAULT_EMBEDDING_MODEL = "BAAI/bge-m3"
 DEFAULT_RERANK_MODEL = "BAAI/bge-reranker-v2-m3"
@@ -14,10 +14,13 @@
 
 DEFAULT_VECTOR_WEIGHT = 0.5
 
+DEFAULT_FAQ_SIMILARITY_THRESHOLD = 0.8
+
 
 
 DEFAULT_KNOWLEDGEBASE_PATH = "localdata/knowledgebases"
 ATTACHMENT_KNOWLEDGEBASE_NAME = "default_attachments"
+FAQ_KNOWLEDGEBASE_NAME = "default_faqs"
 DEFAULT_VECTOR_ID = "default_vectordb"
 
 
diff --git a/backend/db/models/__init__.py b/backend/db/models/__init__.py
index 67b5578d7..eca10be6e 100644
--- a/backend/db/models/__init__.py
+++ b/backend/db/models/__init__.py
@@ -14,6 +14,7 @@
 from db.models.knowledgebase.metadata import KbMetadataEntity, FileMetadataEntity
 from db.models.prompt import PromptModelEntity
 from db.models.chatbot import ChatBotEntity
+from db.models.faq_item import FAQItemEntity
 from db.models.guardrail import GuardrailConfigEntity
 from db.models.code_sandbox import CodeSandboxConfigEntity
 from db.models.evaluation.dataset import DatasetEntity, DatasetSampleEntity
diff --git a/backend/db/models/chatbot.py b/backend/db/models/chatbot.py
index 0ece8e1f5..c83f31c07 100644
--- a/backend/db/models/chatbot.py
+++ b/backend/db/models/chatbot.py
@@ -21,6 +21,8 @@ class ChatBotCreate(SQLModel):
     enable_input_guardrail: Optional[bool] = Field(default=False)
     enable_output_guardrail: Optional[bool] = Field(default=False)
     guardrail_hint: Optional[str] = Field(default=None, sa_column=Column(Text))
+    enable_faq: Optional[bool] = Field(default=False)
+    faq_config: Optional[dict] = Field(default=None, sa_column=Column(JSON))
     prompts: Optional[dict] = Field(default={})
 
 
@@ -45,6 +47,7 @@ class ChatBotEntity(ChatBotCreate, table=True):
     id: str = Field(primary_key=True, default_factory=lambda: str(uuid.uuid4().hex))
     mcp_ids: List[str] = Field(default_factory=list, sa_column=Column(JSON))
     kb_ids: List[str] = Field(default_factory=list, sa_column=Column(JSON))
+    faq_config: Optional[dict] = Field(default=None, sa_column=Column(JSON))
     prompts: Optional[dict] = Field(default_factory=dict, sa_column=Column(JSON))
     tenant_id: Optional[str] = Field(default=DEFAULT_TENANT_ID)
 
diff --git a/backend/db/models/faq_config.py b/backend/db/models/faq_config.py
new file mode 100644
index 000000000..b7db0c218
--- /dev/null
+++ b/backend/db/models/faq_config.py
@@ -0,0 +1,18 @@
+from sqlmodel import Field, SQLModel
+from typing import Optional
+from common.knowledgebase.constants import DEFAULT_FAQ_SIMILARITY_THRESHOLD
+
+
+class FAQConfigCreate(SQLModel):
+    active: bool = Field(
+        default=True
+    )
+    # FAQ configuration fields
+    kb_id: Optional[str] = Field(default=None, description="FAQ知识库ID")
+    similarity_threshold: Optional[float] = Field(default=DEFAULT_FAQ_SIMILARITY_THRESHOLD, description="相似度阈值，范围0.8-1.0")
+    embedding_model: Optional[str] = Field(default="BAAI/bge-m3", description="Embedding模型ID")
+    enable_question_in_retrieval: Optional[bool] = Field(default=True, description="问题是否参与检索")
+    enable_question_in_response: Optional[bool] = Field(default=True, description="问题是否参与回答")
+    enable_answer_in_retrieval: Optional[bool] = Field(default=False, description="答案是否参与检索")
+    enable_answer_in_response: Optional[bool] = Field(default=True, description="答案是否参与回答")
+    return_direct: Optional[bool] = Field(default=False, description="是否直接返回工具结果，不经过LLM加工")
diff --git a/backend/db/models/faq_item.py b/backend/db/models/faq_item.py
new file mode 100644
index 000000000..0b12224c9
--- /dev/null
+++ b/backend/db/models/faq_item.py
@@ -0,0 +1,31 @@
+import uuid
+from sqlmodel import Field, SQLModel
+from sqlalchemy import Column, DateTime, Text
+from datetime import datetime, timezone
+from typing import Optional
+from common.system_constants import DEFAULT_TENANT_ID
+
+
+class FAQItemCreate(SQLModel):
+    question: str = Field(default=None, sa_column=Column(Text))
+    answer: str = Field(default=None, sa_column=Column(Text))
+    chatbot_id: str = Field(default=None)
+    file_id: Optional[str] = Field(default=None)
+    active: bool = Field(default=True)
+
+
+class FAQItemEntity(FAQItemCreate, table=True):
+    __tablename__ = "pai_chatbot_faq"
+
+    id: str = Field(primary_key=True, default_factory=lambda: str(uuid.uuid4().hex))
+    tenant_id: Optional[str] = Field(default=DEFAULT_TENANT_ID, index=True)
+    chatbot_id: str = Field(default=None, foreign_key="pai_chatbot_model.app_id", ondelete="CASCADE", index=True)
+
+    created_at: datetime = Field(
+        default_factory=lambda: datetime.now(timezone.utc).replace(tzinfo=None),
+        sa_column=Column(DateTime),
+    )
+    updated_at: datetime = Field(
+        default_factory=lambda: datetime.now(timezone.utc).replace(tzinfo=None),
+        sa_column=Column(DateTime),
+    )
diff --git a/backend/db/models/knowledgebase/file.py b/backend/db/models/knowledgebase/file.py
index bfd0727bc..3fdb40d71 100644
--- a/backend/db/models/knowledgebase/file.py
+++ b/backend/db/models/knowledgebase/file.py
@@ -50,6 +50,9 @@ class KbFileEntity(SQLModel, table=True):
 
     file_metadata: dict = Field(default={}, sa_column=Column("file_metadata", JSON))
 
+    chunk_config: dict | None = Field(
+        default=None, sa_column=Column("chunk_config", JSON)
+    )
 
     @field_serializer("created_at", "updated_at")
     def serialize_dt(self, dt: datetime, _info):
diff --git a/backend/db/models/knowledgebase/knowledgebase.py b/backend/db/models/knowledgebase/knowledgebase.py
index 8abaacdaa..e177ad4b1 100644
--- a/backend/db/models/knowledgebase/knowledgebase.py
+++ b/backend/db/models/knowledgebase/knowledgebase.py
@@ -7,7 +7,7 @@
 from common.knowledgebase.constants import (
     DEFAULT_CHUNK_SIZE,
     DEFAULT_CHUNK_OVERLAP,
-    DEFAULT_SENTENCE_SEPARATOR,
+    DEFAULT_PARAGRAPH_SEPARATOR,
     DEFAULT_PARSER_TYPE,
     DEFAULT_EMBEDDING_MODEL,
     DEFAULT_SIMILARITY_TOP_K,
@@ -15,17 +15,31 @@
     DEFAULT_VECTOR_WEIGHT,
 )
 from common.knowledgebase.types import VectorIndexRetrievalType
-from typing import Optional
+from typing import Optional, List
 from common.system_constants import DEFAULT_TENANT_ID
 from pydantic import field_serializer
 
+
+class TableParserConfig(SQLModel):
+    """Configuration for table parser (CSV/Excel). Only used when parser_type == 'table'."""
+    concat_rows: bool = Field(default=False, description="Whether to concatenate all rows into one document")
+    row_joiner: str = Field(default="\n", description="Separator to use for joining each row")
+    header_index_max: Optional[int] = Field(default=0, description="Maximum row index to use as header")
+    format_sheet_data_to_json: bool = Field(default=False, description="Whether to format sheet data as JSON")
+    sheet_column_filters: Optional[List[str]] = Field(default=None, description="List of column names to filter")
+    question_column_index: Optional[int] = Field(default=0, description="Index of question column")
+    answer_column_index: Optional[int] = Field(default=1, description="Index of answer column")
+
+
+
 class ChunkConfig(SQLModel):
     chunk_size: int = Field(default=DEFAULT_CHUNK_SIZE)
     chunk_overlap: int = Field(default=DEFAULT_CHUNK_OVERLAP)
     parser_type: str = Field(default=DEFAULT_PARSER_TYPE)
-    separator: str = Field(default=DEFAULT_SENTENCE_SEPARATOR)
+    separator: str = Field(default=DEFAULT_PARAGRAPH_SEPARATOR)
     image_caption_model: Optional[str] = Field(default=None)
     image_caption_provider_name: str = Field(default="openai_like")
+    table_config: Optional[TableParserConfig] = Field(default=None, description="Table parser configuration (only used when parser_type == 'table')")
 
 
 class RetrievalConfig(SQLModel):
diff --git a/backend/rag/kb_file_client.py b/backend/rag/kb_file_client.py
index a899b98ca..c61f842d7 100644
--- a/backend/rag/kb_file_client.py
+++ b/backend/rag/kb_file_client.py
@@ -30,13 +30,17 @@
 from pairag.file.store.file_store_helper import file_store
 from loguru import logger
 from rag.parse_utils import sanitize_text, get_node_texts_for_embedding
-from common.knowledgebase.constants import DEFAULT_SENTENCE_SEPARATOR
+from common.knowledgebase.constants import DEFAULT_PARAGRAPH_SEPARATOR
 
 
 class KbFileClient:
 
-    async def create_file_parser(self, knowledgebase: KbEntity, image_caption_tool: Optional[ImageCaptionTool] = None):
-        chunk_config = ChunkConfig.model_validate(knowledgebase.chunk_config)
+    async def create_file_parser(self, knowledgebase: KbEntity, file_entity: Optional[KbFileEntity] = None, image_caption_tool: Optional[ImageCaptionTool] = None):
+        # Prioritize file's chunk_config if available, otherwise use knowledgebase's chunk_config
+        if file_entity and file_entity.chunk_config:
+            chunk_config = ChunkConfig.model_validate(file_entity.chunk_config)
+        else:
+            chunk_config = ChunkConfig.model_validate(knowledgebase.chunk_config)
 
         image_caption_tool = None
         if chunk_config.image_caption_model:
@@ -48,7 +52,7 @@ async def create_file_parser(self, knowledgebase: KbEntity, image_caption_tool:
             image_caption_tool = ImageCaptionTool(multimodal_llm=multimodal_llm)
 
         if not chunk_config.separator:
-            chunk_config.separator = DEFAULT_SENTENCE_SEPARATOR
+            chunk_config.separator = DEFAULT_PARAGRAPH_SEPARATOR
 
         file_parser = FileParser(
             file_store=file_store,
@@ -151,7 +155,7 @@ async def process_file_async(
                 return
             # parsing file
             logger.info(f"Parsing file {file_item.file_name}.")
-            file_parser = await self.create_file_parser(knowledgebase)
+            file_parser = await self.create_file_parser(knowledgebase, file_entity=file_entity)
             documents, nodes = file_parser.parse(file_item, is_attachment=is_attachment)
             await update_file_content_async(file_id=file_item.id, is_attachment=is_attachment, documents=documents, tenant_id=tenant_id)
             for node in nodes:
diff --git a/backend/rag/parse_utils.py b/backend/rag/parse_utils.py
index 5bed6eb18..b0ca4e7f1 100644
--- a/backend/rag/parse_utils.py
+++ b/backend/rag/parse_utils.py
@@ -28,8 +28,11 @@ def sanitize_text(text: str) -> str:
 def get_node_texts_for_embedding(nodes) -> list[str]:
     texts = []
     for node in nodes:
-        base_text = f"filename: {node.metadata['file_name']}"
+        base_text = ""
+        file_name = node.metadata.get('file_name', '').strip()
         chapter_name = node.metadata.get('chapter_name', '').strip()
+        if file_name:
+            base_text += f"file_name: {file_name}"
         if chapter_name:
             base_text += f"\n\nchapter_name: {chapter_name}"
 
diff --git a/backend/service/agent/agent_service.py b/backend/service/agent/agent_service.py
index fb1b9b4a1..3c7ba0b9f 100644
--- a/backend/service/agent/agent_service.py
+++ b/backend/service/agent/agent_service.py
@@ -1,6 +1,7 @@
 from common.chat.models import ChatAgentRequest
 from service.factory.model_factory import create_llm
 from tools.knowledgebase.knowledgebase_tool import aget_knowledgebase_tool
+from tools.knowledgebase.faq_tool import aget_faq_tool
 from service.factory.tools import create_search_tools, create_chatdb_tools, create_codesandbox_tools
 from service.factory.mcp_factory import create_mcp_tools_async
 from tools.attachments.file_searcher import aget_file_searcher
@@ -42,10 +43,12 @@ def __init__(
         chatdb_service_getter: Callable[[], Awaitable],
         rag_service_getter: Callable[[], Awaitable],
         file_service_getter: Callable[[], Awaitable],
+        faq_config_service_getter: Callable[[], Awaitable],
     ):
         self.session = session
         self._get_llm_service = llm_service_getter
         self._get_chatapp_service = chatapp_service_getter
+        self._get_faq_config_service = faq_config_service_getter
         self._get_websearch_service = websearch_service_getter
         self._get_codesandbox_service = codesandbox_service_getter
         self._get_chatdb_service = chatdb_service_getter
@@ -59,6 +62,7 @@ async def create_agent(self, chat_request: ChatAgentRequest, tenant_id: str) ->
             llm_model = await llm_service.get_llm_by_model_id(chat_request.model, tenant_id=tenant_id)
 
             prompt_set = PlanAgentPromptSet()
+            chatapp_id = None
 
             if llm_model:
                 llm = create_llm(llm_model)
@@ -68,8 +72,10 @@ async def create_agent(self, chat_request: ChatAgentRequest, tenant_id: str) ->
                 if not chatapp:
                     raise ValueError(f"Model `{chat_request.model}` not found.")
 
+                chatapp_id = chatapp.app_id
                 chat_request.model = chatapp.model_id
                 chat_request.mcp_ids = chatapp.mcp_ids
+                chat_request.faq_config = chatapp.faq_config
                 chat_request.kb_ids = chatapp.kb_ids
                 chat_request.enable_search = chatapp.enable_search
                 chat_request.enable_chatdb = chatapp.enable_chatdb
@@ -96,7 +102,9 @@ async def create_agent(self, chat_request: ChatAgentRequest, tenant_id: str) ->
                 enable_chatdb=chat_request.enable_chatdb,
                 mcp_ids=chat_request.mcp_ids,
                 kb_ids=chat_request.kb_ids,
+                faq_config=chat_request.faq_config,
                 user_id=chat_request.user_id,
+                chatapp_id=chatapp_id,
                 metadata_condition=chat_request.metadata_condition,
                 tenant_id=tenant_id,
             )
@@ -125,15 +133,24 @@ async def aget_tools(
         mcp_ids: List[str] = [],
         kb_ids: List[str] = [],
         tenant_id: str = None,
+        chatapp_id: Optional[str] = None,
+        faq_config: Optional[dict] = None,
     ) -> tuple[List[FunctionTool], Callable | None]:
         tools = []
 
         # 知识库工具
         rag_service = await self._get_rag_service()
+        chatapp_service = await self._get_chatapp_service()
+        faq_config_service = await self._get_faq_config_service()
         for kb_id in kb_ids:
             tools.append(await aget_knowledgebase_tool(kb_id=kb_id, user_id=user_id, rag_service=rag_service, tenant_id=tenant_id, metadata_condition=metadata_condition))
         logger.info(f"Resolved {len(kb_ids)} knowledgebase tools.")
 
+        # FAQ工具
+        if faq_config and faq_config.get("active"):
+            tools.append(await aget_faq_tool(chatapp_id=chatapp_id, user_id=user_id, rag_service=rag_service, chatapp_service=chatapp_service, faq_config_service=faq_config_service, tenant_id=tenant_id))
+            logger.info("Resolved FAQ tool.")
+
         # 搜索工具
         if enable_search:
             # Add search web tool
diff --git a/backend/service/factory/tools.py b/backend/service/factory/tools.py
index 739f124bd..0a0778d1c 100644
--- a/backend/service/factory/tools.py
+++ b/backend/service/factory/tools.py
@@ -53,12 +53,14 @@ async def aget_search_result(query: str) -> str:
             async_fn=aget_search_result,
             name="tavily-websearch",
             description="从 Tavily 搜索引擎中搜索给定查询的最新内容。",
+            return_direct=False,
         )
     else:
         search_tool = FunctionTool.from_defaults(
             async_fn=aget_search_result,
             name="aliyun-websearch",
             description="从阿里云搜索引擎中搜索给定查询的最新内容。",
+            return_direct=False,
         )
 
     search_cache.put(search_key, search_tool)
@@ -85,6 +87,7 @@ def create_chatdb_tools(chatdb_config: ChatDbConfigEntity, chatdb_llm: PaiLlm) -
             async_fn=chatdb_client.execute_async,
             name="chat-db",
             description="使用自然语言从给定的数据库中获取数据。输入参数: query(str类型),表示用户的查询意图，需结合上下文信息生成。",
+            return_direct=False,
         )
     chatdb_cache.put(chatdb_key, chatdb_tool)
     return [chatdb_tool]
@@ -156,6 +159,7 @@ async def aexecute_code(
                 # Returns
                     - A string containing all printed output from execution, including Markdown image references if plots are generated.
             """,
+        return_direct=False,
     )
 
     # 安装包的工具
@@ -199,6 +203,7 @@ async def ainstall_package(
                     - Install with version: `{"package_name": "pandas==1.5.0"}`
                     - Install multiple packages: `{"package_name": "numpy scipy matplotlib"}`
             """,
+        return_direct=False,
     )
 
     # 清理函数
diff --git a/backend/service/injection.py b/backend/service/injection.py
index 751426a13..90210b259 100644
--- a/backend/service/injection.py
+++ b/backend/service/injection.py
@@ -10,6 +10,8 @@
 from service.tool.websearch_service import WebsearchService
 from service.tool.chatdb_service import ChatdbService
 from service.tool.chatapp_service import ChatappService
+from service.tool.faq_config_service import FAQConfigService
+from service.tool.faq_item_service import FAQItemService
 from service.tool.codesandbox_service import CodesandboxService
 from service.tool.evaluation_service import EvaluationService
 from service.tool.guardrail_service import GuardrailService
@@ -438,6 +440,36 @@ async def get_chatapp_service(
     return ChatappService(session)
 
 
+async def get_faq_config_service(
+    session: AsyncSession = Depends(get_db_session),
+) -> FAQConfigService:
+    """
+    FastAPI dependency injection function for FAQConfigService.
+
+    Args:
+        session: Database session (injected via Depends)
+
+    Returns:
+        FAQConfigService instance with the injected session
+    """
+    return FAQConfigService(session)
+
+
+async def get_faq_item_service(
+    session: AsyncSession = Depends(get_db_session),
+) -> FAQItemService:
+    """
+    FastAPI dependency injection function for FAQItemService.
+
+    Args:
+        session: Database session (injected via Depends)
+
+    Returns:
+        FAQItemService instance with the injected session
+    """
+    return FAQItemService(session)
+
+
 async def get_codesandbox_service(
     session: AsyncSession = Depends(get_db_session),
 ) -> CodesandboxService:
@@ -613,6 +645,9 @@ async def rag_service_getter():
     async def file_service_getter():
         return await get_file_service(session)
 
+    async def faq_config_service_getter():
+        return await get_faq_config_service(session)
+
     return AgentService(
         session=session,
         llm_service_getter=llm_service_getter,
@@ -623,6 +658,7 @@ async def file_service_getter():
         chatdb_service_getter=chatdb_service_getter,
         rag_service_getter=rag_service_getter,
         file_service_getter=file_service_getter,
+        faq_config_service_getter=faq_config_service_getter,
     )
 
 
diff --git a/backend/service/knowledgebase/knowledgebase_service.py b/backend/service/knowledgebase/knowledgebase_service.py
index da2947c03..9cf730d36 100644
--- a/backend/service/knowledgebase/knowledgebase_service.py
+++ b/backend/service/knowledgebase/knowledgebase_service.py
@@ -17,6 +17,7 @@
 from db.models.knowledgebase.file import KbFileEntity
 from common.chat.response_model import PagedResult
 from service.cache.redis_cache import cache_manager, kb_key, kb_name_key
+from common.knowledgebase.constants import FAQ_KNOWLEDGEBASE_NAME
 
 class KnowledgebaseService:
     """Service layer for Knowledgebase entity CRUD operations using dependency injection."""
@@ -44,16 +45,22 @@ async def get_knowledgebase(self, kb_id: str, tenant_id: str) -> Optional[KbEnti
             KbEntity if found, None otherwise
         """
         cache_key = kb_key(tenant_id, kb_id)
-        kb_data = await cache_manager.get_cache().get(cache_key)
-        if kb_data:
-            logger.info(f"Get knowledgebase entity from cache: {kb_id}")
-            kb_entity = KbEntity.model_validate(kb_data)
-            return kb_entity
+        try:
+            kb_data = await cache_manager.get_cache().get(cache_key)
+            if kb_data:
+                logger.info(f"Get knowledgebase entity from cache: {kb_id}")
+                kb_entity = KbEntity.model_validate(kb_data)
+                return kb_entity
+        except Exception as e:
+            logger.warning(f"Cache get operation failed for {cache_key}: {e}")
 
         result = await self.session.exec(select(KbEntity).where(KbEntity.id == kb_id, KbEntity.tenant_id == tenant_id))
         kb_entity = result.first()
         if kb_entity:
-            await cache_manager.get_cache().set(cache_key, kb_entity.model_dump(mode="json"))
+            try:
+                await cache_manager.get_cache().set(cache_key, kb_entity.model_dump(mode="json"))
+            except Exception as e:
+                logger.warning(f"Cache set operation failed for {cache_key}: {e}")
         return kb_entity
 
     async def get_knowledgebase_by_name(self, name: str, tenant_id: str) -> Optional[KbEntity]:
@@ -67,17 +74,23 @@ async def get_knowledgebase_by_name(self, name: str, tenant_id: str) -> Optional
             KbEntity if found, None otherwise
         """
         cache_key = kb_name_key(tenant_id, name)
-        kb_data = await cache_manager.get_cache().get(cache_key)
-        if kb_data:
-            logger.info(f"Get knowledgebase entity from cache: {name}")
-            kb_entity = KbEntity.model_validate(kb_data)
-            return kb_entity
+        try:
+            kb_data = await cache_manager.get_cache().get(cache_key)
+            if kb_data:
+                logger.info(f"Get knowledgebase entity from cache: {name}")
+                kb_entity = KbEntity.model_validate(kb_data)
+                return kb_entity
+        except Exception as e:
+            logger.warning(f"Cache get operation failed for {cache_key}: {e}, falling back to database")
 
         statement = select(KbEntity).where(KbEntity.name == name, KbEntity.tenant_id == tenant_id)
         result = await self.session.exec(statement)
         kb_entity = result.first()
         if kb_entity:
-            await cache_manager.get_cache().set(cache_key, kb_entity.model_dump(mode="json"))
+            try:
+                await cache_manager.get_cache().set(cache_key, kb_entity.model_dump(mode="json"))
+            except Exception as e:
+                logger.warning(f"Cache set operation failed for {cache_key}: {e}")
         return kb_entity
 
     async def get_knowledgebases_by_ids(self, tenant_id: str, kb_ids: List[str]) -> List[KbEntity]:
@@ -111,11 +124,14 @@ async def list_knowledgebases(
         Returns:
             PagedResult containing list of KbEntity with file_count and pagination metadata
         """
-        # Build base query condition
+        conditions = [KbEntity.tenant_id == tenant_id]
+
         if exclude_default_attachments:
-            base_condition = and_(KbEntity.name != "default_attachments", KbEntity.tenant_id == tenant_id)
-        else:
-            base_condition = KbEntity.tenant_id == tenant_id
+            conditions.append(KbEntity.name != "default_attachments")
+
+        conditions.append(~KbEntity.name.like(f"%_{FAQ_KNOWLEDGEBASE_NAME}"))
+
+        base_condition = and_(*conditions)
         # Add search condition if provided
         if query:
             query_lower = query.lower()
@@ -254,7 +270,10 @@ async def update_knowledgebase(
             ValueError: If Knowledgebase entity not found
         """
         cache_key = kb_key(tenant_id, kb_id)
-        await cache_manager.get_cache().delete(cache_key)
+        try:
+            await cache_manager.get_cache().delete(cache_key)
+        except Exception as e:
+            logger.warning(f"Cache delete operation failed for {cache_key}: {e}")
 
         result = await self.session.exec(select(KbEntity).where(KbEntity.id == kb_id, KbEntity.tenant_id == tenant_id))
         knowledgebase = result.first()
@@ -262,7 +281,10 @@ async def update_knowledgebase(
             raise ValueError(f"知识库 '{kb_id}' 不存在。")
 
         cache_name_key = kb_name_key(tenant_id, knowledgebase.name)
-        await cache_manager.get_cache().delete(cache_name_key)
+        try:
+            await cache_manager.get_cache().delete(cache_name_key)
+        except Exception as e:
+            logger.warning(f"Cache delete operation failed for {cache_name_key}: {e}")
 
         try:
 
@@ -329,8 +351,14 @@ async def delete_knowledgebase(self, kb_id: str, tenant_id: str) -> None:
         # Delete both ID-based and name-based cache entries
         cache_key = kb_key(tenant_id, kb_id)
         cache_name_key = kb_name_key(tenant_id, knowledgebase.name)
-        await cache_manager.get_cache().delete(cache_key)
-        await cache_manager.get_cache().delete(cache_name_key)
+        try:
+            await cache_manager.get_cache().delete(cache_key)
+        except Exception as e:
+            logger.warning(f"Cache delete operation failed for {cache_key}: {e}")
+        try:
+            await cache_manager.get_cache().delete(cache_name_key)
+        except Exception as e:
+            logger.warning(f"Cache delete operation failed for {cache_name_key}: {e}")
 
         # Delete knowledgebase entity only
         await self.session.delete(knowledgebase)
@@ -362,8 +390,14 @@ async def write_cache_after_commit(self, kb_entity: KbEntity, tenant_id: str) ->
         """
         cache_key = kb_key(tenant_id, kb_entity.id)
         cache_name_key = kb_name_key(tenant_id, kb_entity.name)
-        await cache_manager.get_cache().set(cache_key, kb_entity.model_dump(mode="json"))
-        await cache_manager.get_cache().set(cache_name_key, kb_entity.model_dump(mode="json"))
+        try:
+            await cache_manager.get_cache().set(cache_key, kb_entity.model_dump(mode="json"))
+        except Exception as e:
+            logger.warning(f"Cache set operation failed for {cache_key}: {e}")
+        try:
+            await cache_manager.get_cache().set(cache_name_key, kb_entity.model_dump(mode="json"))
+        except Exception as e:
+            logger.warning(f"Cache set operation failed for {cache_name_key}: {e}")
         logger.info(f"Written cache for knowledgebase {kb_entity.id} (name: {kb_entity.name}) after commit")
 
     async def delete_cache_on_rollback(self, kb_id: str, tenant_id: str, kb_name: Optional[str] = None) -> None:
@@ -377,8 +411,14 @@ async def delete_cache_on_rollback(self, kb_id: str, tenant_id: str, kb_name: Op
             kb_name: Optional knowledgebase name (if known)
         """
         cache_key = kb_key(tenant_id, kb_id)
-        await cache_manager.get_cache().delete(cache_key)
+        try:
+            await cache_manager.get_cache().delete(cache_key)
+        except Exception as e:
+            logger.warning(f"Cache delete operation failed for {cache_key}: {e}")
         if kb_name:
             cache_name_key = kb_name_key(tenant_id, kb_name)
-            await cache_manager.get_cache().delete(cache_name_key)
+            try:
+                await cache_manager.get_cache().delete(cache_name_key)
+            except Exception as e:
+                logger.warning(f"Cache delete operation failed for {cache_name_key}: {e}")
         logger.info(f"Deleted cache for knowledgebase {kb_id} on rollback")
diff --git a/backend/service/knowledgebase/vector_table_mapping_service.py b/backend/service/knowledgebase/vector_table_mapping_service.py
index 1decfe0de..0924f8ed2 100644
--- a/backend/service/knowledgebase/vector_table_mapping_service.py
+++ b/backend/service/knowledgebase/vector_table_mapping_service.py
@@ -39,26 +39,49 @@ async def get_vector_table_name(self, tenant_id: str, kb_id: str) -> str:
             The vector table name
         """
         cache_key = vector_table_name_key(tenant_id, kb_id)
-        table_name = await cache_manager.get_cache().get(cache_key)
-        if table_name:
-            logger.debug(f"Found vector table name in cache for tenant {tenant_id} and kb {kb_id}: {table_name}")
-            return table_name
+        try:
+            table_name = await cache_manager.get_cache().get(cache_key)
+            if table_name:
+                logger.debug(f"Found vector table name in cache for tenant {tenant_id} and kb {kb_id}: {table_name}")
+                return table_name
+        except Exception as e:
+            logger.warning(f"Cache get operation failed for {cache_key}: {e}, falling back to database")
 
         # Try to find existing mapping
         mapping = await self._get_mapping(tenant_id, kb_id)
 
         if mapping:
             logger.debug(f"Found existing vector table mapping: {mapping.table_name}")
-            await cache_manager.get_cache().set(cache_key, mapping.table_name)
+            try:
+                await cache_manager.get_cache().set(cache_key, mapping.table_name)
+            except Exception as e:
+                logger.warning(f"Cache set operation failed for {cache_key}: {e}")
             return mapping.table_name
 
         # Generate new table name
         table_name = generate_vector_table_name(tenant_id, kb_id)
         logger.debug(f"Generated new vector table name: {table_name}")
 
-        # Store the mapping
-        await self._create_mapping(tenant_id, kb_id, table_name)
-        await cache_manager.get_cache().set(cache_key, table_name)
+        # Store the mapping (with retry logic for race conditions)
+        try:
+            mapping = await self._create_mapping(tenant_id, kb_id, table_name)
+            # Use the actual table_name from the mapping (in case we got an existing one)
+            table_name = mapping.table_name
+        except Exception as create_ex:
+            # If creation failed, try one more time to get existing mapping
+            # (another concurrent task might have created it)
+            logger.warning(f"Failed to create mapping, retrying to get existing: {create_ex}")
+            existing_mapping = await self._get_mapping(tenant_id, kb_id)
+            if existing_mapping:
+                logger.info(f"Found existing mapping after creation failure for tenant={tenant_id}, kb={kb_id}")
+                table_name = existing_mapping.table_name
+            else:
+                raise
+
+        try:
+            await cache_manager.get_cache().set(cache_key, table_name)
+        except Exception as e:
+            logger.warning(f"Cache set operation failed for {cache_key}: {e}")
         return table_name
 
     async def _get_mapping(
@@ -86,6 +109,7 @@ async def _create_mapping(
     ) -> VectorTableMappingEntity:
         """
         Create a new vector table mapping.
+        Note: This method does not commit the transaction. The caller is responsible for committing.
 
         Args:
             tenant_id: The tenant ID
@@ -95,6 +119,12 @@ async def _create_mapping(
         Returns:
             The created VectorTableMappingEntity
         """
+        # First check if mapping already exists (race condition protection)
+        existing_mapping = await self._get_mapping(tenant_id, kb_id)
+        if existing_mapping:
+            logger.debug(f"Mapping already exists for tenant={tenant_id}, kb={kb_id}, returning existing")
+            return existing_mapping
+
         mapping = VectorTableMappingEntity(
             tenant_id=tenant_id,
             kb_id=kb_id,
@@ -102,17 +132,44 @@ async def _create_mapping(
         )
         try:
             self.session.add(mapping)
-            await self.session.commit()
-            await self.session.refresh(mapping)
-            logger.info(f"Created vector table mapping: tenant={tenant_id}, kb={kb_id}, table={table_name}")
-            return mapping
+            try:
+                await self.session.flush()
+                await self.session.refresh(mapping)
+                logger.info(f"Created vector table mapping: tenant={tenant_id}, kb={kb_id}, table={table_name}")
+                return mapping
+            except Exception as flush_ex:
+                # Check if it's a "Session is already flushing" error
+                error_str = str(flush_ex).lower()
+                if "already flushing" in error_str or "invalidrequesterror" in error_str:
+                    logger.warning(f"Session flush conflict detected, trying to get existing mapping for tenant={tenant_id}, kb={kb_id}")
+                    # Remove the failed mapping from session to avoid conflicts
+                    try:
+                        self.session.expunge(mapping)
+                    except Exception:
+                        pass
+                    # Try to get existing mapping (another concurrent task may have created it)
+                    existing_mapping = await self._get_mapping(tenant_id, kb_id)
+                    if existing_mapping:
+                        logger.info(f"Found existing vector table mapping after flush conflict for tenant={tenant_id}, kb={kb_id}")
+                        return existing_mapping
+                    # If no existing mapping, log and re-raise
+                    logger.error("No existing mapping found after flush conflict, re-raising error")
+                    raise
+                raise
         except Exception as ex:
             logger.error(f"Failed to create vector table mapping: {traceback.format_exc()}")
-            await self.session.rollback()
-            if "UniqueViolationError" in str(ex.orig) or "Duplicate entry" in str(ex.orig):
-                pass
-            else:
-                raise ValueError(f"Failed to create vector table mapping: {ex}") from ex
+            # Check if it's a unique constraint violation
+            error_msg = str(ex)
+            if hasattr(ex, 'orig'):
+                error_msg = str(ex.orig)
+
+            if "UniqueViolationError" in error_msg or "Duplicate entry" in error_msg or "UNIQUE constraint" in error_msg:
+                # If duplicate, try to get the existing mapping
+                existing_mapping = await self._get_mapping(tenant_id, kb_id)
+                if existing_mapping:
+                    logger.info(f"Found existing vector table mapping after unique constraint violation for tenant={tenant_id}, kb={kb_id}")
+                    return existing_mapping
+            raise ValueError(f"Failed to create vector table mapping: {ex}") from ex
 
     async def delete_mapping(self, tenant_id: str, kb_id: str) -> bool:
         """
@@ -128,7 +185,10 @@ async def delete_mapping(self, tenant_id: str, kb_id: str) -> bool:
         mapping = await self._get_mapping(tenant_id, kb_id)
         if mapping:
             cache_key = vector_table_name_key(tenant_id, kb_id)
-            await cache_manager.get_cache().delete(cache_key)
+            try:
+                await cache_manager.get_cache().delete(cache_key)
+            except Exception as e:
+                logger.warning(f"Cache delete operation failed for {cache_key}: {e}")
             await self.session.delete(mapping)
             await self.session.commit()
             logger.info(f"Deleted vector table mapping: tenant={tenant_id}, kb={kb_id}")
@@ -147,13 +207,19 @@ async def get_table_name_if_exists(self, tenant_id: str, kb_id: str) -> Optional
             The table name if mapping exists, None otherwise
         """
         cache_key = vector_table_name_key(tenant_id, kb_id)
-        table_name = await cache_manager.get_cache().get(cache_key)
-        if table_name:
-            logger.debug(f"Found vector table name in cache for tenant {tenant_id} and kb {kb_id}: {table_name}")
-            return table_name
+        try:
+            table_name = await cache_manager.get_cache().get(cache_key)
+            if table_name:
+                logger.debug(f"Found vector table name in cache for tenant {tenant_id} and kb {kb_id}: {table_name}")
+                return table_name
+        except Exception as e:
+            logger.warning(f"Cache get operation failed for {cache_key}: {e}, falling back to database")
 
         mapping = await self._get_mapping(tenant_id, kb_id)
         if mapping:
-            await cache_manager.get_cache().set(cache_key, mapping.table_name)
+            try:
+                await cache_manager.get_cache().set(cache_key, mapping.table_name)
+            except Exception as e:
+                logger.warning(f"Cache set operation failed for {cache_key}: {e}")
             return mapping.table_name
         return None
diff --git a/backend/service/tool/chatapp_service.py b/backend/service/tool/chatapp_service.py
index 79940a994..e9deb8590 100644
--- a/backend/service/tool/chatapp_service.py
+++ b/backend/service/tool/chatapp_service.py
@@ -8,7 +8,16 @@
 from loguru import logger
 
 from db.models.chatbot import ChatBotCreate, ChatBotEntity
+from db.models.knowledgebase.knowledgebase import KnowledgebaseCreate, RetrievalConfig, ChunkConfig, TableParserConfig, KbEntity
 from common.chat.response_model import PagedResult
+from common.knowledgebase.constants import FAQ_KNOWLEDGEBASE_NAME, DEFAULT_FAQ_SIMILARITY_THRESHOLD
+from common.knowledgebase.types import VectorIndexRetrievalType
+from service.knowledgebase.knowledgebase_service import KnowledgebaseService
+from service.model.embedding_service import EmbeddingService
+from service.tool.faq_config_service import FAQConfigService
+from db.models.faq_config import FAQConfigCreate
+from db.models.faq_item import FAQItemEntity
+from service.knowledgebase.rag_service import RagService
 
 
 class ChatappService:
@@ -23,6 +32,79 @@ def __init__(self, session: AsyncSession):
         """
         self.session = session
 
+    async def _ensure_faq_knowledgebase(self, chatbot_id: str, app_id: str, tenant_id: str) -> KbEntity:
+        """
+        Ensure FAQ knowledgebase exists for the given chatbot_id and app_id.
+        Creates it if it doesn't exist.
+        Uses embedding_model from faq_config if available, otherwise uses default.
+
+        Args:
+            chatbot_id: ChatApp chatbot_id
+            app_id: ChatApp app_id
+            tenant_id: Tenant ID
+
+        Returns:
+            KbEntity representing the FAQ knowledgebase
+        """
+        kb_name = f"{app_id}_{FAQ_KNOWLEDGEBASE_NAME}"
+        knowledgebase_service = KnowledgebaseService(self.session)
+        embedding_service = EmbeddingService(self.session)
+        faq_config_service = FAQConfigService(self.session)
+
+        knowledgebase = await knowledgebase_service.get_knowledgebase_by_name(kb_name, tenant_id=tenant_id)
+
+        if not knowledgebase:
+            logger.info(f"Creating FAQ knowledgebase {kb_name} for app_id {app_id} and tenant {tenant_id}")
+
+            # Get FAQ config to get embedding_model
+            faq_config = await faq_config_service.get_faq_config_by_chatbot_id(
+                chatbot_id=chatbot_id, tenant_id=tenant_id
+            )
+
+            # Use embedding_model from faq_config if available, otherwise use default
+            if faq_config and faq_config.embedding_model:
+                embedding_model = faq_config.embedding_model
+                logger.info(f"Using embedding_model {embedding_model} from FAQ config for knowledgebase {kb_name}")
+            else:
+                default_embedding_config = await embedding_service.get_default_embedding(tenant_id=tenant_id)
+                embedding_model = default_embedding_config.model_id
+                logger.info(f"Using default embedding_model {embedding_model} for knowledgebase {kb_name}")
+
+            # Set default retrieval_config
+            default_similarity_threshold = faq_config.similarity_threshold if faq_config else DEFAULT_FAQ_SIMILARITY_THRESHOLD
+
+            retrieval_config = RetrievalConfig(
+                retrieval_mode=VectorIndexRetrievalType.vector,
+                top_k=1,
+                enable_rerank=False,
+                rerank_top_k=None,
+                vector_weight=1.0,
+                similarity_threshold=default_similarity_threshold,
+            )
+
+            chunk_config = ChunkConfig(
+                table_config=TableParserConfig(
+                header_index_max=0,
+                question_column_index=0,
+                answer_column_index=1,
+                ),
+                parser_type="faq",
+            )
+
+            kb_create = KnowledgebaseCreate(
+                name=kb_name,
+                description="faq知识库",
+                embedding_model=embedding_model,
+                retrieval_config=retrieval_config,
+                chunk_config=chunk_config,
+            )
+            knowledgebase = await knowledgebase_service.create_knowledgebase(kb_data=kb_create, tenant_id=tenant_id)
+            await self.session.flush()
+            await self.session.refresh(knowledgebase)
+            logger.info(f"Created FAQ knowledgebase {knowledgebase.id} (name: {kb_name}) for app_id {app_id}")
+
+        return knowledgebase
+
     async def get_chatapp(self, id: str, tenant_id: str) -> Optional[ChatBotEntity]:
         """
         Get a single ChatApp entity by ID.
@@ -104,13 +186,19 @@ async def create_chatapp(self, app_data: ChatBotCreate, tenant_id: str) -> ChatB
 
         Args:
             app_data: ChatApp creation data
+            tenant_id: Tenant ID
 
         Returns:
             Created ChatBotEntity (not yet committed)
 
         Raises:
-            ValueError: If app_id already exists (IntegrityError converted)
+            ValueError: If app_id already exists
         """
+        # Check if app_id already exists
+        existing_chatbot = await self.get_chatapp_by_app_id(app_id=app_data.app_id, tenant_id=tenant_id)
+        if existing_chatbot:
+            raise ValueError(f"应用ID '{app_data.app_id}' 已经存在，无法创建。")
+
         chatbot = ChatBotEntity.model_validate(app_data, update={"tenant_id": tenant_id})
         self.session.add(chatbot)
 
@@ -119,6 +207,33 @@ async def create_chatapp(self, app_data: ChatBotCreate, tenant_id: str) -> ChatB
             await self.session.flush()
             await self.session.refresh(chatbot)
 
+            # If enable_faq is True, create FAQ config
+            if app_data.enable_faq:
+                # Ensure FAQ knowledgebase exists first (to get kb_id)
+                knowledgebase = await self._ensure_faq_knowledgebase(chatbot.id, chatbot.app_id, tenant_id)
+
+                # Initialize FAQ config with default values and set kb_id
+                faq_config_service = FAQConfigService(self.session)
+                faq_config = await faq_config_service.get_or_create_faq_config(
+                    chatbot_id=chatbot.id, tenant_id=tenant_id
+                )
+
+                # Update faq_config with kb_id
+                if not faq_config.kb_id:
+                    faq_config.kb_id = knowledgebase.id
+                    await faq_config_service.update_faq_config(
+                        chatbot_id=chatbot.id,
+                        update_data=faq_config,
+                        tenant_id=tenant_id
+                    )
+
+                await self.session.flush()
+                await self.session.refresh(chatbot)
+
+                logger.info(
+                    f"Created FAQ config for ChatApp: {chatbot.id} (app_id: {chatbot.app_id})"
+                )
+
             logger.info(
                 f"Created ChatApp entity: {chatbot.id} (app_id: {chatbot.app_id})"
             )
@@ -144,12 +259,13 @@ async def update_chatapp(
         Args:
             id: ChatApp entity ID
             update_data: Updated ChatApp data
+            tenant_id: Tenant ID
 
         Returns:
             Updated ChatBotEntity (not yet committed)
 
         Raises:
-            ValueError: If ChatApp entity not found
+            ValueError: If ChatApp entity not found or app_id already exists
         """
         chatbot = await self.get_chatapp(id=id, tenant_id=tenant_id)
         if not chatbot:
@@ -157,6 +273,54 @@ async def update_chatapp(
 
         logger.info(f"Updating ChatApp {id} with data: {update_data}")
 
+        # Check if app_id is being updated and if it conflicts with existing records
+        if update_data.app_id is not None and update_data.app_id != chatbot.app_id:
+            existing_chatbot = await self.get_chatapp_by_app_id(app_id=update_data.app_id, tenant_id=tenant_id)
+            if existing_chatbot and existing_chatbot.id != id:
+                raise ValueError(f"应用ID '{update_data.app_id}' 已经存在，无法更新。")
+
+        faq_config_service = FAQConfigService(self.session)
+        if update_data.enable_faq:
+            if not chatbot.faq_config:
+                knowledgebase = await self._ensure_faq_knowledgebase(chatbot.id, chatbot.app_id, tenant_id)
+
+                faq_config = await faq_config_service.get_or_create_faq_config(
+                    chatbot_id=chatbot.id, tenant_id=tenant_id
+                )
+
+                # Update faq_config with kb_id
+                if not faq_config.kb_id:
+                    faq_config.kb_id = knowledgebase.id
+                    await faq_config_service.update_faq_config(
+                        chatbot_id=chatbot.id,
+                        update_data=faq_config,
+                        tenant_id=tenant_id
+                    )
+
+                logger.info(
+                    f"Created FAQ config for ChatApp: {chatbot.id}"
+                )
+            else:
+                current_config = FAQConfigCreate.model_validate(chatbot.faq_config)
+                if not current_config.active:
+                    current_config.active = True
+                    await faq_config_service.update_faq_config(
+                        chatbot_id=chatbot.id,
+                        update_data=current_config,
+                        tenant_id=tenant_id
+                    )
+                    logger.info(f"Updated FAQ config active to True for ChatApp: {chatbot.id}")
+        else:
+            current_config = FAQConfigCreate.model_validate(chatbot.faq_config)
+
+            current_config.active = False
+            await faq_config_service.update_faq_config(
+                chatbot_id=chatbot.id,
+                update_data=current_config,
+                tenant_id=tenant_id
+            )
+            logger.info(f"Disabled FAQ for ChatApp: {chatbot.id}")
+
         # Update fields
         if update_data.app_id is not None:
             chatbot.app_id = update_data.app_id
@@ -184,6 +348,8 @@ async def update_chatapp(
             chatbot.guardrail_hint = update_data.guardrail_hint
         if update_data.prompts is not None:
             chatbot.prompts = update_data.prompts
+        if update_data.enable_faq is not None:
+            chatbot.enable_faq = update_data.enable_faq
 
         chatbot.updated_at = datetime.now(timezone.utc).replace(tzinfo=None)
         self.session.add(chatbot)
@@ -195,13 +361,15 @@ async def update_chatapp(
         logger.info(f"Updated ChatApp entity: {chatbot.id} (app_id: {chatbot.app_id})")
         return chatbot
 
-    async def delete_chatapp(self, id: str, tenant_id: str) -> None:
+    async def delete_chatapp(self, id: str, tenant_id: str, rag_service: Optional[RagService] = None) -> None:
         """
         Delete a ChatApp entity.
         Note: Caller is responsible for committing the session.
 
         Args:
             id: ChatApp entity ID
+            tenant_id: Tenant ID
+            rag_service: Optional RagService for deleting FAQ knowledgebase
 
         Raises:
             ValueError: If ChatApp entity not found
@@ -210,7 +378,38 @@ async def delete_chatapp(self, id: str, tenant_id: str) -> None:
         if not chatbot:
             raise ValueError(f"应用 '{id}' 不存在。")
 
+        # Delete FAQ knowledgebase if exists
+        if chatbot.faq_config:
+            try:
+                faq_config = FAQConfigCreate.model_validate(chatbot.faq_config)
+                if faq_config.kb_id and rag_service:
+                    try:
+                        await rag_service.delete_knowledgebase(kb_id=faq_config.kb_id, tenant_id=tenant_id)
+                        logger.info(f"Deleted FAQ knowledgebase {faq_config.kb_id} for ChatApp: {id}")
+                    except Exception as e:
+                        logger.warning(f"Failed to delete FAQ knowledgebase {faq_config.kb_id}: {e}")
+                        # Continue with chatbot deletion even if KB deletion fails
+            except Exception as e:
+                logger.warning(f"Failed to parse FAQ config for chatbot {id}: {e}")
+                # Continue with chatbot deletion even if FAQ config parsing fails
+
+        try:
+            faq_items = await self.session.exec(
+                select(FAQItemEntity).where(
+                    FAQItemEntity.chatbot_id == chatbot.app_id,
+                    FAQItemEntity.tenant_id == tenant_id
+                )
+            )
+            faq_items_list = list(faq_items.all())
+            if faq_items_list:
+                for faq_item in faq_items_list:
+                    await self.session.delete(faq_item)
+                logger.info(f"Deleted {len(faq_items_list)} FAQ items for ChatApp: {id}")
+        except Exception as e:
+            logger.warning(f"Failed to delete FAQ items for chatbot {id}: {e}")
+
         # Delete from database (staged, not committed)
+        # FAQ items should be automatically deleted via CASCADE foreign key constraint if it exists
         await self.session.delete(chatbot)
 
         # Flush to ensure deletion is staged
diff --git a/backend/service/tool/faq_config_service.py b/backend/service/tool/faq_config_service.py
new file mode 100644
index 000000000..b4667f446
--- /dev/null
+++ b/backend/service/tool/faq_config_service.py
@@ -0,0 +1,265 @@
+"""FAQ Config Service layer for database operations."""
+
+from datetime import datetime, timezone
+from typing import Optional
+from sqlmodel import select
+from sqlmodel.ext.asyncio.session import AsyncSession
+from common.knowledgebase.constants import DEFAULT_EMBEDDING_MODEL, DEFAULT_FAQ_SIMILARITY_THRESHOLD, FAQ_KNOWLEDGEBASE_NAME
+from common.knowledgebase.types import VectorIndexRetrievalType
+from loguru import logger
+
+from db.models.faq_config import FAQConfigCreate
+from db.models.chatbot import ChatBotEntity
+from db.models.knowledgebase.knowledgebase import KnowledgebaseCreate, RetrievalConfig
+from service.knowledgebase.knowledgebase_service import KnowledgebaseService
+
+
+class FAQConfigService:
+    """Service layer for FAQ Config operations using dependency injection."""
+
+    def __init__(self, session: AsyncSession):
+        """
+        Initialize FAQConfigService with a database session.
+
+        Args:
+            session: Database session (injected dependency)
+        """
+        self.session = session
+
+    def _get_default_faq_config(self) -> dict:
+        """Get default FAQ config values."""
+        return {
+            "active": True,
+            "similarity_threshold": DEFAULT_FAQ_SIMILARITY_THRESHOLD,
+            "embedding_model": DEFAULT_EMBEDDING_MODEL,
+            "enable_question_in_retrieval": True,
+            "enable_question_in_response": True,
+            "enable_answer_in_retrieval": False,
+            "enable_answer_in_response": True,
+            "return_direct": False,
+            "kb_id": None,
+        }
+
+    async def get_faq_config_by_chatbot_id(
+        self, chatbot_id: str, tenant_id: str
+    ) -> Optional[FAQConfigCreate]:
+        """
+        Get FAQ Config by chatbot_id.
+
+        Args:
+            chatbot_id: Chatbot ID
+            tenant_id: Tenant ID
+
+        Returns:
+            FAQConfigCreate if found, None otherwise
+        """
+        chatbot = await self.session.exec(
+            select(ChatBotEntity).where(
+                ChatBotEntity.id == chatbot_id,
+                ChatBotEntity.tenant_id == tenant_id,
+            )
+        )
+        chatbot = chatbot.first()
+        if not chatbot or not chatbot.faq_config:
+            return None
+
+        # Convert dict to FAQConfigCreate
+        return FAQConfigCreate.model_validate(chatbot.faq_config)
+
+    async def get_or_create_faq_config(
+        self, chatbot_id: str, tenant_id: str
+    ) -> FAQConfigCreate:
+        """
+        Get or create a FAQ config for a chatbot.
+
+        Args:
+            chatbot_id: Chatbot ID
+            tenant_id: Tenant ID
+
+        Returns:
+            FAQConfigCreate representing the FAQ config
+        """
+        chatbot = await self.session.exec(
+            select(ChatBotEntity).where(
+                ChatBotEntity.id == chatbot_id,
+                ChatBotEntity.tenant_id == tenant_id,
+            )
+        )
+        chatbot = chatbot.first()
+
+        if not chatbot:
+            raise ValueError(f"Chatbot '{chatbot_id}' 不存在。")
+
+        # If faq_config exists and is not empty, return it
+        if chatbot.faq_config:
+            logger.info(
+                f"Found existing FAQ config for chatbot_id: {chatbot_id}"
+            )
+            return FAQConfigCreate.model_validate(chatbot.faq_config)
+
+        # Create new FAQ config with default values
+        default_config = self._get_default_faq_config()
+        chatbot.faq_config = default_config
+        self.session.add(chatbot)
+
+        await self.session.flush()
+        await self.session.refresh(chatbot)
+        logger.info(
+            f"Created FAQ config for chatbot_id: {chatbot_id}"
+        )
+        return FAQConfigCreate.model_validate(default_config)
+
+    async def update_faq_config(
+        self, chatbot_id: str, update_data: FAQConfigCreate, tenant_id: str
+    ) -> FAQConfigCreate:
+        """
+        Update FAQ config for a chatbot.
+        Note: Caller is responsible for committing the session.
+
+        Args:
+            chatbot_id: Chatbot ID
+            update_data: Updated FAQ Config data
+            tenant_id: Tenant ID
+
+        Returns:
+            Updated FAQConfigCreate
+
+        Raises:
+            ValueError: If Chatbot not found
+        """
+        chatbot = await self.session.exec(
+            select(ChatBotEntity).where(
+                ChatBotEntity.id == chatbot_id,
+                ChatBotEntity.tenant_id == tenant_id,
+            )
+        )
+        chatbot = chatbot.first()
+
+        if not chatbot:
+            raise ValueError(f"Chatbot '{chatbot_id}' 不存在。")
+
+        logger.info(f"Updating FAQ Config for chatbot {chatbot_id} with data: {update_data}")
+
+        # Get current config or use defaults
+        current_config = chatbot.faq_config.copy() if chatbot.faq_config else self._get_default_faq_config()
+
+        # Update fields from update_data
+        update_dict = update_data.model_dump(exclude_unset=True)
+        current_config.update(update_dict)
+
+        # Update chatbot's faq_config
+        chatbot.faq_config = current_config
+        chatbot.updated_at = datetime.now(timezone.utc).replace(tzinfo=None)
+        self.session.add(chatbot)
+
+        # Flush to ensure changes are staged
+        await self.session.flush()
+        await self.session.refresh(chatbot)
+
+        logger.info(f"Updated FAQ Config for chatbot: {chatbot_id}")
+        return FAQConfigCreate.model_validate(chatbot.faq_config)
+
+    async def update_faq_config_with_sync(
+        self,
+        app_id: str,
+        chatbot_id: str,
+        update_data: FAQConfigCreate,
+        tenant_id: str,
+        knowledgebase_service: Optional[KnowledgebaseService] = None
+    ) -> FAQConfigCreate:
+        """
+        Update FAQ config with full synchronization logic:
+        - Get or create FAQ config
+        - Sync chatbot.enable_faq with faq_config.active
+        - Update FAQ config
+        - Update corresponding knowledgebase if embedding_model or similarity_threshold changed
+
+        Note: Caller is responsible for committing the session.
+
+        Args:
+            app_id: Chatbot app_id (used for knowledgebase name)
+            chatbot_id: Chatbot ID
+            update_data: Updated FAQ Config data
+            tenant_id: Tenant ID
+            knowledgebase_service: Optional KnowledgebaseService for updating knowledgebase
+
+        Returns:
+            Updated FAQConfigCreate
+
+        Raises:
+            ValueError: If Chatbot not found
+        """
+        # Get chatbot entity
+        chatbot = await self.session.exec(
+            select(ChatBotEntity).where(
+                ChatBotEntity.id == chatbot_id,
+                ChatBotEntity.tenant_id == tenant_id,
+            )
+        )
+        chatbot = chatbot.first()
+
+        if not chatbot:
+            raise ValueError(f"Chatbot '{chatbot_id}' 不存在。")
+
+        # Get or create FAQ config (this will use the same chatbot entity if it exists)
+        await self.get_or_create_faq_config(
+            chatbot_id=chatbot_id, tenant_id=tenant_id
+        )
+
+        # Refresh chatbot to get latest state
+        await self.session.refresh(chatbot)
+
+        # Sync chatbot.enable_faq with faq_config.active
+        if update_data.active is not None:
+            if chatbot.enable_faq != update_data.active:
+                chatbot.enable_faq = update_data.active
+                logger.info(f"Synced chatbot.enable_faq to {update_data.active} for chatbot {chatbot_id}")
+
+        # Update FAQ config
+        updated_faq_config = await self.update_faq_config(
+            chatbot_id=chatbot_id,
+            update_data=update_data,
+            tenant_id=tenant_id
+        )
+
+        # Update corresponding knowledgebase if embedding_model or similarity_threshold changed
+        if knowledgebase_service and (update_data.embedding_model is not None or update_data.similarity_threshold is not None):
+            kb_name = f"{app_id}_{FAQ_KNOWLEDGEBASE_NAME}"
+            kb = await knowledgebase_service.get_knowledgebase_by_name(kb_name, tenant_id=tenant_id)
+
+            if kb:
+                # Prepare update data for knowledgebase
+                kb_update_data = KnowledgebaseCreate()
+                update_fields = []
+
+                # Update embedding_model if provided
+                if update_data.embedding_model is not None:
+                    kb_update_data.embedding_model = update_data.embedding_model
+                    update_fields.append(f"embedding_model={update_data.embedding_model}")
+
+                # Update retrieval_config.similarity_threshold if provided
+                if update_data.similarity_threshold is not None:
+                    # Get current retrieval_config or create default
+                    current_retrieval_config = RetrievalConfig.model_validate(kb.retrieval_config) if kb.retrieval_config else RetrievalConfig(
+                        retrieval_mode=VectorIndexRetrievalType.vector,
+                        top_k=1,
+                        enable_rerank=False,
+                        rerank_top_k=None,
+                        vector_weight=1.0,
+                        similarity_threshold=update_data.similarity_threshold,
+                    )
+                    # Update similarity_threshold
+                    current_retrieval_config.similarity_threshold = update_data.similarity_threshold
+                    kb_update_data.retrieval_config = current_retrieval_config
+                    update_fields.append(f"similarity_threshold={update_data.similarity_threshold}")
+
+                # Update knowledgebase only if there are fields to update
+                if kb_update_data.embedding_model is not None or kb_update_data.retrieval_config is not None:
+                    await knowledgebase_service.update_knowledgebase(
+                        kb_id=kb.id,
+                        update_data=kb_update_data,
+                        tenant_id=tenant_id
+                    )
+                    logger.info(f"Updated FAQ knowledgebase {kb_name} with {', '.join(update_fields)}")
+
+        return updated_faq_config
diff --git a/backend/service/tool/faq_item_service.py b/backend/service/tool/faq_item_service.py
new file mode 100644
index 000000000..2dc6b16d0
--- /dev/null
+++ b/backend/service/tool/faq_item_service.py
@@ -0,0 +1,359 @@
+"""FAQ Item Service layer for database operations."""
+
+from datetime import datetime, timezone
+from typing import Optional, List
+from sqlmodel import select, func
+from sqlmodel.ext.asyncio.session import AsyncSession
+from loguru import logger
+
+from db.models.faq_item import FAQItemCreate, FAQItemEntity
+from db.models.faq_config import FAQConfigCreate
+from db.models.chatbot import ChatBotEntity
+from common.chat.response_model import PagedResult
+from service.knowledgebase.knowledgebase_service import KnowledgebaseService
+from service.knowledgebase.rag_service import RagService
+from pairag.file.utils.tokenization import estimate_tokens_in_text
+from llama_index.core.schema import TextNode
+
+
+class FAQItemService:
+    """Service layer for FAQ Item entity CRUD operations using dependency injection."""
+
+    def __init__(self, session: AsyncSession):
+        """
+        Initialize FAQItemService with a database session.
+
+        Args:
+            session: Database session (injected dependency)
+        """
+        self.session = session
+
+    async def get_faq_knowledgebase(self, chatbot_id: str, tenant_id: str):
+        """
+        Get FAQ knowledgebase for the given chatbot.
+
+        Args:
+            chatbot_id: Chatbot ID
+            tenant_id: Tenant ID
+
+        Returns:
+            Knowledgebase entity if found, None otherwise
+        """
+        # Get chatbot to get app_id
+        chatbot = await self.session.exec(
+            select(ChatBotEntity).where(
+                ChatBotEntity.app_id == chatbot_id, ChatBotEntity.tenant_id == tenant_id
+            )
+        )
+        chatbot = chatbot.first()
+        if not chatbot:
+            return None
+
+        # Convert dict to FAQConfigCreate object
+        if not chatbot.faq_config:
+            return None
+
+        try:
+            faq_config = FAQConfigCreate.model_validate(chatbot.faq_config)
+        except Exception as e:
+            logger.warning(f"Failed to validate FAQ config for chatbot {chatbot_id}: {e}")
+            return None
+
+        if not faq_config.kb_id:
+            return None
+
+        knowledgebase_service = KnowledgebaseService(self.session)
+        return await knowledgebase_service.get_knowledgebase(faq_config.kb_id, tenant_id=tenant_id)
+
+    async def save_faq_to_knowledgebase(
+        self, faq_item: FAQItemEntity, tenant_id: str, rag_service: RagService
+    ) -> None:
+        """
+        Save FAQ item to knowledgebase.
+
+        Args:
+            faq_item: FAQ Item entity
+            tenant_id: Tenant ID
+        """
+        try:
+            if not faq_item.question or not faq_item.answer:
+                logger.warning(
+                    f"FAQ item {faq_item.id} has no question or answer, skipping save to KB"
+                )
+                return
+
+            # Get FAQ knowledgebase
+            kb = await self.get_faq_knowledgebase(faq_item.chatbot_id, tenant_id)
+            if not kb:
+                logger.warning(
+                    f"FAQ knowledgebase not found for chatbot {faq_item.chatbot_id}, skipping save to KB"
+                )
+                return
+
+            # Get FAQ config from chatbot to determine what to include in chunk_text
+            chatbot = await self.session.exec(
+                select(ChatBotEntity).where(
+                    ChatBotEntity.app_id == faq_item.chatbot_id,
+                    ChatBotEntity.tenant_id == tenant_id,
+                )
+            )
+            chatbot = chatbot.first()
+
+            faq_config = None
+            if chatbot and chatbot.faq_config:
+                faq_config = FAQConfigCreate.model_validate(chatbot.faq_config)
+
+            # Build chunk_text based on faq_config settings
+            chunk_parts = []
+            if faq_config:
+                if faq_config.enable_question_in_retrieval:
+                    chunk_parts.append(f"{faq_item.question}")
+                if faq_config.enable_answer_in_retrieval:
+                    chunk_parts.append(f"{faq_item.answer}")
+            else:
+                chunk_parts.append(f"{faq_item.question}")
+
+            chunk_text = "\n".join(chunk_parts) if chunk_parts else ""
+
+            # Create metadata for TextNode
+            node_metadata = {
+                "faq_item_id": faq_item.id,
+                "chatbot_id": faq_item.chatbot_id,
+                "question": faq_item.question,
+                "answer": faq_item.answer,
+                "token_count": estimate_tokens_in_text(chunk_text),
+            }
+
+            # Create TextNode directly (no KbChunkEntity needed for FAQ items)
+            kb_node = TextNode(
+                id_=faq_item.id,
+                text=chunk_text,
+                metadata=node_metadata,
+            )
+
+
+            if faq_item.active:
+                await rag_service.ainsert(kb_id=kb.id, nodes=[kb_node], tenant_id=tenant_id)
+                logger.info(
+                    f"Inserted FAQ item {faq_item.id} into knowledgebase {kb.id}"
+                )
+            else:
+                logger.info(
+                    f"FAQ item {faq_item.id} is inactive, skipping vector store insertion"
+                )
+
+        except Exception as e:
+            logger.error(f"Failed to save FAQ item to knowledgebase: {e}")
+
+    async def delete_faq_from_knowledgebase(
+        self, faq_item: FAQItemEntity, tenant_id: str, rag_service: RagService
+    ) -> None:
+        """
+        Delete FAQ item from knowledgebase.
+
+        Args:
+            faq_item: FAQ Item entity
+            tenant_id: Tenant ID
+        """
+        try:
+            # Get FAQ knowledgebase
+            kb = await self.get_faq_knowledgebase(faq_item.chatbot_id, tenant_id)
+            if not kb:
+                logger.warning(
+                    f"FAQ knowledgebase not found for chatbot {faq_item.chatbot_id}, skipping delete from KB"
+                )
+                return
+
+            # Delete from vector store using faq_item.id as node_id
+            await rag_service.adelete(kb_id=kb.id, node_ids=[faq_item.id], tenant_id=tenant_id)
+            logger.info(
+                f"Deleted FAQ item {faq_item.id} from knowledgebase {kb.id}"
+            )
+
+        except Exception as e:
+            logger.error(f"Failed to delete FAQ item from knowledgebase: {e}")
+            # Don't raise exception, just log the error
+
+    async def get_faq_item(self, id: str, tenant_id: str) -> Optional[FAQItemEntity]:
+        """
+        Get a single FAQ Item entity by ID.
+
+        Args:
+            id: FAQ Item entity ID
+            tenant_id: Tenant ID
+
+        Returns:
+            FAQItemEntity if found, None otherwise
+        """
+        faq_items = await self.session.exec(
+            select(FAQItemEntity).where(
+                FAQItemEntity.id == id, FAQItemEntity.tenant_id == tenant_id
+            )
+        )
+        return faq_items.first()
+
+    async def list_faq_items(
+        self,
+        chatbot_id: str,
+        tenant_id: str = None,
+        page: int = 1,
+        size: int = 100,
+    ) -> PagedResult[List[FAQItemEntity]]:
+        """
+        List FAQ Item entities with pagination.
+
+        Args:
+            chatbot_id: Chatbot ID
+            tenant_id: Tenant ID
+            page: Page number (1-indexed)
+            size: Page size
+
+        Returns:
+            PagedResult containing list of FAQItemEntity and pagination metadata
+        """
+        # Build base query
+        base_query = select(FAQItemEntity).where(
+            FAQItemEntity.chatbot_id == chatbot_id,
+            FAQItemEntity.tenant_id == tenant_id,
+        )
+
+        # Get total count
+        count_query = select(func.count()).select_from(base_query)
+        total_result = await self.session.exec(count_query)
+        total = total_result.one_or_none() or 0
+
+        # Get paginated results
+        offset = (page - 1) * size
+        paginated_query = (
+            base_query.offset(offset).limit(size).order_by(FAQItemEntity.created_at.desc())
+        )
+        results = await self.session.exec(paginated_query)
+        faq_items = list(results.all())
+
+        # Calculate pages
+        pages = (total + size - 1) // size if total > 0 else 0
+
+        return PagedResult(
+            items=faq_items,
+            total=total,
+            pages=pages,
+            page=page,
+            size=size,
+        )
+
+    async def create_faq_item(
+        self,
+        chatbot_id: str,
+        faq_item_data: FAQItemCreate,
+        tenant_id: str,
+    ) -> FAQItemEntity:
+        """
+        Create a new FAQ Item entity.
+        Note: Caller is responsible for committing the session.
+
+        Args:
+            chatbot_id: Chatbot ID
+            faq_item_data: FAQ Item creation data
+            tenant_id: Tenant ID
+
+        Returns:
+            Created FAQItemEntity (not yet committed)
+        """
+        faq_item = FAQItemEntity.model_validate(
+            faq_item_data,
+            update={"chatbot_id": chatbot_id, "tenant_id": tenant_id},
+        )
+        self.session.add(faq_item)
+
+        try:
+            # Flush to get the ID, but don't commit
+            await self.session.flush()
+            await self.session.refresh(faq_item)
+
+            logger.info(
+                f"Created FAQ Item entity: {faq_item.id} (chatbot_id: {chatbot_id})"
+            )
+
+
+            return faq_item
+        except Exception as e:
+            logger.error(f"Error creating FAQ Item: {e}")
+            raise ValueError(f"创建FAQ条目失败: {e}") from e
+
+    async def update_faq_item(
+        self, id: str, update_data: FAQItemCreate, tenant_id: str, rag_service: Optional[RagService] = None
+    ) -> FAQItemEntity:
+        """
+        Update an existing FAQ Item entity.
+        Note: Caller is responsible for committing the session.
+
+        Args:
+            id: FAQ Item entity ID
+            update_data: Updated FAQ Item data
+            tenant_id: Tenant ID
+
+        Returns:
+            Updated FAQItemEntity (not yet committed)
+
+        Raises:
+            ValueError: If FAQ Item entity not found
+        """
+        faq_item = await self.get_faq_item(id=id, tenant_id=tenant_id)
+        if not faq_item:
+            raise ValueError(f"FAQ条目 '{id}' 不存在。")
+
+        logger.info(f"Updating FAQ Item {id} with data: {update_data}")
+
+        # Update fields
+        if update_data.question is not None:
+            faq_item.question = update_data.question
+        if update_data.answer is not None:
+            faq_item.answer = update_data.answer
+        if update_data.chatbot_id is not None:
+            faq_item.chatbot_id = update_data.chatbot_id
+        if update_data.file_id is not None:
+            faq_item.file_id = update_data.file_id
+        if update_data.active is not None:
+            faq_item.active = update_data.active
+
+        faq_item.updated_at = datetime.now(timezone.utc).replace(tzinfo=None)
+        self.session.add(faq_item)
+
+        # Flush to ensure changes are staged
+        await self.session.flush()
+        await self.session.refresh(faq_item)
+
+        logger.info(f"Updated FAQ Item entity: {faq_item.id}")
+
+        # Update FAQ in knowledgebase (delete old, insert new if active)
+        await self.delete_faq_from_knowledgebase(faq_item, tenant_id, rag_service)
+        await self.save_faq_to_knowledgebase(faq_item, tenant_id, rag_service)
+
+        return faq_item
+
+    async def delete_faq_item(self, id: str, tenant_id: str, rag_service: Optional[RagService] = None) -> None:
+        """
+        Delete a FAQ Item entity.
+        Note: Caller is responsible for committing the session.
+
+        Args:
+            id: FAQ Item entity ID
+            tenant_id: Tenant ID
+
+        Raises:
+            ValueError: If FAQ Item entity not found
+        """
+        faq_item = await self.get_faq_item(id=id, tenant_id=tenant_id)
+        if not faq_item:
+            raise ValueError(f"FAQ条目 '{id}' 不存在。")
+
+        # Delete from knowledgebase first
+        await self.delete_faq_from_knowledgebase(faq_item, tenant_id, rag_service)
+
+        # Delete from database (staged, not committed)
+        await self.session.delete(faq_item)
+
+        # Flush to ensure deletion is staged
+        await self.session.flush()
+
+        logger.info(f"Deleted FAQ Item entity: {id}")
diff --git a/backend/tools/attachments/file_reader.py b/backend/tools/attachments/file_reader.py
index 5abe0964a..34166c611 100644
--- a/backend/tools/attachments/file_reader.py
+++ b/backend/tools/attachments/file_reader.py
@@ -40,5 +40,6 @@ async def aread_file_content(
         async_fn=aread_file_content,
         name="read-file",
         description="根据提供的附件ID读取文件的内容。\n参数：\n- file_id (str, 必需): 要读取的文件的ID。",
+        return_direct=False,
     )
     return read_file_tool
diff --git a/backend/tools/attachments/file_searcher.py b/backend/tools/attachments/file_searcher.py
index 65f04dae8..f8f9441ae 100644
--- a/backend/tools/attachments/file_searcher.py
+++ b/backend/tools/attachments/file_searcher.py
@@ -67,5 +67,6 @@ async def file_retrieve_handler(
 - doc_ids (List[str]): The IDs of the documents to search.
 - kwargs (dict, optional): Additional arguments for the tool.
 """,
+        return_direct=False,
     )
     return search_tool
diff --git a/backend/tools/attachments/image_parser.py b/backend/tools/attachments/image_parser.py
index 3d419f3dc..d1e6ee485 100644
--- a/backend/tools/attachments/image_parser.py
+++ b/backend/tools/attachments/image_parser.py
@@ -101,7 +101,8 @@ async def aget_image_analysis_func(
         name="image-parser",
         description="""解析上传的图片内容。适用于用户提问涉及图片中的信息（如图表、文字、产品图等）。
 参数：
-- question: 可选，用户想问的具体问题，例如“图中智能床的价格是多少？”、“请提取表格数据”等。
+- question: 可选，用户想问的具体问题，例如"图中智能床的价格是多少？"、"请提取表格数据"等。
 返回：包含图片分析结果的 JSON 对象。""",
+        return_direct=False,
     )
     return image_parser_tool
diff --git a/backend/tools/code/code_sandbox_tool.py b/backend/tools/code/code_sandbox_tool.py
index 834bc53a9..662625b2c 100644
--- a/backend/tools/code/code_sandbox_tool.py
+++ b/backend/tools/code/code_sandbox_tool.py
@@ -678,6 +678,7 @@ async def _wrapped_list_files(file_dir_path: str, sandbox_id: str = None):
             async_fn=_wrapped_list_files,
             name="list-sandbox-files",
             description=description,
+            return_direct=False,
         )
 
     async def aupload_files_to_code_sandbox(self, file_ids: List[str], sandbox_id: str = None):
diff --git a/backend/tools/knowledgebase/faq_tool.py b/backend/tools/knowledgebase/faq_tool.py
new file mode 100644
index 000000000..2bf6379fa
--- /dev/null
+++ b/backend/tools/knowledgebase/faq_tool.py
@@ -0,0 +1,145 @@
+from service.knowledgebase.rag_service import RagService
+from service.tool.chatapp_service import ChatappService
+from service.tool.faq_config_service import FAQConfigService
+from db.models.faq_config import FAQConfigCreate
+from typing import Annotated, Optional
+from functools import partial
+from llama_index.core.tools import FunctionTool
+import json
+from loguru import logger
+
+
+async def aget_faq_result(
+    query: str,
+    chatapp_id: str,
+    user_id: str | None = None,
+    rag_service: RagService | None = None,
+    chatapp_service: ChatappService | None = None,
+    faq_config_service: FAQConfigService | None = None,
+    tenant_id: str = None,
+) -> str:
+    """Get FAQ search result from FAQ knowledgebase"""
+    logger.info(f"Searching FAQ with chatapp_id {chatapp_id} and user {user_id}.")
+
+    chatbot = await chatapp_service.get_chatapp_by_app_id(
+        app_id=chatapp_id,
+        tenant_id=tenant_id
+    )
+    if not chatbot:
+        raise ValueError(f"应用 '{chatapp_id}' 不存在。")
+
+    # Convert dict to FAQConfigCreate object
+    kb_id = None
+    if chatbot.faq_config:
+        try:
+            faq_config = FAQConfigCreate.model_validate(chatbot.faq_config)
+            kb_id = faq_config.kb_id
+        except Exception as e:
+            logger.warning(f"Failed to validate FAQ config for chatbot {chatapp_id}: {e}")
+
+    kb = await rag_service.get_knowledgebase(kb_id=kb_id, tenant_id=tenant_id)
+
+    if not kb:
+        raise ValueError(f"FAQ知识库 '{kb_id}' 不存在。")
+
+
+    records = await rag_service.aquery(
+        query=query,
+        user_id=user_id,
+        kb_id=kb.id,
+        tenant_id=tenant_id,
+    )
+
+    logger.info(
+        f"Retrieved {len(records)} FAQ results for query '{query}' from knowledgebase {kb.id}."
+    )
+
+    faq_config = None
+    try:
+        faq_config = await faq_config_service.get_faq_config_by_chatbot_id(
+            chatbot_id=chatbot.id, tenant_id=tenant_id
+        )
+    except Exception as e:
+        logger.warning(f"Failed to get FAQ config: {e}, using defaults")
+
+    question_in_response = faq_config.enable_question_in_response if faq_config else True
+    answer_in_response = faq_config.enable_answer_in_response if faq_config else True
+
+    records_dict = []
+    for record in records:
+        record_dict = record.model_dump()
+        metadata = record_dict.get('metadata', {}) or {}
+
+        question = metadata.get('question', '') or ''
+        answer = metadata.get('answer', '') or ''
+
+        content_parts = []
+        if not faq_config.return_direct:
+            if question_in_response and question:
+                content_parts.append(f"问题：{question}")
+            if answer_in_response and answer:
+                content_parts.append(f"答案：{answer}")
+
+            if content_parts:
+                record_dict['content'] = '\n'.join(content_parts)
+        else:
+            record_dict['content'] = answer
+
+        records_dict.append(record_dict)
+
+    return json.dumps({"result": records_dict}, ensure_ascii=False)
+
+
+async def aget_faq_tool(
+    chatapp_id: str,
+    tenant_id: str,
+    user_id: Optional[str] = None,
+    rag_service: RagService = None,
+    chatapp_service: ChatappService = None,
+    faq_config_service: FAQConfigService = None,
+):
+    """Create a FAQ search tool for the given chatapp_id."""
+    # Get faq_config to determine return_direct value
+    return_direct = False
+    try:
+        chatbot = await chatapp_service.get_chatapp_by_app_id(
+            app_id=chatapp_id,
+            tenant_id=tenant_id
+        )
+        if chatbot:
+            faq_config = await faq_config_service.get_faq_config_by_chatbot_id(
+                chatbot_id=chatbot.id, tenant_id=tenant_id
+            )
+            if faq_config:
+                return_direct = faq_config.return_direct if faq_config.return_direct is not None else False
+    except Exception as e:
+        logger.warning(f"Failed to get FAQ config for return_direct: {e}, using default False")
+
+    aquery_faq_func = partial(
+        aget_faq_result,
+        chatapp_id=chatapp_id,
+        user_id=user_id,
+        rag_service=rag_service,
+        chatapp_service=chatapp_service,
+        faq_config_service=faq_config_service,
+        tenant_id=tenant_id,
+    )
+
+
+    async def query_faq_handler(
+        query: Annotated[
+            str,
+            "根据上下文添加必要的背景信息，改写一个新的独立问题，使问题更完整，注意指代消解、完善主语等",
+        ] = "",
+    ):
+        return await aquery_faq_func(
+            query=query,
+        )
+
+    search_faq_tool = FunctionTool.from_defaults(
+        async_fn=query_faq_handler,
+        name=f"search-faq-{chatapp_id}",
+        description="根据上下文从FAQ知识库中搜索和用户查询相关的内容。",
+        return_direct=return_direct,
+    )
+    return search_faq_tool
diff --git a/backend/tools/knowledgebase/knowledgebase_tool.py b/backend/tools/knowledgebase/knowledgebase_tool.py
index 22fb7fdb6..1e8c8bcc2 100644
--- a/backend/tools/knowledgebase/knowledgebase_tool.py
+++ b/backend/tools/knowledgebase/knowledgebase_tool.py
@@ -55,5 +55,6 @@ async def query_knowledgebase_handler(
         async_fn=query_knowledgebase_handler,
         name=f"search-knowledgebase-{kb_id}",
         description=f"根据上下文从知识库中搜索和用户查询相关的内容。\n知识库名称: {knowledgebase.name}\n知识库描述: {knowledgebase.description}\n",
+        return_direct=False,
     )
     return search_knowledgebase_tool
diff --git a/backend/tools/plan/plan_tool.py b/backend/tools/plan/plan_tool.py
index 01d75172d..17371355d 100644
--- a/backend/tools/plan/plan_tool.py
+++ b/backend/tools/plan/plan_tool.py
@@ -32,6 +32,7 @@ async def plan_func(
         async_fn=plan_func,
         name="planning-tool",
         description=PLAN_TOOL_DESCRIPTION,
+        return_direct=False,
     )
 
     return plan_tool
@@ -53,6 +54,7 @@ async def response_func():
         async_fn=response_func,
         name="respond-tool",
         description=RESPONSE_TOOL_DESCRIPTION,
+        return_direct=False,
     )
 
     return response_tool
diff --git a/backend/tools/search/visit_webpage.py b/backend/tools/search/visit_webpage.py
index b789b82b7..7cf829c90 100644
--- a/backend/tools/search/visit_webpage.py
+++ b/backend/tools/search/visit_webpage.py
@@ -179,6 +179,7 @@ async def visit_webpage_handler(
   ]
 }
 """,
+        return_direct=False,
     )
     return visit_tool
 
diff --git a/backend/tools/think/simple_think_tool.py b/backend/tools/think/simple_think_tool.py
index 864968f49..1c7fc83ac 100644
--- a/backend/tools/think/simple_think_tool.py
+++ b/backend/tools/think/simple_think_tool.py
@@ -48,6 +48,7 @@ async def simple_think_handler(thought: str):
         async_fn=simple_think_handler,
         name="think",
         description="记录思考内容。用于复杂推理或缓存记忆。",
+        return_direct=False,
     )
     openai_tools = []
     tools_name_to_fn = {}
diff --git a/backend/tools/think/think_and_planning_tool.py b/backend/tools/think/think_and_planning_tool.py
index 151c4651c..3c3dbc615 100644
--- a/backend/tools/think/think_and_planning_tool.py
+++ b/backend/tools/think/think_and_planning_tool.py
@@ -75,6 +75,7 @@ async def simple_think_handler(
         async_fn=simple_think_handler,
         name="think-and-planning",
         description="这是用于系统化思考与规划的工具，支持用户在面对复杂问题或任务时，分阶段梳理思考、规划和行动步骤。工具强调思考（thought）、计划（plan）与实际行动（action）的结合，通过编号（thoughtNumber）追踪过程。该工具不会获取新信息或更改数据库，只会将想法附加到记忆中。当需要复杂推理或某种缓存记忆时，可以使用它。",
+        return_direct=False,
     )
 
     return think_tool
diff --git a/backend/utils/upload_file_utils.py b/backend/utils/upload_file_utils.py
index d86f2e7b2..e71070393 100644
--- a/backend/utils/upload_file_utils.py
+++ b/backend/utils/upload_file_utils.py
@@ -1,4 +1,4 @@
-from typing import List
+from typing import List, Optional
 from fastapi import UploadFile
 from pairag.file.models.file_item import FileItem
 from pairag.file.store.file_store_helper import file_store
@@ -50,6 +50,7 @@ class ParseFileTask(BaseModel):
 
 class StartParseTaskRequest(BaseModel):
     files: List[ParseFileTask]
+    chunk_config: Optional[dict] = None
 
 
 async def upload_file_names_async(
diff --git a/frontend/app/api/config/apps/[app_id]/faq-config/route.ts b/frontend/app/api/config/apps/[app_id]/faq-config/route.ts
new file mode 100644
index 000000000..2139ae416
--- /dev/null
+++ b/frontend/app/api/config/apps/[app_id]/faq-config/route.ts
@@ -0,0 +1,12 @@
+// app/api/proxy/route.js
+import { NextRequest } from 'next/server';
+import { proxyRequest } from '@/app/api/proxy';
+
+export async function GET(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function PUT(request: NextRequest) {
+  return proxyRequest(request);
+}
+
diff --git a/frontend/app/api/config/apps/[app_id]/faq-files/route.ts b/frontend/app/api/config/apps/[app_id]/faq-files/route.ts
new file mode 100644
index 000000000..077e4acd9
--- /dev/null
+++ b/frontend/app/api/config/apps/[app_id]/faq-files/route.ts
@@ -0,0 +1,8 @@
+// app/api/proxy/route.js
+import { NextRequest } from 'next/server';
+import { proxyRequest } from '@/app/api/proxy';
+
+export async function POST(request: NextRequest) {
+  return proxyRequest(request);
+}
+
diff --git a/frontend/app/api/config/apps/[app_id]/faqs/[faq_id]/route.ts b/frontend/app/api/config/apps/[app_id]/faqs/[faq_id]/route.ts
new file mode 100644
index 000000000..7f08ff7a0
--- /dev/null
+++ b/frontend/app/api/config/apps/[app_id]/faqs/[faq_id]/route.ts
@@ -0,0 +1,16 @@
+// app/api/proxy/route.js
+import { NextRequest } from 'next/server';
+import { proxyRequest } from '@/app/api/proxy';
+
+export async function GET(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function PUT(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function DELETE(request: NextRequest) {
+  return proxyRequest(request);
+}
+
diff --git a/frontend/app/api/config/apps/[app_id]/faqs/route.ts b/frontend/app/api/config/apps/[app_id]/faqs/route.ts
new file mode 100644
index 000000000..602a9149e
--- /dev/null
+++ b/frontend/app/api/config/apps/[app_id]/faqs/route.ts
@@ -0,0 +1,20 @@
+// app/api/proxy/route.js
+import { NextRequest } from 'next/server';
+import { proxyRequest } from '@/app/api/proxy';
+
+export async function GET(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function POST(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function PUT(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function DELETE(request: NextRequest) {
+  return proxyRequest(request);
+}
+
diff --git a/frontend/app/api/config/knowledgebases/[kb_id]/files/[file_id]/chunk_config/route.ts b/frontend/app/api/config/knowledgebases/[kb_id]/files/[file_id]/chunk_config/route.ts
new file mode 100644
index 000000000..602a9149e
--- /dev/null
+++ b/frontend/app/api/config/knowledgebases/[kb_id]/files/[file_id]/chunk_config/route.ts
@@ -0,0 +1,20 @@
+// app/api/proxy/route.js
+import { NextRequest } from 'next/server';
+import { proxyRequest } from '@/app/api/proxy';
+
+export async function GET(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function POST(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function PUT(request: NextRequest) {
+  return proxyRequest(request);
+}
+
+export async function DELETE(request: NextRequest) {
+  return proxyRequest(request);
+}
+
diff --git a/frontend/app/api/proxy.ts b/frontend/app/api/proxy.ts
index 5203e6c08..968d2072b 100644
--- a/frontend/app/api/proxy.ts
+++ b/frontend/app/api/proxy.ts
@@ -68,23 +68,73 @@ export async function proxyRequest(request: NextRequest) {
   }
 
   // 创建 AbortController 用于超时控制
-  const timeoutMs = parseInt(process.env.PROXY_TIMEOUT_MS || '60000', 10); // 默认 60 秒
+  // 对于可能返回流式响应或需要LLM调用的请求，使用更长的超时时间
+  const defaultTimeoutMs = parseInt(process.env.PROXY_TIMEOUT_MS || '60000', 10); // 默认 60 秒
+  const streamingTimeoutMs = parseInt(process.env.PROXY_STREAMING_TIMEOUT_MS || '300000', 10); // 流式响应默认 5 分钟
+  
+  // 判断是否是可能返回流式响应或需要LLM调用的请求路径
+  // 包括：
+  // - /threads/* 下的所有路径（可能涉及LLM调用，如生成标题、消息等）
+  // - /chat/completions 和 /chat（流式响应）
+  const isPotentialStreamingPath = pathname.includes('/threads/') ||
+                                    pathname.includes('/chat/completions') ||
+                                    pathname.includes('/chat');
+  
+  // 对于可能返回流式响应或需要LLM调用的请求，使用更长的超时时间
+  const initialTimeoutMs = isPotentialStreamingPath ? streamingTimeoutMs : defaultTimeoutMs;
+  
   const controller = new AbortController();
   let timeoutId: NodeJS.Timeout | null = null;
 
   try {
-    timeoutId = setTimeout(() => controller.abort(), timeoutMs);
+    // 根据请求路径设置初始超时时间
+    timeoutId = setTimeout(() => controller.abort(), initialTimeoutMs);
 
     const res = await fetch(upstreamUrl.toString(), {
       method,
       headers,
       body,
       signal: controller.signal,
+      // 添加 keepalive 选项，保持连接活跃
+      keepalive: true,
     });
 
+    // 检查是否是流式响应
+    const contentType = res.headers.get('content-type') || '';
+    const isStreaming = contentType.includes('text/event-stream') || 
+                        contentType.includes('stream') ||
+                        res.headers.get('transfer-encoding') === 'chunked';
+
+    if (isStreaming && res.body) {
+      // 流式响应：清除当前超时，使用更长的超时时间
+      if (timeoutId) clearTimeout(timeoutId);
+      
+      // 对于流式响应，创建一个新的超时控制器，使用更长的超时时间
+      // 注意：这里我们不能直接修改signal，但可以在流式传输过程中监控
+      // 实际上，对于流式响应，我们应该让客户端控制超时，而不是在代理层强制超时
+      // 流式响应：直接传递流，不设置超时限制（由客户端或Next.js处理）
+      return new NextResponse(res.body, {
+        status: res.status,
+        statusText: res.statusText,
+        headers: res.headers,
+      });
+    }
+
+    // 非流式响应：清除超时（响应已完全接收）
     if (timeoutId) clearTimeout(timeoutId);
 
-    // 读取响应数据
+    // 检查响应是否正常
+    if (!res.ok && !res.body) {
+      return NextResponse.json(
+        { 
+          error: 'Proxy request failed', 
+          message: `Backend returned status ${res.status} without body`,
+        }, 
+        { status: res.status }
+      );
+    }
+
+    // 非流式响应：读取完整数据
     const responseData = await res.blob(); // 通用处理（支持 JSON、text、binary）
     const responseHeaders = new Headers(res.headers);
     responseHeaders.set('content-length', responseData.size.toString());
@@ -99,25 +149,57 @@ export async function proxyRequest(request: NextRequest) {
     });
   } catch (error: any) {
     if (timeoutId) clearTimeout(timeoutId);
-    console.log("Proxy request failed: ", error);
     
-    // 处理超时错误
-    if (error.name === 'AbortError' || error.code === 'UND_ERR_HEADERS_TIMEOUT') {
+    // 记录错误详情用于调试
+    console.error("Proxy request failed: ", {
+      name: error.name,
+      message: error.message,
+      code: error.code,
+      cause: error.cause,
+      stack: error.stack
+    });
+    
+    // 处理连接关闭错误
+    if (error.cause?.code === 'UND_ERR_SOCKET' || 
+        error.message?.includes('other side closed') ||
+        error.message?.includes('fetch failed') ||
+        error.message?.includes('ECONNREFUSED') ||
+        error.message?.includes('ENOTFOUND')) {
+      return NextResponse.json(
+        { 
+          error: 'Proxy connection closed', 
+          message: 'Backend connection was closed unexpectedly. This may happen if the request takes too long or the backend service restarted.',
+          details: error.cause?.message || error.message,
+          code: error.cause?.code || 'CONNECTION_CLOSED'
+        }, 
+        { status: 502 } // Bad Gateway - 后端服务问题
+      );
+    }
+    
+    // 处理超时错误（包括AbortError）
+    if (error.name === 'AbortError' || 
+        error.code === 'UND_ERR_HEADERS_TIMEOUT' ||
+        error.code === 20 || // DOMException.ABORT_ERR
+        error.message?.includes('aborted') ||
+        error.message?.includes('This operation was aborted')) {
       return NextResponse.json(
         { 
           error: 'Proxy request timeout', 
-          message: `Request exceeded timeout of ${timeoutMs}ms`,
-          details: error.message 
+          message: `Request exceeded timeout of ${initialTimeoutMs}ms. ${isPotentialStreamingPath ? 'This is a streaming endpoint, which may take longer to respond.' : 'Please try again or contact support if the issue persists.'}`,
+          details: error.message,
+          code: 'TIMEOUT'
         }, 
         { status: 504 }
       );
     }
     
+    // 处理其他错误
     return NextResponse.json(
       { 
         error: 'Proxy request failed', 
         message: error.message || String(error),
-        details: error.cause?.message || error.stack 
+        details: error.cause?.message || error.stack,
+        code: error.code || 'UNKNOWN_ERROR'
       }, 
       { status: 500 }
     );
diff --git a/frontend/app/apps/[appId]/page.tsx b/frontend/app/apps/[appId]/page.tsx
index c8b8ce71e..856432290 100644
--- a/frontend/app/apps/[appId]/page.tsx
+++ b/frontend/app/apps/[appId]/page.tsx
@@ -1,14 +1,107 @@
 'use client';
-import { use } from "react";
+import { use, useState, useEffect } from "react";
 import { ChatbotConfigCard } from "../chatbot_config";
-
+import { FAQManagement } from "../faq_management";
+import { Tabs, TabsContent, TabsList, TabsTrigger } from "@/components/ui/tabs";
+import { Button } from "@/components/ui/button";
+import { Badge } from "@/components/ui/badge";
+import {
+  Breadcrumb,
+  BreadcrumbItem,
+  BreadcrumbLink,
+  BreadcrumbList,
+  BreadcrumbPage,
+  BreadcrumbSeparator,
+} from '@/components/ui/breadcrumb';
+import { useRouter } from "next/navigation";
+import { useTenantFetch } from "@/hooks/use-tenant-fetch";
+import { Chatbot } from "../chatbot_config";
+import { toast } from "sonner";
 
 export default function ViewChatApp(
     { params } : { params: Promise<{ appId: string }> }
 ) {
     const { appId } = use(params);
+    const router = useRouter();
+    const { tenantFetch } = useTenantFetch();
+    const [botConfig, setBotConfig] = useState<Chatbot | null>(null);
+    const [loading, setLoading] = useState(true);
+
+    useEffect(() => {
+        fetchAppConfig();
+    }, [appId]);
+
+    const fetchAppConfig = async () => {
+        try {
+            setLoading(true);
+            const res = await tenantFetch(`/api/config/apps?app_id=${appId}`);
+            if (res.ok) {
+                const data = await res.json();
+                setBotConfig(data.data);
+            }
+        } catch (error: any) {
+            console.error('获取应用配置失败:', error);
+            toast.error('获取应用配置失败');
+        } finally {
+            setLoading(false);
+        }
+    };
+
+    if (loading) {
+        return <div className="flex items-center justify-center h-screen">加载中...</div>;
+    }
+
     return (
-        <ChatbotConfigCard chatbotId={appId}>
-        </ChatbotConfigCard>
-    )
+        <div className="flex flex-col h-screen pt-0 space-y-0">
+            <div className="absolute top-2 left-12 py-0 flex items-center z-10">
+                <Breadcrumb>
+                    <BreadcrumbList>
+                        <BreadcrumbItem>
+                            <BreadcrumbLink asChild>
+                                <Button
+                                    variant="link"
+                                    className="px-0"
+                                    onClick={() => router.push('/apps')}
+                                >
+                                    应用
+                                </Button>
+                            </BreadcrumbLink>
+                        </BreadcrumbItem>
+                        <BreadcrumbSeparator />
+                        <BreadcrumbItem>
+                            <BreadcrumbPage>{botConfig?.app_id || '应用编辑'}</BreadcrumbPage>
+                        </BreadcrumbItem>
+                    </BreadcrumbList>
+                </Breadcrumb>
+                <div className="flex gap-2 items-center ml-4">
+                    <Badge variant="secondary" className="text-xs bg-muted text-muted-foreground">
+                        ID: {botConfig?.id || ''}
+                    </Badge>
+                    {botConfig?.description && (
+                        <Badge variant="secondary" className="text-xs bg-muted text-muted-foreground max-w-[200px] truncate">
+                            {botConfig.description}
+                        </Badge>
+                    )}
+                </div>
+            </div>
+            <div className="flex-1 overflow-y-auto px-2 py-6">
+                <Tabs defaultValue="settings" className="h-full flex flex-col">
+                    <TabsList className="py-0 bg-muted rounded-lg flex-none">
+                        <TabsTrigger value="settings" className="py-1 px-2">
+                            <span className="text-xs">应用设置</span>
+                        </TabsTrigger>
+                        <TabsTrigger value="faq" className="py-1 px-2">
+                            <span className="text-xs">FAQ管理</span>
+                        </TabsTrigger>
+                    </TabsList>
+                    <TabsContent value="settings" className="py-2">
+                        <ChatbotConfigCard chatbotId={appId} />
+                    </TabsContent>
+                    <TabsContent value="faq" className="py-2">
+                        {botConfig && <FAQManagement appId={botConfig.app_id} botConfig={botConfig} setBotConfig={setBotConfig} />}
+                    </TabsContent>
+                </Tabs>
+            </div>
+        </div>
+    );
 }
\ No newline at end of file
diff --git a/frontend/app/apps/chatbot_config.tsx b/frontend/app/apps/chatbot_config.tsx
index 8161455cf..f8aff17cf 100644
--- a/frontend/app/apps/chatbot_config.tsx
+++ b/frontend/app/apps/chatbot_config.tsx
@@ -53,8 +53,17 @@ interface PromptConfig {
   act: string;
   act_with_plan: string;
   summary: string;
-};
+}
 
+interface FAQConfig {
+  active?: boolean;
+  similarity_threshold?: number;
+  embedding_model?: string;
+  enable_question_in_retrieval?: boolean;
+  enable_question_in_response?: boolean;
+  enable_answer_in_retrieval?: boolean;
+  enable_answer_in_response?: boolean;
+}
 
 export interface Chatbot {
   id: string;
@@ -63,6 +72,8 @@ export interface Chatbot {
   enable_search: boolean;
   enable_agent: boolean;
   enable_chatdb: boolean;
+  enable_faq?: boolean;
+  faq_config?: FAQConfig | null;
   mcp_ids: string[];
   kb_ids: string[];
   model_id: string;
@@ -90,6 +101,8 @@ const default_chat_config = {
   updated_at: "",
   enable_agent: false,
   enable_chatdb: false,
+  enable_faq: false,
+  faq_config: null,
   enable_input_guardrail: false,
   enable_output_guardrail: false,
   guardrail_hint: "作为人工智能助手，我无法回应包含不当或敏感信息的内容。",
@@ -502,6 +515,21 @@ export const ChatbotConfigCard: FC<ChatbotConfigProps> = ({
           }}
         />
       </div>
+      <div className="flex gap-6">
+        <Label htmlFor="enable_faq" className="w-[90px]">
+          启用FAQ
+        </Label>
+        <Switch
+          id="enable_faq"
+          checked={botConfig.enable_faq || false}
+          onCheckedChange={(checked) => {
+            setBotConfig({
+              ...botConfig,
+              enable_faq: checked,
+            });
+          }}
+        />
+      </div>
       <div className="flex">
         <Label htmlFor="kb_selection" className="w-[90px]">
           知识库选择
diff --git a/frontend/app/apps/faq_management.tsx b/frontend/app/apps/faq_management.tsx
new file mode 100644
index 000000000..90265e190
--- /dev/null
+++ b/frontend/app/apps/faq_management.tsx
@@ -0,0 +1,1065 @@
+'use client';
+import React, { useState, useEffect } from 'react';
+import { Button } from '@/components/ui/button';
+import { Input } from '@/components/ui/input';
+import { Textarea } from '@/components/ui/textarea';
+import { Label } from '@/components/ui/label';
+import {
+  Table,
+  TableBody,
+  TableCell,
+  TableHead,
+  TableHeader,
+  TableRow,
+} from '@/components/ui/table';
+import {
+  Dialog,
+  DialogContent,
+  DialogDescription,
+  DialogFooter,
+  DialogHeader,
+  DialogTitle,
+  DialogTrigger,
+} from '@/components/ui/dialog';
+import {
+  Select,
+  SelectContent,
+  SelectGroup,
+  SelectItem,
+  SelectTrigger,
+  SelectValue,
+} from '@/components/ui/select';
+import { Slider } from '@/components/ui/slider';
+import { Plus, Edit, Trash2, Settings, HelpCircle, Upload } from 'lucide-react';
+import { toast } from 'sonner';
+import { useTenantFetch } from '@/hooks/use-tenant-fetch';
+import { Switch } from '@/components/ui/switch';
+import { Chatbot } from './chatbot_config';
+import {
+  Tooltip,
+  TooltipContent,
+  TooltipProvider,
+  TooltipTrigger,
+} from '@/components/ui/tooltip';
+import { PaginationComponent } from '@/components/customized/pagination/pagination-component';
+import { Checkbox } from '@/components/ui/checkbox';
+
+const DEFAULT_SCORE_THRESHOLD = 0.8;
+
+interface FAQItem {
+  id?: string;
+  question: string;
+  answer: string;
+}
+
+interface EmbeddingModel {
+  id: string;
+  model_id: string;
+  model_name: string;
+  type: string;
+  provider_name?: string;
+}
+
+interface FAQManagementProps {
+  appId: string;
+  botConfig: Chatbot;
+  setBotConfig: (config: Chatbot) => void;
+}
+
+export const FAQManagement: React.FC<FAQManagementProps> = ({ appId, botConfig, setBotConfig }) => {
+  const [faqs, setFaqs] = useState<FAQItem[]>([]);
+  const [loading, setLoading] = useState(false);
+  const [page, setPage] = useState(1);
+  const [totalPages, setTotalPages] = useState(1);
+  const [totalItems, setTotalItems] = useState(0);
+  const pageSize = 10;
+  const [selectedItems, setSelectedItems] = useState<Set<string>>(new Set());
+  const [isDialogOpen, setIsDialogOpen] = useState(false);
+  const [isConfigDialogOpen, setIsConfigDialogOpen] = useState(false);
+  const [isUploadDialogOpen, setIsUploadDialogOpen] = useState(false);
+  const [uploadFiles, setUploadFiles] = useState<File[]>([]);
+  const [uploadConfig, setUploadConfig] = useState<{
+    header_index_max: number | null;
+    question_column_index: number;
+    answer_column_index: number;
+  }>({
+    header_index_max: 0,
+    question_column_index: 0,
+    answer_column_index: 1,
+  });
+  const [uploading, setUploading] = useState(false);
+  const [editingFaq, setEditingFaq] = useState<FAQItem | null>(null);
+  const [formData, setFormData] = useState<FAQItem>({ question: '', answer: '' });
+  const [embeddingModels, setEmbeddingModels] = useState<EmbeddingModel[]>([]);
+  const [faqConfigData, setFaqConfigData] = useState<{
+    active: boolean;
+    score_threshold: number;
+    embedding_model: string;
+    enable_question_in_retrieval: boolean;
+    enable_question_in_response: boolean;
+    enable_answer_in_retrieval: boolean;
+    enable_answer_in_response: boolean;
+    return_direct: boolean;
+  } | null>(null);
+  const { tenantFetch } = useTenantFetch();
+
+  const handleToggleFAQ = async (checked: boolean) => {
+    try {
+      // 更新 faq_config.active 字段
+      const res = await tenantFetch(`/api/config/apps/${appId}/faq-config`, {
+        method: 'PUT',
+        headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify({
+          active: checked,
+        }),
+      });
+
+      if (!res.ok) throw new Error('更新失败');
+      
+      const data = await res.json();
+      // 更新本地状态
+      if (data.data) {
+          setFaqConfigData({
+            active: data.data.active ?? checked,
+            score_threshold: data.data.similarity_threshold ?? data.data.score_threshold ?? faqConfigData?.score_threshold ?? DEFAULT_SCORE_THRESHOLD,
+            embedding_model: data.data.embedding_model ?? faqConfigData?.embedding_model ?? '',
+            enable_question_in_retrieval: data.data.enable_question_in_retrieval ?? faqConfigData?.enable_question_in_retrieval ?? true,
+            enable_question_in_response: data.data.enable_question_in_response ?? faqConfigData?.enable_question_in_response ?? false,
+            enable_answer_in_retrieval: data.data.enable_answer_in_retrieval ?? faqConfigData?.enable_answer_in_retrieval ?? false,
+            enable_answer_in_response: data.data.enable_answer_in_response ?? faqConfigData?.enable_answer_in_response ?? true,
+            return_direct: data.data.return_direct ?? faqConfigData?.return_direct ?? false,
+          });
+      }
+      
+      // 同步更新 botConfig.enable_faq
+      setBotConfig({
+        ...botConfig,
+        enable_faq: checked,
+      });
+      
+      toast.success(checked ? '已启用FAQ回复' : '已关闭FAQ回复');
+    } catch (error: any) {
+      toast.error(error.message || '更新失败');
+    }
+  };
+
+  useEffect(() => {
+    fetchFAQs();
+    fetchEmbeddingModels();
+    // 无论 enable_faq 是否为 true，都加载 FAQ 配置以获取 active 状态
+    fetchFAQConfig();
+  }, [appId, page]);
+
+  // 当页面切换时，清空选中项
+  useEffect(() => {
+    setSelectedItems(new Set());
+  }, [page]);
+
+  const fetchFAQConfig = async () => {
+    try {
+      const res = await tenantFetch(`/api/config/apps/${appId}/faq-config`);
+      if (res.ok) {
+        const data = await res.json();
+        if (data.data) {
+          // 从后端返回的数据中提取配置字段
+          setFaqConfigData({
+            active: data.data.active ?? false,
+            score_threshold: data.data.score_threshold ?? data.data.similarity_threshold ?? DEFAULT_SCORE_THRESHOLD,
+            embedding_model: data.data.embedding_model ?? '',
+            enable_question_in_retrieval: data.data.enable_question_in_retrieval ?? true,
+            enable_question_in_response: data.data.enable_question_in_response ?? true,
+            enable_answer_in_retrieval: data.data.enable_answer_in_retrieval ?? false,
+            enable_answer_in_response: data.data.enable_answer_in_response ?? true,
+            return_direct: data.data.return_direct ?? false,
+          });
+        } else {
+          // 如果没有配置数据，设置默认值（active 默认为 false）
+          setFaqConfigData({
+            active: false,
+            score_threshold: DEFAULT_SCORE_THRESHOLD,
+            embedding_model: '',
+            enable_question_in_retrieval: true,
+            enable_question_in_response: true,
+            enable_answer_in_retrieval: false,
+            enable_answer_in_response: true,
+            return_direct: false,
+          });
+        }
+      } else if (res.status === 404) {
+        // FAQ 配置不存在，设置默认值
+        setFaqConfigData({
+          active: false,
+          score_threshold: DEFAULT_SCORE_THRESHOLD,
+          embedding_model: '',
+          enable_question_in_retrieval: true,
+          enable_question_in_response: false,
+          enable_answer_in_retrieval: false,
+          enable_answer_in_response: true,
+          return_direct: false,
+        });
+      }
+    } catch (error: any) {
+      console.error('获取FAQ配置失败:', error);
+      // 即使出错也设置默认值，确保开关可以显示
+      setFaqConfigData({
+        active: false,
+        score_threshold: DEFAULT_SCORE_THRESHOLD,
+        embedding_model: '',
+        enable_question_in_retrieval: true,
+        enable_question_in_response: false,
+        enable_answer_in_retrieval: false,
+        enable_answer_in_response: true,
+        return_direct: false,
+      });
+    }
+  };
+
+  const fetchEmbeddingModels = async () => {
+    try {
+      const res = await tenantFetch(`/api/config/embeddings?size=1000`);
+      if (res.ok) {
+        const data = await res.json();
+        setEmbeddingModels(data.data?.items || []);
+      }
+    } catch (error: any) {
+      console.error('获取Embedding模型列表失败:', error);
+    }
+  };
+
+  const fetchFAQs = async () => {
+    try {
+      setLoading(true);
+      const res = await tenantFetch(`/api/config/apps/${appId}/faqs?page=${page}&size=${pageSize}`);
+      if (res.ok) {
+        const data = await res.json();
+        console.log('FAQ分页数据:', data);
+        const items = data.data?.items || [];
+        const total = data.data?.total || 0;
+        const pages = data.data?.pages || 1;
+        
+        setFaqs(items);
+        setTotalItems(total);
+        setTotalPages(pages);
+        
+        console.log(`FAQ分页信息: 当前页=${page}, 总页数=${pages}, 总条数=${total}, 当前页数据=${items.length}条`);
+      } else {
+        console.error('获取FAQ列表失败:', res.status, res.statusText);
+      }
+    } catch (error: any) {
+      console.error('获取FAQ列表失败:', error);
+    } finally {
+      setLoading(false);
+    }
+  };
+
+  const handlePageChange = (newPage: number) => {
+    if (newPage < 1 || newPage > totalPages) return;
+    setPage(newPage);
+  };
+
+  const handleOpenDialog = (faq?: FAQItem) => {
+    if (faq) {
+      setEditingFaq(faq);
+      setFormData({ question: faq.question, answer: faq.answer });
+    } else {
+      setEditingFaq(null);
+      setFormData({ question: '', answer: '' });
+    }
+    setIsDialogOpen(true);
+  };
+
+  const handleCloseDialog = () => {
+    setIsDialogOpen(false);
+    setEditingFaq(null);
+    setFormData({ question: '', answer: '' });
+  };
+
+  const handleSave = async () => {
+    if (!formData.question.trim() || !formData.answer.trim()) {
+      toast.error('请填写问题和答案');
+      return;
+    }
+
+    try {
+      const url = editingFaq?.id
+        ? `/api/config/apps/${appId}/faqs/${editingFaq.id}`
+        : `/api/config/apps/${appId}/faqs`;
+      const method = editingFaq?.id ? 'PUT' : 'POST';
+
+      const res = await tenantFetch(url, {
+        method,
+        headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify(formData),
+      });
+
+      if (!res.ok) throw new Error('保存失败');
+      
+      toast.success(editingFaq ? '更新成功' : '创建成功');
+      handleCloseDialog();
+      // 如果是新增，跳转到第一页；如果是更新，保持在当前页
+      if (!editingFaq) {
+        setPage(1);
+      } else {
+        fetchFAQs();
+      }
+    } catch (error: any) {
+      toast.error(error.message || '保存失败');
+    }
+  };
+
+  const handleDelete = async (faqId: string) => {
+    if (!confirm('确定要删除这条FAQ吗？')) return;
+
+    try {
+      const res = await tenantFetch(`/api/config/apps/${appId}/faqs/${faqId}`, {
+        method: 'DELETE',
+      });
+
+      if (!res.ok) throw new Error('删除失败');
+      
+      toast.success('删除成功');
+      
+      // 从选中项中移除
+      setSelectedItems(prev => {
+        const newSet = new Set(prev);
+        newSet.delete(faqId);
+        return newSet;
+      });
+      
+      // 如果当前页只有一条数据，删除后应该跳转到上一页
+      if (faqs.length === 1 && page > 1) {
+        setPage(page - 1);
+      } else {
+        fetchFAQs();
+      }
+    } catch (error: any) {
+      toast.error(error.message || '删除失败');
+    }
+  };
+
+  const handleSelectItem = (faqId: string) => {
+    setSelectedItems(prev => {
+      const newSet = new Set(prev);
+      if (newSet.has(faqId)) {
+        newSet.delete(faqId);
+      } else {
+        newSet.add(faqId);
+      }
+      return newSet;
+    });
+  };
+
+  const handleSelectAll = () => {
+    const currentPageIds = faqs.filter(faq => faq.id).map(faq => faq.id!);
+    const allSelected = currentPageIds.every(id => selectedItems.has(id));
+    
+    if (allSelected) {
+      // 取消全选当前页
+      setSelectedItems(prev => {
+        const newSet = new Set(prev);
+        currentPageIds.forEach(id => newSet.delete(id));
+        return newSet;
+      });
+    } else {
+      // 全选当前页
+      setSelectedItems(prev => {
+        const newSet = new Set(prev);
+        currentPageIds.forEach(id => newSet.add(id));
+        return newSet;
+      });
+    }
+  };
+
+  const handleBatchDelete = async () => {
+    if (selectedItems.size === 0) {
+      toast.error('请先选择要删除的FAQ');
+      return;
+    }
+
+    if (!confirm(`确定要删除选中的 ${selectedItems.size} 条FAQ吗？`)) return;
+
+    try {
+      const deletePromises = Array.from(selectedItems).map(faqId =>
+        tenantFetch(`/api/config/apps/${appId}/faqs/${faqId}`, {
+          method: 'DELETE',
+        })
+      );
+
+      const results = await Promise.all(deletePromises);
+      const failedCount = results.filter(res => !res.ok).length;
+      const successCount = selectedItems.size - failedCount;
+
+      if (failedCount > 0) {
+        toast.error(`删除失败 ${failedCount} 条，成功 ${successCount} 条`);
+      } else {
+        toast.success(`成功删除 ${successCount} 条FAQ`);
+      }
+
+      // 清空选中项
+      setSelectedItems(new Set());
+      
+      // 刷新列表
+      fetchFAQs();
+    } catch (error: any) {
+      toast.error(error.message || '批量删除失败');
+    }
+  };
+
+  const isAllSelected = faqs.length > 0 && faqs.filter(faq => faq.id).every(faq => selectedItems.has(faq.id!));
+
+  const handleUploadFiles = async () => {
+    if (uploadFiles.length === 0) {
+      toast.error('请选择要上传的文件');
+      return;
+    }
+
+    // 验证文件类型
+    const validFiles = uploadFiles.filter(
+      (file) =>
+        file.name.endsWith('.xlsx') || file.name.endsWith('.xls')
+    );
+
+    if (validFiles.length === 0) {
+      toast.error('请选择有效的Excel文件（.xlsx 或 .xls）');
+      return;
+    }
+
+    setUploading(true);
+    try {
+      // 构建 table_config (扁平结构，不嵌套 faq_config)
+      const tableConfig = {
+        header_index_max: uploadConfig.header_index_max,
+        question_column_index: uploadConfig.question_column_index,
+        answer_column_index: uploadConfig.answer_column_index,
+      };
+
+      // 创建 FormData
+      const formData = new FormData();
+      validFiles.forEach((file) => {
+        formData.append('files', file);
+      });
+      formData.append('table_config', JSON.stringify(tableConfig));
+
+      const res = await tenantFetch(`/api/config/apps/${appId}/faq-files`, {
+        method: 'POST',
+        body: formData,
+      });
+
+      if (!res.ok) {
+        const errorData = await res.json().catch(() => ({}));
+        throw new Error(errorData.message || '上传失败');
+      }
+
+      const data = await res.json();
+      const responseData = data.data || [];
+      
+      // 计算成功上传的文件数（items_count > 0 表示成功提取到FAQ片段）
+      const successCount = responseData.filter(
+        (item: any) => item.items_count > 0
+      ).length;
+      
+      // 计算总片段数
+      const totalChunks = responseData.reduce(
+        (sum: number, item: any) => sum + (item.items_count || 0),
+        0
+      );
+
+      toast.success(
+        `成功上传 ${successCount}/${validFiles.length} 个文件，共提取 ${totalChunks} 个片段`
+      );
+
+      // 关闭对话框并重置状态
+      setIsUploadDialogOpen(false);
+      setUploadFiles([]);
+      setUploadConfig({
+        header_index_max: 0,
+        question_column_index: 0,
+        answer_column_index: 1,
+      });
+
+      // 刷新FAQ列表
+      fetchFAQs();
+    } catch (error: any) {
+      toast.error(error.message || '上传失败');
+    } finally {
+      setUploading(false);
+    }
+  };
+
+  const handleSaveConfig = async () => {
+    try {
+      const res = await tenantFetch(`/api/config/apps/${appId}/faq-config`, {
+        method: 'PUT',
+        headers: { 'Content-Type': 'application/json' },
+        body: JSON.stringify({
+          active: faqConfigData?.active ?? true,
+          similarity_threshold: faqConfigData?.score_threshold,
+          embedding_model: faqConfigData?.embedding_model,
+          enable_question_in_retrieval: faqConfigData?.enable_question_in_retrieval,
+          enable_question_in_response: faqConfigData?.enable_question_in_response,
+          enable_answer_in_retrieval: faqConfigData?.enable_answer_in_retrieval,
+          enable_answer_in_response: faqConfigData?.enable_answer_in_response,
+          return_direct: faqConfigData?.return_direct ?? false,
+        }),
+      });
+
+      if (!res.ok) throw new Error('保存配置失败');
+      
+      const data = await res.json();
+      // 更新本地状态，确保包含 active 字段
+      if (data.data && faqConfigData) {
+        setFaqConfigData({
+          ...faqConfigData,
+          active: data.data.active ?? faqConfigData.active,
+        });
+      }
+      setIsConfigDialogOpen(false);
+      toast.success('配置保存成功');
+    } catch (error: any) {
+      toast.error(error.message || '保存配置失败');
+    }
+  };
+
+  return (
+    <div className="space-y-4">
+      <div className="flex justify-end items-center gap-4">
+        <div className="flex items-center gap-2">
+          <Label htmlFor="enable_faq_switch">开启FAQ回复</Label>
+          <Switch
+            id="enable_faq_switch"
+            checked={faqConfigData?.active ?? false}
+            onCheckedChange={handleToggleFAQ}
+          />
+        </div>
+        {faqConfigData && (
+          <Button
+            variant="outline"
+            size="sm"
+            onClick={() => {
+              if (!faqConfigData) {
+                fetchFAQConfig();
+              }
+              setIsConfigDialogOpen(true);
+            }}
+          >
+            <Settings className="w-4 h-4 mr-2" />
+            配置
+          </Button>
+        )}
+        <Button onClick={() => handleOpenDialog()} size="sm">
+          <Plus className="w-4 h-4 mr-2" />
+          新增FAQ
+        </Button>
+        <Button onClick={() => setIsUploadDialogOpen(true)} size="sm" variant="outline">
+          <Upload className="w-4 h-4 mr-2" />
+          上传文件
+        </Button>
+        {selectedItems.size > 0 && (
+          <Button 
+            onClick={handleBatchDelete} 
+            size="sm" 
+            variant="destructive"
+          >
+            <Trash2 className="w-4 h-4 mr-2" />
+            删除选中 ({selectedItems.size})
+          </Button>
+        )}
+      </div>
+
+      {loading ? (
+        <div className="text-center py-8 text-muted-foreground">加载中...</div>
+      ) : faqs.length === 0 ? (
+        <div className="text-center py-8 text-muted-foreground">
+          暂无FAQ，点击"新增FAQ"添加
+        </div>
+      ) : (
+        <>
+          <div className="mb-4 text-sm text-muted-foreground">
+            共 {totalItems} 条FAQ，第 {page} / {totalPages} 页
+          </div>
+          <Table>
+            <TableHeader>
+              <TableRow>
+                <TableHead className="w-[50px]">
+                  <Checkbox
+                    checked={isAllSelected}
+                    onCheckedChange={handleSelectAll}
+                    aria-label="全选"
+                  />
+                </TableHead>
+                <TableHead className="w-[200px]">问题</TableHead>
+                <TableHead>答案</TableHead>
+                <TableHead className="w-[120px]">操作</TableHead>
+              </TableRow>
+            </TableHeader>
+            <TableBody>
+              {faqs.map((faq) => (
+                <TableRow key={faq.id}>
+                  <TableCell>
+                    <Checkbox
+                      checked={faq.id ? selectedItems.has(faq.id) : false}
+                      onCheckedChange={() => faq.id && handleSelectItem(faq.id)}
+                      aria-label={`选择 ${faq.question}`}
+                    />
+                  </TableCell>
+                  <TableCell className="font-medium">{faq.question}</TableCell>
+                  <TableCell className="max-w-md truncate">{faq.answer}</TableCell>
+                  <TableCell>
+                    <div className="flex gap-2">
+                      <Button
+                        variant="ghost"
+                        size="sm"
+                        onClick={() => handleOpenDialog(faq)}
+                      >
+                        <Edit className="w-4 h-4" />
+                      </Button>
+                      <Button
+                        variant="ghost"
+                        size="sm"
+                        onClick={() => faq.id && handleDelete(faq.id)}
+                      >
+                        <Trash2 className="w-4 h-4" />
+                      </Button>
+                    </div>
+                  </TableCell>
+                </TableRow>
+              ))}
+            </TableBody>
+          </Table>
+          {totalItems > 0 && (
+            <div className="mt-4">
+              <div className="flex items-center justify-between mb-2">
+                <div className="text-sm text-muted-foreground">
+                  显示第 {((page - 1) * pageSize) + 1} - {Math.min(page * pageSize, totalItems)} 条，共 {totalItems} 条
+                </div>
+              </div>
+              <div className="flex justify-center">
+                <PaginationComponent
+                  currentPage={page}
+                  totalPages={totalPages}
+                  onPageChange={handlePageChange}
+                />
+              </div>
+            </div>
+          )}
+        </>
+      )}
+
+      <Dialog open={isDialogOpen} onOpenChange={setIsDialogOpen}>
+        <DialogContent className="sm:max-w-[600px]">
+          <DialogHeader>
+            <DialogTitle>{editingFaq ? '编辑FAQ' : '新增FAQ'}</DialogTitle>
+            <DialogDescription>
+              填写问题和答案，创建FAQ条目
+            </DialogDescription>
+          </DialogHeader>
+          <div className="space-y-4 py-4">
+            <div className="space-y-2">
+              <Label htmlFor="question">问题 *</Label>
+              <Input
+                id="question"
+                value={formData.question}
+                onChange={(e) =>
+                  setFormData({ ...formData, question: e.target.value })
+                }
+                placeholder="请输入问题"
+              />
+            </div>
+            <div className="space-y-2">
+              <Label htmlFor="answer">答案 *</Label>
+              <Textarea
+                id="answer"
+                value={formData.answer}
+                onChange={(e) =>
+                  setFormData({ ...formData, answer: e.target.value })
+                }
+                placeholder="请输入答案"
+                rows={6}
+              />
+            </div>
+          </div>
+          <DialogFooter>
+            <Button variant="outline" onClick={handleCloseDialog}>
+              取消
+            </Button>
+            <Button onClick={handleSave}>
+              {editingFaq ? '更新' : '创建'}
+            </Button>
+          </DialogFooter>
+        </DialogContent>
+      </Dialog>
+
+      {/* FAQ配置对话框 */}
+      <Dialog open={isConfigDialogOpen} onOpenChange={setIsConfigDialogOpen}>
+        <DialogContent className="sm:max-w-[600px]">
+          <DialogHeader>
+            <DialogTitle>FAQ回复设置</DialogTitle>
+            <DialogDescription>
+              配置FAQ检索和回复的相关参数
+            </DialogDescription>
+          </DialogHeader>
+          <div className="space-y-6 py-4">
+            {!faqConfigData ? (
+              <div className="text-center py-4 text-muted-foreground">加载配置中...</div>
+            ) : (
+              <>
+                {/* 分数阈值 */}
+                <div className="space-y-2">
+                  <div className="flex items-center gap-2">
+                    <Label htmlFor="score_threshold">分数阈值</Label>
+                    <TooltipProvider>
+                      <Tooltip>
+                        <TooltipTrigger asChild>
+                          <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                        </TooltipTrigger>
+                        <TooltipContent>
+                          <p className="text-xs">设置FAQ匹配的相似度阈值，值越高匹配越精准</p>
+                        </TooltipContent>
+                      </Tooltip>
+                    </TooltipProvider>
+                  </div>
+                  <div className="space-y-2">
+                    <Slider
+                      value={[faqConfigData?.score_threshold ?? DEFAULT_SCORE_THRESHOLD]}
+                      onValueChange={(value) =>
+                        setFaqConfigData({ ...faqConfigData!, score_threshold: value[0] })
+                      }
+                      min={0}
+                      max={1}
+                      step={0.01}
+                      className="w-full"
+                    />
+                    <div className="flex justify-between text-xs text-muted-foreground">
+                      <span>0 · 容易匹配</span>
+                      <span className="font-medium">{(faqConfigData?.score_threshold ?? DEFAULT_SCORE_THRESHOLD).toFixed(2)}</span>
+                      <span>1 · 精准匹配</span>
+                    </div>
+                  </div>
+                </div>
+
+                {/* Embedding模型 */}
+                <div className="space-y-2">
+                  <div className="flex items-center gap-2">
+                    <Label htmlFor="embedding_model">Embedding 模型</Label>
+                    <TooltipProvider>
+                      <Tooltip>
+                        <TooltipTrigger asChild>
+                          <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                        </TooltipTrigger>
+                        <TooltipContent>
+                          <p className="text-xs">选择用于FAQ向量化的Embedding模型</p>
+                        </TooltipContent>
+                      </Tooltip>
+                    </TooltipProvider>
+                  </div>
+                  <Select
+                    value={faqConfigData?.embedding_model ?? ''}
+                    onValueChange={(value) =>
+                      setFaqConfigData({ ...faqConfigData!, embedding_model: value })
+                    }
+                  >
+                    <SelectTrigger>
+                      <SelectValue placeholder="请选择Embedding模型" />
+                    </SelectTrigger>
+                    <SelectContent>
+                      <SelectGroup>
+                        {embeddingModels.map((model) => (
+                          <SelectItem key={model.id} value={model.model_id}>
+                            {model.model_id}
+                          </SelectItem>
+                        ))}
+                      </SelectGroup>
+                    </SelectContent>
+                  </Select>
+                </div>
+
+                {/* 问题是否参与检索/回答 */}
+                <div className="space-y-3">
+                  <Label>问题参与设置</Label>
+                  <div className="flex items-center justify-between">
+                    <div className="flex items-center gap-2">
+                      <Label htmlFor="question_in_retrieval" className="text-sm font-normal">
+                        问题参与检索
+                      </Label>
+                      <TooltipProvider>
+                        <Tooltip>
+                          <TooltipTrigger asChild>
+                            <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                          </TooltipTrigger>
+                          <TooltipContent>
+                            <p className="text-xs">是否使用问题内容进行向量检索</p>
+                          </TooltipContent>
+                        </Tooltip>
+                      </TooltipProvider>
+                    </div>
+                    <Switch
+                      id="question_in_retrieval"
+                      checked={faqConfigData?.enable_question_in_retrieval ?? true}
+                      onCheckedChange={(checked) =>
+                        setFaqConfigData({ ...faqConfigData!, enable_question_in_retrieval: checked })
+                      }
+                    />
+                  </div>
+                  <div className="flex items-center justify-between">
+                    <div className="flex items-center gap-2">
+                      <Label htmlFor="question_in_response" className="text-sm font-normal">
+                        问题参与回答
+                      </Label>
+                      <TooltipProvider>
+                        <Tooltip>
+                          <TooltipTrigger asChild>
+                            <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                          </TooltipTrigger>
+                          <TooltipContent>
+                            <p className="text-xs">是否在回答中包含问题内容</p>
+                          </TooltipContent>
+                        </Tooltip>
+                      </TooltipProvider>
+                    </div>
+                    <Switch
+                      id="question_in_response"
+                      checked={faqConfigData?.enable_question_in_response ?? false}
+                      onCheckedChange={(checked) =>
+                        setFaqConfigData({ ...faqConfigData!, enable_question_in_response: checked })
+                      }
+                    />
+                  </div>
+                </div>
+
+                {/* 答案是否参与检索/回答 */}
+                <div className="space-y-3">
+                  <Label>答案参与设置</Label>
+                  <div className="flex items-center justify-between">
+                    <div className="flex items-center gap-2">
+                      <Label htmlFor="answer_in_retrieval" className="text-sm font-normal">
+                        答案参与检索
+                      </Label>
+                      <TooltipProvider>
+                        <Tooltip>
+                          <TooltipTrigger asChild>
+                            <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                          </TooltipTrigger>
+                          <TooltipContent>
+                            <p className="text-xs">是否使用答案内容进行向量检索</p>
+                          </TooltipContent>
+                        </Tooltip>
+                      </TooltipProvider>
+                    </div>
+                    <Switch
+                      id="answer_in_retrieval"
+                      checked={faqConfigData?.enable_answer_in_retrieval ?? false}
+                      onCheckedChange={(checked) =>
+                        setFaqConfigData({ ...faqConfigData!, enable_answer_in_retrieval: checked })
+                      }
+                    />
+                  </div>
+                  <div className="flex items-center justify-between">
+                    <div className="flex items-center gap-2">
+                      <Label htmlFor="answer_in_response" className="text-sm font-normal">
+                        答案参与回答
+                      </Label>
+                      <TooltipProvider>
+                        <Tooltip>
+                          <TooltipTrigger asChild>
+                            <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                          </TooltipTrigger>
+                          <TooltipContent>
+                            <p className="text-xs">是否在回答中包含答案内容</p>
+                          </TooltipContent>
+                        </Tooltip>
+                      </TooltipProvider>
+                    </div>
+                    <Switch
+                      id="answer_in_response"
+                      checked={faqConfigData?.enable_answer_in_response ?? true}
+                      onCheckedChange={(checked) =>
+                        setFaqConfigData({ ...faqConfigData!, enable_answer_in_response: checked })
+                      }
+                    />
+                  </div>
+                </div>
+
+                {/* 直接返回设置 */}
+                <div className="space-y-3">
+                  <Label>返回设置</Label>
+                  <div className="flex items-center justify-between">
+                    <div className="flex items-center gap-2">
+                      <Label htmlFor="return_direct" className="text-sm font-normal">
+                        直接返回结果
+                      </Label>
+                      <TooltipProvider>
+                        <Tooltip>
+                          <TooltipTrigger asChild>
+                            <HelpCircle className="h-4 w-4 text-muted-foreground cursor-help" />
+                          </TooltipTrigger>
+                          <TooltipContent>
+                            <p className="text-xs">开启后，FAQ工具将直接返回搜索结果，不经过LLM加工处理</p>
+                          </TooltipContent>
+                        </Tooltip>
+                      </TooltipProvider>
+                    </div>
+                    <Switch
+                      id="return_direct"
+                      checked={faqConfigData?.return_direct ?? false}
+                      onCheckedChange={(checked) =>
+                        setFaqConfigData({ ...faqConfigData!, return_direct: checked })
+                      }
+                    />
+                  </div>
+                </div>
+              </>
+            )}
+          </div>
+          <DialogFooter>
+            <Button variant="outline" onClick={() => setIsConfigDialogOpen(false)}>
+              取消
+            </Button>
+            <Button onClick={handleSaveConfig}>
+              保存
+            </Button>
+          </DialogFooter>
+        </DialogContent>
+      </Dialog>
+
+      {/* 上传文件对话框 */}
+      <Dialog open={isUploadDialogOpen} onOpenChange={setIsUploadDialogOpen}>
+        <DialogContent className="sm:max-w-[600px]">
+          <DialogHeader>
+            <DialogTitle>上传文件</DialogTitle>
+            <DialogDescription>
+              选择文件进行上传
+            </DialogDescription>
+          </DialogHeader>
+          <div className="space-y-4 py-4">
+            {/* 文件选择 */}
+            <div className="space-y-2">
+              <Label htmlFor="file-upload">选择文件</Label>
+              <div className="border-2 border-dashed border-muted rounded-lg p-6 text-center hover:border-primary/50 transition-colors">
+                <input
+                  id="file-upload"
+                  type="file"
+                  accept=".xlsx,.xls"
+                  multiple
+                  onChange={(e) => {
+                    const files = Array.from(e.target.files || []);
+                    setUploadFiles(files);
+                  }}
+                  className="hidden"
+                />
+                <label
+                  htmlFor="file-upload"
+                  className="cursor-pointer flex flex-col items-center gap-2"
+                >
+                  <Upload className="w-8 h-8 text-muted-foreground" />
+                  <span className="text-sm font-medium">点击选择文件</span>
+                  <span className="text-xs text-muted-foreground">支持的文件类型: xlsx, xls</span>
+                </label>
+                {uploadFiles.length > 0 && (
+                  <div className="mt-4 space-y-2 text-left">
+                    <div className="text-xs text-muted-foreground mb-2">已选择 {uploadFiles.length} 个文件:</div>
+                    {uploadFiles.map((file, index) => (
+                      <div key={index} className="text-sm text-foreground bg-muted/50 rounded px-2 py-1">
+                        {file.name}
+                      </div>
+                    ))}
+                  </div>
+                )}
+              </div>
+            </div>
+
+            {/* 配置项 */}
+            <div className="space-y-4 border-t pt-4">
+              <Label>文件解析配置</Label>
+              
+              {/* 标题行下标 */}
+              <div className="space-y-2">
+                <Label htmlFor="header_index_max" className="text-sm">
+                  标题行下标
+                </Label>
+                <Input
+                  id="header_index_max"
+                  type="number"
+                  min="0"
+                  value={uploadConfig.header_index_max ?? ''}
+                  onChange={(e) =>
+                    setUploadConfig({
+                      ...uploadConfig,
+                      header_index_max: e.target.value === '' ? null : parseInt(e.target.value) || 0,
+                    })
+                  }
+                  placeholder="留空表示不使用标题行，默认: 0"
+                />
+                <p className="text-xs text-muted-foreground">
+                  留空表示不使用任何行作为标题行，列将使用数字索引（0, 1, 2...）
+                </p>
+              </div>
+
+              {/* 问题列 */}
+              <div className="space-y-2">
+                <Label htmlFor="question_column_index" className="text-sm">
+                  问题列
+                </Label>
+                <Input
+                  id="question_column_index"
+                  type="number"
+                  min="0"
+                  value={uploadConfig.question_column_index}
+                  onChange={(e) =>
+                    setUploadConfig({
+                      ...uploadConfig,
+                      question_column_index: parseInt(e.target.value) || 0,
+                    })
+                  }
+                  placeholder="默认: 0"
+                />
+              </div>
+
+              {/* 答案列 */}
+              <div className="space-y-2">
+                <Label htmlFor="answer_column_index" className="text-sm">
+                  答案列
+                </Label>
+                <Input
+                  id="answer_column_index"
+                  type="number"
+                  min="0"
+                  value={uploadConfig.answer_column_index}
+                  onChange={(e) =>
+                    setUploadConfig({
+                      ...uploadConfig,
+                      answer_column_index: parseInt(e.target.value) || 1,
+                    })
+                  }
+                  placeholder="默认: 1"
+                />
+              </div>
+            </div>
+          </div>
+          <DialogFooter>
+            <Button
+              variant="outline"
+              onClick={() => {
+                setIsUploadDialogOpen(false);
+                setUploadFiles([]);
+                setUploadConfig({
+                  header_index_max: 0,
+                  question_column_index: 0,
+                  answer_column_index: 1,
+                });
+              }}
+            >
+              取消
+            </Button>
+            <Button
+              onClick={handleUploadFiles}
+              disabled={uploadFiles.length === 0 || uploading}
+            >
+              {uploading ? '上传中...' : '上传'}
+            </Button>
+          </DialogFooter>
+        </DialogContent>
+      </Dialog>
+    </div>
+  );
+};
+
diff --git a/frontend/app/knowledgebases/[kbId]/page.tsx b/frontend/app/knowledgebases/[kbId]/page.tsx
index e69cd8604..d80ec1891 100644
--- a/frontend/app/knowledgebases/[kbId]/page.tsx
+++ b/frontend/app/knowledgebases/[kbId]/page.tsx
@@ -133,6 +133,10 @@ interface KnowledgeBaseFile {
   updated_at: string;
   failed_reason: string;
   file_extension?: string;
+  chunk_config?: {
+    parser_type?: string;
+    [key: string]: any;
+  };
   file_metadata: {
     [key: string]: any;
     file_url?: string;
@@ -190,6 +194,8 @@ export default function KnowledgeBaseDetailPage(
   const [previewError, setPreviewError] = useState('');
   const [dropdownOpen, setDropdownOpen] = useState<Record<string, boolean>>({});
   const [uploadDialogOpen, setUploadDialogOpen] = useState(false);
+  const [chunkConfigDialogOpen, setChunkConfigDialogOpen] = useState(false);
+  const [viewingChunkConfig, setViewingChunkConfig] = useState<{file_name: string; chunk_config: any} | null>(null);
   const [searchrecords, setSearchRecords] = useState(Array<SearchRecord>); // 搜索结果
   const [searching, setSearching] = useState(false);
   const [searchError, setSearchError] = useState<string | null>(null); // 搜索错误信息
@@ -208,9 +214,43 @@ export default function KnowledgeBaseDetailPage(
   const [uploading, setUploading] = useState(false);
   const [uploadProgress, setUploadProgress] = useState(0); // 上传进度 0-100
   const [uploadStep, setUploadStep] = useState<'idle' | 'uploading' | 'uploaded' | 'parsing'>('idle'); // 上传步骤
-  const [uploadedFiles, setUploadedFiles] = useState<Array<{id: string; file_name: string; file_path: string}>>([]);  // 已上传待解析的文件
+  const [uploadedFiles, setUploadedFiles] = useState<Array<{id: string; file_name: string; file_path: string; chunk_config?: any}>>([]);  // 已上传待解析的文件
+  const [uploadChunkConfig, setUploadChunkConfig] = useState<{
+    parser_type: string;
+    separator?: string;
+    chunk_size?: string;
+    chunk_overlap?: string;
+    image_caption_model?: string;
+    image_caption_provider_name?: string;
+    table_config?: {
+      concat_rows?: boolean;
+      row_joiner?: string;
+      header_index_max?: number | null;
+      format_sheet_data_to_json?: boolean;
+      sheet_column_filters?: string[];
+    };
+  } | null>(null); // 上传时使用的 chunk_config
   const [deleting, setDeleting] = useState(false);
   const [reprocessing, setReprocessing] = useState(false);
+  const [reprocessChunkConfigDialogOpen, setReprocessChunkConfigDialogOpen] = useState(false);
+  const [reprocessChunkConfig, setReprocessChunkConfig] = useState<{
+    parser_type: string;
+    separator?: string;
+    chunk_size?: string;
+    chunk_overlap?: string;
+    image_caption_model?: string;
+    image_caption_provider_name?: string;
+    table_config?: {
+      concat_rows?: boolean;
+      row_joiner?: string;
+      header_index_max?: number | null;
+      format_sheet_data_to_json?: boolean;
+      sheet_column_filters?: string[];
+    };
+  } | null>(null);
+  const [pendingReprocessFileId, setPendingReprocessFileId] = useState<string | null>(null);
+  const [pendingReprocessFileIds, setPendingReprocessFileIds] = useState<string[]>([]);
+  const [isBatchReprocess, setIsBatchReprocess] = useState(false);
   const [isEditingMetadata, setIsEditingMetadata] = useState(false);
   const [editingMetadata, setEditingMetadata] = useState<{ [k: string]: any }>(
     {},
@@ -461,6 +501,33 @@ export default function KnowledgeBaseDetailPage(
       const kb_data = json_data.data;
 
       setKnowledgeBase(kb_data); // 更新状态
+      // 初始化上传时的 chunk_config 为知识库的默认配置
+      if (kb_data?.chunk_config) {
+        const config: any = {
+          parser_type: kb_data.chunk_config.parser_type || 'structure',
+          image_caption_model: kb_data.chunk_config.image_caption_model,
+          image_caption_provider_name: kb_data.chunk_config.image_caption_provider_name,
+        };
+        
+                        if (kb_data.chunk_config.parser_type === 'table') {
+                          config.table_config = kb_data.chunk_config.table_config || {
+                            concat_rows: false,
+                            row_joiner: '\n',
+                            header_index_max: 0,
+                            format_sheet_data_to_json: false,
+                          };
+                        } else if (kb_data.chunk_config.parser_type === 'paragraph') {
+                          config.separator = kb_data.chunk_config.separator || '\n\n';
+          config.chunk_size = String(kb_data.chunk_config.chunk_size || 1000);
+          config.chunk_overlap = String(kb_data.chunk_config.chunk_overlap || 50);
+        } else {
+          config.separator = kb_data.chunk_config.separator || '\n\n';
+          config.chunk_size = String(kb_data.chunk_config.chunk_size || 1000);
+          config.chunk_overlap = String(kb_data.chunk_config.chunk_overlap || 50);
+        }
+        
+        setUploadChunkConfig(config);
+      }
       console.log('知识库详情数据:', kb_data);
 
       // 获取向量数据库类型
@@ -585,15 +652,87 @@ export default function KnowledgeBaseDetailPage(
 
 
   const handleReprocessFile = async (file_id: string) => {
+    // 找到文件对象，获取其chunk_config或使用知识库默认配置
+    const file = kbfiles.find(f => f.id === file_id);
+    const defaultConfig = knowledgebase?.chunk_config || {
+      parser_type: 'structure',
+      chunk_size: '1000',
+      chunk_overlap: '50',
+    };
+    
+    // 初始化切片配置：优先使用文件的chunk_config，否则使用知识库默认配置
+    const initialConfig: any = file?.chunk_config || defaultConfig;
+    const config: any = {
+      parser_type: initialConfig.parser_type || 'structure',
+      image_caption_model: initialConfig.image_caption_model,
+      image_caption_provider_name: initialConfig.image_caption_provider_name || 'openai_like',
+    };
+    
+    if (initialConfig.parser_type === 'table') {
+      config.table_config = initialConfig.table_config || {
+        concat_rows: false,
+        row_joiner: '\n',
+        header_index_max: 0,
+        format_sheet_data_to_json: false,
+      };
+    } else if (initialConfig.parser_type === 'paragraph') {
+      config.separator = initialConfig.separator || '\n\n';
+      config.chunk_size = String(initialConfig.chunk_size || 1000);
+      config.chunk_overlap = String(initialConfig.chunk_overlap || 50);
+    } else {
+      config.separator = initialConfig.separator || '\n\n';
+      config.chunk_size = String(initialConfig.chunk_size || 1000);
+      config.chunk_overlap = String(initialConfig.chunk_overlap || 50);
+    }
+    
+    setReprocessChunkConfig(config);
+    setPendingReprocessFileId(file_id);
+    setIsBatchReprocess(false);
+    setReprocessChunkConfigDialogOpen(true);
+  };
+
+  const confirmReprocessFile = async () => {
+    if (!pendingReprocessFileId) return;
+    
     try {
+      const body: any = {};
+      if (reprocessChunkConfig) {
+        // 转换配置格式以匹配API要求
+        const chunkConfig: any = {
+          parser_type: reprocessChunkConfig.parser_type,
+          image_caption_model: reprocessChunkConfig.image_caption_model || null,
+          image_caption_provider_name: reprocessChunkConfig.image_caption_provider_name || 'openai_like',
+        };
+        
+        if (reprocessChunkConfig.parser_type === 'table' && reprocessChunkConfig.table_config) {
+          chunkConfig.table_config = reprocessChunkConfig.table_config;
+        } else {
+          chunkConfig.separator = reprocessChunkConfig.separator || '\n\n';
+          chunkConfig.chunk_size = reprocessChunkConfig.chunk_size ? parseInt(reprocessChunkConfig.chunk_size) : 1000;
+          chunkConfig.chunk_overlap = reprocessChunkConfig.chunk_overlap ? parseInt(reprocessChunkConfig.chunk_overlap) : 50;
+        }
+        
+        body.chunk_config = chunkConfig;
+      }
+      
       const res = await tenantFetch(
-        `/api/config/knowledgebases/${kbId}/files/${file_id}`,
+        `/api/config/knowledgebases/${kbId}/files/${pendingReprocessFileId}`,
         {
           method: 'PUT',
+          headers: {
+            'Content-Type': 'application/json',
+          },
+          body: JSON.stringify(body),
         },
       );
-      if (!res.ok) throw new Error(`重新解析 ${file_id} 失败`);
+      if (!res.ok) {
+        const errorData = await res.json();
+        throw new Error(errorData.message || `重新解析失败`);
+      }
       toast.success("文件入队成功。");
+      setReprocessChunkConfigDialogOpen(false);
+      setPendingReprocessFileId(null);
+      setReprocessChunkConfig(null);
     } catch (error: any) {
       toast.error(error.message);
     } finally {
@@ -667,8 +806,76 @@ export default function KnowledgeBaseDetailPage(
     }
 
     setShowBatchReprocessDialog(false);
+    
+    // 获取第一个文件的chunk_config或使用知识库默认配置
+    const fileIds = Array.from(selectedFiles);
+    const firstFile = kbfiles.find(f => fileIds.includes(f.id));
+    const defaultConfig = knowledgebase?.chunk_config || {
+      parser_type: 'structure',
+      chunk_size: '1000',
+      chunk_overlap: '50',
+    };
+    
+    // 初始化切片配置：优先使用第一个文件的chunk_config，否则使用知识库默认配置
+    const initialConfig: any = firstFile?.chunk_config || defaultConfig;
+    const config: any = {
+      parser_type: initialConfig.parser_type || 'structure',
+      image_caption_model: initialConfig.image_caption_model,
+      image_caption_provider_name: initialConfig.image_caption_provider_name || 'openai_like',
+    };
+    
+    if (initialConfig.parser_type === 'table') {
+      config.table_config = initialConfig.table_config || {
+        concat_rows: false,
+        row_joiner: '\n',
+        header_index_max: 0,
+        format_sheet_data_to_json: false,
+      };
+    } else if (initialConfig.parser_type === 'paragraph') {
+      config.separator = initialConfig.separator || '\n\n';
+      config.chunk_size = String(initialConfig.chunk_size || 1000);
+      config.chunk_overlap = String(initialConfig.chunk_overlap || 50);
+    } else {
+      config.separator = initialConfig.separator || '\n\n';
+      config.chunk_size = String(initialConfig.chunk_size || 1000);
+      config.chunk_overlap = String(initialConfig.chunk_overlap || 50);
+    }
+    
+    setReprocessChunkConfig(config);
+    setPendingReprocessFileIds(fileIds);
+    setIsBatchReprocess(true);
+    setReprocessChunkConfigDialogOpen(true);
+  };
+
+  const confirmBatchReprocessFiles = async () => {
+    if (pendingReprocessFileIds.length === 0) return;
+    
     setReprocessing(true);
     try {
+      const body: any = {
+        operation: 'reprocess',
+        file_id_list: pendingReprocessFileIds,
+      };
+      
+      if (reprocessChunkConfig) {
+        // 转换配置格式以匹配API要求
+        const chunkConfig: any = {
+          parser_type: reprocessChunkConfig.parser_type,
+          image_caption_model: reprocessChunkConfig.image_caption_model || null,
+          image_caption_provider_name: reprocessChunkConfig.image_caption_provider_name || 'openai_like',
+        };
+        
+        if (reprocessChunkConfig.parser_type === 'table' && reprocessChunkConfig.table_config) {
+          chunkConfig.table_config = reprocessChunkConfig.table_config;
+        } else {
+          chunkConfig.separator = reprocessChunkConfig.separator || '\n\n';
+          chunkConfig.chunk_size = reprocessChunkConfig.chunk_size ? parseInt(reprocessChunkConfig.chunk_size) : 1000;
+          chunkConfig.chunk_overlap = reprocessChunkConfig.chunk_overlap ? parseInt(reprocessChunkConfig.chunk_overlap) : 50;
+        }
+        
+        body.chunk_config = chunkConfig;
+      }
+      
       const res = await tenantFetch(
         `/api/config/knowledgebases/${kbId}/files/batch`,
         {
@@ -676,10 +883,7 @@ export default function KnowledgeBaseDetailPage(
           headers: {
             'Content-Type': 'application/json',
           },
-          body: JSON.stringify({
-            operation: 'reprocess',
-            file_id_list: Array.from(selectedFiles),
-          }),
+          body: JSON.stringify(body),
         },
       );
       if (!res.ok) {
@@ -687,8 +891,11 @@ export default function KnowledgeBaseDetailPage(
         throw new Error(errorData.message || `批量重新解析失败`);
       }
       const result = await res.json();
-      toast.success(result.message || `成功将 ${selectedFiles.size} 个文件加入重新处理队列`);
+      toast.success(result.message || `成功将 ${pendingReprocessFileIds.length} 个文件加入重新处理队列`);
       setSelectedFiles(new Set()); // 清空选择
+      setReprocessChunkConfigDialogOpen(false);
+      setPendingReprocessFileIds([]);
+      setReprocessChunkConfig(null);
     } catch (error: any) {
       toast.error(error.message || "批量重新解析失败");
     } finally {
@@ -1023,6 +1230,28 @@ export default function KnowledgeBaseDetailPage(
         };
 
         // 添加 auto_parse=false 参数，只上传不解析
+        // 如果提供了 chunk_config，添加到 FormData
+        if (uploadChunkConfig) {
+          const chunkConfig: any = {
+            parser_type: uploadChunkConfig.parser_type,
+            image_caption_model: uploadChunkConfig.image_caption_model || null,
+            image_caption_provider_name: uploadChunkConfig.image_caption_provider_name || 'openai_like',
+          };
+          
+          if (uploadChunkConfig.parser_type === 'table' && uploadChunkConfig.table_config) {
+            chunkConfig.table_config = uploadChunkConfig.table_config;
+          } else if (uploadChunkConfig.parser_type === 'paragraph') {
+            chunkConfig.separator = uploadChunkConfig.separator || '\n\n';
+            chunkConfig.chunk_size = uploadChunkConfig.chunk_size ? parseInt(uploadChunkConfig.chunk_size) : 1000;
+            chunkConfig.chunk_overlap = uploadChunkConfig.chunk_overlap ? parseInt(uploadChunkConfig.chunk_overlap) : 50;
+          } else {
+            chunkConfig.separator = uploadChunkConfig.separator || '\n\n';
+            chunkConfig.chunk_size = uploadChunkConfig.chunk_size ? parseInt(uploadChunkConfig.chunk_size) : 1000;
+            chunkConfig.chunk_overlap = uploadChunkConfig.chunk_overlap ? parseInt(uploadChunkConfig.chunk_overlap) : 50;
+          }
+          
+          formData.append('chunk_config', JSON.stringify(chunkConfig));
+        }
         xhr.open('POST', `${API_PREFIX}/config/knowledgebases/${kbId}/files?auto_parse=false`);
         xhr.setRequestHeader('X-TENANT-ID', tenantId);
         xhr.send(formData);
@@ -1039,8 +1268,37 @@ export default function KnowledgeBaseDetailPage(
         id: file.id,
         file_name: file.file_name,
         file_path: file.file_path,
+        chunk_config: file.chunk_config, // 保存文件的 chunk_config
       }));
       setUploadedFiles(uploadedFileList);
+      // 更新显示的 chunk_config 为文件的 chunk_config（如果文件有的话）
+      if (uploadedFileList.length > 0 && uploadedFileList[0].chunk_config) {
+        const fileChunkConfig = uploadedFileList[0].chunk_config;
+        const config: any = {
+          parser_type: fileChunkConfig.parser_type || 'structure',
+          image_caption_model: fileChunkConfig.image_caption_model,
+          image_caption_provider_name: fileChunkConfig.image_caption_provider_name,
+        };
+        
+                        if (fileChunkConfig.parser_type === 'table') {
+                          config.table_config = fileChunkConfig.table_config || {
+                            concat_rows: false,
+                            row_joiner: '\n',
+                            header_index_max: 0,
+                            format_sheet_data_to_json: false,
+                          };
+                        } else if (fileChunkConfig.parser_type === 'paragraph') {
+                          config.separator = fileChunkConfig.separator || '\n\n';
+          config.chunk_size = String(fileChunkConfig.chunk_size || 1000);
+          config.chunk_overlap = String(fileChunkConfig.chunk_overlap || 50);
+        } else {
+          config.separator = fileChunkConfig.separator || '\n\n';
+          config.chunk_size = String(fileChunkConfig.chunk_size || 1000);
+          config.chunk_overlap = String(fileChunkConfig.chunk_overlap || 50);
+        }
+        
+        setUploadChunkConfig(config);
+      }
       setUploadStep('uploaded');
       setUploadProgress(100);
       toast.success("文件上传成功，请点击开始解析按钮启动解析任务。");
@@ -1059,6 +1317,43 @@ export default function KnowledgeBaseDetailPage(
     }
   };
 
+  // 构建 chunk_config 对象
+  const buildChunkConfig = () => {
+    if (!uploadChunkConfig) {
+      return undefined;
+    }
+
+    const chunkConfig: any = {
+      parser_type: uploadChunkConfig.parser_type,
+      image_caption_model: uploadChunkConfig.image_caption_model || null,
+      image_caption_provider_name: uploadChunkConfig.image_caption_provider_name || 'openai_like',
+    };
+    
+    if (uploadChunkConfig.parser_type === 'table' && uploadChunkConfig.table_config) {
+      chunkConfig.table_config = uploadChunkConfig.table_config;
+    } else if (uploadChunkConfig.parser_type === 'paragraph') {
+      chunkConfig.separator = uploadChunkConfig.separator || '\n\n';
+      // 如果为空字符串或undefined/null，使用默认值；否则转换为数字
+      chunkConfig.chunk_size = (uploadChunkConfig.chunk_size === '' || !uploadChunkConfig.chunk_size) 
+        ? 1000 
+        : parseInt(uploadChunkConfig.chunk_size);
+      chunkConfig.chunk_overlap = (uploadChunkConfig.chunk_overlap === '' || !uploadChunkConfig.chunk_overlap) 
+        ? 50 
+        : parseInt(uploadChunkConfig.chunk_overlap);
+    } else {
+      chunkConfig.separator = uploadChunkConfig.separator || '\n\n';
+      // 如果为空字符串或undefined/null，使用默认值；否则转换为数字
+      chunkConfig.chunk_size = (uploadChunkConfig.chunk_size === '' || !uploadChunkConfig.chunk_size) 
+        ? 1000 
+        : parseInt(uploadChunkConfig.chunk_size);
+      chunkConfig.chunk_overlap = (uploadChunkConfig.chunk_overlap === '' || !uploadChunkConfig.chunk_overlap) 
+        ? 50 
+        : parseInt(uploadChunkConfig.chunk_overlap);
+    }
+    
+    return chunkConfig;
+  };
+
   const handleStartParse = async () => {
     if (uploadedFiles.length === 0) {
       toast.error("没有待解析的文件");
@@ -1069,17 +1364,28 @@ export default function KnowledgeBaseDetailPage(
 
     try {
       const API_PREFIX = process.env.NEXT_PUBLIC_DEVELOP_MODE === "true" ? "/api" : "/v1";
+      
+      // 构建请求体，包含 files 和可选的 chunk_config
+      const requestBody: any = {
+        files: uploadedFiles.map(f => ({
+          file_name: f.file_name,
+          file_path: f.file_path,
+        })),
+      };
+      
+      // 如果有配置的 chunk_config，添加到请求体中
+      const chunkConfig = buildChunkConfig();
+      if (chunkConfig) {
+        requestBody.chunk_config = chunkConfig;
+      }
+      
+      // 开始解析（chunk_config 会在解析时一起更新）
       const res = await tenantFetch(
         `${API_PREFIX}/config/knowledgebases/${kbId}/files/parse`,
         {
           method: 'POST',
           headers: { 'Content-Type': 'application/json' },
-          body: JSON.stringify({
-            files: uploadedFiles.map(f => ({
-              file_name: f.file_name,
-              file_path: f.file_path,
-            })),
-          }),
+          body: JSON.stringify(requestBody),
         },
       );
 
@@ -1555,11 +1861,14 @@ export default function KnowledgeBaseDetailPage(
                   )}
                 </div>
                 <div className="flex gap-2 items-center">
-                <Dialog open={uploadDialogOpen} onOpenChange={(open) => {
+                <Dialog open={uploadDialogOpen} onOpenChange={async (open) => {
                     // 只有在非上传/解析状态时才允许关闭
                     if (!open && (uploadStep === 'uploading' || uploadStep === 'parsing')) {
                       return;
                     }
+                    
+                    // 注意：chunk_config 现在只在解析时更新，关闭对话框时不再单独更新
+                    
                     setUploadDialogOpen(open);
                     if (!open) {
                       // 关闭时重置状态
@@ -1567,6 +1876,33 @@ export default function KnowledgeBaseDetailPage(
                       setUploadProgress(0);
                       setUploadedFiles([]);
                       setUploading(false);
+                      // 重置 chunk_config 为知识库的默认配置
+                      if (knowledgebase?.chunk_config) {
+                        const config: any = {
+                          parser_type: knowledgebase.chunk_config.parser_type || 'structure',
+                          image_caption_model: knowledgebase.chunk_config.image_caption_model,
+                          image_caption_provider_name: knowledgebase.chunk_config.image_caption_provider_name,
+                        };
+                        
+                        if (knowledgebase.chunk_config.parser_type === 'table') {
+                          config.table_config = knowledgebase.chunk_config.table_config || {
+                            concat_rows: false,
+                            row_joiner: '\n',
+                            header_index_max: 0,
+                            format_sheet_data_to_json: false,
+                          };
+                        } else if (knowledgebase.chunk_config.parser_type === 'paragraph') {
+                          config.separator = knowledgebase.chunk_config.separator || '\n\n';
+                          config.chunk_size = String(knowledgebase.chunk_config.chunk_size || 1000);
+                          config.chunk_overlap = String(knowledgebase.chunk_config.chunk_overlap || 50);
+                        } else {
+                          config.separator = knowledgebase.chunk_config.separator || '\n\n';
+                          config.chunk_size = String(knowledgebase.chunk_config.chunk_size || 1000);
+                          config.chunk_overlap = String(knowledgebase.chunk_config.chunk_overlap || 50);
+                        }
+                        
+                        setUploadChunkConfig(config);
+                      }
                     }
                   }}>
                     <DialogTrigger asChild>
@@ -1579,7 +1915,7 @@ export default function KnowledgeBaseDetailPage(
                         <Upload className="h-3 w-3" /> 上传文件
                       </Button>
                     </DialogTrigger>
-                    <DialogContent className="sm:max-w-md">
+                    <DialogContent className="sm:max-w-2xl max-h-[90vh] overflow-y-auto">
                       <DialogHeader>
                         <DialogTitle>上传文件</DialogTitle>
                         <DialogDescription>
@@ -1592,20 +1928,22 @@ export default function KnowledgeBaseDetailPage(
                       
                       {/* 步骤1: 选择文件 */}
                       {uploadStep === 'idle' && (
-                        <div 
-                          className="flex flex-col items-center justify-center py-8 px-4 cursor-pointer border-2 border-dashed rounded-lg hover:bg-muted/50 transition-colors"
-                          onClick={() => {
-                            document.getElementById('file-upload')?.click();
-                          }}
-                        >
-                          <Upload className="h-12 w-12 text-muted-foreground mb-4" />
-                          <p className="text-sm text-muted-foreground text-center">
-                            支持的文件类型：txt, md, pdf, docx, pptx, xlsx, xls, html, jsonl, jpg, jpeg, png
-                          </p>
-                          <p className="text-xs text-muted-foreground mt-2">
-                            点击选择文件
-                          </p>
-                        </div>
+                        <>
+                          <div 
+                            className="flex flex-col items-center justify-center py-8 px-4 cursor-pointer border-2 border-dashed rounded-lg hover:bg-muted/50 transition-colors"
+                            onClick={() => {
+                              document.getElementById('file-upload')?.click();
+                            }}
+                          >
+                            <Upload className="h-12 w-12 text-muted-foreground mb-4" />
+                            <p className="text-sm text-muted-foreground text-center">
+                              支持的文件类型：txt, md, pdf, docx, pptx, xlsx, xls, html, jsonl, jpg, jpeg, png
+                            </p>
+                            <p className="text-xs text-muted-foreground mt-2">
+                              点击选择文件
+                            </p>
+                          </div>
+                        </>
                       )}
 
                       {/* 步骤2: 上传中 - 显示进度条 */}
@@ -1638,6 +1976,286 @@ export default function KnowledgeBaseDetailPage(
                               </div>
                             ))}
                           </div>
+                          
+                          {/* Chunk Config 配置 */}
+                          {uploadChunkConfig && (
+                            <div className="mb-4 border-t pt-4">
+                              <p className="text-sm font-medium mb-3">切片配置</p>
+                              <div className="space-y-3">
+                                <div className="flex gap-3 items-center">
+                                  <Label htmlFor="upload-parser-type" className="w-[80px] text-xs">
+                                    切片类型
+                                  </Label>
+                                  <Select
+                                    value={uploadChunkConfig.parser_type || 'structure'}
+                                    onValueChange={(value) => {
+                                      setUploadChunkConfig((prev) => {
+                                        if (!prev) return null;
+                                        const newConfig: any = {
+                                          ...prev,
+                                          parser_type: value,
+                                        };
+                                        
+                                        // 根据新的 parser_type 初始化相应的配置
+                                        if (value === 'table') {
+                                          newConfig.table_config = prev.table_config || {
+                                            concat_rows: false,
+                                            row_joiner: '\n',
+                                            header_index_max: 0,
+                                            format_sheet_data_to_json: false,
+                                          };
+                                          // 清除其他类型的配置
+                                          delete newConfig.chunk_size;
+                                          delete newConfig.chunk_overlap;
+                                          delete newConfig.separator;
+                                        } else if (value === 'paragraph') {
+                                          newConfig.separator = prev.separator || '\n\n';
+                                          newConfig.chunk_size = prev.chunk_size || '1000';
+                                          newConfig.chunk_overlap = prev.chunk_overlap || '50';
+                                          // 清除 table_config
+                                          delete newConfig.table_config;
+                                        } else {
+                                          newConfig.separator = prev.separator || '\n\n';
+                                          newConfig.chunk_size = prev.chunk_size || '1000';
+                                          newConfig.chunk_overlap = prev.chunk_overlap || '50';
+                                          // 清除 table_config
+                                          delete newConfig.table_config;
+                                        }
+                                        
+                                        return newConfig;
+                                      });
+                                    }}
+                                  >
+                                    <SelectTrigger className="w-[200px] h-7 text-xs">
+                                      <SelectValue placeholder="请选择切片类型" />
+                                    </SelectTrigger>
+                                    <SelectContent className="text-xs">
+                                      <SelectGroup>
+                                        <SelectItem value="structure" className="text-xs h-5">
+                                          结构化(structure)
+                                        </SelectItem>
+                                        <SelectItem value="token" className="text-xs h-5">
+                                          按token
+                                        </SelectItem>
+                                        <SelectItem value="table" className="text-xs h-5">
+                                          表格(table)
+                                        </SelectItem>
+                                        <SelectItem value="paragraph" className="text-xs h-5">
+                                          段落(paragraph)
+                                        </SelectItem>
+                                      </SelectGroup>
+                                    </SelectContent>
+                                  </Select>
+                                </div>
+
+                                {/* Table Config - 只在 parser_type === 'table' 时显示 */}
+                                {uploadChunkConfig.parser_type === 'table' && (
+                                  <div className="space-y-3">
+                                    {/* 第一行：最大表头行index 和 格式化为Json */}
+                                    <div className="flex gap-3 items-center">
+                                      <div className="flex gap-3 items-center flex-1">
+                                        <Label htmlFor="upload-header-index-max" className="w-[80px] text-xs">
+                                          最大表头行index
+                                        </Label>
+                                        <Input
+                                          type="number"
+                                          className="w-[200px] h-7 text-xs"
+                                          id="upload-header-index-max"
+                                          value={uploadChunkConfig.table_config?.header_index_max ?? ''}
+                                          onChange={(e) => {
+                                            setUploadChunkConfig((prev) => prev ? {
+                                              ...prev,
+                                              table_config: {
+                                                ...prev.table_config,
+                                                header_index_max: e.target.value === '' ? null : (parseInt(e.target.value) || 0),
+                                              },
+                                            } : null);
+                                          }}
+                                          min="0"
+                                          placeholder="留空表示不使用标题行"
+                                        />
+                                      </div>
+                                      <div className="flex gap-3 items-center flex-1">
+                                        <Label htmlFor="upload-format-json" className="w-[80px] text-xs">
+                                          格式化为Json
+                                        </Label>
+                                        <Checkbox
+                                          id="upload-format-json"
+                                          checked={uploadChunkConfig.table_config?.format_sheet_data_to_json ?? false}
+                                          onCheckedChange={(checked) => {
+                                            setUploadChunkConfig((prev) => prev ? {
+                                              ...prev,
+                                              table_config: {
+                                                ...prev.table_config,
+                                                format_sheet_data_to_json: checked === true,
+                                              },
+                                            } : null);
+                                          }}
+                                        />
+                                      </div>
+                                    </div>
+                                    {/* 第二行：合并行 和 行分隔符 */}
+                                    <div className="flex gap-3 items-center">
+                                      <div className="flex gap-3 items-center flex-1">
+                                        <Label htmlFor="upload-concat-rows" className="w-[80px] text-xs">
+                                          合并行
+                                        </Label>
+                                        <Checkbox
+                                          id="upload-concat-rows"
+                                          checked={uploadChunkConfig.table_config?.concat_rows ?? false}
+                                          onCheckedChange={(checked) => {
+                                            setUploadChunkConfig((prev) => prev ? {
+                                              ...prev,
+                                              table_config: {
+                                                ...prev.table_config,
+                                                concat_rows: checked === true,
+                                              },
+                                            } : null);
+                                          }}
+                                        />
+                                      </div>
+                                      <div className="flex gap-3 items-center flex-1">
+                                        <Label htmlFor="upload-row-joiner" className="w-[80px] text-xs">
+                                          行分隔符
+                                        </Label>
+                                        <Input
+                                          type="text"
+                                          className="w-[200px] h-7 text-xs"
+                                          id="upload-row-joiner"
+                                          value={uploadChunkConfig.table_config?.row_joiner || '\n'}
+                                          onChange={(e) => {
+                                            setUploadChunkConfig((prev) => prev ? {
+                                              ...prev,
+                                              table_config: {
+                                                ...prev.table_config,
+                                                row_joiner: e.target.value,
+                                              },
+                                            } : null);
+                                          }}
+                                        />
+                                      </div>
+                                    </div>
+                                  </div>
+                                )}
+
+                                {/* Paragraph Config - 只在 parser_type === 'paragraph' 时显示 */}
+                                {uploadChunkConfig.parser_type === 'paragraph' && (
+                                  <div className="space-y-3">
+                                    <div className="flex gap-3 items-center">
+                                      <Label htmlFor="upload-separator" className="w-[80px] text-xs">
+                                        分隔符
+                                      </Label>
+                                      <Input
+                                        type="text"
+                                        className="w-[200px] h-7 text-xs"
+                                        id="upload-separator"
+                                        value={uploadChunkConfig.separator || '\n\n'}
+                                        onChange={(e) => {
+                                          setUploadChunkConfig((prev) => prev ? {
+                                            ...prev,
+                                            separator: e.target.value,
+                                          } : null);
+                                        }}
+                                      />
+                                    </div>
+                                    <div className="flex gap-3 items-center">
+                                      <Label htmlFor="upload-chunk-size" className="w-[80px] text-xs">
+                                        切片大小
+                                      </Label>
+                                      <Input
+                                        type="text"
+                                        inputMode="numeric"
+                                        className="w-[200px] h-7 text-xs"
+                                        id="upload-chunk-size"
+                                        value={uploadChunkConfig.chunk_size ?? ''}
+                                        placeholder="1000"
+                                        onChange={(e) => {
+                                          const value = e.target.value;
+                                          // 只允许数字和空字符串
+                                          if (value === '' || /^\d+$/.test(value)) {
+                                            setUploadChunkConfig((prev) => prev ? {
+                                              ...prev,
+                                              chunk_size: value,
+                                            } : null);
+                                          }
+                                        }}
+                                      />
+                                      <Label htmlFor="upload-chunk-overlap" className="w-[80px] text-xs ml-2">
+                                        切片重叠
+                                      </Label>
+                                      <Input
+                                        type="text"
+                                        inputMode="numeric"
+                                        className="w-[200px] h-7 text-xs"
+                                        id="upload-chunk-overlap"
+                                        value={uploadChunkConfig.chunk_overlap ?? ''}
+                                        placeholder="50"
+                                        onChange={(e) => {
+                                          const value = e.target.value;
+                                          // 只允许数字和空字符串
+                                          if (value === '' || /^\d+$/.test(value)) {
+                                            setUploadChunkConfig((prev) => prev ? {
+                                              ...prev,
+                                              chunk_overlap: value,
+                                            } : null);
+                                          }
+                                        }}
+                                      />
+                                    </div>
+                                  </div>
+                                )}
+
+                                {/* Default Config - 只在 parser_type 为 'structure' 或 'token' 时显示 */}
+                                {(uploadChunkConfig.parser_type === 'structure' || uploadChunkConfig.parser_type === 'token') && (
+                                  <div className="flex gap-3 items-center">
+                                    <Label htmlFor="upload-chunk-size" className="w-[80px] text-xs">
+                                      切片大小
+                                    </Label>
+                                    <Input
+                                      type="text"
+                                      inputMode="numeric"
+                                      className="w-[200px] h-7 text-xs"
+                                      id="upload-chunk-size"
+                                      value={uploadChunkConfig.chunk_size ?? ''}
+                                      placeholder="1000"
+                                      onChange={(e) => {
+                                        const value = e.target.value;
+                                        // 只允许数字和空字符串
+                                        if (value === '' || /^\d+$/.test(value)) {
+                                          setUploadChunkConfig((prev) => prev ? {
+                                            ...prev,
+                                            chunk_size: value,
+                                          } : null);
+                                        }
+                                      }}
+                                    />
+                                    <Label htmlFor="upload-chunk-overlap" className="w-[80px] text-xs ml-2">
+                                      切片重叠
+                                    </Label>
+                                    <Input
+                                      type="text"
+                                      inputMode="numeric"
+                                      className="w-[200px] h-7 text-xs"
+                                      id="upload-chunk-overlap"
+                                      value={uploadChunkConfig.chunk_overlap ?? ''}
+                                      placeholder="50"
+                                      onChange={(e) => {
+                                        const value = e.target.value;
+                                        // 只允许数字和空字符串
+                                        if (value === '' || /^\d+$/.test(value)) {
+                                          setUploadChunkConfig((prev) => prev ? {
+                                            ...prev,
+                                            chunk_overlap: value,
+                                          } : null);
+                                        }
+                                      }}
+                                    />
+                                  </div>
+                                )}
+                              </div>
+                            </div>
+                          )}
+                          
                           <Button 
                             onClick={handleStartParse}
                             className="w-full"
@@ -1703,6 +2321,7 @@ export default function KnowledgeBaseDetailPage(
                           </TableHead>
                           <TableHead className="text-xs text-muted-foreground">文件大小</TableHead>
                           <TableHead className="text-xs text-muted-foreground">更新时间</TableHead>
+                          <TableHead className="text-xs text-muted-foreground">切片类型</TableHead>
                           <TableHead>
                             <FileStatusFilter 
                               value={statusFilter as 'all' | 'succeeded' | 'failed' | 'pending' | 'parsing' | 'persisting'}
@@ -1748,6 +2367,28 @@ export default function KnowledgeBaseDetailPage(
                             <TableCell className="text-xs p-1">
                               {formatBeijingTime(file.updated_at)}
                             </TableCell>
+                            <TableCell className="text-xs p-1" onClick={(e) => e.stopPropagation()}>
+                              {file.chunk_config?.parser_type && (
+                                <Badge 
+                                  variant="secondary" 
+                                  className="bg-blue-100 text-blue-700 hover:bg-blue-200 dark:bg-blue-900/20 dark:text-blue-400 cursor-pointer"
+                                  onClick={() => {
+                                    setViewingChunkConfig({
+                                      file_name: file.file_name,
+                                      chunk_config: file.chunk_config
+                                    });
+                                    setChunkConfigDialogOpen(true);
+                                  }}
+                                >
+                                  <span className="h-2 w-2 rounded-full bg-blue-500 mr-1.5 inline-block"></span>
+                                  {file.chunk_config.parser_type === 'structure' ? '结构化' :
+                                   file.chunk_config.parser_type === 'token' ? '按token' :
+                                   file.chunk_config.parser_type === 'table' ? '表格' :
+                                   file.chunk_config.parser_type === 'paragraph' ? '段落' :
+                                   file.chunk_config.parser_type}
+                                </Badge>
+                              )}
+                            </TableCell>
                             <TableCell className="text-xs p-1">
                               {file.status === 'pending' ? (
                                 <Badge variant="secondary" className="bg-yellow-100 text-yellow-700 hover:bg-yellow-200 dark:bg-yellow-900/20 dark:text-yellow-400">
@@ -3164,6 +3805,489 @@ export default function KnowledgeBaseDetailPage(
           </div>
         </DialogContent>
       </Dialog>
+
+      {/* 切片配置查看对话框 */}
+      <Dialog open={chunkConfigDialogOpen} onOpenChange={(open) => {
+        setChunkConfigDialogOpen(open);
+        if (!open) {
+          setViewingChunkConfig(null);
+        }
+      }}>
+        <DialogContent className="sm:max-w-2xl max-h-[90vh] overflow-y-auto">
+          <DialogHeader>
+            <DialogTitle className="text-sm">切片配置</DialogTitle>
+            <DialogDescription className="text-xs">
+              {viewingChunkConfig?.file_name}
+            </DialogDescription>
+          </DialogHeader>
+          {viewingChunkConfig?.chunk_config && (
+            <div className="space-y-4">
+              {/* 基本信息 */}
+              <div className="space-y-2">
+                <Label className="text-xs font-semibold">切片类型</Label>
+                <div className="text-xs text-muted-foreground">
+                  {viewingChunkConfig.chunk_config.parser_type === 'structure' ? '结构化' :
+                   viewingChunkConfig.chunk_config.parser_type === 'token' ? '按token' :
+                   viewingChunkConfig.chunk_config.parser_type === 'table' ? '表格' :
+                   viewingChunkConfig.chunk_config.parser_type === 'paragraph' ? '段落' :
+                   viewingChunkConfig.chunk_config.parser_type}
+                </div>
+              </div>
+
+              {/* 图片理解配置 */}
+              {(viewingChunkConfig.chunk_config.image_caption_model || viewingChunkConfig.chunk_config.image_caption_provider_name) && (
+                <div className="space-y-2">
+                  <Label className="text-xs font-semibold">图片理解配置</Label>
+                  <div className="space-y-1 text-xs text-muted-foreground">
+                    {viewingChunkConfig.chunk_config.image_caption_model && (
+                      <div>模型: {viewingChunkConfig.chunk_config.image_caption_model}</div>
+                    )}
+                    {viewingChunkConfig.chunk_config.image_caption_provider_name && (
+                      <div>服务商: {viewingChunkConfig.chunk_config.image_caption_provider_name}</div>
+                    )}
+                  </div>
+                </div>
+              )}
+
+              {/* 表格配置 */}
+              {viewingChunkConfig.chunk_config.parser_type === 'table' && viewingChunkConfig.chunk_config.table_config && (
+                <div className="space-y-2">
+                  <Label className="text-xs font-semibold">表格配置</Label>
+                  <div className="space-y-1 text-xs text-muted-foreground">
+                    <div>最大表头行索引: {viewingChunkConfig.chunk_config.table_config.header_index_max ?? '未设置'}</div>
+                    <div>格式化为JSON: {viewingChunkConfig.chunk_config.table_config.format_sheet_data_to_json ? '是' : '否'}</div>
+                    <div>合并行: {viewingChunkConfig.chunk_config.table_config.concat_rows ? '是' : '否'}</div>
+                    <div>行分隔符: {viewingChunkConfig.chunk_config.table_config.row_joiner ? `"${viewingChunkConfig.chunk_config.table_config.row_joiner}"` : '未设置'}</div>
+                    {viewingChunkConfig.chunk_config.table_config.sheet_column_filters && (
+                      <div>列过滤器: {Array.isArray(viewingChunkConfig.chunk_config.table_config.sheet_column_filters) 
+                        ? viewingChunkConfig.chunk_config.table_config.sheet_column_filters.join(', ')
+                        : viewingChunkConfig.chunk_config.table_config.sheet_column_filters}</div>
+                    )}
+                  </div>
+                </div>
+              )}
+
+              {/* 段落配置 */}
+              {viewingChunkConfig.chunk_config.parser_type === 'paragraph' && (
+                <div className="space-y-2">
+                  <Label className="text-xs font-semibold">段落配置</Label>
+                  <div className="space-y-1 text-xs text-muted-foreground">
+                    <div>分隔符: {viewingChunkConfig.chunk_config.separator ? `"${viewingChunkConfig.chunk_config.separator}"` : '未设置'}</div>
+                    <div>切片大小: {viewingChunkConfig.chunk_config.chunk_size ?? '未设置'}</div>
+                    <div>切片重叠: {viewingChunkConfig.chunk_config.chunk_overlap ?? '未设置'}</div>
+                  </div>
+                </div>
+              )}
+
+              {/* 其他类型配置（structure/token） */}
+              {(viewingChunkConfig.chunk_config.parser_type === 'structure' || viewingChunkConfig.chunk_config.parser_type === 'token') && (
+                <div className="space-y-2">
+                  <Label className="text-xs font-semibold">切片配置</Label>
+                  <div className="space-y-1 text-xs text-muted-foreground">
+                    <div>分隔符: {viewingChunkConfig.chunk_config.separator ? `"${viewingChunkConfig.chunk_config.separator}"` : '未设置'}</div>
+                    <div>切片大小: {viewingChunkConfig.chunk_config.chunk_size ?? '未设置'}</div>
+                    <div>切片重叠: {viewingChunkConfig.chunk_config.chunk_overlap ?? '未设置'}</div>
+                  </div>
+                </div>
+              )}
+
+              {/* 原始 JSON（可选，用于调试） */}
+              <div className="space-y-2 border-t pt-2">
+                <Label className="text-xs font-semibold">完整配置（JSON）</Label>
+                <pre className="text-xs bg-muted p-2 rounded overflow-x-auto">
+                  {JSON.stringify(viewingChunkConfig.chunk_config, null, 2)}
+                </pre>
+              </div>
+            </div>
+          )}
+          <div className="flex justify-end">
+            <Button
+              variant="outline"
+              size="sm"
+              className="text-xs h-7"
+              onClick={() => {
+                setChunkConfigDialogOpen(false);
+                setViewingChunkConfig(null);
+              }}
+            >
+              关闭
+            </Button>
+          </div>
+        </DialogContent>
+      </Dialog>
+
+      {/* 重新解析切片配置对话框 */}
+      <Dialog open={reprocessChunkConfigDialogOpen} onOpenChange={(open) => {
+        setReprocessChunkConfigDialogOpen(open);
+        if (!open) {
+          setReprocessChunkConfig(null);
+          setPendingReprocessFileId(null);
+          setPendingReprocessFileIds([]);
+        }
+      }}>
+        <DialogContent className="sm:max-w-2xl max-h-[90vh] overflow-y-auto">
+          <DialogHeader>
+            <DialogTitle className="text-sm">
+              {isBatchReprocess ? `批量重新解析 - 设置切片配置` : `重新解析 - 设置切片配置`}
+            </DialogTitle>
+            <DialogDescription className="text-xs">
+              {isBatchReprocess 
+                ? `为 ${pendingReprocessFileIds.length} 个文件设置切片配置`
+                : `为文件设置切片配置，配置将在重新解析时应用`}
+            </DialogDescription>
+          </DialogHeader>
+          {reprocessChunkConfig && (
+            <div className="space-y-4">
+              {/* 切片类型 */}
+              <div className="flex gap-3 items-center flex-wrap">
+                <Label htmlFor="reprocess-parserType" className="w-[120px] text-xs shrink-0">
+                  切片类型
+                  <span className="text-destructive">*</span>
+                </Label>
+                <Select
+                  value={reprocessChunkConfig.parser_type || 'structure'}
+                  onValueChange={(value) => {
+                    setReprocessChunkConfig((prev) => {
+                      if (!prev) return null;
+                      const newConfig: any = {
+                        ...prev,
+                        parser_type: value,
+                      };
+                      
+                      // 根据新的 parser_type 初始化相应的配置
+                      if (value === 'table') {
+                        newConfig.table_config = prev.table_config || {
+                          concat_rows: false,
+                          row_joiner: '\n',
+                          header_index_max: 0,
+                          format_sheet_data_to_json: false,
+                        };
+                        // 清除其他类型的配置
+                        delete newConfig.chunk_size;
+                        delete newConfig.chunk_overlap;
+                        delete newConfig.separator;
+                      } else if (value === 'paragraph') {
+                        newConfig.separator = prev.separator || '\n\n';
+                        newConfig.chunk_size = prev.chunk_size || '1000';
+                        newConfig.chunk_overlap = prev.chunk_overlap || '50';
+                        // 清除 table_config
+                        delete newConfig.table_config;
+                      } else {
+                        newConfig.separator = prev.separator || '\n\n';
+                        newConfig.chunk_size = prev.chunk_size || '1000';
+                        newConfig.chunk_overlap = prev.chunk_overlap || '50';
+                        // 清除 table_config
+                        delete newConfig.table_config;
+                      }
+                      
+                      return newConfig;
+                    });
+                  }}
+                >
+                  <SelectTrigger className="w-[200px] h-6 text-xs">
+                    <SelectValue placeholder="请选择切片类型" />
+                  </SelectTrigger>
+                  <SelectContent className="text-xs">
+                    <SelectGroup>
+                      <SelectItem value="structure" className="text-xs h-5">
+                        结构化(structure)
+                      </SelectItem>
+                      <SelectItem value="token" className="text-xs h-5">
+                        按token
+                      </SelectItem>
+                      <SelectItem value="table" className="text-xs h-5">
+                        表格(table)
+                      </SelectItem>
+                      <SelectItem value="paragraph" className="text-xs h-5">
+                        段落(paragraph)
+                      </SelectItem>
+                    </SelectGroup>
+                  </SelectContent>
+                </Select>
+                <p className="text-xs text-muted-foreground shrink-0">选择文档切片方式</p>
+              </div>
+
+              {/* Table Config - 只在 parser_type === 'table' 时显示 */}
+              {reprocessChunkConfig.parser_type === 'table' && (
+                <div className="space-y-3">
+                  <div className="flex gap-3 items-center flex-wrap">
+                    <div className="flex gap-3 items-center min-w-[280px]">
+                      <Label htmlFor="reprocess-table-header-index-max" className="w-[120px] text-xs shrink-0">
+                        最大表头行index
+                      </Label>
+                      <Input
+                        type="number"
+                        className="w-[200px] h-6 text-xs"
+                        id="reprocess-table-header-index-max"
+                        value={reprocessChunkConfig.table_config?.header_index_max ?? 0}
+                        onChange={(e) =>
+                          setReprocessChunkConfig((prev) => {
+                            if (!prev) return null;
+                            return {
+                              ...prev,
+                              table_config: {
+                                ...prev.table_config,
+                                header_index_max: e.target.value ? parseInt(e.target.value) : 0,
+                              },
+                            };
+                          })
+                        }
+                        min="0"
+                      />
+                    </div>
+                    <div className="flex gap-3 items-center min-w-[200px]">
+                      <Label htmlFor="reprocess-table-format-json" className="w-[120px] text-xs shrink-0">
+                        格式化为Json
+                      </Label>
+                      <Checkbox
+                        id="reprocess-table-format-json"
+                        checked={reprocessChunkConfig.table_config?.format_sheet_data_to_json ?? false}
+                        onCheckedChange={(checked) =>
+                          setReprocessChunkConfig((prev) => {
+                            if (!prev) return null;
+                            return {
+                              ...prev,
+                              table_config: {
+                                ...prev.table_config,
+                                format_sheet_data_to_json: checked === true,
+                              },
+                            };
+                          })
+                        }
+                      />
+                    </div>
+                  </div>
+                  <div className="flex gap-3 items-center flex-wrap">
+                    <div className="flex gap-3 items-center min-w-[200px]">
+                      <Label htmlFor="reprocess-table-concat-rows" className="w-[120px] text-xs shrink-0">
+                        合并行
+                      </Label>
+                      <Checkbox
+                        id="reprocess-table-concat-rows"
+                        checked={reprocessChunkConfig.table_config?.concat_rows ?? false}
+                        onCheckedChange={(checked) =>
+                          setReprocessChunkConfig((prev) => {
+                            if (!prev) return null;
+                            return {
+                              ...prev,
+                              table_config: {
+                                ...prev.table_config,
+                                concat_rows: checked === true,
+                              },
+                            };
+                          })
+                        }
+                      />
+                    </div>
+                    <div className="flex gap-3 items-center min-w-[280px]">
+                      <Label htmlFor="reprocess-table-row-joiner" className="w-[120px] text-xs shrink-0">
+                        行分隔符
+                      </Label>
+                      <Input
+                        type="text"
+                        className="w-[200px] h-6 text-xs"
+                        id="reprocess-table-row-joiner"
+                        value={reprocessChunkConfig.table_config?.row_joiner || '\n'}
+                        onChange={(e) =>
+                          setReprocessChunkConfig((prev) => {
+                            if (!prev) return null;
+                            return {
+                              ...prev,
+                              table_config: {
+                                ...prev.table_config,
+                                row_joiner: e.target.value,
+                              },
+                            };
+                          })
+                        }
+                      />
+                    </div>
+                  </div>
+                </div>
+              )}
+
+              {/* Paragraph Config - 只在 parser_type === 'paragraph' 时显示 */}
+              {reprocessChunkConfig.parser_type === 'paragraph' && (
+                <div className="space-y-3">
+                  <div className="flex gap-3 items-center flex-wrap">
+                    <Label htmlFor="reprocess-paragraph-separator" className="w-[120px] text-xs shrink-0">
+                      分隔符
+                      <span className="text-destructive">*</span>
+                    </Label>
+                    <Input
+                      type="text"
+                      className="w-[200px] h-6 text-xs"
+                      id="reprocess-paragraph-separator"
+                      value={reprocessChunkConfig.separator || '\n\n'}
+                      onChange={(e) =>
+                        setReprocessChunkConfig((prev) => {
+                          if (!prev) return null;
+                          return {
+                            ...prev,
+                            separator: e.target.value,
+                          };
+                        })
+                      }
+                    />
+                  </div>
+                  <div className="flex gap-3 items-center flex-wrap">
+                    <div className="flex gap-3 items-center min-w-[320px]">
+                      <Label htmlFor="reprocess-chunkSize" className="w-[120px] text-xs shrink-0">
+                        切片大小
+                        <span className="text-destructive">*</span>
+                      </Label>
+                      <Input
+                        type="text"
+                        inputMode="numeric"
+                        className="w-[200px] h-6 text-xs"
+                        id="reprocess-chunkSize"
+                        value={reprocessChunkConfig.chunk_size ?? ''}
+                        placeholder="1000"
+                        onChange={(e) => {
+                          const value = e.target.value;
+                          // 只允许数字和空字符串
+                          if (value === '' || /^\d+$/.test(value)) {
+                            setReprocessChunkConfig((prev) => {
+                              if (!prev) return null;
+                              return {
+                                ...prev,
+                                chunk_size: value,
+                              };
+                            });
+                          }
+                        }}
+                        required
+                      />
+                      <p className="text-xs text-muted-foreground shrink-0">推荐值: 1000</p>
+                    </div>
+                    <div className="flex gap-3 items-center min-w-[320px]">
+                      <Label htmlFor="reprocess-chunkOverlap" className="w-[120px] text-xs shrink-0">
+                        切片重叠
+                        <span className="text-destructive">*</span>
+                      </Label>
+                      <Input
+                        type="text"
+                        inputMode="numeric"
+                        className="w-[200px] h-6 text-xs"
+                        id="reprocess-chunkOverlap"
+                        value={reprocessChunkConfig.chunk_overlap ?? ''}
+                        placeholder="50"
+                        onChange={(e) => {
+                          const value = e.target.value;
+                          // 只允许数字和空字符串
+                          if (value === '' || /^\d+$/.test(value)) {
+                            setReprocessChunkConfig((prev) => {
+                              if (!prev) return null;
+                              return {
+                                ...prev,
+                                chunk_overlap: value,
+                              };
+                            });
+                          }
+                        }}
+                      />
+                      <p className="text-xs text-muted-foreground shrink-0">推荐值: 50</p>
+                    </div>
+                  </div>
+                </div>
+              )}
+
+              {/* Default Config - 只在 parser_type 为 'structure' 或 'token' 时显示 */}
+              {(reprocessChunkConfig.parser_type === 'structure' || reprocessChunkConfig.parser_type === 'token') && (
+                <div className="flex gap-3 items-center flex-wrap">
+                  <div className="flex gap-3 items-center min-w-[320px]">
+                    <Label htmlFor="reprocess-chunkSize-default" className="w-[120px] text-xs shrink-0">
+                      切片大小
+                      <span className="text-destructive">*</span>
+                    </Label>
+                    <Input
+                      type="text"
+                      inputMode="numeric"
+                      className="w-[200px] h-6 text-xs"
+                      id="reprocess-chunkSize-default"
+                      value={reprocessChunkConfig.chunk_size ?? ''}
+                      placeholder="1000"
+                      onChange={(e) => {
+                        const value = e.target.value;
+                        // 只允许数字和空字符串
+                        if (value === '' || /^\d+$/.test(value)) {
+                          setReprocessChunkConfig((prev) => {
+                            if (!prev) return null;
+                            return {
+                              ...prev,
+                              chunk_size: value,
+                            };
+                          });
+                        }
+                      }}
+                      required
+                    />
+                    <p className="text-xs text-muted-foreground shrink-0">推荐值: 1000</p>
+                  </div>
+                  <div className="flex gap-3 items-center min-w-[320px]">
+                    <Label htmlFor="reprocess-chunkOverlap-default" className="w-[120px] text-xs shrink-0">
+                      切片重叠
+                      <span className="text-destructive">*</span>
+                    </Label>
+                    <Input
+                      type="text"
+                      inputMode="numeric"
+                      className="w-[200px] h-6 text-xs"
+                      id="reprocess-chunkOverlap-default"
+                      value={reprocessChunkConfig.chunk_overlap ?? ''}
+                      placeholder="50"
+                      onChange={(e) => {
+                        const value = e.target.value;
+                        // 只允许数字和空字符串
+                        if (value === '' || /^\d+$/.test(value)) {
+                          setReprocessChunkConfig((prev) => {
+                            if (!prev) return null;
+                            return {
+                              ...prev,
+                              chunk_overlap: value,
+                            };
+                          });
+                        }
+                      }}
+                    />
+                    <p className="text-xs text-muted-foreground shrink-0">推荐值: 50</p>
+                  </div>
+                </div>
+              )}
+            </div>
+          )}
+          <div className="flex justify-end gap-2 pt-4">
+            <Button
+              variant="outline"
+              size="sm"
+              className="text-xs h-7"
+              onClick={() => {
+                setReprocessChunkConfigDialogOpen(false);
+                setReprocessChunkConfig(null);
+                setPendingReprocessFileId(null);
+                setPendingReprocessFileIds([]);
+              }}
+            >
+              取消
+            </Button>
+            <Button
+              variant="default"
+              size="sm"
+              className="text-xs h-7"
+              onClick={() => {
+                if (isBatchReprocess) {
+                  confirmBatchReprocessFiles();
+                } else {
+                  confirmReprocessFile();
+                }
+              }}
+              disabled={reprocessing}
+            >
+              {reprocessing ? '处理中...' : '确认重新解析'}
+            </Button>
+          </div>
+        </DialogContent>
+      </Dialog>
     </div>
   );
 }
diff --git a/frontend/app/knowledgebases/kbconfig.tsx b/frontend/app/knowledgebases/kbconfig.tsx
index e80047176..218dc1d54 100644
--- a/frontend/app/knowledgebases/kbconfig.tsx
+++ b/frontend/app/knowledgebases/kbconfig.tsx
@@ -103,11 +103,18 @@ export interface KbConfig {
   description: string;
   chunk_config: {
     parser_type: string; // 切片类型
-    separator: string; // 切片标识符
-    chunk_size: string; // 切片大小
-    chunk_overlap: string; // 切片重叠大小
+    separator?: string; // 切片标识符
+    chunk_size?: string; // 切片大小
+    chunk_overlap?: string; // 切片重叠大小
     image_caption_model?: string; // 图片理解模型ID
     image_caption_provider_name?: string; // 图片理解模型服务商
+    table_config?: {
+      concat_rows?: boolean;
+      row_joiner?: string;
+      header_index_max?: number;
+      format_sheet_data_to_json?: boolean;
+      sheet_column_filters?: string[];
+    };
   };
   embedding_model: string; //向量模型名称
   embedding_provider_name?: string; // 向量模型服务商
@@ -341,13 +348,43 @@ export const KbConfigCard: FC<KbConfigProps> = ({
               <Select
                 value={kb.chunk_config.parser_type || 'structure'}
                 onValueChange={(value) => {
-                  setKb((prev) => ({
-                    ...prev,
-                    chunk_config: {
+                  setKb((prev) => {
+                    const newConfig: any = {
                       ...prev.chunk_config,
                       parser_type: value,
-                    },
-                  }));
+                    };
+                    
+                    // 根据新的 parser_type 初始化相应的配置
+                    if (value === 'table') {
+                      newConfig.table_config = prev.chunk_config.table_config || {
+                        concat_rows: false,
+                        row_joiner: '\n',
+                        header_index_max: 0,
+                        format_sheet_data_to_json: false,
+                      };
+                      // 清除其他类型的配置
+                      delete newConfig.chunk_size;
+                      delete newConfig.chunk_overlap;
+                      delete newConfig.separator;
+                    } else if (value === 'paragraph') {
+                      newConfig.separator = prev.chunk_config.separator || '\n\n';
+                      newConfig.chunk_size = prev.chunk_config.chunk_size || '1000';
+                      newConfig.chunk_overlap = prev.chunk_config.chunk_overlap || '50';
+                      // 清除 table_config
+                      delete newConfig.table_config;
+                    } else {
+                      newConfig.separator = prev.chunk_config.separator || '\n\n';
+                      newConfig.chunk_size = prev.chunk_config.chunk_size || '1000';
+                      newConfig.chunk_overlap = prev.chunk_config.chunk_overlap || '50';
+                      // 清除 table_config
+                      delete newConfig.table_config;
+                    }
+                    
+                    return {
+                      ...prev,
+                      chunk_config: newConfig,
+                    };
+                  });
                 }}
               >
                 <SelectTrigger className="w-60 h-6 text-xs">
@@ -361,60 +398,259 @@ export const KbConfigCard: FC<KbConfigProps> = ({
                     <SelectItem value="token" className="text-xs h-5">
                       按token
                     </SelectItem>
+                    <SelectItem value="table" className="text-xs h-5">
+                      表格(table)
+                    </SelectItem>
+                    <SelectItem value="paragraph" className="text-xs h-5">
+                      段落(paragraph)
+                    </SelectItem>
                   </SelectGroup>
                 </SelectContent>
               </Select>
               <p className="text-xs text-muted-foreground">选择文档切片方式</p>
             </div>
 
-            <div className="flex gap-3 items-center">
-              <Label htmlFor="chunkSize" className="w-[100px] text-xs">
-                切片大小
-                <span className="text-destructive">*</span>
-              </Label>
-              <Input
-                type="number"
-                className="w-60 h-6 text-xs"
-                id="chunkSize"
-                value={kb.chunk_config.chunk_size}
-                onChange={(e) =>
-                  setKb((prev) => ({
-                    ...prev,
-                    chunk_config: {
-                      ...prev.chunk_config,
-                      chunk_size: e.target.value,
-                    },
-                  }))
-                }
-                min="100"
-                max="2000"
-                required
-              />
-              <p className="text-xs text-muted-foreground">推荐值: 1000</p>
+            {/* Table Config - 只在 parser_type === 'table' 时显示 */}
+            {kb.chunk_config.parser_type === 'table' && (
+              <div className="space-y-3">
+                <div className="flex gap-3 items-center">
+                  <div className="flex gap-3 items-center flex-1">
+                    <Label htmlFor="table-header-index-max" className="w-[100px] text-xs">
+                      最大表头行index
+                    </Label>
+                    <Input
+                      type="number"
+                      className="w-60 h-6 text-xs"
+                      id="table-header-index-max"
+                      value={kb.chunk_config.table_config?.header_index_max ?? 0}
+                      onChange={(e) =>
+                        setKb((prev) => ({
+                          ...prev,
+                          chunk_config: {
+                            ...prev.chunk_config,
+                            table_config: {
+                              ...prev.chunk_config.table_config,
+                              header_index_max: e.target.value ? parseInt(e.target.value) : 0,
+                            },
+                          },
+                        }))
+                      }
+                      min="0"
+                    />
+                  </div>
+                  <div className="flex gap-3 items-center flex-1">
+                    <Label htmlFor="table-format-json" className="w-[100px] text-xs">
+                      格式化为Json
+                    </Label>
+                    <Checkbox
+                      id="table-format-json"
+                      checked={kb.chunk_config.table_config?.format_sheet_data_to_json ?? false}
+                      onCheckedChange={(checked) =>
+                        setKb((prev) => ({
+                          ...prev,
+                          chunk_config: {
+                            ...prev.chunk_config,
+                            table_config: {
+                              ...prev.chunk_config.table_config,
+                              format_sheet_data_to_json: checked === true,
+                            },
+                          },
+                        }))
+                      }
+                    />
+                  </div>
+                </div>
+                <div className="flex gap-3 items-center">
+                  <div className="flex gap-3 items-center flex-1">
+                    <Label htmlFor="table-concat-rows" className="w-[100px] text-xs">
+                      合并行
+                    </Label>
+                    <Checkbox
+                      id="table-concat-rows"
+                      checked={kb.chunk_config.table_config?.concat_rows ?? false}
+                      onCheckedChange={(checked) =>
+                        setKb((prev) => ({
+                          ...prev,
+                          chunk_config: {
+                            ...prev.chunk_config,
+                            table_config: {
+                              ...prev.chunk_config.table_config,
+                              concat_rows: checked === true,
+                            },
+                          },
+                        }))
+                      }
+                    />
+                  </div>
+                  <div className="flex gap-3 items-center flex-1">
+                    <Label htmlFor="table-row-joiner" className="w-[100px] text-xs">
+                      行分隔符
+                    </Label>
+                    <Input
+                      type="text"
+                      className="w-60 h-6 text-xs"
+                      id="table-row-joiner"
+                      value={kb.chunk_config.table_config?.row_joiner || '\n'}
+                      onChange={(e) =>
+                        setKb((prev) => ({
+                          ...prev,
+                          chunk_config: {
+                            ...prev.chunk_config,
+                            table_config: {
+                              ...prev.chunk_config.table_config,
+                              row_joiner: e.target.value,
+                            },
+                          },
+                        }))
+                      }
+                    />
+                  </div>
+                </div>
+              </div>
+            )}
+
+            {/* Paragraph Config - 只在 parser_type === 'paragraph' 时显示 */}
+            {kb.chunk_config.parser_type === 'paragraph' && (
+              <div className="space-y-3">
+                <div className="flex gap-3 items-center">
+                  <Label htmlFor="paragraph-separator" className="w-[100px] text-xs">
+                    分隔符
+                    <span className="text-destructive">*</span>
+                  </Label>
+                  <Input
+                    type="text"
+                    className="w-60 h-6 text-xs"
+                    id="paragraph-separator"
+                    value={kb.chunk_config.separator || '\n\n'}
+                    onChange={(e) =>
+                      setKb((prev) => ({
+                        ...prev,
+                        chunk_config: {
+                          ...prev.chunk_config,
+                          separator: e.target.value,
+                        },
+                      }))
+                    }
+                  />
+                </div>
+                <div className="flex gap-3 items-center">
+                  <Label htmlFor="chunkSize" className="w-[100px] text-xs">
+                    切片大小
+                    <span className="text-destructive">*</span>
+                  </Label>
+                  <Input
+                    type="text"
+                    inputMode="numeric"
+                    className="w-60 h-6 text-xs"
+                    id="chunkSize"
+                    value={kb.chunk_config.chunk_size ?? ''}
+                    placeholder="1000"
+                    onChange={(e) => {
+                      const value = e.target.value;
+                      // 只允许数字和空字符串
+                      if (value === '' || /^\d+$/.test(value)) {
+                        setKb((prev) => ({
+                          ...prev,
+                          chunk_config: {
+                            ...prev.chunk_config,
+                            chunk_size: value,
+                          },
+                        }));
+                      }
+                    }}
+                    required
+                  />
+                  <p className="text-xs text-muted-foreground">推荐值: 1000</p>
 
-              <Label htmlFor="chunkOverlap" className="w-[100px] ml-20 text-xs">
-                切片重叠
-                <span className="text-destructive">*</span>
-              </Label>
-              <Input
-                type="number"
-                className="w-60 h-6 text-xs"
-                id="chunkOverlap"
-                value={kb.chunk_config.chunk_overlap}
-                onChange={(e) =>
-                  setKb((prev) => ({
-                    ...prev,
-                    chunk_config: {
-                      ...prev.chunk_config,
-                      chunk_overlap: e.target.value,
-                    },
-                  }))
-                }
-                min="0"
-                max="200"
-              />
-              <p className="text-xs text-muted-foreground">推荐值: 50</p>
-            </div>
+                  <Label htmlFor="chunkOverlap" className="w-[100px] ml-20 text-xs">
+                    切片重叠
+                    <span className="text-destructive">*</span>
+                  </Label>
+                  <Input
+                    type="text"
+                    inputMode="numeric"
+                    className="w-60 h-6 text-xs"
+                    id="chunkOverlap"
+                    value={kb.chunk_config.chunk_overlap ?? ''}
+                    placeholder="50"
+                    onChange={(e) => {
+                      const value = e.target.value;
+                      // 只允许数字和空字符串
+                      if (value === '' || /^\d+$/.test(value)) {
+                        setKb((prev) => ({
+                          ...prev,
+                          chunk_config: {
+                            ...prev.chunk_config,
+                            chunk_overlap: value,
+                          },
+                        }));
+                      }
+                    }}
+                  />
+                  <p className="text-xs text-muted-foreground">推荐值: 50</p>
+                </div>
+              </div>
+            )}
+
+            {/* Default Config - 只在 parser_type 为 'structure' 或 'token' 时显示 */}
+            {(kb.chunk_config.parser_type === 'structure' || kb.chunk_config.parser_type === 'token') && (
+              <div className="flex gap-3 items-center">
+                <Label htmlFor="chunkSize" className="w-[100px] text-xs">
+                  切片大小
+                  <span className="text-destructive">*</span>
+                </Label>
+                <Input
+                  type="text"
+                  inputMode="numeric"
+                  className="w-60 h-6 text-xs"
+                  id="chunkSize"
+                  value={kb.chunk_config.chunk_size ?? ''}
+                  placeholder="1000"
+                  onChange={(e) => {
+                    const value = e.target.value;
+                    // 只允许数字和空字符串
+                    if (value === '' || /^\d+$/.test(value)) {
+                      setKb((prev) => ({
+                        ...prev,
+                        chunk_config: {
+                          ...prev.chunk_config,
+                          chunk_size: value,
+                        },
+                      }));
+                    }
+                  }}
+                  required
+                />
+                <p className="text-xs text-muted-foreground">推荐值: 1000</p>
+
+                <Label htmlFor="chunkOverlap" className="w-[100px] ml-20 text-xs">
+                  切片重叠
+                  <span className="text-destructive">*</span>
+                </Label>
+                <Input
+                  type="text"
+                  inputMode="numeric"
+                  className="w-60 h-6 text-xs"
+                  id="chunkOverlap"
+                  value={kb.chunk_config.chunk_overlap ?? ''}
+                  placeholder="50"
+                  onChange={(e) => {
+                    const value = e.target.value;
+                    // 只允许数字和空字符串
+                    if (value === '' || /^\d+$/.test(value)) {
+                      setKb((prev) => ({
+                        ...prev,
+                        chunk_config: {
+                          ...prev.chunk_config,
+                          chunk_overlap: value,
+                        },
+                      }));
+                    }
+                  }}
+                />
+                <p className="text-xs text-muted-foreground">推荐值: 50</p>
+              </div>
+            )}
 
             <div className="flex gap-3 items-center">
               <Label htmlFor="imageCaptionModel" className="w-[100px] text-xs">
diff --git a/integrations/pairag-file/pairag/file/nodeparsers/file_parser.py b/integrations/pairag-file/pairag/file/nodeparsers/file_parser.py
index 6bd1883b2..155a486e3 100644
--- a/integrations/pairag-file/pairag/file/nodeparsers/file_parser.py
+++ b/integrations/pairag-file/pairag/file/nodeparsers/file_parser.py
@@ -7,8 +7,11 @@
 from pairag.file.models.file_item import FileItem
 from pairag.file.readers.base import BaseReader
 from pairag.file.readers.csv2md_reader import Csv2MdReader
+from pairag.file.readers.csv_reader import CSVReader
 from pairag.file.readers.doc_reader import DocxReader
 from pairag.file.readers.excel2md_reader import Excel2MdReader
+from pairag.file.readers.excel_reader import ExcelReader
+from pairag.file.readers.faq_reader import FAQReader
 from pairag.file.readers.html_reader import HtmlReader
 from pairag.file.readers.image_reader import ImageReader
 from pairag.file.readers.jsonl2md_reader import Json2MdReader
@@ -18,6 +21,7 @@
 from pairag.file.readers.text_reader import TextReader
 from pairag.file.readers.simple_pdf_reader import SimplePdfReader
 from pairag.file.nodeparsers.token_parser import TokenTextSplitter
+from pairag.file.nodeparsers.paragraph_parser import ParagraphSplitter
 from pairag.file.nodeparsers.pai_markdown_parser import MarkdownNodeParser
 from pairag.file.nodeparsers.positional_markdown_parser import PositionalMarkdownNodeParser
 from pairag.file.store.base import BaseFileStore
@@ -26,7 +30,7 @@
 from pairag.file.utils.constants import (
     DEFAULT_CHUNK_SIZE,
     DEFAULT_CHUNK_OVERLAP,
-    DEFAULT_SENTENCE_SEPARATOR,
+    DEFAULT_PARAGRAPH_SEPARATOR,
     DEFAULT_PARSER_TYPE,
 )
 from pairag.file.utils.image_utils import MARKDOWN_IMAGE_PATTERN, markdown_image_text_to_chunk
@@ -57,11 +61,21 @@
 
 
 
+class TableParserConfig(BaseModel):
+    """Configuration for table parser (CSV/Excel). Only used when parser_type == 'table'."""
+    concat_rows: Optional[bool] = Field(default=False, description="Whether to concatenate all rows into one document")
+    row_joiner: Optional[str] = Field(default="\n", description="Separator to use for joining each row")
+    header_index_max: Optional[int] = Field(default=0, description="Maximum row index to use as header")
+    format_sheet_data_to_json: Optional[bool] = Field(default=False, description="Whether to format sheet data as JSON")
+    sheet_column_filters: Optional[List[str]] = Field(default=None, description="List of column names to filter")
+
+
 class ChunkConfig(BaseModel):
     chunk_size: int = Field(default=DEFAULT_CHUNK_SIZE)
     chunk_overlap: int = Field(default=DEFAULT_CHUNK_OVERLAP)
     parser_type: str = Field(default=DEFAULT_PARSER_TYPE)
-    separator: str = Field(default=DEFAULT_SENTENCE_SEPARATOR)
+    separator: str = Field(default=DEFAULT_PARAGRAPH_SEPARATOR)
+    table_config: Optional[TableParserConfig] = Field(default=None, description="Table parser configuration (only used when parser_type == 'table')")
 
 
 class ReaderConfig(BaseModel):
@@ -92,7 +106,12 @@ def _get_reader(
             self,
             file_extension: str,
             is_attachment: bool=False,
-            chunk_size: int=DEFAULT_CHUNK_SIZE) -> BaseReader:
+            chunk_config: Optional[ChunkConfig] = None) -> BaseReader:
+        chunk_size = chunk_config.chunk_size if chunk_config else DEFAULT_CHUNK_SIZE
+        parser_type = chunk_config.parser_type if chunk_config else DEFAULT_PARSER_TYPE
+        
+        table_config = chunk_config.table_config if chunk_config and chunk_config.table_config else None
+        
         if is_attachment:
             match file_extension:
                 case ".docx":
@@ -186,10 +205,46 @@ def _get_reader(
                         image_caption_tool=self.image_caption_tool,
                     )
                 case ".xlsx":
+                    if parser_type.lower() == "table":
+                        return ExcelReader(
+                            concat_rows=table_config.concat_rows,
+                            row_joiner=table_config.row_joiner,
+                            header_index_max=table_config.header_index_max,
+                            format_sheet_data_to_json=table_config.format_sheet_data_to_json,
+                            sheet_column_filters=table_config.sheet_column_filters,
+                        )
+                    elif parser_type.lower() == "faq":
+                        return FAQReader(
+                            header_index_max=table_config.header_index_max,
+                            question_column_index=table_config.question_column_index,
+                            answer_column_index=table_config.answer_column_index,
+                        )
                     return Excel2MdReader(chunk_size=chunk_size)
                 case ".xls":
+                    if parser_type.lower() == "table":
+                        return ExcelReader(
+                            concat_rows=table_config.concat_rows,
+                            row_joiner=table_config.row_joiner,
+                            header_index_max=table_config.header_index_max,
+                            format_sheet_data_to_json=table_config.format_sheet_data_to_json,
+                            sheet_column_filters=table_config.sheet_column_filters,
+                        )
+                    elif parser_type.lower() == "faq":
+                        return FAQReader(
+                            header_index_max=table_config.header_index_max,
+                            question_column_index=table_config.question_column_index,
+                            answer_column_index=table_config.answer_column_index,
+                        )
                     return Excel2MdReader(chunk_size=chunk_size)
                 case ".csv":
+                    if parser_type.lower() == "table":
+                        return CSVReader(
+                            concat_rows=table_config.concat_rows,
+                            row_joiner=table_config.row_joiner,
+                            header_index_max=table_config.header_index_max,
+                            format_sheet_data_to_json=table_config.format_sheet_data_to_json,
+                            sheet_column_filters=table_config.sheet_column_filters,
+                        )
                     return Csv2MdReader(chunk_size=chunk_size)
                 case ".jsonl":
                     return Json2MdReader(chunk_size=chunk_size)
@@ -208,7 +263,7 @@ def read_file(
         reader = self._get_reader(
             file_item.file_extension,
             is_attachment=is_attachment,
-            chunk_size=chunk_config.chunk_size if chunk_config else DEFAULT_CHUNK_SIZE)
+            chunk_config=chunk_config)
         return reader.read(file_item)
 
     def split_docs(
@@ -238,6 +293,7 @@ def split_docs(
                     TextNode(
                         id_=node_id,
                         text=doc_node.text,
+                        metadata=doc_node.metadata,
                     )
                 )
             elif chunk_config.parser_type.lower() == "token":
@@ -247,6 +303,14 @@ def split_docs(
                     id_func=node_id_func,
                 )
                 chunks = parser.get_nodes_from_documents([doc_node])
+            elif chunk_config.parser_type.lower() == "paragraph":
+                parser = ParagraphSplitter(
+                    chunk_size=chunk_config.chunk_size,
+                    chunk_overlap=chunk_config.chunk_overlap,
+                    paragraph_separator=chunk_config.separator,
+                    id_func=node_id_func,
+                )
+                chunks = parser.get_nodes_from_documents([doc_node])
             else:
                 logger.info(f"Start splitting document: {doc_node.metadata['file_name']} with id {doc_node.id_}")
                 parser = MySentenceSplitter(
diff --git a/integrations/pairag-file/pairag/file/nodeparsers/paragraph_parser.py b/integrations/pairag-file/pairag/file/nodeparsers/paragraph_parser.py
new file mode 100644
index 000000000..902af7cdd
--- /dev/null
+++ b/integrations/pairag-file/pairag/file/nodeparsers/paragraph_parser.py
@@ -0,0 +1,149 @@
+from llama_index.core.node_parser.interface import TextSplitter
+from typing import (
+    List,
+    Callable,
+    Sequence,
+    Any,
+)
+from llama_index.core.schema import BaseNode
+from pairag.file.utils.tokenization import get_tokenizer
+from llama_index.core.bridge.pydantic import Field
+from llama_index.core.utils import get_tqdm_iterable
+from llama_index.core.schema import (
+    BaseNode,
+    MetadataMode,
+)
+from llama_index.core.node_parser.node_utils import build_nodes_from_splits
+from pairag.file.utils.constants import DEFAULT_CHUNK_SIZE, DEFAULT_CHUNK_OVERLAP, DEFAULT_PARAGRAPH_SEPARATOR
+from pairag.file.utils.tokenization import estimate_tokens_in_text
+import re
+from loguru import logger
+
+class ParagraphSplitter(TextSplitter):
+    """Splitting text using paragraph separator."""
+
+    paragraph_separator: str = Field(default="\n\n", description="Separator between paragraphs.")
+    chunk_size: int = Field(default=1024, description="chunk size.")
+    chunk_overlap: int = Field(default=50, description="Chunk overlap size.")
+
+    def __init__(
+        self,
+        chunk_size: int = DEFAULT_CHUNK_SIZE,
+        chunk_overlap: int = DEFAULT_CHUNK_OVERLAP,
+        paragraph_separator: str = DEFAULT_PARAGRAPH_SEPARATOR,
+        id_func: Callable[[int, BaseNode], str] = None,
+    ):
+        super().__init__(chunk_size=chunk_size, chunk_overlap=chunk_overlap, paragraph_separator=paragraph_separator)
+        self.id_func = id_func
+        self._tokenizer = get_tokenizer()
+
+
+
+    def split_text(self, text: str) -> tuple[list[str], list[int]]:
+        """Split text into chunks."""
+        logger.info(f"Splitting text into chunks with chunk size {self.chunk_size}")
+        return self._split_text(text, paragraph_separator=self.paragraph_separator, chunk_size=self.chunk_size, chunk_overlap=self.chunk_overlap)
+
+    def _split_text_with_regex(self, text: str, paragraph_separator: str = None) -> list[str]:
+        if paragraph_separator is None:
+            paragraph_separator = DEFAULT_PARAGRAPH_SEPARATOR
+        splits = re.split(paragraph_separator, text)
+        return [s for s in splits if (s not in {"", "\n"})]
+
+
+    def _split_text_on_tokens(self, text: str, chunk_size: int = None, chunk_overlap: int = None) -> tuple[list[str], list[int]]:
+        """Split incoming text and return chunks using tokenizer."""
+        splits: list[str] = []
+        token_counts: list[int] = []
+        
+        if chunk_size is None:
+            chunk_size = DEFAULT_CHUNK_SIZE
+        
+        if chunk_overlap is None:
+            chunk_overlap = DEFAULT_CHUNK_OVERLAP
+        
+        result = self._tokenizer(
+            text, 
+            return_offsets_mapping=True, 
+            return_attention_mask=False, 
+            add_special_tokens=False
+        )
+        input_ids = result["input_ids"]
+        offset_mapping = result["offset_mapping"]
+        
+        start_idx = 0
+        while start_idx < len(input_ids):
+            chunk_offset_mapping = offset_mapping[start_idx:start_idx + chunk_size]
+            
+            if chunk_offset_mapping:
+                chunk_start_char = chunk_offset_mapping[0][0]
+                chunk_end_char = chunk_offset_mapping[-1][1]
+                # Extract text using character offsets to avoid splitting characters
+                chunk_text = text[chunk_start_char:chunk_end_char]
+                splits.append(chunk_text)
+                token_counts.append(len(chunk_offset_mapping))
+            
+            # Move to next chunk with overlap
+            start_idx += chunk_size - chunk_overlap
+        
+        return splits, token_counts
+
+
+    
+
+    def _split_text(self, text: str, paragraph_separator: str = None, chunk_size: int = None, chunk_overlap: int = None) -> tuple[list[str], list[int]]:
+        """Split incoming text and return chunks using tokenizer."""
+        final_splits: list[str] = []
+        final_token_counts: list[int] = []
+        
+        if not text:
+            return [], []
+        
+        if chunk_size is None:
+            chunk_size = DEFAULT_CHUNK_SIZE
+
+        if chunk_overlap is None:
+            chunk_overlap = DEFAULT_CHUNK_OVERLAP
+
+        if paragraph_separator is None:
+            paragraph_separator = DEFAULT_PARAGRAPH_SEPARATOR
+
+        # First split by paragraph separator
+        paragraph_splits = self._split_text_with_regex(text, paragraph_separator)
+        
+        # Process each paragraph split
+        for split in paragraph_splits:
+            # Ensure split is a string
+            if not isinstance(split, str):
+                split = str(split) if split is not None else ""
+            
+            # Skip empty splits
+            if not split:
+                continue
+                
+            token_count = estimate_tokens_in_text(split)
+            if token_count <= chunk_size:
+                final_splits.append(split)
+                final_token_counts.append(token_count)
+            else:
+                # Split further using tokenizer
+                sub_splits, sub_token_counts = self._split_text_on_tokens(split, chunk_size, chunk_overlap)
+                final_splits.extend(sub_splits)
+                final_token_counts.extend(sub_token_counts)
+        
+        return final_splits, final_token_counts
+
+    def _parse_nodes(
+        self, nodes: Sequence[BaseNode], show_progress: bool = False, **kwargs: Any
+    ) -> List[BaseNode]:
+        all_nodes: List[BaseNode] = []
+        nodes_with_progress = get_tqdm_iterable(nodes, show_progress, "Parsing nodes")
+        for node in nodes_with_progress:
+            splits, token_counts = self.split_text(node.get_content(metadata_mode=MetadataMode.NONE))
+            node.metadata.pop("content_list", None)
+            chunks = build_nodes_from_splits(splits, node, id_func=self.id_func)
+            for chunk, token_count in zip(chunks, token_counts):
+                chunk.metadata["token_count"] = token_count
+            all_nodes.extend(chunks)
+        return all_nodes
+
diff --git a/integrations/pairag-file/pairag/file/readers/csv_reader.py b/integrations/pairag-file/pairag/file/readers/csv_reader.py
index c6603ba3d..1bd5d8152 100644
--- a/integrations/pairag-file/pairag/file/readers/csv_reader.py
+++ b/integrations/pairag-file/pairag/file/readers/csv_reader.py
@@ -1,36 +1,90 @@
-from typing import BinaryIO
+"""Tabular parser-CSV parser.
 
+
+Contains parsers for tabular data files.
+
+"""
+
+from pathlib import Path
+from typing import Any, BinaryIO, Dict, List, Optional
 from loguru import logger
+
+import pandas as pd
+from llama_index.core.schema import Document
+import os
 from pairag.file.readers.base import BaseReader, FileItem, Document, List
 import charset_normalizer
 
+class CSVReader(BaseReader):
 
-class CsvReader(BaseReader):
-    def _read_file(self, file: BinaryIO):
-        import pandas as pd
 
+    def __init__(
+        self,
+        *args: Any,
+        concat_rows: Optional[bool] = False,
+        row_joiner: Optional[str] = "\n",
+        header_index_max: Optional[int] = 0,
+        format_sheet_data_to_json: Optional[bool] = False,
+        sheet_column_filters: Optional[List[str]] = None,
+        **kwargs: Any,
+    ) -> None:
+        """Init params."""
+        super().__init__(*args, **kwargs)
+        self._concat_rows = concat_rows if concat_rows is not None else False
+        self._row_joiner = row_joiner if row_joiner is not None else "\n"
+        self._header_index_max = header_index_max if header_index_max is not None else 0
+        self._format_sheet_data_to_json = format_sheet_data_to_json if format_sheet_data_to_json is not None else False
+        self._sheet_column_filters = sheet_column_filters if sheet_column_filters is not None else None
+        self._pandas_config = {'header': self._header_index_max} if self._header_index_max is not None else {}
+
+    def _read_file(self, file: BinaryIO):
+        """Read CSV file from binary file object."""
         encoding = charset_normalizer.detect(file.read(1000))["encoding"]
         file.seek(0)
-        encoding = "utf-8"
-        if encoding is not None and "GB" in encoding.upper():
+        if encoding is None or "GB" in encoding.upper():
             encoding = "GB18030"
-
-        df = pd.read_csv(file, encoding=encoding)
+        else:
+            encoding = "utf-8"
+        
+        df = pd.read_csv(file, encoding=encoding, **self._pandas_config)
         return df
 
     def read(self, file_item: FileItem) -> List[Document]:
-        """
-        Read a CSV file and return a list of Documents.
-        """
+        """Read CSV file from FileItem."""
+        extra_info = file_item.metadata()
+        
+        # Use file_item.file directly, similar to Csv2MdReader
+        file_item.file.seek(0)
         df = self._read_file(file_item.file)
-        text_list = [
-            "\n".join([f"{k}:{v}" for k, v in record.items()])
-            for record in df.to_dict("records")
-        ]
-        metadata = file_item.metadata()
-        docs = [Document(id_=file_item.id, text=text, metadata=metadata) for text in text_list]
-
-        logger.info(
-            f"Successfully read {len(docs)} documents from {file_item.file_name}"
-        )
-        return docs
+
+        if self._sheet_column_filters:
+            df = df[self._sheet_column_filters]
+
+        if self._format_sheet_data_to_json:
+            text_list = df.apply(
+                lambda row: str(dict(zip(df.columns, row.astype(str)))), axis=1
+            ).tolist()
+        else:
+            text_list = [
+                "\n".join([f"{k}:{v}" for k, v in record.items()])
+                for record in df.to_dict("records")
+            ]
+
+        extra_info = extra_info or {}
+        extra_info["file_path"] = file_item.file_path
+        extra_info["file_name"] = file_item.file_name
+
+        if self._concat_rows:
+            return [
+                Document(
+                    text=(self._row_joiner).join(text_list),
+                    metadata=extra_info,
+                )
+            ]
+        else:
+            docs = []
+            for i, text in enumerate(text_list):
+                row_metadata = extra_info.copy()
+                row_metadata["row_number"] = i + 1
+                docs.append(Document(text=text, metadata=row_metadata))
+            return docs
\ No newline at end of file
diff --git a/integrations/pairag-file/pairag/file/readers/excel_reader.py b/integrations/pairag-file/pairag/file/readers/excel_reader.py
index 178c9587e..1ee5c0e2b 100644
--- a/integrations/pairag-file/pairag/file/readers/excel_reader.py
+++ b/integrations/pairag-file/pairag/file/readers/excel_reader.py
@@ -1,33 +1,132 @@
+"""Tabular parser-Excel parser.
+
+Contains parsers for tabular data files.
+
+"""
+
+import os
+from io import BytesIO
+from pathlib import Path
+from typing import Any, BinaryIO, Dict, List, Optional
 from loguru import logger
-from pairag.file.readers.base import BaseReader, FileItem, Document, List
+from openpyxl import load_workbook
+
+import pandas as pd
+from llama_index.core.schema import Document
+from pairag.file.readers.base import BaseReader
+from pairag.file.models.file_item import FileItem
 
 
 class ExcelReader(BaseReader):
-    def _read_file(self, file_item: FileItem):
-        import pandas as pd
 
-        if file_item.file_extension == ".xls":
-            read_engine = "xlrd"
+    def __init__(
+        self,
+        *args: Any,
+        concat_rows: Optional[bool] = False,
+        row_joiner: Optional[str] = "\n",
+        header_index_max: Optional[int] = 0,
+        format_sheet_data_to_json: Optional[bool] = False,
+        sheet_column_filters: Optional[List[str]] = None,
+        **kwargs: Any,
+    ) -> None:
+        """Init params."""
+        super().__init__(*args, **kwargs)
+        self._concat_rows = concat_rows if concat_rows is not None else False
+        self._row_joiner = row_joiner  if row_joiner is not None else "\n"
+        self._header_index_max = header_index_max  # Allow None to indicate no header row
+        self._format_sheet_data_to_json = format_sheet_data_to_json if format_sheet_data_to_json is not None else False
+        self._sheet_column_filters = sheet_column_filters if sheet_column_filters is not None else None
+        # Use list of rows from 0 to header_index_max as MultiIndex column names
+        if self._header_index_max is None:
+            self._pandas_config = {'header': None}
         else:
-            read_engine = "openpyxl"
+            self._pandas_config = {'header': list(range(self._header_index_max + 1))}
 
-        df = pd.read_excel(file_item.file, engine=read_engine)
+    def read_xlsx(
+        self,
+        file: BinaryIO,
+        file_extension: Optional[str] = None,
+    ):
+        """Parse Excel file (supports both .xls and .xlsx with merge_cells handling)."""
+        file.seek(0)
+        
+        if file_extension and file_extension.lower() == ".xls":
+            df_temp = pd.read_excel(file, sheet_name=0, engine='xlrd')
+            xlsx_file = BytesIO()
+            df_temp.to_excel(xlsx_file, engine='openpyxl', index=False)
+            xlsx_file.seek(0)
+            file = xlsx_file
+        
+        excel = pd.ExcelFile(load_workbook(file, data_only=True), engine="openpyxl")
+        sheet_name = excel.sheet_names[0]
+        sheet = excel.book[sheet_name]
+        df = excel.parse(sheet_name, **self._pandas_config)
+
+        for item in sheet.merged_cells:
+            top_col, top_row, bottom_col, bottom_row = item.bounds
+            base_value = item.start_cell.value
+            # Convert 1-based index to 0-based index
+            top_row -= 1
+            top_col -= 1
+            # Since the previous lines are set as headers, the coordinates need to be adjusted here.
+            if self._header_index_max is not None and self._header_index_max > 0:
+                top_row -= self._header_index_max + 1
+                bottom_row -= self._header_index_max + 1
+
+            df.iloc[top_row:bottom_row, top_col:bottom_col] = base_value
         return df
 
+    
+
     def read(self, file_item: FileItem) -> List[Document]:
-        """
-        Read a Excel file and return a list of Documents.
-        """
-        df = self._read_file(file_item)
-        text_list = [
-            "\n".join([f"{k}:{v}" for k, v in record.items()])
-            for record in df.to_dict("records")
-        ]
-
-        metadata = file_item.metadata()
-        docs = [Document(id_=file_item.id, text=text, metadata=metadata) for text in text_list]
-        logger.info(
-            f"Successfully read {len(docs)} documents from {file_item.file_name}"
-        )
-
-        return docs
+        """Read Excel file from FileItem."""
+        extra_info = file_item.metadata()
+        
+        # Use file_item.file directly, unified handling for both .xls and .xlsx
+        file_item.file.seek(0)
+        df = self.read_xlsx(file_item.file, file_item.file_extension)
+        
+        if self._sheet_column_filters:
+            df = df[self._sheet_column_filters]
+
+        # Handle MultiIndex column names by joining them with separator
+        def format_column_name(col):
+            if isinstance(col, tuple):
+                # MultiIndex column: join with space
+                return " ".join(str(c) for c in col if pd.notna(c) and str(c).strip())
+            else:
+                return str(col)
+
+        if self._format_sheet_data_to_json:
+            text_list = df.apply(
+                lambda row: str(dict(zip(
+                    [format_column_name(col) for col in df.columns], 
+                    [str(v) if pd.notna(v) else '' for v in row]
+                ))), axis=1
+            ).tolist()
+        else:
+            text_list = [
+                "\n".join([
+                    f"{format_column_name(k)}:{str(v) if pd.notna(v) else ''}" 
+                    for k, v in record.items()
+                ])
+                for record in df.to_dict("records")
+            ]
+
+        if self._concat_rows:
+            logger.info(f"Parsed workbook {file_item.file_name} into single document.")
+            return [
+                Document(
+                    text=(self._row_joiner).join(text_list), metadata=extra_info or {}
+                )
+            ]
+        else:
+            docs = []
+            extra_info = extra_info or {}
+            for i, text in enumerate(text_list):
+                row_metadata = extra_info.copy()
+                row_metadata["row_number"] = i + 1
+                docs.append(Document(text=text, metadata=row_metadata))
+
+            logger.info(f"Parsed workbook {file_item.file_name} into {len(docs)} documents.")
+            return docs
\ No newline at end of file
diff --git a/integrations/pairag-file/pairag/file/readers/faq_reader.py b/integrations/pairag-file/pairag/file/readers/faq_reader.py
new file mode 100644
index 000000000..7c3ea117d
--- /dev/null
+++ b/integrations/pairag-file/pairag/file/readers/faq_reader.py
@@ -0,0 +1,123 @@
+"""Tabular parser-Excel parser for FAQ file。
+
+"""
+
+import os
+from io import BytesIO
+from pathlib import Path
+from typing import Any, BinaryIO, Dict, List, Optional
+from loguru import logger
+from openpyxl import load_workbook
+
+import pandas as pd
+from llama_index.core.schema import Document
+from pairag.file.readers.base import BaseReader
+from pairag.file.models.file_item import FileItem
+
+
+class FAQReader(BaseReader):
+
+    def __init__(
+        self,
+        *args: Any,
+        header_index_max: Optional[int] = 0,
+        question_column_index: Optional[int] = 0,
+        answer_column_index: Optional[int] = 1,
+        **kwargs: Any,
+    ) -> None:
+        """Init params."""
+        super().__init__(*args, **kwargs)
+        self._question_column_index = question_column_index if question_column_index is not None else 0
+        self._answer_column_index = answer_column_index if answer_column_index is not None else 1
+        self._header_index_max = header_index_max  # Allow None to indicate no header row
+        # When header_index_max is None, pandas will use numeric column indices (0, 1, 2, ...)
+        # Use list of rows from 0 to header_index_max as MultiIndex column names
+        if self._header_index_max is None:
+            self._pandas_config = {'header': None}
+        else:
+            self._pandas_config = {'header': list(range(self._header_index_max + 1))}
+
+    def read_xlsx(
+        self,
+        file: BinaryIO,
+        file_extension: Optional[str] = None,
+    ):
+        """Parse Excel file (supports both .xls and .xlsx with merge_cells handling)."""
+        file.seek(0)
+        
+        if file_extension and file_extension.lower() == ".xls":
+            df_temp = pd.read_excel(file, sheet_name=0, engine='xlrd')
+            xlsx_file = BytesIO()
+            df_temp.to_excel(xlsx_file, engine='openpyxl', index=False)
+            xlsx_file.seek(0)
+            file = xlsx_file
+        
+        excel = pd.ExcelFile(load_workbook(file, data_only=True), engine="openpyxl")
+        sheet_name = excel.sheet_names[0]
+        sheet = excel.book[sheet_name]
+        df = excel.parse(sheet_name, **self._pandas_config)
+
+        for item in sheet.merged_cells:
+            top_col, top_row, bottom_col, bottom_row = item.bounds
+            base_value = item.start_cell.value
+            # Convert 1-based index to 0-based index
+            top_row -= 1
+            top_col -= 1
+            # Since the previous lines are set as headers, the coordinates need to be adjusted here.
+            if self._header_index_max is not None and self._header_index_max > 0:
+                top_row -= self._header_index_max + 1
+                bottom_row -= self._header_index_max + 1
+
+            df.iloc[top_row:bottom_row, top_col:bottom_col] = base_value
+        return df
+
+    
+    
+    def _process_dataframe(self, df: pd.DataFrame, extra_info: Optional[Dict] = None, file_name: Optional[str] = None) -> List[Document]:
+        """Process DataFrame and create FAQ documents."""
+
+        # Get question and answer columns by index
+        if len(df.columns) <= self._question_column_index:
+            raise ValueError(f"Question column index {self._question_column_index} is out of range. DataFrame has {len(df.columns)} columns.")
+        if len(df.columns) <= self._answer_column_index:
+            raise ValueError(f"Answer column index {self._answer_column_index} is out of range. DataFrame has {len(df.columns)} columns.")
+        
+        question_column = df.columns[self._question_column_index]
+        answer_column = df.columns[self._answer_column_index]
+
+        # Build documents for each row
+        docs = []
+        extra_info = extra_info or {}
+        
+        for i, row in df.iterrows():
+            question = str(row[question_column]) if pd.notna(row[question_column]) else ""
+            answer = str(row[answer_column]) if pd.notna(row[answer_column]) else ""
+            
+            if not question.strip() and not answer.strip():
+                continue
+            
+            
+            
+            chunk_text = f"问题: {question}\n答案: {answer}"
+            
+            row_metadata = extra_info.copy()
+            row_metadata["row_number"] = i + 1
+            row_metadata["question"] = question
+            row_metadata["answer"] = answer
+            
+            docs.append(Document(text=chunk_text, metadata=row_metadata))
+
+        file_display_name = file_name if file_name else "file"
+        logger.info(f"Parsed workbook {file_display_name} into {len(docs)} FAQ documents.")
+        return docs
+
+    def read(self, file_item: FileItem) -> List[Document]:
+        """Read Excel file from FileItem."""
+        extra_info = file_item.metadata()
+        
+        # Use file_item.file directly, unified handling for both .xls and .xlsx
+        file_item.file.seek(0)
+        df = self.read_xlsx(file_item.file, file_item.file_extension)
+        
+        return self._process_dataframe(df, extra_info, file_item.file_name)
+        
\ No newline at end of file
diff --git a/integrations/pairag-file/pairag/file/utils/constants.py b/integrations/pairag-file/pairag/file/utils/constants.py
index 7dd1b9e10..aaf1ec553 100644
--- a/integrations/pairag-file/pairag/file/utils/constants.py
+++ b/integrations/pairag-file/pairag/file/utils/constants.py
@@ -1,5 +1,5 @@
 DEFAULT_CHUNK_SIZE = 1024
 DEFAULT_CHUNK_OVERLAP = 50
 DEFAULT_PARSER_TYPE = "Sentence"
-DEFAULT_SENTENCE_SEPARATOR = "\n\n"
+DEFAULT_PARAGRAPH_SEPARATOR = "\n\n"
 DEFAULT_KNOWLEDGEBASE_PATH = "localdata/knowledgebases"
\ No newline at end of file
diff --git a/integrations/pairag-file/pyproject.toml b/integrations/pairag-file/pyproject.toml
index d1f99f550..172a97e1f 100644
--- a/integrations/pairag-file/pyproject.toml
+++ b/integrations/pairag-file/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
 
 [tool.poetry]
 name = "pairag-file"
-version = "2.1.23"
+version = "2.1.24"
 description = "PAI-RAG file processing library."
 authors = []
 readme = "README.md"
diff --git a/poetry.lock b/poetry.lock
index 62924751b..2af4dd69d 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1,4 +1,4 @@
-# This file is automatically @generated by Poetry 2.2.0 and should not be changed by hand.
+# This file is automatically @generated by Poetry 2.1.3 and should not be changed by hand.
 
 [[package]]
 name = "accelerate"
@@ -2477,8 +2477,6 @@ files = [
     {file = "greenlet-3.2.4-cp310-cp310-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c2ca18a03a8cfb5b25bc1cbe20f3d9a4c80d8c3b13ba3df49ac3961af0b1018d"},
     {file = "greenlet-3.2.4-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:9fe0a28a7b952a21e2c062cd5756d34354117796c6d9215a87f55e38d15402c5"},
     {file = "greenlet-3.2.4-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:8854167e06950ca75b898b104b63cc646573aa5fef1353d4508ecdd1ee76254f"},
-    {file = "greenlet-3.2.4-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:f47617f698838ba98f4ff4189aef02e7343952df3a615f847bb575c3feb177a7"},
-    {file = "greenlet-3.2.4-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:af41be48a4f60429d5cad9d22175217805098a9ef7c40bfef44f7669fb9d74d8"},
     {file = "greenlet-3.2.4-cp310-cp310-win_amd64.whl", hash = "sha256:73f49b5368b5359d04e18d15828eecc1806033db5233397748f4ca813ff1056c"},
     {file = "greenlet-3.2.4-cp311-cp311-macosx_11_0_universal2.whl", hash = "sha256:96378df1de302bc38e99c3a9aa311967b7dc80ced1dcc6f171e99842987882a2"},
     {file = "greenlet-3.2.4-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:1ee8fae0519a337f2329cb78bd7a8e128ec0f881073d43f023c7b8d4831d5246"},
@@ -2488,8 +2486,6 @@ files = [
     {file = "greenlet-3.2.4-cp311-cp311-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:2523e5246274f54fdadbce8494458a2ebdcdbc7b802318466ac5606d3cded1f8"},
     {file = "greenlet-3.2.4-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:1987de92fec508535687fb807a5cea1560f6196285a4cde35c100b8cd632cc52"},
     {file = "greenlet-3.2.4-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:55e9c5affaa6775e2c6b67659f3a71684de4c549b3dd9afca3bc773533d284fa"},
-    {file = "greenlet-3.2.4-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:c9c6de1940a7d828635fbd254d69db79e54619f165ee7ce32fda763a9cb6a58c"},
-    {file = "greenlet-3.2.4-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:03c5136e7be905045160b1b9fdca93dd6727b180feeafda6818e6496434ed8c5"},
     {file = "greenlet-3.2.4-cp311-cp311-win_amd64.whl", hash = "sha256:9c40adce87eaa9ddb593ccb0fa6a07caf34015a29bf8d344811665b573138db9"},
     {file = "greenlet-3.2.4-cp312-cp312-macosx_11_0_universal2.whl", hash = "sha256:3b67ca49f54cede0186854a008109d6ee71f66bd57bb36abd6d0a0267b540cdd"},
     {file = "greenlet-3.2.4-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:ddf9164e7a5b08e9d22511526865780a576f19ddd00d62f8a665949327fde8bb"},
@@ -2499,8 +2495,6 @@ files = [
     {file = "greenlet-3.2.4-cp312-cp312-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:3b3812d8d0c9579967815af437d96623f45c0f2ae5f04e366de62a12d83a8fb0"},
     {file = "greenlet-3.2.4-cp312-cp312-musllinux_1_1_aarch64.whl", hash = "sha256:abbf57b5a870d30c4675928c37278493044d7c14378350b3aa5d484fa65575f0"},
     {file = "greenlet-3.2.4-cp312-cp312-musllinux_1_1_x86_64.whl", hash = "sha256:20fb936b4652b6e307b8f347665e2c615540d4b42b3b4c8a321d8286da7e520f"},
-    {file = "greenlet-3.2.4-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:ee7a6ec486883397d70eec05059353b8e83eca9168b9f3f9a361971e77e0bcd0"},
-    {file = "greenlet-3.2.4-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:326d234cbf337c9c3def0676412eb7040a35a768efc92504b947b3e9cfc7543d"},
     {file = "greenlet-3.2.4-cp312-cp312-win_amd64.whl", hash = "sha256:a7d4e128405eea3814a12cc2605e0e6aedb4035bf32697f72deca74de4105e02"},
     {file = "greenlet-3.2.4-cp313-cp313-macosx_11_0_universal2.whl", hash = "sha256:1a921e542453fe531144e91e1feedf12e07351b1cf6c9e8a3325ea600a715a31"},
     {file = "greenlet-3.2.4-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:cd3c8e693bff0fff6ba55f140bf390fa92c994083f838fece0f63be121334945"},
@@ -2510,8 +2504,6 @@ files = [
     {file = "greenlet-3.2.4-cp313-cp313-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:23768528f2911bcd7e475210822ffb5254ed10d71f4028387e5a99b4c6699671"},
     {file = "greenlet-3.2.4-cp313-cp313-musllinux_1_1_aarch64.whl", hash = "sha256:00fadb3fedccc447f517ee0d3fd8fe49eae949e1cd0f6a611818f4f6fb7dc83b"},
     {file = "greenlet-3.2.4-cp313-cp313-musllinux_1_1_x86_64.whl", hash = "sha256:d25c5091190f2dc0eaa3f950252122edbbadbb682aa7b1ef2f8af0f8c0afefae"},
-    {file = "greenlet-3.2.4-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:6e343822feb58ac4d0a1211bd9399de2b3a04963ddeec21530fc426cc121f19b"},
-    {file = "greenlet-3.2.4-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:ca7f6f1f2649b89ce02f6f229d7c19f680a6238af656f61e0115b24857917929"},
     {file = "greenlet-3.2.4-cp313-cp313-win_amd64.whl", hash = "sha256:554b03b6e73aaabec3745364d6239e9e012d64c68ccd0b8430c64ccc14939a8b"},
     {file = "greenlet-3.2.4-cp314-cp314-macosx_11_0_universal2.whl", hash = "sha256:49a30d5fda2507ae77be16479bdb62a660fa51b1eb4928b524975b3bde77b3c0"},
     {file = "greenlet-3.2.4-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:299fd615cd8fc86267b47597123e3f43ad79c9d8a22bebdce535e53550763e2f"},
@@ -2519,8 +2511,6 @@ files = [
     {file = "greenlet-3.2.4-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.whl", hash = "sha256:b4a1870c51720687af7fa3e7cda6d08d801dae660f75a76f3845b642b4da6ee1"},
     {file = "greenlet-3.2.4-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.whl", hash = "sha256:061dc4cf2c34852b052a8620d40f36324554bc192be474b9e9770e8c042fd735"},
     {file = "greenlet-3.2.4-cp314-cp314-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:44358b9bf66c8576a9f57a590d5f5d6e72fa4228b763d0e43fee6d3b06d3a337"},
-    {file = "greenlet-3.2.4-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:2917bdf657f5859fbf3386b12d68ede4cf1f04c90c3a6bc1f013dd68a22e2269"},
-    {file = "greenlet-3.2.4-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:015d48959d4add5d6c9f6c5210ee3803a830dce46356e3bc326d6776bde54681"},
     {file = "greenlet-3.2.4-cp314-cp314-win_amd64.whl", hash = "sha256:e37ab26028f12dbb0ff65f29a8d3d44a765c61e729647bf2ddfbbed621726f01"},
     {file = "greenlet-3.2.4-cp39-cp39-macosx_11_0_universal2.whl", hash = "sha256:b6a7c19cf0d2742d0809a4c05975db036fdff50cd294a93632d6a310bf9ac02c"},
     {file = "greenlet-3.2.4-cp39-cp39-manylinux2014_aarch64.manylinux_2_17_aarch64.whl", hash = "sha256:27890167f55d2387576d1f41d9487ef171849ea0359ce1510ca6e06c8bece11d"},
@@ -2530,8 +2520,6 @@ files = [
     {file = "greenlet-3.2.4-cp39-cp39-manylinux_2_24_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c9913f1a30e4526f432991f89ae263459b1c64d1608c0d22a5c79c287b3c70df"},
     {file = "greenlet-3.2.4-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:b90654e092f928f110e0007f572007c9727b5265f7632c2fa7415b4689351594"},
     {file = "greenlet-3.2.4-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:81701fd84f26330f0d5f4944d4e92e61afe6319dcd9775e39396e39d7c3e5f98"},
-    {file = "greenlet-3.2.4-cp39-cp39-musllinux_1_2_aarch64.whl", hash = "sha256:28a3c6b7cd72a96f61b0e4b2a36f681025b60ae4779cc73c1535eb5f29560b10"},
-    {file = "greenlet-3.2.4-cp39-cp39-musllinux_1_2_x86_64.whl", hash = "sha256:52206cd642670b0b320a1fd1cbfd95bca0e043179c1d8a045f2c6109dfe973be"},
     {file = "greenlet-3.2.4-cp39-cp39-win32.whl", hash = "sha256:65458b409c1ed459ea899e939f0e1cdb14f58dbc803f2f93c5eab5694d32671b"},
     {file = "greenlet-3.2.4-cp39-cp39-win_amd64.whl", hash = "sha256:d2e685ade4dafd447ede19c31277a224a239a0a1a4eca4e6390efedf20260cfb"},
     {file = "greenlet-3.2.4.tar.gz", hash = "sha256:0dca0d95ff849f9a364385f36ab49f50065d76964944638be9691e1832e9f86d"},
@@ -5583,13 +5571,13 @@ files = [
 
 [[package]]
 name = "pairag-file"
-version = "2.1.23"
+version = "2.1.24"
 description = "PAI-RAG file processing library."
 optional = false
 python-versions = ">=3.11,<3.13"
 groups = ["main"]
 files = [
-    {file = "pairag_file-2.1.23-py3-none-any.whl", hash = "sha256:b07d621697538334b9f8576f4d6560361b2ae324da45a8e7014ad3589790f4d1"},
+    {file = "pairag_file-2.1.24-py3-none-any.whl", hash = "sha256:3f6d9e55a6133fbdbcc81df0b007e0607c19c88ac48625514de8f1215a07c57a"},
 ]
 
 [package.dependencies]
@@ -5622,7 +5610,7 @@ xlrd = ">=2.0.2,<3.0.0"
 
 [package.source]
 type = "url"
-url = "https://pai-rag.oss-cn-hangzhou.aliyuncs.com/packages/python_wheels/pairag_file-2.1.23-py3-none-any.whl"
+url = "https://pai-rag.oss-cn-hangzhou.aliyuncs.com/packages/python_wheels/pairag_file-2.1.24-py3-none-any.whl"
 
 [[package]]
 name = "pandas"
@@ -9706,4 +9694,4 @@ files = [
 [metadata]
 lock-version = "2.1"
 python-versions = ">=3.11.0,<3.13"
-content-hash = "d6c1e7280499d157a8ea5df1b29b75c046fb023cdab8e8857ce40ab730bfad7b"
+content-hash = "eb4d280851287fdd242a15e9d361a39c61933d900f448dddeebc95af6dab8b70"
diff --git a/pyproject.toml b/pyproject.toml
index a0b5bf931..3a1189fa3 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -86,7 +86,7 @@ json5 = "^0.12.1"
 aiomysql = "^0.3.2"
 aiofiles = "24.1.0"
 alibabacloud-credentials = "1.0.1"
-pairag-file = {url = "https://pai-rag.oss-cn-hangzhou.aliyuncs.com/packages/python_wheels/pairag_file-2.1.23-py3-none-any.whl"}
+pairag-file = {url = "https://pai-rag.oss-cn-hangzhou.aliyuncs.com/packages/python_wheels/pairag_file-2.1.24-py3-none-any.whl"}
 aiocache = "^0.12.3"
 opentelemetry-instrumentation-fastapi = "^0.60b1"
 opentelemetry-exporter-otlp-proto-http = "^1.39.1"