https-deeplearning-ai · welovejack · Jan 11, 2026
diff --git a/PROMPT.md b/PROMPT.md
@@ -0,0 +1,5 @@
+重构backend文件夹中的内容，将rag_system修改为一个通用的rag系统，输入改为任意的md文件，保持各文件名不变；
+不再需要使用大模型接口，不再需要ai_generator.py文件、session_manager.py文件；
+rag_system对外提供两个接口：
+1. 初始化接口，输入为文件夹路径，输出为初始化完成的rag系统；
+2. 查询接口，输入为查询语句，输出为查询结果；2
diff --git a/backend/ai_generator.py b/backend/ai_generator.py
diff --git a/backend/app.py b/backend/app.py
@@ -1,20 +1,21 @@
+import os
 import warnings
+from pathlib import Path
+from typing import List, Optional
 
 warnings.filterwarnings("ignore", message="resource_tracker: There appear to be.*")
 
-import os
-from typing import List, Optional
-
 from config import config
 from fastapi import FastAPI, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.middleware.trustedhost import TrustedHostMiddleware
+from fastapi.responses import FileResponse
 from fastapi.staticfiles import StaticFiles
 from pydantic import BaseModel
 from rag_system import RAGSystem
 
 # Initialize FastAPI app
-app = FastAPI(title="Course Materials RAG System", root_path="")
+app = FastAPI(title="Markdown RAG System", root_path="")
 
 # Add trusted host middleware for proxy
 app.add_middleware(TrustedHostMiddleware, allowed_hosts=["*"])
@@ -29,38 +30,27 @@
     expose_headers=["*"],
 )
 
-# Initialize RAG system
-rag_system = RAGSystem(config)
-
 
 # Pydantic models for request/response
 class QueryRequest(BaseModel):
-    """Request model for course queries"""
+    """Request model for queries"""
 
     query: str
-    session_id: Optional[str] = None
+    limit: Optional[int] = 5
 
 
 class QueryResponse(BaseModel):
-    """Response model for course queries"""
+    """Response model for queries"""
 
     answer: str
     sources: List[str]
-    source_links: List[Optional[str]]
-    session_id: str
-
-
-class CourseStats(BaseModel):
-    """Response model for course statistics"""
 
-    total_courses: int
-    course_titles: List[str]
 
+class DocumentStats(BaseModel):
+    """Response model for document statistics"""
 
-class ClearSessionRequest(BaseModel):
-    """Request model for clearing a session"""
-
-    session_id: str
+    total_documents: int
+    file_names: List[str]
 
 
 # API Endpoints
@@ -70,69 +60,62 @@ class ClearSessionRequest(BaseModel):
 async def query_documents(request: QueryRequest):
     """Process a query and return response with sources"""
     try:
-        # Create session if not provided
-        session_id = request.session_id
-        if not session_id:
-            session_id = rag_system.session_manager.create_session()
-
         # Process query using RAG system
-        answer, sources, source_links = rag_system.query(request.query, session_id)
+        result = rag_system.query(request.query, request.limit or 5)
 
-        return QueryResponse(
-            answer=answer,
-            sources=sources,
-            source_links=source_links,
-            session_id=session_id,
-        )
+        return QueryResponse(answer=result["answer"], sources=result["sources"])
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
 
-@app.get("/api/courses", response_model=CourseStats)
-async def get_course_stats():
-    """Get course analytics and statistics"""
+@app.get("/api/documents", response_model=DocumentStats)
+async def get_document_stats():
+    """Get document analytics and statistics"""
     try:
-        analytics = rag_system.get_course_analytics()
-        return CourseStats(
-            total_courses=analytics["total_courses"],
-            course_titles=analytics["course_titles"],
+        stats = rag_system.get_document_stats()
+        return DocumentStats(
+            total_documents=stats["total_documents"],
+            file_names=stats["file_names"],
         )
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
 
-@app.post("/api/clear-session")
-async def clear_session(request: ClearSessionRequest):
-    """Clear a conversation session"""
-    try:
-        rag_system.session_manager.clear_session(request.session_id)
-        return {"status": "success", "message": "Session cleared successfully"}
-    except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))
-
-
 @app.on_event("startup")
 async def startup_event():
     """Load initial documents on startup"""
+    # Initialize RAG system with docs folder
     docs_path = "../docs"
+    rag = None
+
     if os.path.exists(docs_path):
         print("Loading initial documents...")
         try:
-            courses, chunks = rag_system.add_course_folder(
-                docs_path, clear_existing=False
-            )
-            print(f"Loaded {courses} courses with {chunks} chunks")
+            # Initialize and load documents
+            rag = RAGSystem(docs_path, chroma_path=config.CHROMA_PATH)
+            print(f"RAG system initialized with documents from: {docs_path}")
+
+            # Store globally for use in endpoints
+            globals()["rag_system"] = rag
         except Exception as e:
             print(f"Error loading documents: {e}")
+            # Initialize empty system
+            rag = RAGSystem.__new__(RAGSystem)
+            rag.md_processor = None
+            rag.vector_store = None
+            rag.folder_path = docs_path
+            globals()["rag_system"] = rag
+    else:
+        print(f"Docs folder not found: {docs_path}")
+        # Initialize empty system
+        rag = RAGSystem.__new__(RAGSystem)
+        rag.md_processor = None
+        rag.vector_store = None
+        rag.folder_path = docs_path
+        globals()["rag_system"] = rag
 
 
-import os
-from pathlib import Path
-
-from fastapi.responses import FileResponse
-
 # Custom static file handler with no-cache headers for development
-from fastapi.staticfiles import StaticFiles
 
 
 class DevStaticFiles(StaticFiles):
@@ -147,4 +130,4 @@ async def get_response(self, path: str, scope):
 
 
 # Serve static files for the frontend
-app.mount("/", StaticFiles(directory="../frontend", html=True), name="static")
+app.mount("/", DevStaticFiles(directory="../frontend", html=True), name="static")
diff --git a/backend/config.py b/backend/config.py
@@ -11,18 +11,13 @@
 class Config:
     """Configuration settings for the RAG system"""
 
-    # Anthropic API settings
-    ANTHROPIC_API_KEY: str = os.getenv("ANTHROPIC_API_KEY", "")
-    ANTHROPIC_MODEL: str = "claude-sonnet-4-20250514"
-
     # Embedding model settings
     EMBEDDING_MODEL: str = "all-MiniLM-L6-v2"
 
     # Document processing settings
     CHUNK_SIZE: int = 800  # Size of text chunks for vector storage
     CHUNK_OVERLAP: int = 100  # Characters to overlap between chunks
     MAX_RESULTS: int = 5  # Maximum search results to return
-    MAX_HISTORY: int = 2  # Number of conversation messages to remember
 
     # Database paths
     CHROMA_PATH: str = "./chroma_db"  # ChromaDB storage location