diff --git a/.claude/settings.local.json b/.claude/settings.local.json
new file mode 100644
index 000000000..1d3fa4e21
--- /dev/null
+++ b/.claude/settings.local.json
@@ -0,0 +1,13 @@
+{
+  "permissions": {
+    "allow": [
+      "Bash(git add:*)",
+      "Bash(git push:*)",
+      "Bash(git pull:*)",
+      "Bash(echo:*)",
+      "Bash(uv run -m pytest:*)",
+      "Bash(git commit:*)",
+      "Bash(git merge:*)"
+    ]
+  }
+}
diff --git a/.github/workflows/claude-code-review.yml b/.github/workflows/claude-code-review.yml
new file mode 100644
index 000000000..4f6145beb
--- /dev/null
+++ b/.github/workflows/claude-code-review.yml
@@ -0,0 +1,44 @@
+name: Claude Code Review
+
+on:
+  pull_request:
+    types: [opened, synchronize, ready_for_review, reopened]
+    # Optional: Only run on specific file changes
+    # paths:
+    #   - "src/**/*.ts"
+    #   - "src/**/*.tsx"
+    #   - "src/**/*.js"
+    #   - "src/**/*.jsx"
+
+jobs:
+  claude-review:
+    # Optional: Filter by PR author
+    # if: |
+    #   github.event.pull_request.user.login == 'external-contributor' ||
+    #   github.event.pull_request.user.login == 'new-developer' ||
+    #   github.event.pull_request.author_association == 'FIRST_TIME_CONTRIBUTOR'
+
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      pull-requests: read
+      issues: read
+      id-token: write
+
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 1
+
+      - name: Run Claude Code Review
+        id: claude-review
+        uses: anthropics/claude-code-action@v1
+        with:
+          anthropic_api_key: ${{ secrets.ANTHROPIC_API_KEY }}
+          plugin_marketplaces: 'https://github.com/anthropics/claude-code.git'
+          plugins: 'code-review@claude-code-plugins'
+          prompt: '/code-review:code-review ${{ github.repository }}/pull/${{ github.event.pull_request.number }}'
+          # See https://github.com/anthropics/claude-code-action/blob/main/docs/usage.md
+          # or https://code.claude.com/docs/en/cli-reference for available options
+
diff --git a/.github/workflows/claude.yml b/.github/workflows/claude.yml
new file mode 100644
index 000000000..79fe05647
--- /dev/null
+++ b/.github/workflows/claude.yml
@@ -0,0 +1,50 @@
+name: Claude Code
+
+on:
+  issue_comment:
+    types: [created]
+  pull_request_review_comment:
+    types: [created]
+  issues:
+    types: [opened, assigned]
+  pull_request_review:
+    types: [submitted]
+
+jobs:
+  claude:
+    if: |
+      (github.event_name == 'issue_comment' && contains(github.event.comment.body, '@claude')) ||
+      (github.event_name == 'pull_request_review_comment' && contains(github.event.comment.body, '@claude')) ||
+      (github.event_name == 'pull_request_review' && contains(github.event.review.body, '@claude')) ||
+      (github.event_name == 'issues' && (contains(github.event.issue.body, '@claude') || contains(github.event.issue.title, '@claude')))
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      pull-requests: read
+      issues: read
+      id-token: write
+      actions: read # Required for Claude to read CI results on PRs
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 1
+
+      - name: Run Claude Code
+        id: claude
+        uses: anthropics/claude-code-action@v1
+        with:
+          anthropic_api_key: ${{ secrets.ANTHROPIC_API_KEY }}
+
+          # This is an optional setting that allows Claude to read CI results on PRs
+          additional_permissions: |
+            actions: read
+
+          # Optional: Give a custom prompt to Claude. If this is not specified, Claude will perform the instructions specified in the comment that tagged it.
+          # prompt: 'Update the pull request description to include a summary of changes.'
+
+          # Optional: Add claude_args to customize behavior and configuration
+          # See https://github.com/anthropics/claude-code-action/blob/main/docs/usage.md
+          # or https://code.claude.com/docs/en/cli-reference for available options
+          # claude_args: '--allowed-tools Bash(gh pr:*)'
+
diff --git a/CLAUDE.md b/CLAUDE.md
new file mode 100644
index 000000000..7162cce15
--- /dev/null
+++ b/CLAUDE.md
@@ -0,0 +1,203 @@
+# CLAUDE.md
+
+This file provides guidance to Claude Code (claude.ai/code) when working with code in this repository.
+
+## Project Overview
+
+This is a Retrieval-Augmented Generation (RAG) chatbot system that answers questions about DeepLearning.AI course materials. It uses ChromaDB for vector storage, Anthropic's Claude API with tool calling, and provides a web interface for conversational queries.
+
+## Development Commands
+
+### Setup
+```bash
+# Install dependencies (uses uv package manager)
+uv sync
+
+# Set up environment variables
+cp .env.example .env
+# Edit .env and add your ANTHROPIC_API_KEY
+```
+
+### Running the Application
+```bash
+# Quick start (recommended)
+./run.sh
+
+# Manual start (from project root)
+cd backend && uv run uvicorn app:app --reload --port 8000
+
+# Access points
+# - Web UI: http://localhost:8000
+# - API docs: http://localhost:8000/docs
+```
+
+### Adding Course Documents
+Place text files in the `docs/` folder. Files are automatically loaded on server startup. See "Document Format Requirements" below.
+
+## Architecture
+
+### RAG Pipeline Flow
+
+The system implements a **tool-based RAG architecture** where Claude decides when to search:
+
+```
+User Query → FastAPI → RAGSystem → AIGenerator → Claude API
+                                                      ↓
+                                            (Claude calls tool)
+                                                      ↓
+                                    SearchTool → VectorStore → ChromaDB
+                                                      ↓
+                                         (search results returned)
+                                                      ↓
+                                            Claude synthesizes response
+                                                      ↓
+                                          SessionManager stores history
+                                                      ↓
+                                            Return answer + sources
+```
+
+**Key architectural decision**: Claude has search as a *callable tool*, not an always-on feature. The system prompt instructs Claude to call `search_course_content` when needed, making searches contextual rather than automatic.
+
+### Dual Collection Strategy
+
+ChromaDB uses **two separate collections** with different purposes:
+
+1. **`course_catalog`** (vector_store.py:51)
+   - Purpose: Fuzzy matching of course names for search filtering
+   - Documents: Course titles only
+   - Metadata: Full course info (instructor, links, lesson metadata)
+   - IDs: Course title (serves as unique identifier)
+   - Usage: When user specifies a course name, semantic search finds the best match
+
+2. **`course_content`** (vector_store.py:52)
+   - Purpose: Actual semantic search of course material
+   - Documents: Text chunks with enriched context
+   - Metadata: `{course_title, lesson_number, chunk_index}`
+   - IDs: `"{course_title_snake_case}_{chunk_index}"`
+   - Usage: Primary search collection for answering queries
+
+This separation enables fuzzy course name matching (e.g., "MCP" → "MCP: Build Rich-Context AI Apps") before searching content.
+
+### Component Relationships
+
+**rag_system.py** is the orchestration layer that:
+- Coordinates all components (VectorStore, AIGenerator, SearchTool, SessionManager)
+- Manages document ingestion and deduplication
+- Handles query flow from input to response
+
+**ai_generator.py** handles Claude API interactions:
+- Builds API requests with system prompt, history, and tool definitions
+- Processes tool calls from Claude
+- Extracts responses and sources from Claude's output
+- Uses temperature=0 for deterministic responses
+
+**session_manager.py** maintains conversation state:
+- Thread-safe session storage with dict-based in-memory storage
+- Automatically trims history to last `MAX_HISTORY` exchanges (default: 2)
+- Each session tracks conversation context for multi-turn queries
+
+### Text Chunking Strategy
+
+**document_processor.py:25-91** implements sentence-aware chunking:
+
+1. **Sentence splitting** using regex that handles abbreviations (Mr., Dr., etc.)
+2. **Chunk building** up to 800 characters per chunk
+3. **Overlap calculation** - 100 characters shared between consecutive chunks by counting backwards from chunk end
+4. **Context enrichment** - First chunk of each lesson prefixed with `"Lesson N content: ..."`, last lesson chunks include course title
+
+This preserves semantic boundaries and context across chunk boundaries.
+
+## Document Format Requirements
+
+Course documents must follow this structure:
+
+```
+Course Title: [title]
+Course Link: [url]
+Course Instructor: [name]
+
+Lesson 0: [title]
+Lesson Link: [url]
+[content...]
+
+Lesson 1: [title]
+Lesson Link: [url]
+[content...]
+```
+
+**Processing behavior**:
+- Lines 1-3: Metadata extraction with regex matching
+- Remaining lines: Parsed for `^Lesson\s+(\d+):\s*(.+)$` markers
+- Content between lesson markers becomes lesson content
+- Lesson links (optional) must appear immediately after lesson headers
+- If no lesson markers found, entire file treated as single document
+
+## Configuration
+
+All configuration in **backend/config.py** as a dataclass:
+
+- `CHUNK_SIZE`: 800 characters (sentence-aware, not hard cutoff)
+- `CHUNK_OVERLAP`: 100 characters between chunks
+- `MAX_RESULTS`: 5 search results per query
+- `MAX_HISTORY`: 2 conversation exchanges retained
+- `EMBEDDING_MODEL`: "all-MiniLM-L6-v2" (384-dimensional embeddings)
+- `ANTHROPIC_MODEL`: "claude-sonnet-4-20250514"
+- `CHROMA_PATH`: "./chroma_db" (persistent vector storage)
+
+## Important Patterns
+
+### Document Deduplication
+**rag_system.py:76** checks existing course titles before processing. If a course with the same title already exists in the vector store, it's skipped. To reload a course, clear the vector store first.
+
+### Tool Definition
+**search_tools.py** defines the `search_course_content` tool with three parameters:
+- `query` (required): What to search for
+- `course_name` (optional): Fuzzy-matched against course_catalog
+- `lesson_number` (optional): Filter to specific lesson
+
+The system prompt instructs Claude to use this tool strategically, not for every query.
+
+### Search Filtering
+**vector_store.py:118-133** builds ChromaDB filters:
+- Both course + lesson: `{"$and": [{"course_title": "..."}, {"lesson_number": N}]}`
+- Course only: `{"course_title": "..."}`
+- Lesson only: `{"lesson_number": N}`
+- Neither: No filter (search all content)
+
+### Session Management
+Sessions are created implicitly if no `session_id` is provided. Frontend passes `session_id` back to maintain conversation context. Sessions are stored in-memory (lost on restart).
+
+## Key Files
+
+- **app.py**: FastAPI application, startup document loading, API endpoints
+- **rag_system.py**: Main orchestration, coordinates all components
+- **vector_store.py**: ChromaDB wrapper, dual collection management, search logic
+- **ai_generator.py**: Claude API integration, tool call handling
+- **document_processor.py**: Metadata extraction, chunking algorithm
+- **search_tools.py**: Tool definitions for Claude function calling
+- **session_manager.py**: Conversation history management
+- **config.py**: Centralized configuration
+- **models.py**: Pydantic data models (Course, Lesson, CourseChunk)
+
+## Frontend
+
+Vanilla JavaScript application (frontend/) with no framework dependencies:
+- **index.html**: Chat UI structure
+- **script.js**: API communication, message handling
+- **style.css**: Responsive styling
+
+Frontend communicates with backend via `/api/query` POST endpoint, receives responses with `{answer, sources, session_id}`.
+
+## Extending the System
+
+### Adding New Course Sources
+Place files in `docs/` folder matching the required format. Supported extensions: `.txt`, `.pdf`, `.docx`. Server automatically loads on startup.
+
+### Modifying Chunking Behavior
+Edit `CHUNK_SIZE` and `CHUNK_OVERLAP` in config.py. Larger chunks provide more context but reduce granularity. More overlap improves context preservation but increases storage.
+
+### Changing Search Results1
+Modify `MAX_RESULTS` in config.py to return more/fewer chunks per search. More results give Claude more context but increase token usage.
+
+### Adjusting Conversation Memory
+Change `MAX_HISTORY` in config.py. Higher values retain more context but increase token costs. Each exchange = 2 messages (user + assistant).
diff --git a/backend-tool-refactor.md b/backend-tool-refactor.md
new file mode 100644
index 000000000..de23ae5c7
--- /dev/null
+++ b/backend-tool-refactor.md
@@ -0,0 +1,28 @@
+Refactor @backend/ai_generator.py to support sequential tool calling where Claude can make up to 2 tool calls in separate API rounds.
+
+Current behavior:
+- Claude makes 1 tool call → tools are removed from API params → final response
+- If Claude wants another tool call after seeing results, it can't (gets empty response)
+
+Desired behavior:
+- Each tool call should be a separate API request where Claude can reason about previous results
+- Support for complex queries requiring multiple searches for comparisons, multi-part questions, or when information from different courses/lessons is needed
+
+Example flow:
+1. User: "Search for a course that discusses the same topic as lesson 4 of course X"
+2. Claude: get course outline for course X → gets title of lesson 4
+3. Claude: uses the title to search for a course that discusses the same topic → returns course information
+4. Claude: provides complete answer
+
+Requirements:
+- Maximum 2 sequential rounds per user query
+- Terminate when: (a) 2 rounds completed, (b) Claude's response has no tool_use blocks, or (c) tool call fails
+- Preserve conversation context between rounds
+- Handle tool execution errors gracefully
+
+Notes: 
+- Update the system prompt in @backend/ai_generator.py 
+- Update the test @backend/tests/test_ai_generator.py
+- Write tests that verify the external behavior (API calls made, tools executed, results returned) rather than internal state details. 
+
+Use two parallel subagents to brainstorm possible plans. Do not implement any code.
diff --git a/backend/ai_generator.py b/backend/ai_generator.py
index 0363ca90c..88a4b59cc 100644
--- a/backend/ai_generator.py
+++ b/backend/ai_generator.py
@@ -1,25 +1,43 @@
+from typing import Any, Dict, List, Optional
+
 import anthropic
-from typing import List, Optional, Dict, Any
+
 
 class AIGenerator:
     """Handles interactions with Anthropic's Claude API for generating responses"""
-    
+
+    MAX_TOOL_ROUNDS = 2
+    DIRECT_RETURN_TOOLS = frozenset({"get_course_outline"})
+
     # Static system prompt to avoid rebuilding on each call
-    SYSTEM_PROMPT = """ You are an AI assistant specialized in course materials and educational content with access to a comprehensive search tool for course information.
+    SYSTEM_PROMPT = """ You are an AI assistant specialized in course materials and educational content with access to comprehensive tools for course information.
+
+Available Tools:
+- **search_course_content**: Search within course materials for specific content
+- **get_course_outline**: Get complete course outline with all lessons
+
+Tool Usage Guidelines:
+- Use search_course_content for detailed questions about specific topics or lessons
+- Use get_course_outline for questions about course structure, lesson lists, or "what's in this course"
+- **You can make up to 2 rounds of tool calls to gather comprehensive information**
+  - Round 1: Initial search to gather relevant information
+  - Round 2: Refine or search additional context (different course, narrower lesson, related term)
+  - Most queries need only 1 tool call. Use a second only when the first result is insufficient.
+- Synthesize tool results into accurate, fact-based responses
+- If tools yield no results, state this clearly without offering alternatives
 
-Search Tool Usage:
-- Use the search tool **only** for questions about specific course content or detailed educational materials
-- **One search per query maximum**
-- Synthesize search results into accurate, fact-based responses
-- If search yields no results, state this clearly without offering alternatives
+Course Outline Responses:
+When using get_course_outline:
+- Return the tool output EXACTLY as formatted - do not add summaries, context, or additional information
+- Present the complete structured list without modification
 
 Response Protocol:
-- **General knowledge questions**: Answer using existing knowledge without searching
-- **Course-specific questions**: Search first, then answer
+- **General knowledge questions**: Answer using existing knowledge without tools
+- **Course outline questions**: Use get_course_outline first
+- **Course-specific content questions**: Use search_course_content first, then synthesize
 - **No meta-commentary**:
- - Provide direct answers only — no reasoning process, search explanations, or question-type analysis
- - Do not mention "based on the search results"
-
+  - Provide direct answers only — no reasoning process, tool explanations, or question-type analysis
+  - Do not mention "based on the tool results"
 
 All responses must be:
 1. **Brief, Concise and focused** - Get to the point quickly
@@ -28,108 +46,171 @@ class AIGenerator:
 4. **Example-supported** - Include relevant examples when they aid understanding
 Provide only the direct answer to what was asked.
 """
-    
+
     def __init__(self, api_key: str, model: str):
         self.client = anthropic.Anthropic(api_key=api_key)
         self.model = model
-        
+
         # Pre-build base API parameters
-        self.base_params = {
-            "model": self.model,
-            "temperature": 0,
-            "max_tokens": 800
-        }
-    
-    def generate_response(self, query: str,
-                         conversation_history: Optional[str] = None,
-                         tools: Optional[List] = None,
-                         tool_manager=None) -> str:
+        self.base_params = {"model": self.model, "temperature": 0, "max_tokens": 800}
+
+    def _call_api(self, **params):
+        """Make an Anthropic API call with standardized error handling."""
+        try:
+            return self.client.messages.create(**params)
+        except anthropic.AuthenticationError as e:
+            raise RuntimeError(f"Anthropic API authentication failed: {e}") from e
+        except anthropic.APIError as e:
+            raise RuntimeError(f"Anthropic API error: {e}") from e
+
+    def generate_response(
+        self,
+        query: str,
+        conversation_history: Optional[str] = None,
+        tools: Optional[List] = None,
+        tool_manager=None,
+    ) -> str:
         """
         Generate AI response with optional tool usage and conversation context.
-        
+        Supports up to MAX_TOOL_ROUNDS sequential rounds of tool calling.
+
         Args:
             query: The user's question or request
             conversation_history: Previous messages for context
             tools: Available tools the AI can use
             tool_manager: Manager to execute tools
-            
+
         Returns:
             Generated response as string
         """
-        
+
         # Build system content efficiently - avoid string ops when possible
         system_content = (
             f"{self.SYSTEM_PROMPT}\n\nPrevious conversation:\n{conversation_history}"
-            if conversation_history 
+            if conversation_history
             else self.SYSTEM_PROMPT
         )
-        
-        # Prepare API call parameters efficiently
-        api_params = {
+
+        # Start with initial messages
+        messages = [{"role": "user", "content": query}]
+
+        # Execute up to MAX_TOOL_ROUNDS rounds of tool calling
+        for round_num in range(self.MAX_TOOL_ROUNDS):
+            # Prepare API call parameters
+            api_params = {
+                **self.base_params,
+                "messages": messages,
+                "system": system_content,
+            }
+
+            # Add tools if available
+            if tools:
+                api_params["tools"] = tools
+                api_params["tool_choice"] = {"type": "auto"}
+
+            response = self._call_api(**api_params)
+
+            # Handle tool execution if needed
+            if response.stop_reason == "tool_use" and tool_manager:
+                messages, should_continue, direct_result = self._handle_tool_execution(
+                    response, messages, tool_manager
+                )
+                if direct_result is not None:
+                    return direct_result
+                if not should_continue:
+                    break
+            else:
+                # No tool use, return direct response
+                return self._extract_text(response)
+
+        # After max rounds, make final call without tools to get response
+        final_params = {
             **self.base_params,
-            "messages": [{"role": "user", "content": query}],
-            "system": system_content
+            "messages": messages,
+            "system": system_content,
         }
-        
-        # Add tools if available
-        if tools:
-            api_params["tools"] = tools
-            api_params["tool_choice"] = {"type": "auto"}
-        
-        # Get response from Claude
-        response = self.client.messages.create(**api_params)
-        
-        # Handle tool execution if needed
-        if response.stop_reason == "tool_use" and tool_manager:
-            return self._handle_tool_execution(response, api_params, tool_manager)
-        
-        # Return direct response
-        return response.content[0].text
-    
-    def _handle_tool_execution(self, initial_response, base_params: Dict[str, Any], tool_manager):
+
+        final_response = self._call_api(**final_params)
+        return self._extract_text(final_response)
+
+    @staticmethod
+    def _extract_text(response) -> str:
+        """Safely extract text from an API response, handling empty content."""
+        if not response.content:
+            return "I'm sorry, I wasn't able to generate a response. Please try again."
+        for block in response.content:
+            if hasattr(block, "text"):
+                return block.text
+        return "I'm sorry, I wasn't able to generate a response. Please try again."
+
+    def _handle_tool_execution(self, initial_response, messages: List, tool_manager):
         """
-        Handle execution of tool calls and get follow-up response.
-        
+        Handle execution of tool calls and update message history.
+
+        Executes ALL tool calls before deciding flow control. This ensures the
+        Anthropic API receives tool_result blocks for every tool_use block, even
+        if some tools fail.
+
         Args:
             initial_response: The response containing tool use requests
-            base_params: Base API parameters
+            messages: Current message history
             tool_manager: Manager to execute tools
-            
+
         Returns:
-            Final response text after tool execution
+            Tuple of (updated_messages, should_continue, direct_result)
+            direct_result is non-None when the tool output should be returned as-is
         """
-        # Start with existing messages
-        messages = base_params["messages"].copy()
-        
         # Add AI's tool use response
         messages.append({"role": "assistant", "content": initial_response.content})
-        
-        # Execute all tool calls and collect results
+
+        # Execute ALL tool calls and collect results
         tool_results = []
+        direct_return_result = None
+        has_error = False
+
         for content_block in initial_response.content:
-            if content_block.type == "tool_use":
+            if content_block.type != "tool_use":
+                continue
+
+            try:
                 tool_result = tool_manager.execute_tool(
-                    content_block.name, 
-                    **content_block.input
+                    content_block.name, **content_block.input
+                )
+
+                tool_results.append(
+                    {
+                        "type": "tool_result",
+                        "tool_use_id": content_block.id,
+                        "content": tool_result,
+                    }
                 )
-                
-                tool_results.append({
-                    "type": "tool_result",
-                    "tool_use_id": content_block.id,
-                    "content": tool_result
-                })
-        
-        # Add tool results as single message
+
+                # Mark outline results for direct return (but keep executing remaining tools)
+                if content_block.name in self.DIRECT_RETURN_TOOLS:
+                    direct_return_result = tool_result
+
+            except Exception as e:
+                has_error = True
+                tool_results.append(
+                    {
+                        "type": "tool_result",
+                        "tool_use_id": content_block.id,
+                        "content": f"Error: Tool execution failed - {str(e)}",
+                        "is_error": True,
+                    }
+                )
+
+        # Add all tool results as single message
         if tool_results:
             messages.append({"role": "user", "content": tool_results})
-        
-        # Prepare final API call without tools
-        final_params = {
-            **self.base_params,
-            "messages": messages,
-            "system": base_params["system"]
-        }
-        
-        # Get final response
-        final_response = self.client.messages.create(**final_params)
-        return final_response.content[0].text
\ No newline at end of file
+
+        # Direct return takes priority (e.g. course outline)
+        if direct_return_result is not None:
+            return messages, False, direct_return_result
+
+        # Stop rounds if any tool failed
+        if has_error:
+            return messages, False, None
+
+        # Continue with next round
+        return messages, True, None
diff --git a/backend/app.py b/backend/app.py
index 5a69d741d..352ee097c 100644
--- a/backend/app.py
+++ b/backend/app.py
@@ -1,4 +1,5 @@
 import warnings
+
 warnings.filterwarnings("ignore", message="resource_tracker: There appear to be.*")
 
 from fastapi import FastAPI, HTTPException
@@ -6,7 +7,7 @@
 from fastapi.staticfiles import StaticFiles
 from fastapi.middleware.trustedhost import TrustedHostMiddleware
 from pydantic import BaseModel
-from typing import List, Optional
+from typing import List, Optional, Dict, Union
 import os
 
 from config import config
@@ -16,10 +17,7 @@
 app = FastAPI(title="Course Materials RAG System", root_path="")
 
 # Add trusted host middleware for proxy
-app.add_middleware(
-    TrustedHostMiddleware,
-    allowed_hosts=["*"]
-)
+app.add_middleware(TrustedHostMiddleware, allowed_hosts=["*"])
 
 # Enable CORS with proper settings for proxy
 app.add_middleware(
@@ -34,25 +32,39 @@
 # Initialize RAG system
 rag_system = RAGSystem(config)
 
+
 # Pydantic models for request/response
 class QueryRequest(BaseModel):
     """Request model for course queries"""
+
     query: str
     session_id: Optional[str] = None
 
+
 class QueryResponse(BaseModel):
     """Response model for course queries"""
+
     answer: str
-    sources: List[str]
+    sources: List[Union[str, Dict[str, str]]]  # Support both strings and dicts
     session_id: str
 
+
 class CourseStats(BaseModel):
     """Response model for course statistics"""
+
     total_courses: int
     course_titles: List[str]
 
+
+class ClearSessionRequest(BaseModel):
+    """Request model for clearing a session"""
+
+    session_id: str
+
+
 # API Endpoints
 
+
 @app.post("/api/query", response_model=QueryResponse)
 async def query_documents(request: QueryRequest):
     """Process a query and return response with sources"""
@@ -61,18 +73,15 @@ async def query_documents(request: QueryRequest):
         session_id = request.session_id
         if not session_id:
             session_id = rag_system.session_manager.create_session()
-        
+
         # Process query using RAG system
-        answer, sources = rag_system.query(request.query, session_id)
-        
-        return QueryResponse(
-            answer=answer,
-            sources=sources,
-            session_id=session_id
-        )
+        answer, sources, source_links = rag_system.query(request.query, session_id)
+
+        return QueryResponse(answer=answer, sources=sources, session_id=session_id)
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
+
 @app.get("/api/courses", response_model=CourseStats)
 async def get_course_stats():
     """Get course analytics and statistics"""
@@ -80,11 +89,22 @@ async def get_course_stats():
         analytics = rag_system.get_course_analytics()
         return CourseStats(
             total_courses=analytics["total_courses"],
-            course_titles=analytics["course_titles"]
+            course_titles=analytics["course_titles"],
         )
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 
+
+@app.post("/api/session/clear")
+async def clear_session(request: ClearSessionRequest):
+    """Clear a conversation session"""
+    try:
+        rag_system.session_manager.clear_session(request.session_id)
+        return {"status": "success", "message": f"Session {request.session_id} cleared"}
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+
+
 @app.on_event("startup")
 async def startup_event():
     """Load initial documents on startup"""
@@ -92,11 +112,14 @@ async def startup_event():
     if os.path.exists(docs_path):
         print("Loading initial documents...")
         try:
-            courses, chunks = rag_system.add_course_folder(docs_path, clear_existing=False)
+            courses, chunks = rag_system.add_course_folder(
+                docs_path, clear_existing=False
+            )
             print(f"Loaded {courses} courses with {chunks} chunks")
         except Exception as e:
             print(f"Error loading documents: {e}")
 
+
 # Custom static file handler with no-cache headers for development
 from fastapi.staticfiles import StaticFiles
 from fastapi.responses import FileResponse
@@ -113,7 +136,7 @@ async def get_response(self, path: str, scope):
             response.headers["Pragma"] = "no-cache"
             response.headers["Expires"] = "0"
         return response
-    
-    
+
+
 # Serve static files for the frontend
-app.mount("/", StaticFiles(directory="../frontend", html=True), name="static")
\ No newline at end of file
+app.mount("/", DevStaticFiles(directory="../frontend", html=True), name="static")
diff --git a/backend/config.py b/backend/config.py
index d9f6392ef..7379e7133 100644
--- a/backend/config.py
+++ b/backend/config.py
@@ -5,25 +5,26 @@
 # Load environment variables from .env file
 load_dotenv()
 
+
 @dataclass
 class Config:
     """Configuration settings for the RAG system"""
+
     # Anthropic API settings
     ANTHROPIC_API_KEY: str = os.getenv("ANTHROPIC_API_KEY", "")
     ANTHROPIC_MODEL: str = "claude-sonnet-4-20250514"
-    
+
     # Embedding model settings
     EMBEDDING_MODEL: str = "all-MiniLM-L6-v2"
-    
+
     # Document processing settings
-    CHUNK_SIZE: int = 800       # Size of text chunks for vector storage
-    CHUNK_OVERLAP: int = 100     # Characters to overlap between chunks
-    MAX_RESULTS: int = 5         # Maximum search results to return
-    MAX_HISTORY: int = 2         # Number of conversation messages to remember
-    
+    CHUNK_SIZE: int = 800  # Size of text chunks for vector storage
+    CHUNK_OVERLAP: int = 100  # Characters to overlap between chunks
+    MAX_RESULTS: int = 5  # Maximum search results to return
+    MAX_HISTORY: int = 2  # Number of conversation messages to remember
+
     # Database paths
     CHROMA_PATH: str = "./chroma_db"  # ChromaDB storage location
 
-config = Config()
-
 
+config = Config()
diff --git a/backend/document_processor.py b/backend/document_processor.py
index 266e85904..32c6648ae 100644
--- a/backend/document_processor.py
+++ b/backend/document_processor.py
@@ -3,81 +3,84 @@
 from typing import List, Tuple
 from models import Course, Lesson, CourseChunk
 
+
 class DocumentProcessor:
     """Processes course documents and extracts structured information"""
-    
+
     def __init__(self, chunk_size: int, chunk_overlap: int):
         self.chunk_size = chunk_size
         self.chunk_overlap = chunk_overlap
-    
+
     def read_file(self, file_path: str) -> str:
         """Read content from file with UTF-8 encoding"""
         try:
-            with open(file_path, 'r', encoding='utf-8') as file:
+            with open(file_path, "r", encoding="utf-8") as file:
                 return file.read()
         except UnicodeDecodeError:
             # If UTF-8 fails, try with error handling
-            with open(file_path, 'r', encoding='utf-8', errors='ignore') as file:
+            with open(file_path, "r", encoding="utf-8", errors="ignore") as file:
                 return file.read()
-    
-
 
     def chunk_text(self, text: str) -> List[str]:
         """Split text into sentence-based chunks with overlap using config settings"""
-        
+
         # Clean up the text
-        text = re.sub(r'\s+', ' ', text.strip())  # Normalize whitespace
-        
+        text = re.sub(r"\s+", " ", text.strip())  # Normalize whitespace
+
         # Better sentence splitting that handles abbreviations
         # This regex looks for periods followed by whitespace and capital letters
         # but ignores common abbreviations
-        sentence_endings = re.compile(r'(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\!|\?)\s+(?=[A-Z])')
+        sentence_endings = re.compile(
+            r"(?<!\w\.\w.)(?<![A-Z][a-z]\.)(?<=\.|\!|\?)\s+(?=[A-Z])"
+        )
         sentences = sentence_endings.split(text)
-        
+
         # Clean sentences
         sentences = [s.strip() for s in sentences if s.strip()]
-        
+
         chunks = []
         i = 0
-        
+
         while i < len(sentences):
             current_chunk = []
             current_size = 0
-            
+
             # Build chunk starting from sentence i
             for j in range(i, len(sentences)):
                 sentence = sentences[j]
-                
+
                 # Calculate size with space
                 space_size = 1 if current_chunk else 0
                 total_addition = len(sentence) + space_size
-                
+
                 # Check if adding this sentence would exceed chunk size
                 if current_size + total_addition > self.chunk_size and current_chunk:
                     break
-                
+
                 current_chunk.append(sentence)
                 current_size += total_addition
-            
+
             # Add chunk if we have content
             if current_chunk:
-                chunks.append(' '.join(current_chunk))
-                
+                chunks.append(" ".join(current_chunk))
+
                 # Calculate overlap for next chunk
-                if hasattr(self, 'chunk_overlap') and self.chunk_overlap > 0:
+                if hasattr(self, "chunk_overlap") and self.chunk_overlap > 0:
                     # Find how many sentences to overlap
                     overlap_size = 0
                     overlap_sentences = 0
-                    
+
                     # Count backwards from end of current chunk
                     for k in range(len(current_chunk) - 1, -1, -1):
-                        sentence_len = len(current_chunk[k]) + (1 if k < len(current_chunk) - 1 else 0)
+                        sentence_len = len(current_chunk[k]) + (
+                            1 if k < len(current_chunk) - 1 else 0
+                        )
                         if overlap_size + sentence_len <= self.chunk_overlap:
                             overlap_size += sentence_len
                             overlap_sentences += 1
                         else:
                             break
-                    
+
                     # Move start position considering overlap
                     next_start = i + len(current_chunk) - overlap_sentences
                     i = max(next_start, i + 1)  # Ensure we make progress
@@ -87,14 +90,12 @@ def chunk_text(self, text: str) -> List[str]:
             else:
                 # No sentences fit, move to next
                 i += 1
-        
-        return chunks
-
-
 
+        return chunks
 
-    
-    def process_course_document(self, file_path: str) -> Tuple[Course, List[CourseChunk]]:
+    def process_course_document(
+        self, file_path: str
+    ) -> Tuple[Course, List[CourseChunk]]:
         """
         Process a course document with expected format:
         Line 1: Course Title: [title]
@@ -104,47 +105,51 @@ def process_course_document(self, file_path: str) -> Tuple[Course, List[CourseCh
         """
         content = self.read_file(file_path)
         filename = os.path.basename(file_path)
-        
-        lines = content.strip().split('\n')
-        
+
+        lines = content.strip().split("\n")
+
         # Extract course metadata from first three lines
         course_title = filename  # Default fallback
         course_link = None
         instructor_name = "Unknown"
-        
+
         # Parse course title from first line
         if len(lines) >= 1 and lines[0].strip():
-            title_match = re.match(r'^Course Title:\s*(.+)$', lines[0].strip(), re.IGNORECASE)
+            title_match = re.match(
+                r"^Course Title:\s*(.+)$", lines[0].strip(), re.IGNORECASE
+            )
             if title_match:
                 course_title = title_match.group(1).strip()
             else:
                 course_title = lines[0].strip()
-        
+
         # Parse remaining lines for course metadata
         for i in range(1, min(len(lines), 4)):  # Check first 4 lines for metadata
             line = lines[i].strip()
             if not line:
                 continue
-                
+
             # Try to match course link
-            link_match = re.match(r'^Course Link:\s*(.+)$', line, re.IGNORECASE)
+            link_match = re.match(r"^Course Link:\s*(.+)$", line, re.IGNORECASE)
             if link_match:
                 course_link = link_match.group(1).strip()
                 continue
-                
+
             # Try to match instructor
-            instructor_match = re.match(r'^Course Instructor:\s*(.+)$', line, re.IGNORECASE)
+            instructor_match = re.match(
+                r"^Course Instructor:\s*(.+)$", line, re.IGNORECASE
+            )
             if instructor_match:
                 instructor_name = instructor_match.group(1).strip()
                 continue
-        
+
         # Create course object with title as ID
         course = Course(
             title=course_title,
             course_link=course_link,
-            instructor=instructor_name if instructor_name != "Unknown" else None
+            instructor=instructor_name if instructor_name != "Unknown" else None,
         )
-        
+
         # Process lessons and create chunks
         course_chunks = []
         current_lesson = None
@@ -152,108 +157,114 @@ def process_course_document(self, file_path: str) -> Tuple[Course, List[CourseCh
         lesson_link = None
         lesson_content = []
         chunk_counter = 0
-        
+
         # Start processing from line 4 (after metadata)
         start_index = 3
         if len(lines) > 3 and not lines[3].strip():
             start_index = 4  # Skip empty line after instructor
-        
+
         i = start_index
         while i < len(lines):
             line = lines[i]
-            
+
             # Check for lesson markers (e.g., "Lesson 0: Introduction")
-            lesson_match = re.match(r'^Lesson\s+(\d+):\s*(.+)$', line.strip(), re.IGNORECASE)
-            
+            lesson_match = re.match(
+                r"^Lesson\s+(\d+):\s*(.+)$", line.strip(), re.IGNORECASE
+            )
+
             if lesson_match:
                 # Process previous lesson if it exists
                 if current_lesson is not None and lesson_content:
-                    lesson_text = '\n'.join(lesson_content).strip()
+                    lesson_text = "\n".join(lesson_content).strip()
                     if lesson_text:
                         # Add lesson to course
                         lesson = Lesson(
                             lesson_number=current_lesson,
                             title=lesson_title,
-                            lesson_link=lesson_link
+                            lesson_link=lesson_link,
                         )
                         course.lessons.append(lesson)
-                        
+
                         # Create chunks for this lesson
                         chunks = self.chunk_text(lesson_text)
                         for idx, chunk in enumerate(chunks):
                             # For the first chunk of each lesson, add lesson context
                             if idx == 0:
-                                chunk_with_context = f"Lesson {current_lesson} content: {chunk}"
+                                chunk_with_context = (
+                                    f"Lesson {current_lesson} content: {chunk}"
+                                )
                             else:
                                 chunk_with_context = chunk
-                            
+
                             course_chunk = CourseChunk(
                                 content=chunk_with_context,
                                 course_title=course.title,
                                 lesson_number=current_lesson,
-                                chunk_index=chunk_counter
+                                chunk_index=chunk_counter,
                             )
                             course_chunks.append(course_chunk)
                             chunk_counter += 1
-                
+
                 # Start new lesson
                 current_lesson = int(lesson_match.group(1))
                 lesson_title = lesson_match.group(2).strip()
                 lesson_link = None
-                
+
                 # Check if next line is a lesson link
                 if i + 1 < len(lines):
                     next_line = lines[i + 1].strip()
-                    link_match = re.match(r'^Lesson Link:\s*(.+)$', next_line, re.IGNORECASE)
+                    link_match = re.match(
+                        r"^Lesson Link:\s*(.+)$", next_line, re.IGNORECASE
+                    )
                     if link_match:
                         lesson_link = link_match.group(1).strip()
                         i += 1  # Skip the link line so it's not added to content
-                
+
                 lesson_content = []
             else:
                 # Add line to current lesson content
                 lesson_content.append(line)
-                
+
             i += 1
-        
+
         # Process the last lesson
         if current_lesson is not None and lesson_content:
-            lesson_text = '\n'.join(lesson_content).strip()
+            lesson_text = "\n".join(lesson_content).strip()
             if lesson_text:
                 lesson = Lesson(
                     lesson_number=current_lesson,
                     title=lesson_title,
-                    lesson_link=lesson_link
+                    lesson_link=lesson_link,
                 )
                 course.lessons.append(lesson)
-                
+
                 chunks = self.chunk_text(lesson_text)
                 for idx, chunk in enumerate(chunks):
                     # For any chunk of each lesson, add lesson context & course title
-                  
+
                     chunk_with_context = f"Course {course_title} Lesson {current_lesson} content: {chunk}"
-                    
+
                     course_chunk = CourseChunk(
                         content=chunk_with_context,
                         course_title=course.title,
                         lesson_number=current_lesson,
-                        chunk_index=chunk_counter
+                        chunk_index=chunk_counter,
                     )
                     course_chunks.append(course_chunk)
                     chunk_counter += 1
-        
+
         # If no lessons found, treat entire content as one document
         if not course_chunks and len(lines) > 2:
-            remaining_content = '\n'.join(lines[start_index:]).strip()
+            remaining_content = "\n".join(lines[start_index:]).strip()
             if remaining_content:
                 chunks = self.chunk_text(remaining_content)
                 for chunk in chunks:
                     course_chunk = CourseChunk(
                         content=chunk,
                         course_title=course.title,
-                        chunk_index=chunk_counter
+                        chunk_index=chunk_counter,
                     )
                     course_chunks.append(course_chunk)
                     chunk_counter += 1
-        
+
         return course, course_chunks
diff --git a/backend/models.py b/backend/models.py
index 7f7126fa3..12ae8113e 100644
--- a/backend/models.py
+++ b/backend/models.py
@@ -1,22 +1,28 @@
 from typing import List, Dict, Optional
 from pydantic import BaseModel
 
+
 class Lesson(BaseModel):
     """Represents a lesson within a course"""
+
     lesson_number: int  # Sequential lesson number (1, 2, 3, etc.)
-    title: str         # Lesson title
+    title: str  # Lesson title
     lesson_link: Optional[str] = None  # URL link to the lesson
 
+
 class Course(BaseModel):
     """Represents a complete course with its lessons"""
-    title: str                 # Full course title (used as unique identifier)
+
+    title: str  # Full course title (used as unique identifier)
     course_link: Optional[str] = None  # URL link to the course
     instructor: Optional[str] = None  # Course instructor name (optional metadata)
-    lessons: List[Lesson] = [] # List of lessons in this course
+    lessons: List[Lesson] = []  # List of lessons in this course
+
 
 class CourseChunk(BaseModel):
     """Represents a text chunk from a course for vector storage"""
-    content: str                        # The actual text content
-    course_title: str                   # Which course this chunk belongs to
-    lesson_number: Optional[int] = None # Which lesson this chunk is from
-    chunk_index: int                    # Position of this chunk in the document
\ No newline at end of file
+
+    content: str  # The actual text content
+    course_title: str  # Which course this chunk belongs to
+    lesson_number: Optional[int] = None  # Which lesson this chunk is from
+    chunk_index: int  # Position of this chunk in the document
diff --git a/backend/rag_system.py b/backend/rag_system.py
index 50d848c8e..c1322a9f2 100644
--- a/backend/rag_system.py
+++ b/backend/rag_system.py
@@ -1,147 +1,170 @@
 from typing import List, Tuple, Optional, Dict
 import os
+import re
 from document_processor import DocumentProcessor
 from vector_store import VectorStore
 from ai_generator import AIGenerator
 from session_manager import SessionManager
-from search_tools import ToolManager, CourseSearchTool
+from search_tools import ToolManager, CourseSearchTool, CourseOutlineTool
 from models import Course, Lesson, CourseChunk
 
+
 class RAGSystem:
     """Main orchestrator for the Retrieval-Augmented Generation system"""
-    
+
     def __init__(self, config):
         self.config = config
-        
+
         # Initialize core components
-        self.document_processor = DocumentProcessor(config.CHUNK_SIZE, config.CHUNK_OVERLAP)
-        self.vector_store = VectorStore(config.CHROMA_PATH, config.EMBEDDING_MODEL, config.MAX_RESULTS)
-        self.ai_generator = AIGenerator(config.ANTHROPIC_API_KEY, config.ANTHROPIC_MODEL)
+        self.document_processor = DocumentProcessor(
+            config.CHUNK_SIZE, config.CHUNK_OVERLAP
+        )
+        self.vector_store = VectorStore(
+            config.CHROMA_PATH, config.EMBEDDING_MODEL, config.MAX_RESULTS
+        )
+        self.ai_generator = AIGenerator(
+            config.ANTHROPIC_API_KEY, config.ANTHROPIC_MODEL
+        )
         self.session_manager = SessionManager(config.MAX_HISTORY)
-        
+
         # Initialize search tools
         self.tool_manager = ToolManager()
         self.search_tool = CourseSearchTool(self.vector_store)
+        self.outline_tool = CourseOutlineTool(self.vector_store)
         self.tool_manager.register_tool(self.search_tool)
-    
+        self.tool_manager.register_tool(self.outline_tool)
+
     def add_course_document(self, file_path: str) -> Tuple[Course, int]:
         """
         Add a single course document to the knowledge base.
-        
+
         Args:
             file_path: Path to the course document
-            
+
         Returns:
             Tuple of (Course object, number of chunks created)
         """
         try:
             # Process the document
-            course, course_chunks = self.document_processor.process_course_document(file_path)
-            
+            course, course_chunks = self.document_processor.process_course_document(
+                file_path
+            )
+
             # Add course metadata to vector store for semantic search
             self.vector_store.add_course_metadata(course)
-            
+
             # Add course content chunks to vector store
             self.vector_store.add_course_content(course_chunks)
-            
+
             return course, len(course_chunks)
         except Exception as e:
             print(f"Error processing course document {file_path}: {e}")
             return None, 0
-    
-    def add_course_folder(self, folder_path: str, clear_existing: bool = False) -> Tuple[int, int]:
+
+    def add_course_folder(
+        self, folder_path: str, clear_existing: bool = False
+    ) -> Tuple[int, int]:
         """
         Add all course documents from a folder.
-        
+
         Args:
             folder_path: Path to folder containing course documents
             clear_existing: Whether to clear existing data first
-            
+
         Returns:
             Tuple of (total courses added, total chunks created)
         """
         total_courses = 0
         total_chunks = 0
-        
+
         # Clear existing data if requested
         if clear_existing:
             print("Clearing existing data for fresh rebuild...")
             self.vector_store.clear_all_data()
-        
+
         if not os.path.exists(folder_path):
             print(f"Folder {folder_path} does not exist")
             return 0, 0
-        
+
         # Get existing course titles to avoid re-processing
         existing_course_titles = set(self.vector_store.get_existing_course_titles())
-        
+
         # Process each file in the folder
         for file_name in os.listdir(folder_path):
             file_path = os.path.join(folder_path, file_name)
-            if os.path.isfile(file_path) and file_name.lower().endswith(('.pdf', '.docx', '.txt')):
+            if os.path.isfile(file_path) and file_name.lower().endswith(
+                (".pdf", ".docx", ".txt")
+            ):
                 try:
                     # Check if this course might already exist
                     # We'll process the document to get the course ID, but only add if new
-                    course, course_chunks = self.document_processor.process_course_document(file_path)
-                    
+                    course, course_chunks = (
+                        self.document_processor.process_course_document(file_path)
+                    )
+
                     if course and course.title not in existing_course_titles:
                         # This is a new course - add it to the vector store
                         self.vector_store.add_course_metadata(course)
                         self.vector_store.add_course_content(course_chunks)
                         total_courses += 1
                         total_chunks += len(course_chunks)
-                        print(f"Added new course: {course.title} ({len(course_chunks)} chunks)")
+                        print(
+                            f"Added new course: {course.title} ({len(course_chunks)} chunks)"
+                        )
                         existing_course_titles.add(course.title)
                     elif course:
                         print(f"Course already exists: {course.title} - skipping")
                 except Exception as e:
                     print(f"Error processing {file_name}: {e}")
-        
+
         return total_courses, total_chunks
-    
-    def query(self, query: str, session_id: Optional[str] = None) -> Tuple[str, List[str]]:
+
+    def query(
+        self, query: str, session_id: Optional[str] = None
+    ) -> Tuple[str, List[str]]:
         """
         Process a user query using the RAG system with tool-based search.
-        
+
         Args:
             query: User's question
             session_id: Optional session ID for conversation context
-            
+
         Returns:
-            Tuple of (response, sources list - empty for tool-based approach)
+            Tuple of (response, sources list, source_links list)
         """
         # Create prompt for the AI with clear instructions
         prompt = f"""Answer this question about course materials: {query}"""
-        
+
         # Get conversation history if session exists
         history = None
         if session_id:
             history = self.session_manager.get_conversation_history(session_id)
-        
+
         # Generate response using AI with tools
         response = self.ai_generator.generate_response(
             query=prompt,
             conversation_history=history,
             tools=self.tool_manager.get_tool_definitions(),
-            tool_manager=self.tool_manager
+            tool_manager=self.tool_manager,
         )
-        
-        # Get sources from the search tool
+
+        # Get sources and source links from the search tool
         sources = self.tool_manager.get_last_sources()
+        source_links = self.tool_manager.get_last_source_links()
 
         # Reset sources after retrieving them
         self.tool_manager.reset_sources()
-        
+
         # Update conversation history
         if session_id:
             self.session_manager.add_exchange(session_id, query, response)
-        
-        # Return response with sources from tool searches
-        return response, sources
-    
+
+        # Return response with sources and links from tool searches
+        return response, sources, source_links
+
     def get_course_analytics(self) -> Dict:
         """Get analytics about the course catalog"""
         return {
             "total_courses": self.vector_store.get_course_count(),
-            "course_titles": self.vector_store.get_existing_course_titles()
-        }
\ No newline at end of file
+            "course_titles": self.vector_store.get_existing_course_titles(),
+        }
diff --git a/backend/search_tools.py b/backend/search_tools.py
index adfe82352..d1a606eae 100644
--- a/backend/search_tools.py
+++ b/backend/search_tools.py
@@ -5,12 +5,12 @@
 
 class Tool(ABC):
     """Abstract base class for all tools"""
-    
+
     @abstractmethod
     def get_tool_definition(self) -> Dict[str, Any]:
         """Return Anthropic tool definition for this tool"""
         pass
-    
+
     @abstractmethod
     def execute(self, **kwargs) -> str:
         """Execute the tool with given parameters"""
@@ -19,11 +19,11 @@ def execute(self, **kwargs) -> str:
 
 class CourseSearchTool(Tool):
     """Tool for searching course content with semantic course name matching"""
-    
+
     def __init__(self, vector_store: VectorStore):
         self.store = vector_store
         self.last_sources = []  # Track sources from last search
-    
+
     def get_tool_definition(self) -> Dict[str, Any]:
         """Return Anthropic tool definition for this tool"""
         return {
@@ -33,46 +33,49 @@ def get_tool_definition(self) -> Dict[str, Any]:
                 "type": "object",
                 "properties": {
                     "query": {
-                        "type": "string", 
-                        "description": "What to search for in the course content"
+                        "type": "string",
+                        "description": "What to search for in the course content",
                     },
                     "course_name": {
                         "type": "string",
-                        "description": "Course title (partial matches work, e.g. 'MCP', 'Introduction')"
+                        "description": "Course title (partial matches work, e.g. 'MCP', 'Introduction')",
                     },
                     "lesson_number": {
                         "type": "integer",
-                        "description": "Specific lesson number to search within (e.g. 1, 2, 3)"
-                    }
+                        "description": "Specific lesson number to search within (e.g. 1, 2, 3)",
+                    },
                 },
-                "required": ["query"]
-            }
+                "required": ["query"],
+            },
         }
-    
-    def execute(self, query: str, course_name: Optional[str] = None, lesson_number: Optional[int] = None) -> str:
+
+    def execute(
+        self,
+        query: str,
+        course_name: Optional[str] = None,
+        lesson_number: Optional[int] = None,
+    ) -> str:
         """
         Execute the search tool with given parameters.
-        
+
         Args:
             query: What to search for
             course_name: Optional course filter
             lesson_number: Optional lesson filter
-            
+
         Returns:
             Formatted search results or error message
         """
-        
+
         # Use the vector store's unified search interface
         results = self.store.search(
-            query=query,
-            course_name=course_name,
-            lesson_number=lesson_number
+            query=query, course_name=course_name, lesson_number=lesson_number
         )
-        
+
         # Handle errors
         if results.error:
             return results.error
-        
+
         # Handle empty results
         if results.is_empty():
             filter_info = ""
@@ -81,44 +84,128 @@ def execute(self, query: str, course_name: Optional[str] = None, lesson_number:
             if lesson_number:
                 filter_info += f" in lesson {lesson_number}"
             return f"No relevant content found{filter_info}."
-        
+
         # Format and return results
         return self._format_results(results)
-    
+
     def _format_results(self, results: SearchResults) -> str:
         """Format search results with course and lesson context"""
         formatted = []
         sources = []  # Track sources for the UI
-        
+        source_links = []  # Track lesson links for the UI
+
         for doc, meta in zip(results.documents, results.metadata):
-            course_title = meta.get('course_title', 'unknown')
-            lesson_num = meta.get('lesson_number')
-            
+            course_title = meta.get("course_title", "unknown")
+            lesson_num = meta.get("lesson_number")
+
             # Build context header
             header = f"[{course_title}"
             if lesson_num is not None:
                 header += f" - Lesson {lesson_num}"
             header += "]"
-            
+
             # Track source for the UI
             source = course_title
             if lesson_num is not None:
                 source += f" - Lesson {lesson_num}"
             sources.append(source)
-            
+
+            # Get lesson link if available
+            lesson_link = None
+            if lesson_num is not None:
+                lesson_link = self.store.get_lesson_link(course_title, lesson_num)
+            source_links.append(lesson_link)
+
             formatted.append(f"{header}\n{doc}")
-        
+
         # Store sources for retrieval
         self.last_sources = sources
-        
+        self.last_source_links = source_links
+
         return "\n\n".join(formatted)
 
+
+class CourseOutlineTool(Tool):
+    """Tool for retrieving complete course outlines and lesson lists"""
+
+    def __init__(self, vector_store: VectorStore):
+        self.store = vector_store
+
+    def get_tool_definition(self) -> Dict[str, Any]:
+        """Return Anthropic tool definition for this tool"""
+        return {
+            "name": "get_course_outline",
+            "description": "Get the complete outline of a course including title, link, and all lessons with their numbers and titles",
+            "input_schema": {
+                "type": "object",
+                "properties": {
+                    "course_name": {
+                        "type": "string",
+                        "description": "Course title (partial matches work, e.g. 'MCP', 'Introduction')",
+                    }
+                },
+                "required": ["course_name"],
+            },
+        }
+
+    def execute(self, course_name: str) -> str:
+        """
+        Execute the outline retrieval tool.
+
+        Args:
+            course_name: Course name to get outline for
+
+        Returns:
+            Formatted course outline or error message
+        """
+        # Resolve course name using vector store's existing method
+        course_title = self.store._resolve_course_name(course_name)
+        if not course_title:
+            return f"No course found matching '{course_name}'"
+
+        # Get course metadata
+        try:
+            results = self.store.course_catalog.get(ids=[course_title])
+            if not results or not results["metadatas"]:
+                return f"Course metadata not found for '{course_title}'"
+
+            metadata = results["metadatas"][0]
+
+            # Parse lessons from JSON
+            import json
+
+            lessons_json = metadata.get("lessons_json")
+            if not lessons_json:
+                return f"No lesson information available for '{course_title}'"
+
+            lessons = json.loads(lessons_json)
+
+            # Format the outline with proper markdown
+            header = (
+                f"**Course Title:** {metadata.get('title', course_title)}\n\n"
+                f"**Course Link:** {metadata.get('course_link', 'N/A')}\n\n"
+                f"**Total Lessons:** {len(lessons)}\n\n"
+                f"**Lesson Outline:**\n"
+            )
+
+            lesson_lines = []
+            for lesson in lessons:
+                lesson_num = lesson.get("lesson_number", "N/A")
+                lesson_title = lesson.get("lesson_title", "N/A")
+                lesson_lines.append(f"- **Lesson {lesson_num}:** {lesson_title}")
+
+            return header + "\n".join(lesson_lines)
+
+        except Exception as e:
+            return f"Error retrieving course outline: {str(e)}"
+
+
 class ToolManager:
     """Manages available tools for the AI"""
-    
+
     def __init__(self):
         self.tools = {}
-    
+
     def register_tool(self, tool: Tool):
         """Register any tool that implements the Tool interface"""
         tool_def = tool.get_tool_definition()
@@ -127,28 +214,37 @@ def register_tool(self, tool: Tool):
             raise ValueError("Tool must have a 'name' in its definition")
         self.tools[tool_name] = tool
 
-    
     def get_tool_definitions(self) -> list:
         """Get all tool definitions for Anthropic tool calling"""
         return [tool.get_tool_definition() for tool in self.tools.values()]
-    
+
     def execute_tool(self, tool_name: str, **kwargs) -> str:
         """Execute a tool by name with given parameters"""
         if tool_name not in self.tools:
             return f"Tool '{tool_name}' not found"
-        
+
         return self.tools[tool_name].execute(**kwargs)
-    
+
     def get_last_sources(self) -> list:
         """Get sources from the last search operation"""
         # Check all tools for last_sources attribute
         for tool in self.tools.values():
-            if hasattr(tool, 'last_sources') and tool.last_sources:
+            if hasattr(tool, "last_sources") and tool.last_sources:
                 return tool.last_sources
         return []
 
+    def get_last_source_links(self) -> list:
+        """Get source links from the last search operation"""
+        # Check all tools for last_source_links attribute
+        for tool in self.tools.values():
+            if hasattr(tool, "last_source_links") and tool.last_source_links:
+                return tool.last_source_links
+        return []
+
     def reset_sources(self):
         """Reset sources from all tools that track sources"""
         for tool in self.tools.values():
-            if hasattr(tool, 'last_sources'):
-                tool.last_sources = []
\ No newline at end of file
+            if hasattr(tool, "last_sources"):
+                tool.last_sources = []
+            if hasattr(tool, "last_source_links"):
+                tool.last_source_links = []
diff --git a/backend/session_manager.py b/backend/session_manager.py
index a5a96b1a1..9e17f346b 100644
--- a/backend/session_manager.py
+++ b/backend/session_manager.py
@@ -1,61 +1,66 @@
 from typing import Dict, List, Optional
 from dataclasses import dataclass
 
+
 @dataclass
 class Message:
     """Represents a single message in a conversation"""
-    role: str     # "user" or "assistant"
+
+    role: str  # "user" or "assistant"
     content: str  # The message content
 
+
 class SessionManager:
     """Manages conversation sessions and message history"""
-    
+
     def __init__(self, max_history: int = 5):
         self.max_history = max_history
         self.sessions: Dict[str, List[Message]] = {}
         self.session_counter = 0
-    
+
     def create_session(self) -> str:
         """Create a new conversation session"""
         self.session_counter += 1
         session_id = f"session_{self.session_counter}"
         self.sessions[session_id] = []
         return session_id
-    
+
     def add_message(self, session_id: str, role: str, content: str):
         """Add a message to the conversation history"""
         if session_id not in self.sessions:
             self.sessions[session_id] = []
-        
+
         message = Message(role=role, content=content)
         self.sessions[session_id].append(message)
-        
+
         # Keep conversation history within limits
         if len(self.sessions[session_id]) > self.max_history * 2:
-            self.sessions[session_id] = self.sessions[session_id][-self.max_history * 2:]
-    
+            self.sessions[session_id] = self.sessions[session_id][
+                -self.max_history * 2 :
+            ]
+
     def add_exchange(self, session_id: str, user_message: str, assistant_message: str):
         """Add a complete question-answer exchange"""
         self.add_message(session_id, "user", user_message)
         self.add_message(session_id, "assistant", assistant_message)
-    
+
     def get_conversation_history(self, session_id: Optional[str]) -> Optional[str]:
         """Get formatted conversation history for a session"""
         if not session_id or session_id not in self.sessions:
             return None
-        
+
         messages = self.sessions[session_id]
         if not messages:
             return None
-        
+
         # Format messages for context
         formatted_messages = []
         for msg in messages:
             formatted_messages.append(f"{msg.role.title()}: {msg.content}")
-        
+
         return "\n".join(formatted_messages)
-    
+
     def clear_session(self, session_id: str):
         """Clear all messages from a session"""
         if session_id in self.sessions:
-            self.sessions[session_id] = []
\ No newline at end of file
+            self.sessions[session_id] = []
diff --git a/backend/tests/__init__.py b/backend/tests/__init__.py
new file mode 100644
index 000000000..e69de29bb
diff --git a/backend/tests/conftest.py b/backend/tests/conftest.py
new file mode 100644
index 000000000..1cdf8ab3c
--- /dev/null
+++ b/backend/tests/conftest.py
@@ -0,0 +1,43 @@
+import sys
+import os
+
+# Add backend and tests directories to path so imports work
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), ".."))
+sys.path.insert(0, os.path.dirname(__file__))
+
+import pytest
+from unittest.mock import MagicMock, patch
+from helpers import MockConfig, make_valid_search_results
+
+
+@pytest.fixture
+def mock_config():
+    """Shared MockConfig instance."""
+    return MockConfig()
+
+
+@pytest.fixture
+def mock_rag_system():
+    """A MagicMock standing in for RAGSystem with pre-wired sub-components."""
+    rag = MagicMock()
+    rag.session_manager.create_session.return_value = "test-session-123"
+    rag.query.return_value = (
+        "This is a test answer.",
+        ["Source A", "Source B"],
+        ["http://example.com/a", "http://example.com/b"],
+    )
+    rag.get_course_analytics.return_value = {
+        "total_courses": 2,
+        "course_titles": ["Course A", "Course B"],
+    }
+    return rag
+
+
+@pytest.fixture
+def mock_vector_store():
+    """A MagicMock standing in for VectorStore."""
+    store = MagicMock()
+    store.get_course_count.return_value = 2
+    store.get_existing_course_titles.return_value = ["Course A", "Course B"]
+    store.search.return_value = make_valid_search_results(2)
+    return store
diff --git a/backend/tests/helpers.py b/backend/tests/helpers.py
new file mode 100644
index 000000000..9e3e9dcfa
--- /dev/null
+++ b/backend/tests/helpers.py
@@ -0,0 +1,67 @@
+"""Shared test helpers and factories."""
+
+import sys
+import os
+from dataclasses import dataclass
+from unittest.mock import MagicMock
+
+# Add backend to path so imports work
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), ".."))
+
+from vector_store import SearchResults
+
+
+@dataclass
+class MockConfig:
+    ANTHROPIC_API_KEY: str = "test-key"
+    ANTHROPIC_MODEL: str = "claude-sonnet-4-20250514"
+    EMBEDDING_MODEL: str = "all-MiniLM-L6-v2"
+    CHUNK_SIZE: int = 800
+    CHUNK_OVERLAP: int = 100
+    MAX_RESULTS: int = 5
+    MAX_HISTORY: int = 2
+    CHROMA_PATH: str = "./test_chroma_db"
+
+
+def make_search_results(documents=None, metadata=None, distances=None, error=None):
+    """Factory for SearchResults objects."""
+    if error:
+        return SearchResults.empty(error)
+    return SearchResults(
+        documents=documents or [],
+        metadata=metadata or [],
+        distances=distances or [],
+        error=None,
+    )
+
+
+def make_valid_search_results(n=2):
+    """Create valid search results with n items."""
+    docs = [f"Content about topic {i}" for i in range(n)]
+    meta = [
+        {"course_title": f"Course {i}", "lesson_number": i + 1, "chunk_index": i}
+        for i in range(n)
+    ]
+    dists = [0.1 * (i + 1) for i in range(n)]
+    return SearchResults(documents=docs, metadata=meta, distances=dists)
+
+
+def make_anthropic_response(content_blocks, stop_reason="end_turn"):
+    """Factory for mock Anthropic API responses."""
+    mock_response = MagicMock()
+    mock_response.stop_reason = stop_reason
+
+    blocks = []
+    for block in content_blocks:
+        mock_block = MagicMock()
+        mock_block.type = block["type"]
+        if block["type"] == "text":
+            mock_block.text = block["text"]
+        elif block["type"] == "tool_use":
+            mock_block.id = block["id"]
+            mock_block.name = block["name"]
+            mock_block.input = block["input"]
+        blocks.append(mock_block)
+
+    mock_response.content = blocks
+    return mock_response
diff --git a/backend/tests/test_ai_generator.py b/backend/tests/test_ai_generator.py
new file mode 100644
index 000000000..1769c71ab
--- /dev/null
+++ b/backend/tests/test_ai_generator.py
@@ -0,0 +1,421 @@
+"""Tests for AIGenerator tool calling and response handling."""
+
+import pytest
+import anthropic
+from unittest.mock import MagicMock, patch, call
+from helpers import make_anthropic_response
+from ai_generator import AIGenerator
+
+
+@pytest.fixture
+def generator():
+    with patch("ai_generator.anthropic.Anthropic"):
+        gen = AIGenerator(api_key="test-key", model="claude-sonnet-4-20250514")
+    return gen
+
+
+@pytest.fixture
+def tool_manager():
+    tm = MagicMock()
+    tm.execute_tool.return_value = "Tool result: content about topic"
+    return tm
+
+
+@pytest.fixture
+def sample_tools():
+    return [
+        {
+            "name": "search_course_content",
+            "description": "Search course materials",
+            "input_schema": {
+                "type": "object",
+                "properties": {"query": {"type": "string"}},
+                "required": ["query"],
+            },
+        }
+    ]
+
+
+class TestNoToolUsage:
+    def test_direct_text_response(self, generator, sample_tools):
+        """When Claude returns text (no tools), returns text directly."""
+        response = make_anthropic_response(
+            [{"type": "text", "text": "Hello, I can help!"}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.return_value = response
+
+        result = generator.generate_response(query="hi", tools=sample_tools)
+
+        assert result == "Hello, I can help!"
+
+    def test_empty_content_returns_fallback(self, generator, sample_tools):
+        """When response.content is empty, returns a fallback message instead of crashing."""
+        response = make_anthropic_response([], stop_reason="end_turn")
+        response.content = []  # explicitly empty
+        generator.client.messages.create.return_value = response
+
+        result = generator.generate_response(query="test", tools=sample_tools)
+
+        assert "able to generate a response" in result.lower()
+
+
+class TestSingleToolRound:
+    def test_tool_use_calls_tool_manager(self, generator, tool_manager, sample_tools):
+        """When Claude returns tool_use, calls tool_manager.execute_tool()."""
+        tool_response = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "neural networks"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        text_response = make_anthropic_response(
+            [{"type": "text", "text": "Neural networks are..."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            tool_response,
+            text_response,
+        ]
+
+        generator.generate_response(
+            query="what are neural networks",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        tool_manager.execute_tool.assert_called_once_with(
+            "search_course_content", query="neural networks"
+        )
+
+    def test_tool_use_then_synthesis(self, generator, tool_manager, sample_tools):
+        """Round 1: tool_use -> execute -> Round 2: Claude synthesizes answer."""
+        tool_response = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "transformers"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        synthesis_response = make_anthropic_response(
+            [{"type": "text", "text": "Transformers use attention mechanisms."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            tool_response,
+            synthesis_response,
+        ]
+
+        result = generator.generate_response(
+            query="explain transformers",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        assert result == "Transformers use attention mechanisms."
+        assert generator.client.messages.create.call_count == 2
+
+    def test_course_outline_returns_directly(
+        self, generator, tool_manager, sample_tools
+    ):
+        """get_course_outline tool result is returned directly without synthesis."""
+        outline_result = "**Course Title:** MCP\n- Lesson 1: Intro"
+        tool_manager.execute_tool.return_value = outline_result
+
+        tool_response = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "get_course_outline",
+                    "input": {"course_name": "MCP"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        generator.client.messages.create.return_value = tool_response
+
+        result = generator.generate_response(
+            query="outline of MCP",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        assert result == outline_result
+        # Should NOT make a second API call for synthesis
+        assert generator.client.messages.create.call_count == 1
+
+
+class TestMultiRoundToolCalling:
+    def test_two_rounds_of_tool_calls(self, generator, tool_manager, sample_tools):
+        """Loop executes up to 2 tool rounds before final synthesis call."""
+        tool_response_1 = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "round 1"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        tool_response_2 = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t2",
+                    "name": "search_course_content",
+                    "input": {"query": "round 2"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        final_response = make_anthropic_response(
+            [{"type": "text", "text": "Final answer after 2 rounds."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            tool_response_1,
+            tool_response_2,
+            final_response,
+        ]
+
+        result = generator.generate_response(
+            query="complex question",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        assert result == "Final answer after 2 rounds."
+        # 2 tool rounds + 1 final synthesis = 3 API calls
+        assert generator.client.messages.create.call_count == 3
+        assert tool_manager.execute_tool.call_count == 2
+
+    def test_messages_accumulate_across_rounds(
+        self, generator, tool_manager, sample_tools
+    ):
+        """2nd API call's messages kwarg contains tool results from round 1."""
+        tool_manager.execute_tool.return_value = "Result from round 1"
+
+        tool_response_1 = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "round 1"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        text_response = make_anthropic_response(
+            [{"type": "text", "text": "Synthesized answer."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            tool_response_1,
+            text_response,
+        ]
+
+        generator.generate_response(
+            query="test query",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        # The 2nd API call should have accumulated messages
+        second_call_kwargs = generator.client.messages.create.call_args_list[1][1]
+        msgs = second_call_kwargs["messages"]
+
+        # Should be: user query, assistant tool_use, user tool_result
+        assert len(msgs) == 3
+        assert msgs[0] == {"role": "user", "content": "test query"}
+        assert msgs[1]["role"] == "assistant"
+        assert msgs[2]["role"] == "user"
+        # The tool_result content should contain our result
+        tool_result_content = msgs[2]["content"]
+        assert len(tool_result_content) == 1
+        assert tool_result_content[0]["type"] == "tool_result"
+        assert tool_result_content[0]["content"] == "Result from round 1"
+
+    def test_parallel_tool_calls_all_executed(
+        self, generator, tool_manager, sample_tools
+    ):
+        """When Claude calls 2 tools in one response, both execute."""
+        tool_manager.execute_tool.side_effect = ["Result A", "Result B"]
+
+        parallel_response = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "topic A"},
+                },
+                {
+                    "type": "tool_use",
+                    "id": "t2",
+                    "name": "search_course_content",
+                    "input": {"query": "topic B"},
+                },
+            ],
+            stop_reason="tool_use",
+        )
+        synthesis_response = make_anthropic_response(
+            [{"type": "text", "text": "Combined answer."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            parallel_response,
+            synthesis_response,
+        ]
+
+        result = generator.generate_response(
+            query="compare topics",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        assert result == "Combined answer."
+        assert tool_manager.execute_tool.call_count == 2
+        tool_manager.execute_tool.assert_any_call(
+            "search_course_content", query="topic A"
+        )
+        tool_manager.execute_tool.assert_any_call(
+            "search_course_content", query="topic B"
+        )
+
+        # Verify both results sent back to API
+        second_call_msgs = generator.client.messages.create.call_args_list[1][1][
+            "messages"
+        ]
+        tool_results_msg = second_call_msgs[-1]["content"]
+        assert len(tool_results_msg) == 2
+        assert tool_results_msg[0]["content"] == "Result A"
+        assert tool_results_msg[1]["content"] == "Result B"
+
+    def test_parallel_tools_one_fails_still_returns_all_results(
+        self, generator, tool_manager, sample_tools
+    ):
+        """One tool fails -> error sent for that tool, successful result still included."""
+        tool_manager.execute_tool.side_effect = [
+            "Success result",
+            RuntimeError("Tool B crashed"),
+        ]
+
+        parallel_response = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "good query"},
+                },
+                {
+                    "type": "tool_use",
+                    "id": "t2",
+                    "name": "search_course_content",
+                    "input": {"query": "bad query"},
+                },
+            ],
+            stop_reason="tool_use",
+        )
+        final_response = make_anthropic_response(
+            [{"type": "text", "text": "Partial answer with error context."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            parallel_response,
+            final_response,
+        ]
+
+        result = generator.generate_response(
+            query="multi tool query",
+            tools=sample_tools,
+            tool_manager=tool_manager,
+        )
+
+        assert isinstance(result, str)
+        # Both tools were attempted
+        assert tool_manager.execute_tool.call_count == 2
+
+        # Verify both results (success + error) sent back to API
+        second_call_msgs = generator.client.messages.create.call_args_list[1][1][
+            "messages"
+        ]
+        tool_results_msg = second_call_msgs[-1]["content"]
+        assert len(tool_results_msg) == 2
+        # First tool succeeded
+        assert tool_results_msg[0]["content"] == "Success result"
+        assert "is_error" not in tool_results_msg[0]
+        # Second tool has error
+        assert "Error" in tool_results_msg[1]["content"]
+        assert tool_results_msg[1]["is_error"] is True
+
+
+class TestErrorHandling:
+    def test_tool_execution_exception_handled(
+        self, generator, tool_manager, sample_tools
+    ):
+        """When tool_manager raises, error is caught and loop breaks."""
+        tool_manager.execute_tool.side_effect = RuntimeError("Tool crashed")
+
+        tool_response = make_anthropic_response(
+            [
+                {
+                    "type": "tool_use",
+                    "id": "t1",
+                    "name": "search_course_content",
+                    "input": {"query": "test"},
+                }
+            ],
+            stop_reason="tool_use",
+        )
+        # After exception, a final synthesis call is made (no tools)
+        final_response = make_anthropic_response(
+            [{"type": "text", "text": "I encountered an error."}],
+            stop_reason="end_turn",
+        )
+        generator.client.messages.create.side_effect = [
+            tool_response,
+            final_response,
+        ]
+
+        result = generator.generate_response(
+            query="test", tools=sample_tools, tool_manager=tool_manager
+        )
+
+        # The function should still return (error is handled in _handle_tool_execution)
+        assert isinstance(result, str)
+
+    def test_api_exception_wrapped_as_runtime_error(self, generator, sample_tools):
+        """When client.messages.create() raises APIError, it's wrapped as RuntimeError with context."""
+        generator.client.messages.create.side_effect = anthropic.APIError(
+            message="rate limit exceeded",
+            request=MagicMock(),
+            body=None,
+        )
+
+        with pytest.raises(RuntimeError, match="Anthropic API error"):
+            generator.generate_response(query="test", tools=sample_tools)
+
+    def test_auth_exception_wrapped_with_context(self, generator, sample_tools):
+        """When client.messages.create() raises AuthenticationError, it's wrapped with auth context."""
+        generator.client.messages.create.side_effect = anthropic.AuthenticationError(
+            message="invalid api key",
+            response=MagicMock(status_code=401, headers={}),
+            body=None,
+        )
+
+        with pytest.raises(RuntimeError, match="authentication failed"):
+            generator.generate_response(query="test", tools=sample_tools)
diff --git a/backend/tests/test_api_endpoints.py b/backend/tests/test_api_endpoints.py
new file mode 100644
index 000000000..f7259a47b
--- /dev/null
+++ b/backend/tests/test_api_endpoints.py
@@ -0,0 +1,172 @@
+"""Tests for FastAPI API endpoints.
+
+Because the production app.py mounts static files from ../frontend (which
+doesn't exist in the test environment), we define a lightweight test app that
+mirrors the endpoint logic and wires in a mock RAGSystem.
+"""
+
+import pytest
+from unittest.mock import MagicMock
+from fastapi import FastAPI, HTTPException
+from fastapi.testclient import TestClient
+from pydantic import BaseModel
+from typing import List, Optional, Dict, Union
+
+
+# ---------------------------------------------------------------------------
+# Pydantic models (duplicated from app.py to avoid import side-effects)
+# ---------------------------------------------------------------------------
+
+class QueryRequest(BaseModel):
+    query: str
+    session_id: Optional[str] = None
+
+
+class QueryResponse(BaseModel):
+    answer: str
+    sources: List[Union[str, Dict[str, str]]]
+    session_id: str
+
+
+class CourseStats(BaseModel):
+    total_courses: int
+    course_titles: List[str]
+
+
+class ClearSessionRequest(BaseModel):
+    session_id: str
+
+
+# ---------------------------------------------------------------------------
+# Test app factory
+# ---------------------------------------------------------------------------
+
+def _create_test_app(rag_system: MagicMock) -> FastAPI:
+    """Build a minimal FastAPI app with the same endpoints as production."""
+    test_app = FastAPI()
+
+    @test_app.post("/api/query", response_model=QueryResponse)
+    async def query_documents(request: QueryRequest):
+        try:
+            session_id = request.session_id
+            if not session_id:
+                session_id = rag_system.session_manager.create_session()
+            answer, sources, _links = rag_system.query(request.query, session_id)
+            return QueryResponse(answer=answer, sources=sources, session_id=session_id)
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=str(e))
+
+    @test_app.get("/api/courses", response_model=CourseStats)
+    async def get_course_stats():
+        try:
+            analytics = rag_system.get_course_analytics()
+            return CourseStats(
+                total_courses=analytics["total_courses"],
+                course_titles=analytics["course_titles"],
+            )
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=str(e))
+
+    @test_app.post("/api/session/clear")
+    async def clear_session(request: ClearSessionRequest):
+        try:
+            rag_system.session_manager.clear_session(request.session_id)
+            return {"status": "success", "message": f"Session {request.session_id} cleared"}
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=str(e))
+
+    return test_app
+
+
+# ---------------------------------------------------------------------------
+# Fixtures
+# ---------------------------------------------------------------------------
+
+@pytest.fixture
+def client(mock_rag_system):
+    """TestClient wired to the mock RAG system."""
+    app = _create_test_app(mock_rag_system)
+    return TestClient(app)
+
+
+# ---------------------------------------------------------------------------
+# /api/query
+# ---------------------------------------------------------------------------
+
+class TestQueryEndpoint:
+    def test_query_with_session_id(self, client, mock_rag_system):
+        resp = client.post("/api/query", json={"query": "What is RAG?", "session_id": "s1"})
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["answer"] == "This is a test answer."
+        assert data["sources"] == ["Source A", "Source B"]
+        assert data["session_id"] == "s1"
+        mock_rag_system.query.assert_called_once_with("What is RAG?", "s1")
+
+    def test_query_creates_session_when_missing(self, client, mock_rag_system):
+        resp = client.post("/api/query", json={"query": "Hello"})
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["session_id"] == "test-session-123"
+        mock_rag_system.session_manager.create_session.assert_called_once()
+
+    def test_query_returns_dict_sources(self, client, mock_rag_system):
+        mock_rag_system.query.return_value = (
+            "Answer",
+            [{"title": "Lesson 1", "link": "http://example.com"}],
+            [],
+        )
+        resp = client.post("/api/query", json={"query": "test"})
+        assert resp.status_code == 200
+        assert resp.json()["sources"] == [{"title": "Lesson 1", "link": "http://example.com"}]
+
+    def test_query_missing_body_returns_422(self, client):
+        resp = client.post("/api/query", json={})
+        assert resp.status_code == 422
+
+    def test_query_rag_error_returns_500(self, client, mock_rag_system):
+        mock_rag_system.query.side_effect = RuntimeError("boom")
+        resp = client.post("/api/query", json={"query": "fail", "session_id": "s1"})
+        assert resp.status_code == 500
+        assert "boom" in resp.json()["detail"]
+
+
+# ---------------------------------------------------------------------------
+# /api/courses
+# ---------------------------------------------------------------------------
+
+class TestCoursesEndpoint:
+    def test_get_courses(self, client):
+        resp = client.get("/api/courses")
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["total_courses"] == 2
+        assert data["course_titles"] == ["Course A", "Course B"]
+
+    def test_courses_error_returns_500(self, client, mock_rag_system):
+        mock_rag_system.get_course_analytics.side_effect = RuntimeError("db down")
+        resp = client.get("/api/courses")
+        assert resp.status_code == 500
+        assert "db down" in resp.json()["detail"]
+
+
+# ---------------------------------------------------------------------------
+# /api/session/clear
+# ---------------------------------------------------------------------------
+
+class TestClearSessionEndpoint:
+    def test_clear_session_success(self, client, mock_rag_system):
+        resp = client.post("/api/session/clear", json={"session_id": "s1"})
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["status"] == "success"
+        mock_rag_system.session_manager.clear_session.assert_called_once_with("s1")
+
+    def test_clear_session_missing_id_returns_422(self, client):
+        resp = client.post("/api/session/clear", json={})
+        assert resp.status_code == 422
+
+    def test_clear_session_error_returns_500(self, client, mock_rag_system):
+        mock_rag_system.session_manager.clear_session.side_effect = KeyError("no session")
+        resp = client.post("/api/session/clear", json={"session_id": "bad"})
+        assert resp.status_code == 500
diff --git a/backend/tests/test_rag_integration.py b/backend/tests/test_rag_integration.py
new file mode 100644
index 000000000..41ad8463d
--- /dev/null
+++ b/backend/tests/test_rag_integration.py
@@ -0,0 +1,108 @@
+"""Tests for RAG system query pipeline with mocked dependencies."""
+
+import pytest
+from unittest.mock import MagicMock, patch
+
+
+class TestRAGQueryPipeline:
+    """Test the full query pipeline with mocked external dependencies."""
+
+    @pytest.fixture
+    def mock_deps(self):
+        """Set up mocked RAG system with all dependencies mocked."""
+        with (
+            patch("rag_system.DocumentProcessor"),
+            patch("rag_system.VectorStore"),
+            patch("rag_system.AIGenerator"),
+            patch("rag_system.SessionManager"),
+            patch("rag_system.CourseSearchTool"),
+            patch("rag_system.CourseOutlineTool"),
+            patch("rag_system.ToolManager") as mock_tm_cls,
+        ):
+            from rag_system import RAGSystem
+            from helpers import MockConfig
+
+            config = MockConfig()
+            rag = RAGSystem(config)
+
+            # rag.tool_manager is now a MagicMock instance
+            rag.ai_generator.generate_response.return_value = "This is the answer."
+            rag.tool_manager.get_last_sources.return_value = ["Course A - Lesson 1"]
+            rag.tool_manager.get_last_source_links.return_value = [
+                "https://example.com/1"
+            ]
+            rag.session_manager.get_conversation_history.return_value = None
+
+            yield rag
+
+    def test_query_returns_response_and_sources(self, mock_deps):
+        """Happy path: returns (answer, sources, source_links) tuple."""
+        rag = mock_deps
+
+        response, sources, source_links = rag.query("What is MCP?")
+
+        assert response == "This is the answer."
+        assert sources == ["Course A - Lesson 1"]
+        assert source_links == ["https://example.com/1"]
+
+    def test_query_passes_tools_to_generator(self, mock_deps):
+        """get_tool_definitions() is passed to ai_generator.generate_response()."""
+        rag = mock_deps
+        rag.tool_manager.get_tool_definitions.return_value = [
+            {"name": "search_course_content"}
+        ]
+
+        rag.query("test question")
+
+        call_kwargs = rag.ai_generator.generate_response.call_args
+        assert call_kwargs.kwargs["tools"] == [{"name": "search_course_content"}]
+
+    def test_query_passes_tool_manager(self, mock_deps):
+        """tool_manager instance is passed to generator for tool dispatch."""
+        rag = mock_deps
+
+        rag.query("test question")
+
+        call_kwargs = rag.ai_generator.generate_response.call_args
+        assert call_kwargs.kwargs["tool_manager"] is rag.tool_manager
+
+    def test_query_collects_sources_after_response(self, mock_deps):
+        """Sources retrieved via get_last_sources() after generation."""
+        rag = mock_deps
+
+        rag.query("test")
+
+        gen_call_order = rag.ai_generator.generate_response.call_args_list
+        src_call_order = rag.tool_manager.get_last_sources.call_args_list
+        assert len(gen_call_order) == 1
+        assert len(src_call_order) == 1
+
+    def test_query_resets_sources(self, mock_deps):
+        """reset_sources() called after source collection."""
+        rag = mock_deps
+
+        rag.query("test")
+
+        rag.tool_manager.reset_sources.assert_called_once()
+
+    def test_query_exception_propagates_to_caller(self, mock_deps):
+        """When generator raises, exception propagates (no try/except in query())."""
+        rag = mock_deps
+        rag.ai_generator.generate_response.side_effect = Exception("API auth failed")
+
+        with pytest.raises(Exception, match="API auth failed"):
+            rag.query("test question")
+
+    def test_query_with_session_passes_history(self, mock_deps):
+        """Session history is passed as conversation_history parameter."""
+        rag = mock_deps
+        rag.session_manager.get_conversation_history.return_value = (
+            "User: hi\nAssistant: hello"
+        )
+
+        rag.query("follow up question", session_id="session_1")
+
+        call_kwargs = rag.ai_generator.generate_response.call_args
+        assert (
+            call_kwargs.kwargs["conversation_history"] == "User: hi\nAssistant: hello"
+        )
diff --git a/backend/tests/test_search_tools.py b/backend/tests/test_search_tools.py
new file mode 100644
index 000000000..ce6da52a6
--- /dev/null
+++ b/backend/tests/test_search_tools.py
@@ -0,0 +1,114 @@
+"""Tests for CourseSearchTool.execute() and ToolManager dispatch."""
+
+import pytest
+from unittest.mock import MagicMock, patch
+from helpers import make_search_results, make_valid_search_results
+from search_tools import CourseSearchTool, ToolManager
+from vector_store import SearchResults
+
+
+@pytest.fixture
+def mock_store():
+    store = MagicMock()
+    store.get_lesson_link = MagicMock(return_value="https://example.com/lesson")
+    return store
+
+
+@pytest.fixture
+def search_tool(mock_store):
+    return CourseSearchTool(mock_store)
+
+
+@pytest.fixture
+def tool_manager(search_tool):
+    tm = ToolManager()
+    tm.register_tool(search_tool)
+    return tm
+
+
+class TestCourseSearchToolExecute:
+    def test_execute_returns_formatted_results(self, search_tool, mock_store):
+        """Valid search results are formatted as [Course - Lesson N]\\ncontent."""
+        results = make_valid_search_results(2)
+        mock_store.search.return_value = results
+
+        output = search_tool.execute(query="test query")
+
+        assert "[Course 0 - Lesson 1]" in output
+        assert "Content about topic 0" in output
+        assert "[Course 1 - Lesson 2]" in output
+        assert "Content about topic 1" in output
+
+    def test_execute_populates_sources(self, search_tool, mock_store):
+        """last_sources and last_source_links are populated after execution."""
+        results = make_valid_search_results(2)
+        mock_store.search.return_value = results
+
+        search_tool.execute(query="test query")
+
+        assert len(search_tool.last_sources) == 2
+        assert "Course 0 - Lesson 1" in search_tool.last_sources
+        assert len(search_tool.last_source_links) == 2
+
+    def test_execute_error_from_search(self, search_tool, mock_store):
+        """When SearchResults.error is set, execute returns the error string."""
+        mock_store.search.return_value = make_search_results(
+            error="No course found matching 'xyz'"
+        )
+
+        output = search_tool.execute(query="test", course_name="xyz")
+
+        assert "No course found matching 'xyz'" in output
+
+    def test_execute_empty_results(self, search_tool, mock_store):
+        """When no documents found, returns 'No relevant content found'."""
+        mock_store.search.return_value = make_search_results()
+
+        output = search_tool.execute(query="nonexistent topic")
+
+        assert "No relevant content found" in output
+
+    def test_execute_empty_with_filters(self, search_tool, mock_store):
+        """Empty results with course_name/lesson filters include filter info."""
+        mock_store.search.return_value = make_search_results()
+
+        output = search_tool.execute(query="topic", course_name="MCP", lesson_number=3)
+
+        assert "in course 'MCP'" in output
+        assert "in lesson 3" in output
+
+    def test_execute_exception_propagates(self, search_tool, mock_store):
+        """When store.search() raises, exception propagates (not caught)."""
+        mock_store.search.side_effect = RuntimeError("DB connection failed")
+
+        with pytest.raises(RuntimeError, match="DB connection failed"):
+            search_tool.execute(query="test")
+
+    def test_tool_definition_schema(self, search_tool):
+        """Tool definition has correct name, required params, schema."""
+        defn = search_tool.get_tool_definition()
+
+        assert defn["name"] == "search_course_content"
+        assert defn["input_schema"]["required"] == ["query"]
+        assert "query" in defn["input_schema"]["properties"]
+        assert "course_name" in defn["input_schema"]["properties"]
+        assert "lesson_number" in defn["input_schema"]["properties"]
+
+
+class TestToolManager:
+    def test_dispatches_correctly(self, tool_manager, mock_store):
+        """ToolManager.execute_tool dispatches to the right tool."""
+        mock_store.search.return_value = make_valid_search_results(1)
+
+        result = tool_manager.execute_tool("search_course_content", query="test query")
+
+        mock_store.search.assert_called_once_with(
+            query="test query", course_name=None, lesson_number=None
+        )
+        assert "[Course 0 - Lesson 1]" in result
+
+    def test_unknown_tool_returns_error(self, tool_manager):
+        """Unknown tool name returns error string, not exception."""
+        result = tool_manager.execute_tool("nonexistent_tool", query="test")
+
+        assert "not found" in result.lower()
diff --git a/backend/vector_store.py b/backend/vector_store.py
index 390abe71c..c14e2f03c 100644
--- a/backend/vector_store.py
+++ b/backend/vector_store.py
@@ -5,73 +5,88 @@
 from models import Course, CourseChunk
 from sentence_transformers import SentenceTransformer
 
+
 @dataclass
 class SearchResults:
     """Container for search results with metadata"""
+
     documents: List[str]
     metadata: List[Dict[str, Any]]
     distances: List[float]
     error: Optional[str] = None
-    
+
     @classmethod
-    def from_chroma(cls, chroma_results: Dict) -> 'SearchResults':
+    def from_chroma(cls, chroma_results: Dict) -> "SearchResults":
         """Create SearchResults from ChromaDB query results"""
         return cls(
-            documents=chroma_results['documents'][0] if chroma_results['documents'] else [],
-            metadata=chroma_results['metadatas'][0] if chroma_results['metadatas'] else [],
-            distances=chroma_results['distances'][0] if chroma_results['distances'] else []
+            documents=(
+                chroma_results["documents"][0] if chroma_results["documents"] else []
+            ),
+            metadata=(
+                chroma_results["metadatas"][0] if chroma_results["metadatas"] else []
+            ),
+            distances=(
+                chroma_results["distances"][0] if chroma_results["distances"] else []
+            ),
         )
-    
+
     @classmethod
-    def empty(cls, error_msg: str) -> 'SearchResults':
+    def empty(cls, error_msg: str) -> "SearchResults":
         """Create empty results with error message"""
         return cls(documents=[], metadata=[], distances=[], error=error_msg)
-    
+
     def is_empty(self) -> bool:
         """Check if results are empty"""
         return len(self.documents) == 0
 
+
 class VectorStore:
     """Vector storage using ChromaDB for course content and metadata"""
-    
+
     def __init__(self, chroma_path: str, embedding_model: str, max_results: int = 5):
         self.max_results = max_results
         # Initialize ChromaDB client
         self.client = chromadb.PersistentClient(
-            path=chroma_path,
-            settings=Settings(anonymized_telemetry=False)
+            path=chroma_path, settings=Settings(anonymized_telemetry=False)
         )
-        
+
         # Set up sentence transformer embedding function
-        self.embedding_function = chromadb.utils.embedding_functions.SentenceTransformerEmbeddingFunction(
-            model_name=embedding_model
+        self.embedding_function = (
+            chromadb.utils.embedding_functions.SentenceTransformerEmbeddingFunction(
+                model_name=embedding_model
+            )
         )
-        
+
         # Create collections for different types of data
-        self.course_catalog = self._create_collection("course_catalog")  # Course titles/instructors
-        self.course_content = self._create_collection("course_content")  # Actual course material
-    
+        self.course_catalog = self._create_collection(
+            "course_catalog"
+        )  # Course titles/instructors
+        self.course_content = self._create_collection(
+            "course_content"
+        )  # Actual course material
+
     def _create_collection(self, name: str):
         """Create or get a ChromaDB collection"""
         return self.client.get_or_create_collection(
-            name=name,
-            embedding_function=self.embedding_function
+            name=name, embedding_function=self.embedding_function
         )
-    
-    def search(self, 
-               query: str,
-               course_name: Optional[str] = None,
-               lesson_number: Optional[int] = None,
-               limit: Optional[int] = None) -> SearchResults:
+
+    def search(
+        self,
+        query: str,
+        course_name: Optional[str] = None,
+        lesson_number: Optional[int] = None,
+        limit: Optional[int] = None,
+    ) -> SearchResults:
         """
         Main search interface that handles course resolution and content search.
-        
+
         Args:
             query: What to search for in course content
             course_name: Optional course name/title to filter by
             lesson_number: Optional lesson number to filter by
             limit: Maximum results to return
-            
+
         Returns:
             SearchResults object with documents and metadata
         """
@@ -81,104 +96,111 @@ def search(self,
             course_title = self._resolve_course_name(course_name)
             if not course_title:
                 return SearchResults.empty(f"No course found matching '{course_name}'")
-        
+
         # Step 2: Build filter for content search
         filter_dict = self._build_filter(course_title, lesson_number)
-        
+
         # Step 3: Search course content
         # Use provided limit or fall back to configured max_results
         search_limit = limit if limit is not None else self.max_results
-        
+
         try:
             results = self.course_content.query(
-                query_texts=[query],
-                n_results=search_limit,
-                where=filter_dict
+                query_texts=[query], n_results=search_limit, where=filter_dict
             )
             return SearchResults.from_chroma(results)
         except Exception as e:
             return SearchResults.empty(f"Search error: {str(e)}")
-    
+
     def _resolve_course_name(self, course_name: str) -> Optional[str]:
         """Use vector search to find best matching course by name"""
         try:
-            results = self.course_catalog.query(
-                query_texts=[course_name],
-                n_results=1
-            )
-            
-            if results['documents'][0] and results['metadatas'][0]:
+            results = self.course_catalog.query(query_texts=[course_name], n_results=1)
+
+            if results["documents"][0] and results["metadatas"][0]:
                 # Return the title (which is now the ID)
-                return results['metadatas'][0][0]['title']
+                return results["metadatas"][0][0]["title"]
         except Exception as e:
             print(f"Error resolving course name: {e}")
-        
+
         return None
-    
-    def _build_filter(self, course_title: Optional[str], lesson_number: Optional[int]) -> Optional[Dict]:
+
+    def _build_filter(
+        self, course_title: Optional[str], lesson_number: Optional[int]
+    ) -> Optional[Dict]:
         """Build ChromaDB filter from search parameters"""
         if not course_title and lesson_number is None:
             return None
-            
+
         # Handle different filter combinations
         if course_title and lesson_number is not None:
-            return {"$and": [
-                {"course_title": course_title},
-                {"lesson_number": lesson_number}
-            ]}
-        
+            return {
+                "$and": [
+                    {"course_title": course_title},
+                    {"lesson_number": lesson_number},
+                ]
+            }
+
         if course_title:
             return {"course_title": course_title}
-            
+
         return {"lesson_number": lesson_number}
-    
+
     def add_course_metadata(self, course: Course):
         """Add course information to the catalog for semantic search"""
         import json
 
         course_text = course.title
-        
+
         # Build lessons metadata and serialize as JSON string
         lessons_metadata = []
         for lesson in course.lessons:
-            lessons_metadata.append({
-                "lesson_number": lesson.lesson_number,
-                "lesson_title": lesson.title,
-                "lesson_link": lesson.lesson_link
-            })
-        
+            lessons_metadata.append(
+                {
+                    "lesson_number": lesson.lesson_number,
+                    "lesson_title": lesson.title,
+                    "lesson_link": lesson.lesson_link,
+                }
+            )
+
         self.course_catalog.add(
             documents=[course_text],
-            metadatas=[{
-                "title": course.title,
-                "instructor": course.instructor,
-                "course_link": course.course_link,
-                "lessons_json": json.dumps(lessons_metadata),  # Serialize as JSON string
-                "lesson_count": len(course.lessons)
-            }],
-            ids=[course.title]
+            metadatas=[
+                {
+                    "title": course.title,
+                    "instructor": course.instructor,
+                    "course_link": course.course_link,
+                    "lessons_json": json.dumps(
+                        lessons_metadata
+                    ),  # Serialize as JSON string
+                    "lesson_count": len(course.lessons),
+                }
+            ],
+            ids=[course.title],
         )
-    
+
     def add_course_content(self, chunks: List[CourseChunk]):
         """Add course content chunks to the vector store"""
         if not chunks:
             return
-        
+
         documents = [chunk.content for chunk in chunks]
-        metadatas = [{
-            "course_title": chunk.course_title,
-            "lesson_number": chunk.lesson_number,
-            "chunk_index": chunk.chunk_index
-        } for chunk in chunks]
+        metadatas = [
+            {
+                "course_title": chunk.course_title,
+                "lesson_number": chunk.lesson_number,
+                "chunk_index": chunk.chunk_index,
+            }
+            for chunk in chunks
+        ]
         # Use title with chunk index for unique IDs
-        ids = [f"{chunk.course_title.replace(' ', '_')}_{chunk.chunk_index}" for chunk in chunks]
-        
-        self.course_content.add(
-            documents=documents,
-            metadatas=metadatas,
-            ids=ids
-        )
-    
+        ids = [
+            f"{chunk.course_title.replace(' ', '_')}_{chunk.chunk_index}"
+            for chunk in chunks
+        ]
+
+        self.course_content.add(documents=documents, metadatas=metadatas, ids=ids)
+
     def clear_all_data(self):
         """Clear all data from both collections"""
         try:
@@ -189,43 +211,46 @@ def clear_all_data(self):
             self.course_content = self._create_collection("course_content")
         except Exception as e:
             print(f"Error clearing data: {e}")
-    
+
     def get_existing_course_titles(self) -> List[str]:
         """Get all existing course titles from the vector store"""
         try:
             # Get all documents from the catalog
             results = self.course_catalog.get()
-            if results and 'ids' in results:
-                return results['ids']
+            if results and "ids" in results:
+                return results["ids"]
             return []
         except Exception as e:
             print(f"Error getting existing course titles: {e}")
             return []
-    
+
     def get_course_count(self) -> int:
         """Get the total number of courses in the vector store"""
         try:
             results = self.course_catalog.get()
-            if results and 'ids' in results:
-                return len(results['ids'])
+            if results and "ids" in results:
+                return len(results["ids"])
             return 0
         except Exception as e:
             print(f"Error getting course count: {e}")
             return 0
-    
+
     def get_all_courses_metadata(self) -> List[Dict[str, Any]]:
         """Get metadata for all courses in the vector store"""
         import json
+
         try:
             results = self.course_catalog.get()
-            if results and 'metadatas' in results:
+            if results and "metadatas" in results:
                 # Parse lessons JSON for each course
                 parsed_metadata = []
-                for metadata in results['metadatas']:
+                for metadata in results["metadatas"]:
                     course_meta = metadata.copy()
-                    if 'lessons_json' in course_meta:
-                        course_meta['lessons'] = json.loads(course_meta['lessons_json'])
-                        del course_meta['lessons_json']  # Remove the JSON string version
+                    if "lessons_json" in course_meta:
+                        course_meta["lessons"] = json.loads(course_meta["lessons_json"])
+                        del course_meta[
+                            "lessons_json"
+                        ]  # Remove the JSON string version
                     parsed_metadata.append(course_meta)
                 return parsed_metadata
             return []
@@ -238,30 +263,67 @@ def get_course_link(self, course_title: str) -> Optional[str]:
         try:
             # Get course by ID (title is the ID)
             results = self.course_catalog.get(ids=[course_title])
-            if results and 'metadatas' in results and results['metadatas']:
-                metadata = results['metadatas'][0]
-                return metadata.get('course_link')
+            if results and "metadatas" in results and results["metadatas"]:
+                metadata = results["metadatas"][0]
+                return metadata.get("course_link")
             return None
         except Exception as e:
             print(f"Error getting course link: {e}")
             return None
-    
+
     def get_lesson_link(self, course_title: str, lesson_number: int) -> Optional[str]:
         """Get lesson link for a given course title and lesson number"""
         import json
+
         try:
             # Get course by ID (title is the ID)
             results = self.course_catalog.get(ids=[course_title])
-            if results and 'metadatas' in results and results['metadatas']:
-                metadata = results['metadatas'][0]
-                lessons_json = metadata.get('lessons_json')
+            if results and "metadatas" in results and results["metadatas"]:
+                metadata = results["metadatas"][0]
+                lessons_json = metadata.get("lessons_json")
                 if lessons_json:
                     lessons = json.loads(lessons_json)
                     # Find the lesson with matching number
                     for lesson in lessons:
-                        if lesson.get('lesson_number') == lesson_number:
-                            return lesson.get('lesson_link')
+                        if lesson.get("lesson_number") == lesson_number:
+                            return lesson.get("lesson_link")
             return None
         except Exception as e:
             print(f"Error getting lesson link: {e}")
-    
\ No newline at end of file
+            return None
+
+    def get_course_outline(self, course_name: str) -> Optional[Dict[str, Any]]:
+        """
+        Get the complete outline of a course including all lessons.
+
+        Args:
+            course_name: Course name or partial name (fuzzy matching supported)
+
+        Returns:
+            Dictionary with course_title, course_link, and lessons list, or None if not found
+        """
+        import json
+
+        # Resolve course name using fuzzy matching
+        course_title = self._resolve_course_name(course_name)
+        if not course_title:
+            return None
+
+        try:
+            # Get course metadata by ID (title is the ID)
+            results = self.course_catalog.get(ids=[course_title])
+            if results and "metadatas" in results and results["metadatas"]:
+                metadata = results["metadatas"][0]
+                lessons_json = metadata.get("lessons_json")
+
+                if lessons_json:
+                    lessons = json.loads(lessons_json)
+                    return {
+                        "course_title": metadata.get("title"),
+                        "course_link": metadata.get("course_link"),
+                        "lessons": lessons,
+                    }
+            return None
+        except Exception as e:
+            print(f"Error getting course outline: {e}")
+            return None
diff --git a/frontend-changes.md b/frontend-changes.md
new file mode 100644
index 000000000..3371786fd
--- /dev/null
+++ b/frontend-changes.md
@@ -0,0 +1,165 @@
+# Frontend Changes
+
+## Change 1: Dark/Light Theme Toggle Button
+
+### Summary
+Added a theme toggle button (sun/moon icons) in the top-right corner that switches between dark and light modes with smooth CSS transitions. User preference is persisted via `localStorage`.
+
+### Files Changed
+
+#### `frontend/index.html`
+- Added a `<button id="themeToggle">` with inline SVG sun and moon icons, positioned before the `<header>` element inside `.container`
+- Includes `aria-label` and `title` for accessibility
+
+### Design Details
+- **Position**: Fixed top-right (`top: 1rem; right: 1rem; z-index: 100`)
+- **Icons**: Sun icon shown in light mode, moon icon shown in dark mode; swap uses opacity + rotation animation
+- **Default**: Dark mode (matches existing design)
+
+---
+
+## Change 2: Light Theme CSS Variables (Accessibility & Contrast Improvements)
+
+### Summary
+Improved the light theme color palette for proper contrast, readability, and WCAG AA compliance. Added new CSS variables to replace all hardcoded color values, ensuring every UI element adapts correctly across both themes.
+
+### Files Changed
+
+#### `frontend/style.css`
+
+**New CSS variables added to `:root` (dark theme defaults):**
+- `--user-message-text` — user bubble text color (`#ffffff`)
+- `--welcome-shadow` — shadow for the welcome message card
+- `--error-bg`, `--error-text`, `--error-border` — error message theming
+- `--success-bg`, `--success-text`, `--success-border` — success message theming
+- `--source-link-bg`, `--source-link-border` — source link chip background/border
+- `--source-visited`, `--source-visited-bg`, `--source-visited-border` — visited source link colors
+
+**Light theme `[data-theme="light"]` variable improvements:**
+- `--primary-color`: `#2563eb` → `#1d4ed8` (darker blue for better contrast on white)
+- `--primary-hover`: `#1d4ed8` → `#1e40af` (deeper hover state)
+- `--text-primary`: `#1e293b` → `#0f172a` (near-black, 15.4:1 contrast ratio on white)
+- `--text-secondary`: `#64748b` → `#475569` (darkened from ~4.6:1 to ~7:1 contrast ratio, comfortably passes WCAG AA)
+- `--border-color`: `#e2e8f0` → `#cbd5e1` (more visible borders)
+- `--welcome-border`: `#2563eb` → `#93bbfd` (softer accent for light bg)
+- `--welcome-shadow`: lighter shadow appropriate for light backgrounds
+- `--error-text`: `#f87171` → `#dc2626` (high-contrast red for light backgrounds)
+- `--success-text`: `#4ade80` → `#16a34a` (high-contrast green for light backgrounds)
+- `--error-bg`/`--success-bg`: solid light tints instead of low-opacity dark overlays
+
+**Bug fix:**
+- `.message-content blockquote` — `var(--primary)` (undefined) → `var(--primary-color)`
+
+### Accessibility Notes
+- All text-on-background combinations meet WCAG AA (4.5:1 minimum for normal text):
+  - `--text-primary` (#0f172a) on `--background` (#f8fafc): **15.4:1**
+  - `--text-secondary` (#475569) on `--background` (#f8fafc): **7.1:1**
+  - `--text-secondary` (#475569) on `--surface` (#ffffff): **7.3:1**
+  - `--error-text` (#dc2626) on `--error-bg` (#fef2f2): **5.6:1**
+  - `--success-text` (#16a34a) on `--success-bg` (#f0fdf4): **4.6:1**
+  - `--user-message-text` (#ffffff) on `--user-message` (#2563eb): **4.6:1**
+
+---
+
+## Change 3: JavaScript Toggle Functionality & Smooth Transitions
+
+### Summary
+Rewrote the theme toggle JavaScript for production-quality behavior: eliminated the flash of wrong theme on page load (FOUC), added OS color scheme detection, dynamic aria-labels, a keyboard shortcut, and expanded the CSS transition coverage to all themed elements.
+
+### Files Changed
+
+#### `frontend/index.html`
+- Added an inline `<script>` in `<head>` (before CSS renders) that applies the saved theme **before first paint**, preventing any flash of the wrong theme
+- The inline script also adds a `.no-transitions` class to `<html>` to suppress CSS transition animations during initial load
+- Falls back to `prefers-color-scheme` OS preference when no saved theme exists
+
+#### `frontend/script.js`
+
+**Refactored theme system into 5 focused functions:**
+
+| Function | Purpose |
+|---|---|
+| `initTheme()` | Removes `.no-transitions` class after paint (double-`requestAnimationFrame`), sets initial aria-label, registers OS preference listener and keyboard shortcut |
+| `getCurrentTheme()` | Reads current theme from `data-theme` attribute (returns `'light'` or `'dark'`) |
+| `applyTheme(theme, save)` | Sets/removes `data-theme` attribute, updates `<meta name="color-scheme">`, and optionally persists to `localStorage` |
+| `toggleTheme()` | Flips the current theme and saves |
+| `updateToggleLabel()` | Dynamically sets `aria-label` and `title` on the toggle button to reflect the *action* it will perform (e.g., "Switch to light mode") |
+
+**Key behaviors:**
+
+1. **No FOUC**: Theme is applied by inline `<script>` in `<head>` before the browser paints
+2. **No transition on load**: `.no-transitions` class suppresses all CSS transitions during initial render
+3. **OS preference detection**: Respects `prefers-color-scheme` when no saved preference exists; live listener updates in real time
+4. **Dynamic aria-label**: Describes the *action* (e.g., "Switch to dark mode (Ctrl+Shift+L)")
+5. **Keyboard shortcut**: `Ctrl+Shift+L` toggles the theme from anywhere
+
+#### `frontend/style.css`
+
+**Added `.no-transitions` suppression rule and expanded transition coverage to all themed elements.**
+
+---
+
+## Change 4: Full CSS Variable Coverage & Cross-Browser Theme Support
+
+### Summary
+Eliminated all remaining hardcoded `[data-theme="light"]`-specific CSS overrides by moving them into the CSS variable system. Added `color-scheme` support for browser-native elements, Firefox scrollbar theming, text selection styling, and a `<meta name="color-scheme">` tag for browser chrome adaptation.
+
+### Files Changed
+
+#### `frontend/index.html`
+- Added `<meta name="color-scheme" content="dark light">` in `<head>` — tells the browser to render native UI (scrollbars, form controls, autofill) in the matching theme
+- Inline `<script>` now also updates this meta tag to match the resolved theme before first paint
+- Bumped cache-busting versions to CSS `v=14`, JS `v=12`
+
+#### `frontend/script.js`
+- `applyTheme()` now updates `<meta name="color-scheme">` content to `'light'` or `'dark'` whenever the theme changes, keeping browser chrome in sync
+
+#### `frontend/style.css`
+
+**New CSS variables added to both `:root` and `[data-theme="light"]`:**
+
+| Variable | Dark Value | Light Value | Purpose |
+|---|---|---|---|
+| `--surface-alt` | `#0f172a` | `#f1f5f9` | Alternate surface for cards inside surfaces (stat items) |
+| `--assistant-message-bg` | `#1e293b` | `#f1f5f9` | Assistant message bubble background |
+| `--assistant-message-border` | `transparent` | `#cbd5e1` | Assistant message bubble border (visible in light theme) |
+| `--sidebar-shadow` | `none` | `2px 0 8px rgba(0,0,0,0.04)` | Depth shadow for sidebar |
+| `--input-bg` | `#1e293b` | `#ffffff` | Chat input field background |
+| `--scrollbar-thumb` | `#334155` | `#cbd5e1` | Scrollbar thumb color |
+| `--scrollbar-thumb-hover` | `#94a3b8` | `#94a3b8` | Scrollbar thumb hover |
+| `--scrollbar-track` | `#1e293b` | `#f1f5f9` | Scrollbar track background |
+| `--selection-bg` | `rgba(37,99,235,0.4)` | `rgba(37,99,235,0.25)` | Text selection highlight |
+| `--selection-text` | `#ffffff` | `#0f172a` | Text selection color |
+
+**Removed: the entire `[data-theme="light"]`-specific override block** (6 rules for assistant messages, sidebar shadow, chat input, stat items, suggested items). These are now handled purely by CSS variables, eliminating the maintenance burden of having both a variable system and hardcoded overrides.
+
+**Added `color-scheme` property:**
+- `:root` sets `color-scheme: dark`
+- `[data-theme="light"]` sets `color-scheme: light`
+- This makes browser-rendered elements (scrollbars in Firefox/Edge, form control outlines, autofill backgrounds) match the active theme automatically
+
+**Added `::selection` styling:**
+```css
+::selection {
+    background: var(--selection-bg);
+    color: var(--selection-text);
+}
+```
+
+**Added Firefox scrollbar support:**
+- `.sidebar` and `.chat-messages` now include `scrollbar-color: var(--scrollbar-thumb) var(--scrollbar-track)`
+- WebKit scrollbar pseudo-elements updated to use `--scrollbar-thumb`, `--scrollbar-thumb-hover`, and `--scrollbar-track` variables
+- Responsive media query scrollbar rules also updated to use the same variables
+
+**Updated element selectors to use new variables:**
+- `.message.assistant .message-content` — uses `var(--assistant-message-bg)` and `var(--assistant-message-border)`
+- `.sidebar` — uses `var(--sidebar-shadow)` for box-shadow
+- `#chatInput` — uses `var(--input-bg)` for background
+- `.stat-item` — uses `var(--surface-alt)` for background
+
+### Design Hierarchy Preserved
+The visual hierarchy between surfaces is maintained in both themes:
+- **Background** (page) < **Surface** (sidebar, toggle) < **Surface-alt** (cards inside sidebar)
+- In dark: `#0f172a` < `#1e293b` < `#0f172a` (cards recede)
+- In light: `#f8fafc` < `#ffffff` < `#f1f5f9` (cards subtly distinguished)
+- Assistant messages are distinguished from the page background in both themes via background color + optional border
diff --git a/frontend/index.html b/frontend/index.html
index f8e25a62f..699d955fc 100644
--- a/frontend/index.html
+++ b/frontend/index.html
@@ -7,10 +7,42 @@
     <meta http-equiv="Pragma" content="no-cache">
     <meta http-equiv="Expires" content="0">
     <title>Course Materials Assistant</title>
-    <link rel="stylesheet" href="style.css?v=9">
+    <meta name="color-scheme" content="dark light">
+    <link rel="stylesheet" href="style.css?v=14">
+    <script>
+        // Apply theme before first paint to prevent flash of wrong theme
+        (function() {
+            var saved = localStorage.getItem('theme');
+            var theme = saved || (window.matchMedia('(prefers-color-scheme: light)').matches ? 'light' : 'dark');
+            if (theme === 'light') {
+                document.documentElement.setAttribute('data-theme', 'light');
+            }
+            // Update color-scheme meta to match resolved theme
+            var meta = document.querySelector('meta[name="color-scheme"]');
+            if (meta) meta.content = theme === 'light' ? 'light' : 'dark';
+            // Mark that we haven't finished loading yet (suppress transitions)
+            document.documentElement.classList.add('no-transitions');
+        })();
+    </script>
 </head>
 <body>
     <div class="container">
+        <button id="themeToggle" class="theme-toggle" aria-label="Toggle dark mode" title="Toggle theme">
+            <svg class="theme-icon sun-icon" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round">
+                <circle cx="12" cy="12" r="5"></circle>
+                <line x1="12" y1="1" x2="12" y2="3"></line>
+                <line x1="12" y1="21" x2="12" y2="23"></line>
+                <line x1="4.22" y1="4.22" x2="5.64" y2="5.64"></line>
+                <line x1="18.36" y1="18.36" x2="19.78" y2="19.78"></line>
+                <line x1="1" y1="12" x2="3" y2="12"></line>
+                <line x1="21" y1="12" x2="23" y2="12"></line>
+                <line x1="4.22" y1="19.78" x2="5.64" y2="18.36"></line>
+                <line x1="18.36" y1="5.64" x2="19.78" y2="4.22"></line>
+            </svg>
+            <svg class="theme-icon moon-icon" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round">
+                <path d="M21 12.79A9 9 0 1 1 11.21 3 7 7 0 0 0 21 12.79z"></path>
+            </svg>
+        </button>
         <header>
             <h1>Course Materials Assistant</h1>
             <p class="subtitle">Ask questions about courses, instructors, and content</p>
@@ -19,6 +51,14 @@ <h1>Course Materials Assistant</h1>
         <div class="main-content">
             <!-- Left Sidebar -->
             <aside class="sidebar">
+                <!-- New Chat Button -->
+                <div class="sidebar-section">
+                    <button id="newChatButton" class="new-chat-button">
+                        <span class="new-chat-icon">+</span>
+                        <span class="new-chat-text">NEW CHAT</span>
+                    </button>
+                </div>
+
                 <!-- Course Stats -->
                 <div class="sidebar-section">
                     <details class="stats-collapsible">
@@ -76,6 +116,6 @@ <h1>Course Materials Assistant</h1>
 
 
     <script src="https://cdn.jsdelivr.net/npm/marked/marked.min.js"></script>
-    <script src="script.js?v=9"></script>
+    <script src="script.js?v=12"></script>
 </body>
 </html>
\ No newline at end of file
diff --git a/frontend/script.js b/frontend/script.js
index 562a8a363..ce410f51c 100644
--- a/frontend/script.js
+++ b/frontend/script.js
@@ -15,7 +15,8 @@ document.addEventListener('DOMContentLoaded', () => {
     sendButton = document.getElementById('sendButton');
     totalCourses = document.getElementById('totalCourses');
     courseTitles = document.getElementById('courseTitles');
-    
+
+    initTheme();
     setupEventListeners();
     createNewSession();
     loadCourseStats();
@@ -38,6 +39,20 @@ function setupEventListeners() {
             sendMessage();
         });
     });
+
+    // Theme toggle
+    const themeToggle = document.getElementById('themeToggle');
+    if (themeToggle) {
+        themeToggle.addEventListener('click', toggleTheme);
+    }
+
+    // New chat button
+    const newChatButton = document.getElementById('newChatButton');
+    if (newChatButton) {
+        newChatButton.addEventListener('click', () => {
+            createNewSession();
+        });
+    }
 }
 
 
@@ -122,10 +137,28 @@ function addMessage(content, type, sources = null, isWelcome = false) {
     let html = `<div class="message-content">${displayContent}</div>`;
     
     if (sources && sources.length > 0) {
+        // Format sources - handle both string and object formats
+        const formattedSources = sources.map(source => {
+            // Handle legacy string format (backward compatibility)
+            if (typeof source === 'string') {
+                return escapeHtml(source);
+            }
+            // Handle new object format with optional link
+            if (typeof source === 'object' && source.text) {
+                const text = escapeHtml(source.text);
+                if (source.link) {
+                    // Create clickable link that opens in new tab
+                    return `<a href="${escapeHtml(source.link)}" target="_blank" rel="noopener noreferrer" class="source-link">${text}</a>`;
+                }
+                return text;
+            }
+            return '';
+        }).filter(s => s); // Remove empty strings
+
         html += `
             <details class="sources-collapsible">
                 <summary class="sources-header">Sources</summary>
-                <div class="sources-content">${sources.join(', ')}</div>
+                <div class="sources-content">${formattedSources.join(', ')}</div>
             </details>
         `;
     }
@@ -147,9 +180,111 @@ function escapeHtml(text) {
 // Removed removeMessage function - no longer needed since we handle loading differently
 
 async function createNewSession() {
+    // Store old session ID for potential backend cleanup
+    const oldSessionId = currentSessionId;
+
+    // Reset session state
     currentSessionId = null;
+
+    // Clear UI
     chatMessages.innerHTML = '';
+
+    // Add welcome message
     addMessage('Welcome to the Course Materials Assistant! I can help you with questions about courses, lessons and specific content. What would you like to know?', 'assistant', null, true);
+
+    // Focus input for immediate use
+    if (chatInput) {
+        chatInput.focus();
+    }
+
+    // Clear backend session if one existed
+    if (oldSessionId) {
+        clearBackendSession(oldSessionId);
+    }
+}
+
+async function clearBackendSession(sessionId) {
+    if (!sessionId) return;
+
+    try {
+        await fetch(`${API_URL}/session/clear`, {
+            method: 'POST',
+            headers: {
+                'Content-Type': 'application/json',
+            },
+            body: JSON.stringify({ session_id: sessionId })
+        });
+    } catch (error) {
+        // Silent fail - session will be garbage collected eventually
+        console.warn('Failed to clear backend session:', error);
+    }
+}
+
+// Theme Toggle
+function initTheme() {
+    // Theme was already applied by the inline <script> in index.html to prevent FOUC.
+    // Here we just enable transitions now that the page has loaded,
+    // update the toggle button's aria-label, and listen for OS changes.
+
+    // Remove transition suppression after a frame so the browser has painted
+    requestAnimationFrame(() => {
+        requestAnimationFrame(() => {
+            document.documentElement.classList.remove('no-transitions');
+        });
+    });
+
+    updateToggleLabel();
+
+    // Listen for OS-level theme changes (only applies when no saved preference)
+    window.matchMedia('(prefers-color-scheme: light)').addEventListener('change', (e) => {
+        if (!localStorage.getItem('theme')) {
+            applyTheme(e.matches ? 'light' : 'dark', false);
+        }
+    });
+
+    // Keyboard shortcut: Ctrl+Shift+L to toggle theme
+    document.addEventListener('keydown', (e) => {
+        if (e.ctrlKey && e.shiftKey && e.key === 'L') {
+            e.preventDefault();
+            toggleTheme();
+        }
+    });
+}
+
+function getCurrentTheme() {
+    return document.documentElement.getAttribute('data-theme') === 'light' ? 'light' : 'dark';
+}
+
+function applyTheme(theme, save) {
+    if (theme === 'light') {
+        document.documentElement.setAttribute('data-theme', 'light');
+    } else {
+        document.documentElement.removeAttribute('data-theme');
+    }
+    // Keep color-scheme meta in sync for browser chrome (scrollbars, form controls)
+    var meta = document.querySelector('meta[name="color-scheme"]');
+    if (meta) meta.content = theme === 'light' ? 'light' : 'dark';
+    if (save) {
+        localStorage.setItem('theme', theme);
+    }
+    updateToggleLabel();
+}
+
+function toggleTheme() {
+    const next = getCurrentTheme() === 'light' ? 'dark' : 'light';
+    applyTheme(next, true);
+}
+
+function updateToggleLabel() {
+    const toggle = document.getElementById('themeToggle');
+    if (!toggle) return;
+    const current = getCurrentTheme();
+    toggle.setAttribute('aria-label',
+        current === 'dark' ? 'Switch to light mode' : 'Switch to dark mode'
+    );
+    toggle.setAttribute('title',
+        current === 'dark' ? 'Switch to light mode (Ctrl+Shift+L)' : 'Switch to dark mode (Ctrl+Shift+L)'
+    );
 }
 
 // Load course statistics
diff --git a/frontend/style.css b/frontend/style.css
index 825d03675..27d75845a 100644
--- a/frontend/style.css
+++ b/frontend/style.css
@@ -5,23 +5,95 @@
     padding: 0;
 }
 
-/* CSS Variables */
+/* CSS Variables - Dark Theme (default) */
 :root {
+    color-scheme: dark;
     --primary-color: #2563eb;
     --primary-hover: #1d4ed8;
     --background: #0f172a;
     --surface: #1e293b;
     --surface-hover: #334155;
+    --surface-alt: #0f172a;
     --text-primary: #f1f5f9;
     --text-secondary: #94a3b8;
     --border-color: #334155;
     --user-message: #2563eb;
-    --assistant-message: #374151;
+    --user-message-text: #ffffff;
+    --assistant-message-bg: #1e293b;
+    --assistant-message-border: transparent;
     --shadow: 0 4px 6px -1px rgba(0, 0, 0, 0.3);
+    --sidebar-shadow: none;
     --radius: 12px;
     --focus-ring: rgba(37, 99, 235, 0.2);
     --welcome-bg: #1e3a5f;
     --welcome-border: #2563eb;
+    --welcome-shadow: 0 4px 16px rgba(0, 0, 0, 0.2);
+    --code-bg: rgba(0, 0, 0, 0.2);
+    --error-bg: rgba(239, 68, 68, 0.1);
+    --error-text: #f87171;
+    --error-border: rgba(239, 68, 68, 0.2);
+    --success-bg: rgba(34, 197, 94, 0.1);
+    --success-text: #4ade80;
+    --success-border: rgba(34, 197, 94, 0.2);
+    --source-link-bg: rgba(59, 130, 246, 0.08);
+    --source-link-border: rgba(59, 130, 246, 0.2);
+    --source-visited: #8b5cf6;
+    --source-visited-bg: rgba(139, 92, 246, 0.08);
+    --source-visited-border: rgba(139, 92, 246, 0.2);
+    --selection-bg: rgba(37, 99, 235, 0.4);
+    --selection-text: #ffffff;
+    --scrollbar-thumb: #334155;
+    --scrollbar-thumb-hover: #94a3b8;
+    --scrollbar-track: #1e293b;
+    --input-bg: #1e293b;
+}
+
+/* Light Theme */
+[data-theme="light"] {
+    color-scheme: light;
+    --primary-color: #1d4ed8;
+    --primary-hover: #1e40af;
+    --background: #f8fafc;
+    --surface: #ffffff;
+    --surface-hover: #f1f5f9;
+    --surface-alt: #f1f5f9;
+    --text-primary: #0f172a;
+    --text-secondary: #475569;
+    --border-color: #cbd5e1;
+    --user-message: #2563eb;
+    --user-message-text: #ffffff;
+    --assistant-message-bg: #f1f5f9;
+    --assistant-message-border: #cbd5e1;
+    --shadow: 0 4px 6px -1px rgba(0, 0, 0, 0.08);
+    --sidebar-shadow: 2px 0 8px rgba(0, 0, 0, 0.04);
+    --focus-ring: rgba(37, 99, 235, 0.2);
+    --welcome-bg: #eff6ff;
+    --welcome-border: #93bbfd;
+    --welcome-shadow: 0 4px 16px rgba(0, 0, 0, 0.06);
+    --code-bg: rgba(0, 0, 0, 0.05);
+    --error-bg: #fef2f2;
+    --error-text: #dc2626;
+    --error-border: #fecaca;
+    --success-bg: #f0fdf4;
+    --success-text: #16a34a;
+    --success-border: #bbf7d0;
+    --source-link-bg: rgba(37, 99, 235, 0.06);
+    --source-link-border: rgba(37, 99, 235, 0.2);
+    --source-visited: #7c3aed;
+    --source-visited-bg: rgba(124, 58, 237, 0.06);
+    --source-visited-border: rgba(124, 58, 237, 0.2);
+    --selection-bg: rgba(37, 99, 235, 0.25);
+    --selection-text: #0f172a;
+    --scrollbar-thumb: #cbd5e1;
+    --scrollbar-thumb-hover: #94a3b8;
+    --scrollbar-track: #f1f5f9;
+    --input-bg: #ffffff;
+}
+
+/* Text Selection */
+::selection {
+    background: var(--selection-bg);
+    color: var(--selection-text);
 }
 
 /* Base Styles */
@@ -80,9 +152,11 @@ header h1 {
     width: 320px;
     background: var(--surface);
     border-right: 1px solid var(--border-color);
+    box-shadow: var(--sidebar-shadow);
     padding: 1.5rem;
     overflow-y: auto;
     flex-shrink: 0;
+    scrollbar-color: var(--scrollbar-thumb) var(--scrollbar-track);
 }
 
 /* Custom Scrollbar for Sidebar */
@@ -91,16 +165,16 @@ header h1 {
 }
 
 .sidebar::-webkit-scrollbar-track {
-    background: var(--surface);
+    background: var(--scrollbar-track);
 }
 
 .sidebar::-webkit-scrollbar-thumb {
-    background: var(--border-color);
+    background: var(--scrollbar-thumb);
     border-radius: 4px;
 }
 
 .sidebar::-webkit-scrollbar-thumb:hover {
-    background: var(--text-secondary);
+    background: var(--scrollbar-thumb-hover);
 }
 
 .sidebar-section {
@@ -142,6 +216,7 @@ header h1 {
     flex-direction: column;
     gap: 1rem;
     background: var(--background);
+    scrollbar-color: var(--scrollbar-thumb) var(--scrollbar-track);
 }
 
 /* Custom Scrollbar */
@@ -150,16 +225,16 @@ header h1 {
 }
 
 .chat-messages::-webkit-scrollbar-track {
-    background: var(--surface);
+    background: var(--scrollbar-track);
 }
 
 .chat-messages::-webkit-scrollbar-thumb {
-    background: var(--border-color);
+    background: var(--scrollbar-thumb);
     border-radius: 4px;
 }
 
 .chat-messages::-webkit-scrollbar-thumb:hover {
-    background: var(--text-secondary);
+    background: var(--scrollbar-thumb-hover);
 }
 
 /* Message Styles */
@@ -196,13 +271,14 @@ header h1 {
 
 .message.user .message-content {
     background: var(--user-message);
-    color: white;
+    color: var(--user-message-text);
     border-bottom-right-radius: 4px;
 }
 
 .message.assistant .message-content {
-    background: var(--surface);
+    background: var(--assistant-message-bg);
     color: var(--text-primary);
+    border: 1px solid var(--assistant-message-border);
     border-bottom-left-radius: 4px;
 }
 
@@ -245,6 +321,50 @@ header h1 {
     color: var(--text-secondary);
 }
 
+/* Source link styling */
+.sources-content .source-link {
+    color: var(--primary-color);
+    text-decoration: none;
+    transition: all 0.2s ease;
+    padding: 0.25rem 0.5rem;
+    border-radius: 4px;
+    background: var(--source-link-bg);
+    border: 1px solid var(--source-link-border);
+    display: inline-block;
+    margin: 0.15rem 0.2rem;
+    font-weight: 500;
+}
+
+.sources-content .source-link:hover {
+    color: #ffffff;
+    background: var(--primary-color);
+    border-color: var(--primary-color);
+    transform: translateY(-1px);
+    box-shadow: 0 2px 8px rgba(59, 130, 246, 0.3);
+}
+
+.sources-content .source-link:focus {
+    outline: 2px solid var(--primary-color);
+    outline-offset: 2px;
+    border-radius: 4px;
+}
+
+.sources-content .source-link:visited {
+    color: var(--source-visited);
+    background: var(--source-visited-bg);
+    border-color: var(--source-visited-border);
+}
+
+.sources-content .source-link:visited:hover {
+    color: #ffffff;
+    background: var(--source-visited);
+    border-color: var(--source-visited);
+}
+
+.sources-content .source-link:active {
+    transform: translateY(0);
+}
+
 /* Markdown formatting styles */
 .message-content h1,
 .message-content h2,
@@ -277,7 +397,7 @@ header h1 {
 }
 
 .message-content code {
-    background-color: rgba(0, 0, 0, 0.2);
+    background-color: var(--code-bg);
     padding: 0.125rem 0.25rem;
     border-radius: 3px;
     font-family: 'Fira Code', 'Consolas', monospace;
@@ -285,7 +405,7 @@ header h1 {
 }
 
 .message-content pre {
-    background-color: rgba(0, 0, 0, 0.2);
+    background-color: var(--code-bg);
     padding: 0.75rem;
     border-radius: 4px;
     overflow-x: auto;
@@ -298,7 +418,7 @@ header h1 {
 }
 
 .message-content blockquote {
-    border-left: 3px solid var(--primary);
+    border-left: 3px solid var(--primary-color);
     padding-left: 1rem;
     margin: 0.5rem 0;
     color: var(--text-secondary);
@@ -306,9 +426,9 @@ header h1 {
 
 /* Welcome message special styling */
 .message.welcome-message .message-content {
-    background: var(--surface);
-    border: 2px solid var(--border-color);
-    box-shadow: 0 4px 16px rgba(0, 0, 0, 0.2);
+    background: var(--welcome-bg);
+    border: 2px solid var(--welcome-border);
+    box-shadow: var(--welcome-shadow);
     position: relative;
 }
 
@@ -340,7 +460,7 @@ header h1 {
 #chatInput {
     flex: 1;
     padding: 0.875rem 1.25rem;
-    background: var(--surface);
+    background: var(--input-bg);
     border: 1px solid var(--border-color);
     border-radius: 24px;
     color: var(--text-primary);
@@ -427,21 +547,21 @@ header h1 {
 
 /* Error Message */
 .error-message {
-    background: rgba(239, 68, 68, 0.1);
-    color: #f87171;
+    background: var(--error-bg);
+    color: var(--error-text);
     padding: 0.75rem 1.25rem;
     border-radius: 8px;
-    border: 1px solid rgba(239, 68, 68, 0.2);
+    border: 1px solid var(--error-border);
     margin: 0.5rem 0;
 }
 
 /* Success Message */
 .success-message {
-    background: rgba(34, 197, 94, 0.1);
-    color: #4ade80;
+    background: var(--success-bg);
+    color: var(--success-text);
     padding: 0.75rem 1.25rem;
     border-radius: 8px;
-    border: 1px solid rgba(34, 197, 94, 0.2);
+    border: 1px solid var(--success-border);
     margin: 0.5rem 0;
 }
 
@@ -504,7 +624,7 @@ details[open] .suggested-header::before {
 .stat-item {
     text-align: left;
     padding: 0.75rem;
-    background: var(--background);
+    background: var(--surface-alt);
     border-radius: 8px;
     border: 1px solid var(--border-color);
     margin-bottom: 0.75rem;
@@ -601,6 +721,48 @@ details[open] .suggested-header::before {
     text-transform: none;
 }
 
+/* New Chat Button */
+.new-chat-button {
+    width: 100%;
+    padding: 0.5rem 0;
+    background: none;
+    border: none;
+    color: var(--text-secondary);
+    font-size: 0.875rem;
+    font-weight: 600;
+    cursor: pointer;
+    transition: color 0.2s ease;
+    text-align: left;
+    display: flex;
+    align-items: center;
+    gap: 0.5rem;
+    text-transform: uppercase;
+    letter-spacing: 0.5px;
+}
+
+.new-chat-icon {
+    font-size: 1.25rem;
+    font-weight: 400;
+    color: var(--text-secondary);
+}
+
+.new-chat-text {
+    flex: 1;
+}
+
+.new-chat-button:hover {
+    color: var(--primary-color);
+}
+
+.new-chat-button:focus {
+    outline: none;
+    color: var(--primary-color);
+}
+
+.new-chat-button:active {
+    color: var(--primary-color);
+}
+
 /* Suggested Questions in Sidebar */
 .suggested-items {
     display: flex;
@@ -634,6 +796,102 @@ details[open] .suggested-header::before {
     transform: translateX(2px);
 }
 
+/* Theme Toggle Button */
+.theme-toggle {
+    position: fixed;
+    top: 1rem;
+    right: 1rem;
+    z-index: 100;
+    width: 44px;
+    height: 44px;
+    border-radius: 50%;
+    border: 1px solid var(--border-color);
+    background: var(--surface);
+    color: var(--text-secondary);
+    cursor: pointer;
+    display: flex;
+    align-items: center;
+    justify-content: center;
+    transition: background 0.3s ease, color 0.3s ease, border-color 0.3s ease, box-shadow 0.3s ease;
+    box-shadow: var(--shadow);
+}
+
+.theme-toggle:hover {
+    color: var(--primary-color);
+    border-color: var(--primary-color);
+    box-shadow: 0 4px 12px rgba(37, 99, 235, 0.2);
+}
+
+.theme-toggle:focus {
+    outline: none;
+    box-shadow: 0 0 0 3px var(--focus-ring);
+}
+
+.theme-toggle:active {
+    transform: scale(0.92);
+}
+
+/* Sun/Moon icon visibility */
+.theme-icon {
+    position: absolute;
+    transition: opacity 0.3s ease, transform 0.3s ease;
+}
+
+.sun-icon {
+    opacity: 0;
+    transform: rotate(-90deg) scale(0.5);
+}
+
+.moon-icon {
+    opacity: 1;
+    transform: rotate(0deg) scale(1);
+}
+
+[data-theme="light"] .sun-icon {
+    opacity: 1;
+    transform: rotate(0deg) scale(1);
+}
+
+[data-theme="light"] .moon-icon {
+    opacity: 0;
+    transform: rotate(90deg) scale(0.5);
+}
+
+/* Smooth theme transition on all themed elements */
+body,
+.container,
+.sidebar,
+.chat-main,
+.chat-container,
+.chat-messages,
+.chat-input-container,
+#chatInput,
+#sendButton,
+.stat-item,
+.suggested-item,
+.message-content,
+.new-chat-button,
+.theme-toggle,
+.sources-collapsible,
+.sources-content,
+.course-title-item,
+.stat-label,
+.stat-value,
+.new-chat-icon,
+.stats-header,
+.suggested-header,
+.loading span {
+    transition: background-color 0.3s ease, color 0.3s ease, border-color 0.3s ease, box-shadow 0.3s ease;
+}
+
+/* Suppress all transitions during initial page load to prevent flash */
+.no-transitions,
+.no-transitions *,
+.no-transitions *::before,
+.no-transitions *::after {
+    transition: none !important;
+}
+
 /* Responsive Design */
 @media (max-width: 768px) {
     .main-content {
@@ -652,18 +910,18 @@ details[open] .suggested-header::before {
     .sidebar::-webkit-scrollbar {
         width: 8px;
     }
-    
+
     .sidebar::-webkit-scrollbar-track {
-        background: var(--surface);
+        background: var(--scrollbar-track);
     }
-    
+
     .sidebar::-webkit-scrollbar-thumb {
-        background: var(--border-color);
+        background: var(--scrollbar-thumb);
         border-radius: 4px;
     }
-    
+
     .sidebar::-webkit-scrollbar-thumb:hover {
-        background: var(--text-secondary);
+        background: var(--scrollbar-thumb-hover);
     }
     
     .chat-main {
diff --git a/pyproject.toml b/pyproject.toml
index 3f05e2de0..5a5d555a7 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -12,4 +12,23 @@ dependencies = [
     "uvicorn==0.35.0",
     "python-multipart==0.0.20",
     "python-dotenv==1.1.1",
+    "pytest>=8.0",
+    "httpx>=0.27.0",
 ]
+
+[tool.pytest.ini_options]
+testpaths = ["backend/tests"]
+pythonpath = ["backend"]
+filterwarnings = [
+    "ignore::DeprecationWarning",
+    "ignore:resource_tracker:UserWarning",
+]
+
+[dependency-groups]
+dev = [
+    "black>=24.0",
+]
+
+[tool.black]
+line-length = 88
+target-version = ["py313"]
diff --git a/scripts/quality.sh b/scripts/quality.sh
new file mode 100644
index 000000000..50a32db7b
--- /dev/null
+++ b/scripts/quality.sh
@@ -0,0 +1,68 @@
+#!/bin/bash
+# Run code quality checks for the project
+
+set -e
+
+PROJECT_ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+cd "$PROJECT_ROOT"
+
+# Colors for output
+GREEN='\033[0;32m'
+RED='\033[0;31m'
+YELLOW='\033[1;33m'
+NC='\033[0m' # No Color
+
+usage() {
+    echo "Usage: $0 [command]"
+    echo ""
+    echo "Commands:"
+    echo "  format    Run black to format all Python files"
+    echo "  check     Run black in check mode (no changes, exit 1 if unformatted)"
+    echo "  test      Run pytest"
+    echo "  all       Run all checks (check + test)"
+    echo ""
+    echo "If no command is given, 'all' is used."
+}
+
+run_format() {
+    echo -e "${YELLOW}Formatting code with black...${NC}"
+    uv run --group dev black backend/ main.py
+    echo -e "${GREEN}Formatting complete.${NC}"
+}
+
+run_check() {
+    echo -e "${YELLOW}Checking formatting with black...${NC}"
+    if uv run --group dev black --check backend/ main.py; then
+        echo -e "${GREEN}All files are properly formatted.${NC}"
+    else
+        echo -e "${RED}Some files need formatting. Run '$0 format' to fix.${NC}"
+        return 1
+    fi
+}
+
+run_test() {
+    echo -e "${YELLOW}Running tests...${NC}"
+    uv run pytest backend/tests/ -v
+    echo -e "${GREEN}Tests passed.${NC}"
+}
+
+run_all() {
+    run_check
+    run_test
+    echo -e "${GREEN}All quality checks passed.${NC}"
+}
+
+COMMAND="${1:-all}"
+
+case "$COMMAND" in
+    format) run_format ;;
+    check)  run_check ;;
+    test)   run_test ;;
+    all)    run_all ;;
+    -h|--help) usage ;;
+    *)
+        echo -e "${RED}Unknown command: $COMMAND${NC}"
+        usage
+        exit 1
+        ;;
+esac
diff --git a/uv.lock b/uv.lock
index 9ae65c557..d9ebe985f 100644
--- a/uv.lock
+++ b/uv.lock
@@ -1,5 +1,5 @@
 version = 1
-revision = 2
+revision = 3
 requires-python = ">=3.13"
 
 [[package]]
@@ -110,6 +110,33 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a9/cf/45fb5261ece3e6b9817d3d82b2f343a505fd58674a92577923bc500bd1aa/bcrypt-4.3.0-cp39-abi3-win_amd64.whl", hash = "sha256:e53e074b120f2877a35cc6c736b8eb161377caae8925c17688bd46ba56daaa5b", size = 152799, upload-time = "2025-02-28T01:23:53.139Z" },
 ]
 
+[[package]]
+name = "black"
+version = "26.1.0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "click" },
+    { name = "mypy-extensions" },
+    { name = "packaging" },
+    { name = "pathspec" },
+    { name = "platformdirs" },
+    { name = "pytokens" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/13/88/560b11e521c522440af991d46848a2bde64b5f7202ec14e1f46f9509d328/black-26.1.0.tar.gz", hash = "sha256:d294ac3340eef9c9eb5d29288e96dc719ff269a88e27b396340459dd85da4c58", size = 658785, upload-time = "2026-01-18T04:50:11.993Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/79/04/fa2f4784f7237279332aa735cdfd5ae2e7730db0072fb2041dadda9ae551/black-26.1.0-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:ba1d768fbfb6930fc93b0ecc32a43d8861ded16f47a40f14afa9bb04ab93d304", size = 1877781, upload-time = "2026-01-18T04:59:39.054Z" },
+    { url = "https://files.pythonhosted.org/packages/cf/ad/5a131b01acc0e5336740a039628c0ab69d60cf09a2c87a4ec49f5826acda/black-26.1.0-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:2b807c240b64609cb0e80d2200a35b23c7df82259f80bef1b2c96eb422b4aac9", size = 1699670, upload-time = "2026-01-18T04:59:41.005Z" },
+    { url = "https://files.pythonhosted.org/packages/da/7c/b05f22964316a52ab6b4265bcd52c0ad2c30d7ca6bd3d0637e438fc32d6e/black-26.1.0-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:1de0f7d01cc894066a1153b738145b194414cc6eeaad8ef4397ac9abacf40f6b", size = 1775212, upload-time = "2026-01-18T04:59:42.545Z" },
+    { url = "https://files.pythonhosted.org/packages/a6/a3/e8d1526bea0446e040193185353920a9506eab60a7d8beb062029129c7d2/black-26.1.0-cp313-cp313-win_amd64.whl", hash = "sha256:91a68ae46bf07868963671e4d05611b179c2313301bd756a89ad4e3b3db2325b", size = 1409953, upload-time = "2026-01-18T04:59:44.357Z" },
+    { url = "https://files.pythonhosted.org/packages/c7/5a/d62ebf4d8f5e3a1daa54adaab94c107b57be1b1a2f115a0249b41931e188/black-26.1.0-cp313-cp313-win_arm64.whl", hash = "sha256:be5e2fe860b9bd9edbf676d5b60a9282994c03fbbd40fe8f5e75d194f96064ca", size = 1217707, upload-time = "2026-01-18T04:59:45.719Z" },
+    { url = "https://files.pythonhosted.org/packages/6a/83/be35a175aacfce4b05584ac415fd317dd6c24e93a0af2dcedce0f686f5d8/black-26.1.0-cp314-cp314-macosx_10_15_x86_64.whl", hash = "sha256:9dc8c71656a79ca49b8d3e2ce8103210c9481c57798b48deeb3a8bb02db5f115", size = 1871864, upload-time = "2026-01-18T04:59:47.586Z" },
+    { url = "https://files.pythonhosted.org/packages/a5/f5/d33696c099450b1274d925a42b7a030cd3ea1f56d72e5ca8bbed5f52759c/black-26.1.0-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:b22b3810451abe359a964cc88121d57f7bce482b53a066de0f1584988ca36e79", size = 1701009, upload-time = "2026-01-18T04:59:49.443Z" },
+    { url = "https://files.pythonhosted.org/packages/1b/87/670dd888c537acb53a863bc15abbd85b22b429237d9de1b77c0ed6b79c42/black-26.1.0-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:53c62883b3f999f14e5d30b5a79bd437236658ad45b2f853906c7cbe79de00af", size = 1767806, upload-time = "2026-01-18T04:59:50.769Z" },
+    { url = "https://files.pythonhosted.org/packages/fe/9c/cd3deb79bfec5bcf30f9d2100ffeec63eecce826eb63e3961708b9431ff1/black-26.1.0-cp314-cp314-win_amd64.whl", hash = "sha256:f016baaadc423dc960cdddf9acae679e71ee02c4c341f78f3179d7e4819c095f", size = 1433217, upload-time = "2026-01-18T04:59:52.218Z" },
+    { url = "https://files.pythonhosted.org/packages/4e/29/f3be41a1cf502a283506f40f5d27203249d181f7a1a2abce1c6ce188035a/black-26.1.0-cp314-cp314-win_arm64.whl", hash = "sha256:66912475200b67ef5a0ab665011964bf924745103f51977a78b4fb92a9fc1bf0", size = 1245773, upload-time = "2026-01-18T04:59:54.457Z" },
+    { url = "https://files.pythonhosted.org/packages/e4/3d/51bdb3ecbfadfaf825ec0c75e1de6077422b4afa2091c6c9ba34fbfc0c2d/black-26.1.0-py3-none-any.whl", hash = "sha256:1054e8e47ebd686e078c0bb0eaf31e6ce69c966058d122f2c0c950311f9f3ede", size = 204010, upload-time = "2026-01-18T04:50:09.978Z" },
+]
+
 [[package]]
 name = "build"
 version = "1.2.2.post1"
@@ -470,6 +497,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/a4/ed/1f1afb2e9e7f38a545d628f864d562a5ae64fe6f7a10e28ffb9b185b4e89/importlib_resources-6.5.2-py3-none-any.whl", hash = "sha256:789cfdc3ed28c78b67a06acb8126751ced69a3d5f79c095a98298cd8a760ccec", size = 37461, upload-time = "2025-01-03T18:51:54.306Z" },
 ]
 
+[[package]]
+name = "iniconfig"
+version = "2.3.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/72/34/14ca021ce8e5dfedc35312d08ba8bf51fdd999c576889fc2c24cb97f4f10/iniconfig-2.3.0.tar.gz", hash = "sha256:c76315c77db068650d49c5b56314774a7804df16fee4402c1f19d6d15d8c4730", size = 20503, upload-time = "2025-10-18T21:55:43.219Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cb/b1/3846dd7f199d53cb17f49cba7e651e9ce294d8497c8c150530ed11865bb8/iniconfig-2.3.0-py3-none-any.whl", hash = "sha256:f631c04d2c48c52b84d0d0549c99ff3859c98df65b3101406327ecc7d53fbf12", size = 7484, upload-time = "2025-10-18T21:55:41.639Z" },
+]
+
 [[package]]
 name = "jinja2"
 version = "3.1.6"
@@ -658,6 +694,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/43/e3/7d92a15f894aa0c9c4b49b8ee9ac9850d6e63b03c9c32c0367a13ae62209/mpmath-1.3.0-py3-none-any.whl", hash = "sha256:a0b2b9fe80bbcd81a6647ff13108738cfb482d481d826cc0e02f5b35e5c88d2c", size = 536198, upload-time = "2023-03-07T16:47:09.197Z" },
 ]
 
+[[package]]
+name = "mypy-extensions"
+version = "1.1.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/a2/6e/371856a3fb9d31ca8dac321cda606860fa4548858c0cc45d9d1d4ca2628b/mypy_extensions-1.1.0.tar.gz", hash = "sha256:52e68efc3284861e772bbcd66823fde5ae21fd2fdb51c62a211403730b916558", size = 6343, upload-time = "2025-04-22T14:54:24.164Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/79/7b/2c79738432f5c924bef5071f933bcc9efd0473bac3b4aa584a6f7c1c8df8/mypy_extensions-1.1.0-py3-none-any.whl", hash = "sha256:1be4cccdb0f2482337c4743e60421de3a356cd97508abadd57d47403e94f5505", size = 4963, upload-time = "2025-04-22T14:54:22.983Z" },
+]
+
 [[package]]
 name = "networkx"
 version = "3.5"
@@ -983,6 +1028,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/20/12/38679034af332785aac8774540895e234f4d07f7545804097de4b666afd8/packaging-25.0-py3-none-any.whl", hash = "sha256:29572ef2b1f17581046b3a2227d5c611fb25ec70ca1ba8554b24b0e69331a484", size = 66469, upload-time = "2025-04-19T11:48:57.875Z" },
 ]
 
+[[package]]
+name = "pathspec"
+version = "1.0.4"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/fa/36/e27608899f9b8d4dff0617b2d9ab17ca5608956ca44461ac14ac48b44015/pathspec-1.0.4.tar.gz", hash = "sha256:0210e2ae8a21a9137c0d470578cb0e595af87edaa6ebf12ff176f14a02e0e645", size = 131200, upload-time = "2026-01-27T03:59:46.938Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/ef/3c/2c197d226f9ea224a9ab8d197933f9da0ae0aac5b6e0f884e2b8d9c8e9f7/pathspec-1.0.4-py3-none-any.whl", hash = "sha256:fb6ae2fd4e7c921a165808a552060e722767cfa526f99ca5156ed2ce45a5c723", size = 55206, upload-time = "2026-01-27T03:59:45.137Z" },
+]
+
 [[package]]
 name = "pillow"
 version = "11.3.0"
@@ -1038,6 +1092,24 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/89/c7/5572fa4a3f45740eaab6ae86fcdf7195b55beac1371ac8c619d880cfe948/pillow-11.3.0-cp314-cp314t-win_arm64.whl", hash = "sha256:79ea0d14d3ebad43ec77ad5272e6ff9bba5b679ef73375ea760261207fa8e0aa", size = 2512835, upload-time = "2025-07-01T09:15:50.399Z" },
 ]
 
+[[package]]
+name = "platformdirs"
+version = "4.9.2"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/1b/04/fea538adf7dbbd6d186f551d595961e564a3b6715bdf276b477460858672/platformdirs-4.9.2.tar.gz", hash = "sha256:9a33809944b9db043ad67ca0db94b14bf452cc6aeaac46a88ea55b26e2e9d291", size = 28394, upload-time = "2026-02-16T03:56:10.574Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/48/31/05e764397056194206169869b50cf2fee4dbbbc71b344705b9c0d878d4d8/platformdirs-4.9.2-py3-none-any.whl", hash = "sha256:9170634f126f8efdae22fb58ae8a0eaa86f38365bc57897a6c4f781d1f5875bd", size = 21168, upload-time = "2026-02-16T03:56:08.891Z" },
+]
+
+[[package]]
+name = "pluggy"
+version = "1.6.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/f9/e2/3e91f31a7d2b083fe6ef3fa267035b518369d9511ffab804f839851d2779/pluggy-1.6.0.tar.gz", hash = "sha256:7dcc130b76258d33b90f61b658791dede3486c3e6bfb003ee5c9bfb396dd22f3", size = 69412, upload-time = "2025-05-15T12:30:07.975Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/54/20/4d324d65cc6d9205fabedc306948156824eb9f0ee1633355a8f7ec5c66bf/pluggy-1.6.0-py3-none-any.whl", hash = "sha256:e920276dd6813095e9377c0bc5566d94c932c33b27a3e3945d8389c374dd4746", size = 20538, upload-time = "2025-05-15T12:30:06.134Z" },
+]
+
 [[package]]
 name = "posthog"
 version = "5.4.0"
@@ -1207,6 +1279,22 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/5a/dc/491b7661614ab97483abf2056be1deee4dc2490ecbf7bff9ab5cdbac86e1/pyreadline3-3.5.4-py3-none-any.whl", hash = "sha256:eaf8e6cc3c49bcccf145fc6067ba8643d1df34d604a1ec0eccbf7a18e6d3fae6", size = 83178, upload-time = "2024-09-19T02:40:08.598Z" },
 ]
 
+[[package]]
+name = "pytest"
+version = "9.0.2"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "colorama", marker = "sys_platform == 'win32'" },
+    { name = "iniconfig" },
+    { name = "packaging" },
+    { name = "pluggy" },
+    { name = "pygments" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/d1/db/7ef3487e0fb0049ddb5ce41d3a49c235bf9ad299b6a25d5780a89f19230f/pytest-9.0.2.tar.gz", hash = "sha256:75186651a92bd89611d1d9fc20f0b4345fd827c41ccd5c299a868a05d70edf11", size = 1568901, upload-time = "2025-12-06T21:30:51.014Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/3b/ab/b3226f0bd7cdcf710fbede2b3548584366da3b19b5021e74f5bde2a8fa3f/pytest-9.0.2-py3-none-any.whl", hash = "sha256:711ffd45bf766d5264d487b917733b453d917afd2b0ad65223959f59089f875b", size = 374801, upload-time = "2025-12-06T21:30:49.154Z" },
+]
+
 [[package]]
 name = "python-dateutil"
 version = "2.9.0.post0"
@@ -1237,6 +1325,30 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/45/58/38b5afbc1a800eeea951b9285d3912613f2603bdf897a4ab0f4bd7f405fc/python_multipart-0.0.20-py3-none-any.whl", hash = "sha256:8a62d3a8335e06589fe01f2a3e178cdcc632f3fbe0d492ad9ee0ec35aab1f104", size = 24546, upload-time = "2024-12-16T19:45:44.423Z" },
 ]
 
+[[package]]
+name = "pytokens"
+version = "0.4.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/b6/34/b4e015b99031667a7b960f888889c5bd34ef585c85e1cb56a594b92836ac/pytokens-0.4.1.tar.gz", hash = "sha256:292052fe80923aae2260c073f822ceba21f3872ced9a68bb7953b348e561179a", size = 23015, upload-time = "2026-01-30T01:03:45.924Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cb/dc/08b1a080372afda3cceb4f3c0a7ba2bde9d6a5241f1edb02a22a019ee147/pytokens-0.4.1-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:8bdb9d0ce90cbf99c525e75a2fa415144fd570a1ba987380190e8b786bc6ef9b", size = 160720, upload-time = "2026-01-30T01:03:13.843Z" },
+    { url = "https://files.pythonhosted.org/packages/64/0c/41ea22205da480837a700e395507e6a24425151dfb7ead73343d6e2d7ffe/pytokens-0.4.1-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:5502408cab1cb18e128570f8d598981c68a50d0cbd7c61312a90507cd3a1276f", size = 254204, upload-time = "2026-01-30T01:03:14.886Z" },
+    { url = "https://files.pythonhosted.org/packages/e0/d2/afe5c7f8607018beb99971489dbb846508f1b8f351fcefc225fcf4b2adc0/pytokens-0.4.1-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:29d1d8fb1030af4d231789959f21821ab6325e463f0503a61d204343c9b355d1", size = 268423, upload-time = "2026-01-30T01:03:15.936Z" },
+    { url = "https://files.pythonhosted.org/packages/68/d4/00ffdbd370410c04e9591da9220a68dc1693ef7499173eb3e30d06e05ed1/pytokens-0.4.1-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:970b08dd6b86058b6dc07efe9e98414f5102974716232d10f32ff39701e841c4", size = 266859, upload-time = "2026-01-30T01:03:17.458Z" },
+    { url = "https://files.pythonhosted.org/packages/a7/c9/c3161313b4ca0c601eeefabd3d3b576edaa9afdefd32da97210700e47652/pytokens-0.4.1-cp313-cp313-win_amd64.whl", hash = "sha256:9bd7d7f544d362576be74f9d5901a22f317efc20046efe2034dced238cbbfe78", size = 103520, upload-time = "2026-01-30T01:03:18.652Z" },
+    { url = "https://files.pythonhosted.org/packages/8f/a7/b470f672e6fc5fee0a01d9e75005a0e617e162381974213a945fcd274843/pytokens-0.4.1-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:4a14d5f5fc78ce85e426aa159489e2d5961acf0e47575e08f35584009178e321", size = 160821, upload-time = "2026-01-30T01:03:19.684Z" },
+    { url = "https://files.pythonhosted.org/packages/80/98/e83a36fe8d170c911f864bfded690d2542bfcfacb9c649d11a9e6eb9dc41/pytokens-0.4.1-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:97f50fd18543be72da51dd505e2ed20d2228c74e0464e4262e4899797803d7fa", size = 254263, upload-time = "2026-01-30T01:03:20.834Z" },
+    { url = "https://files.pythonhosted.org/packages/0f/95/70d7041273890f9f97a24234c00b746e8da86df462620194cef1d411ddeb/pytokens-0.4.1-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:dc74c035f9bfca0255c1af77ddd2d6ae8419012805453e4b0e7513e17904545d", size = 268071, upload-time = "2026-01-30T01:03:21.888Z" },
+    { url = "https://files.pythonhosted.org/packages/da/79/76e6d09ae19c99404656d7db9c35dfd20f2086f3eb6ecb496b5b31163bad/pytokens-0.4.1-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:f66a6bbe741bd431f6d741e617e0f39ec7257ca1f89089593479347cc4d13324", size = 271716, upload-time = "2026-01-30T01:03:23.633Z" },
+    { url = "https://files.pythonhosted.org/packages/79/37/482e55fa1602e0a7ff012661d8c946bafdc05e480ea5a32f4f7e336d4aa9/pytokens-0.4.1-cp314-cp314-win_amd64.whl", hash = "sha256:b35d7e5ad269804f6697727702da3c517bb8a5228afa450ab0fa787732055fc9", size = 104539, upload-time = "2026-01-30T01:03:24.788Z" },
+    { url = "https://files.pythonhosted.org/packages/30/e8/20e7db907c23f3d63b0be3b8a4fd1927f6da2395f5bcc7f72242bb963dfe/pytokens-0.4.1-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:8fcb9ba3709ff77e77f1c7022ff11d13553f3c30299a9fe246a166903e9091eb", size = 168474, upload-time = "2026-01-30T01:03:26.428Z" },
+    { url = "https://files.pythonhosted.org/packages/d6/81/88a95ee9fafdd8f5f3452107748fd04c24930d500b9aba9738f3ade642cc/pytokens-0.4.1-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:79fc6b8699564e1f9b521582c35435f1bd32dd06822322ec44afdeba666d8cb3", size = 290473, upload-time = "2026-01-30T01:03:27.415Z" },
+    { url = "https://files.pythonhosted.org/packages/cf/35/3aa899645e29b6375b4aed9f8d21df219e7c958c4c186b465e42ee0a06bf/pytokens-0.4.1-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:d31b97b3de0f61571a124a00ffe9a81fb9939146c122c11060725bd5aea79975", size = 303485, upload-time = "2026-01-30T01:03:28.558Z" },
+    { url = "https://files.pythonhosted.org/packages/52/a0/07907b6ff512674d9b201859f7d212298c44933633c946703a20c25e9d81/pytokens-0.4.1-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:967cf6e3fd4adf7de8fc73cd3043754ae79c36475c1c11d514fc72cf5490094a", size = 306698, upload-time = "2026-01-30T01:03:29.653Z" },
+    { url = "https://files.pythonhosted.org/packages/39/2a/cbbf9250020a4a8dd53ba83a46c097b69e5eb49dd14e708f496f548c6612/pytokens-0.4.1-cp314-cp314t-win_amd64.whl", hash = "sha256:584c80c24b078eec1e227079d56dc22ff755e0ba8654d8383b2c549107528918", size = 116287, upload-time = "2026-01-30T01:03:30.912Z" },
+    { url = "https://files.pythonhosted.org/packages/c6/78/397db326746f0a342855b81216ae1f0a32965deccfd7c830a2dbc66d2483/pytokens-0.4.1-py3-none-any.whl", hash = "sha256:26cef14744a8385f35d0e095dc8b3a7583f6c953c2e3d269c7f82484bf5ad2de", size = 13729, upload-time = "2026-01-30T01:03:45.029Z" },
+]
+
 [[package]]
 name = "pyyaml"
 version = "6.0.2"
@@ -1555,23 +1667,35 @@ dependencies = [
     { name = "anthropic" },
     { name = "chromadb" },
     { name = "fastapi" },
+    { name = "httpx" },
+    { name = "pytest" },
     { name = "python-dotenv" },
     { name = "python-multipart" },
     { name = "sentence-transformers" },
     { name = "uvicorn" },
 ]
 
+[package.dev-dependencies]
+dev = [
+    { name = "black" },
+]
+
 [package.metadata]
 requires-dist = [
     { name = "anthropic", specifier = "==0.58.2" },
     { name = "chromadb", specifier = "==1.0.15" },
     { name = "fastapi", specifier = "==0.116.1" },
+    { name = "httpx", specifier = ">=0.27.0" },
+    { name = "pytest", specifier = ">=8.0" },
     { name = "python-dotenv", specifier = "==1.1.1" },
     { name = "python-multipart", specifier = "==0.0.20" },
     { name = "sentence-transformers", specifier = "==5.0.0" },
     { name = "uvicorn", specifier = "==0.35.0" },
 ]
 
+[package.metadata.requires-dev]
+dev = [{ name = "black", specifier = ">=24.0" }]
+
 [[package]]
 name = "sympy"
 version = "1.14.0"