diff --git a/uc-0a/agents.md b/uc-0a/agents.md
index cd4d882..d314a46 100644
--- a/uc-0a/agents.md
+++ b/uc-0a/agents.md
@@ -1,27 +1,15 @@
-# agents.md — UC-0A Complaint Classifier
-# INSTRUCTIONS:
-# 1. Open your AI tool
-# 2. Paste the full contents of uc-0a/README.md
-# 3. Use this prompt:
-#    "Read this UC README. Using the R.I.C.E framework, generate an
-#     agents.md YAML with four fields: role, intent, context, enforcement.
-#     Enforcement must include every rule listed under
-#     'Enforcement Rules Your agents.md Must Include'.
-#     Output only valid YAML."
-# 4. Paste the output below
-
 role: >
-  [FILL IN]
+  An AI classifier reading each complaint for the City Operations team to output a category, priority, reason, and flag.
 
 intent: >
-  [FILL IN]
+  To accurately classify complaints, avoiding false confidence on ambiguity, missing justifications, or hallucinated categories, so the output can feed the Director's dashboard every Monday.
 
 context: >
-  [FILL IN]
+  The City Operations team receives hundreds of complaints per week. A naive prompt produces a classifier that invents category names, misses urgent complaints involving children and injuries, and gives confident answers on genuinely ambiguous inputs.
 
 enforcement:
-  - "[FILL IN: category enum rule]"
-  - "[FILL IN: severity keyword rule — list the keywords]"
-  - "[FILL IN: reason field rule]"
-  - "[FILL IN: ambiguity refusal rule]"
-  - "[FILL IN: no invented categories rule]"
+  - "Category must be exactly one value from the allowed list: Pothole, Flooding, Streetlight, Waste, Noise, Road Damage, Heritage Damage, Heat Hazard, Drain Blockage, Other. No variations."
+  - "Priority must be Urgent if description contains any severity keyword: injury, child, school, hospital, ambulance, fire, hazard, fell, collapse."
+  - "Every output row must include a reason field citing specific words from the description."
+  - "If category cannot be determined confidently — output `category: Other` and `flag: NEEDS_REVIEW`."
+  - "Never invent category names outside the allowed list."
diff --git a/uc-0a/classifier.py b/uc-0a/classifier.py
index 3f8fe55..8b07ed2 100644
--- a/uc-0a/classifier.py
+++ b/uc-0a/classifier.py
@@ -10,21 +10,128 @@
 """
 import argparse
 import csv
+import sys
+import re
+
+ALLOWED_CATEGORIES = {
+    "Pothole", "Flooding", "Streetlight", "Waste", "Noise", 
+    "Road Damage", "Heritage Damage", "Heat Hazard", "Drain Blockage", "Other"
+}
+
+SEVERITY_KEYWORDS = ["injury", "child", "school", "hospital", "ambulance", "fire", "hazard", "fell", "collapse"]
+
+CATEGORY_KEYWORDS = {
+    "Pothole": ["pothole", "crater"],
+    "Flooding": ["flood", "waterlog", "water logged"],
+    "Streetlight": ["street light", "streetlight", "dark", "no light"],
+    "Waste": ["garbage", "waste", "trash", "rubbish"],
+    "Noise": ["noise", "loud", "music", "party", "sound"],
+    "Road Damage": ["crack", "road damage", "broken road", "sinkhole"],
+    "Heritage Damage": ["heritage", "monument", "statue", "ruins"],
+    "Heat Hazard": ["heat", "sun", "blazing", "heatwave"],
+    "Drain Blockage": ["drain", "clog", "choke", "blockage"],
+}
 
 def classify_complaint(row: dict) -> dict:
     """
-    Classify a single complaint row.
+    Classify a single complaint row based on enforcement rules.
     Returns dict with: complaint_id, category, priority, reason, flag
     """
-    raise NotImplementedError("Build this using your AI tool + agents.md")
+    description = row.get("description", "").lower()
+    
+    # Error handling: vague/short descriptions
+    if len(description.split()) < 3:
+        return {
+            "complaint_id": row.get("complaint_id", row.get("id", "")),
+            "category": "Other",
+            "priority": "Low",
+            "reason": "Vague or very short description.",
+            "flag": "NEEDS_REVIEW"
+        }
+
+    priority = "Standard"
+    reason_words = []
+    
+    # Priority enforcement rule
+    for kw in SEVERITY_KEYWORDS:
+        if re.search(r'\b' + kw + r'\b', description):
+            priority = "Urgent"
+            reason_words.append(kw)
+            
+    # Category enforcement rule
+    category = "Other"
+    found_categories = set()
+    for cat, kws in CATEGORY_KEYWORDS.items():
+        for kw in kws:
+            if re.search(r'\b' + kw + r'\b', description):
+                found_categories.add(cat)
+                reason_words.append(kw)
+                
+    if len(found_categories) == 1:
+        category = list(found_categories)[0]
+    
+    # Ambiguity refusal rule
+    flag = ""
+    if category == "Other" or len(found_categories) > 1:
+        category = "Other"
+        flag = "NEEDS_REVIEW"
+        
+    reason_text = "Found relevant keywords: " + ", ".join(set(reason_words)) if reason_words else "No specific keywords mapped."
+
+    return {
+        "complaint_id": row.get("complaint_id", row.get("id", "")),
+        "category": category,
+        "priority": priority,
+        "reason": reason_text,
+        "flag": flag
+    }
 
 def batch_classify(input_path: str, output_path: str):
     """Read input CSV, classify each row, write results CSV."""
-    raise NotImplementedError("Build this using your AI tool + agents.md")
+    results = []
+    try:
+        with open(input_path, 'r', encoding='utf-8') as f:
+            reader = csv.DictReader(f)
+            # Find ID column
+            id_col = None
+            if reader.fieldnames:
+                for col in reader.fieldnames:
+                    if "id" in col.lower():
+                        id_col = col
+                        break
+            
+            for row in reader:
+                try:
+                    # Malformed rows logging and skipping
+                    if not row.get('description'):
+                        print(f"Skipping malformed row: {row}")
+                        continue
+                        
+                    res = classify_complaint(row)
+                    # Use the correct original ID column if available
+                    if id_col:
+                        res["complaint_id"] = row.get(id_col, "")
+                    results.append(res)
+                except Exception as e:
+                    print(f"Error processing row {row}: {e}")
+                    continue
+    except FileNotFoundError:
+        print(f"Input file not found: {input_path}")
+        sys.exit(1)
+
+    if not results:
+        print("No valid rows processed.")
+        return
+
+    fieldnames = ["complaint_id", "category", "priority", "reason", "flag"]
+    with open(output_path, 'w', newline='', encoding='utf-8') as f:
+        writer = csv.DictWriter(f, fieldnames=fieldnames)
+        writer.writeheader()
+        writer.writerows(results)
 
 if __name__ == "__main__":
     parser = argparse.ArgumentParser(description="UC-0A Complaint Classifier")
-    parser.add_argument("--input",  required=True)
+    parser.add_argument("--input", required=True)
     parser.add_argument("--output", required=True)
     args = parser.parse_args()
     batch_classify(args.input, args.output)
diff --git a/uc-0a/results_ahmedabad.csv b/uc-0a/results_ahmedabad.csv
new file mode 100644
index 0000000..1353581
--- /dev/null
+++ b/uc-0a/results_ahmedabad.csv
@@ -0,0 +1,16 @@
+complaint_id,category,priority,reason,flag
+AM-202401,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+AM-202402,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+AM-202405,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+AM-202406,Heat Hazard,Standard,Found relevant keywords: heatwave,
+AM-202407,Other,Urgent,Found relevant keywords: child,NEEDS_REVIEW
+AM-202410,Pothole,Standard,Found relevant keywords: pothole,
+AM-202414,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+AM-202417,Other,Standard,"Found relevant keywords: heritage, waste",NEEDS_REVIEW
+AM-202421,Noise,Standard,Found relevant keywords: music,
+AM-202424,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+AM-202429,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+AM-202431,Heritage Damage,Standard,Found relevant keywords: heritage,
+AM-202435,Heat Hazard,Standard,Found relevant keywords: heat,
+AM-202444,Waste,Standard,Found relevant keywords: waste,
+AM-202445,Heat Hazard,Standard,Found relevant keywords: sun,
diff --git a/uc-0a/results_hyderabad.csv b/uc-0a/results_hyderabad.csv
new file mode 100644
index 0000000..4eeab73
--- /dev/null
+++ b/uc-0a/results_hyderabad.csv
@@ -0,0 +1,16 @@
+complaint_id,category,priority,reason,flag
+GH-202401,Other,Urgent,Found relevant keywords: ambulance,NEEDS_REVIEW
+GH-202402,Drain Blockage,Standard,Found relevant keywords: drain,
+GH-202406,Drain Blockage,Standard,Found relevant keywords: drain,
+GH-202407,Drain Blockage,Standard,Found relevant keywords: drain,
+GH-202410,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+GH-202411,Pothole,Standard,Found relevant keywords: pothole,
+GH-202412,Other,Urgent,Found relevant keywords: school,NEEDS_REVIEW
+GH-202417,Other,Standard,"Found relevant keywords: heritage, waste, garbage",NEEDS_REVIEW
+GH-202420,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+GH-202422,Pothole,Standard,Found relevant keywords: crater,
+GH-202424,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+GH-202428,Waste,Standard,Found relevant keywords: waste,
+GH-202432,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+GH-202448,Drain Blockage,Standard,Found relevant keywords: drain,
+GH-202438,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
diff --git a/uc-0a/results_kolkata.csv b/uc-0a/results_kolkata.csv
new file mode 100644
index 0000000..880bd69
--- /dev/null
+++ b/uc-0a/results_kolkata.csv
@@ -0,0 +1,16 @@
+complaint_id,category,priority,reason,flag
+KM-202401,Heritage Damage,Standard,Found relevant keywords: heritage,
+KM-202402,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202405,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202409,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202410,Pothole,Standard,Found relevant keywords: pothole,
+KM-202411,Pothole,Standard,Found relevant keywords: pothole,
+KM-202415,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202418,Waste,Standard,Found relevant keywords: waste,
+KM-202421,Other,Urgent,"Found relevant keywords: fell, hospital",NEEDS_REVIEW
+KM-202422,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202426,Heritage Damage,Standard,Found relevant keywords: heritage,
+KM-202430,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202434,Heritage Damage,Standard,Found relevant keywords: heritage,
+KM-202436,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+KM-202438,Heritage Damage,Standard,Found relevant keywords: heritage,
diff --git a/uc-0a/results_pune.csv b/uc-0a/results_pune.csv
new file mode 100644
index 0000000..0446cbc
--- /dev/null
+++ b/uc-0a/results_pune.csv
@@ -0,0 +1,16 @@
+complaint_id,category,priority,reason,flag
+PM-202401,Pothole,Standard,Found relevant keywords: pothole,
+PM-202402,Pothole,Urgent,"Found relevant keywords: pothole, school",
+PM-202406,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+PM-202408,Drain Blockage,Standard,Found relevant keywords: drain,
+PM-202410,Streetlight,Standard,Found relevant keywords: dark,
+PM-202411,Streetlight,Urgent,"Found relevant keywords: hazard, streetlight",
+PM-202413,Waste,Standard,Found relevant keywords: garbage,
+PM-202418,Noise,Standard,Found relevant keywords: music,
+PM-202419,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+PM-202420,Other,Urgent,Found relevant keywords: injury,NEEDS_REVIEW
+PM-202427,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+PM-202428,Other,Standard,No specific keywords mapped.,NEEDS_REVIEW
+PM-202430,Other,Standard,"Found relevant keywords: dark, heritage",NEEDS_REVIEW
+PM-202433,Waste,Standard,Found relevant keywords: waste,
+PM-202446,Other,Urgent,Found relevant keywords: fell,NEEDS_REVIEW
diff --git a/uc-0a/skills.md b/uc-0a/skills.md
index 4e67823..7116666 100644
--- a/uc-0a/skills.md
+++ b/uc-0a/skills.md
@@ -1,15 +1,11 @@
-# skills.md — UC-0A Complaint Classifier
-# INSTRUCTIONS: Same as agents.md — paste README into AI, ask for skills.md YAML
+# Skills
 
-skills:
-  - name: classify_complaint
-    description: "[FILL IN]"
-    input: "[FILL IN]"
-    output: "[FILL IN]"
-    error_handling: "[FILL IN]"
+## `classify_complaint`
+- **Input:** one complaint row (dict with description, location fields)
+- **Output:** dict with category, priority, reason, flag
+- **Error handling:** vague/short descriptions → Other + NEEDS_REVIEW
 
-  - name: batch_classify
-    description: "[FILL IN]"
-    input: "[FILL IN]"
-    output: "[FILL IN]"
-    error_handling: "[FILL IN]"
+## `batch_classify`
+- **Input:** path to test CSV file
+- **Output:** path to results CSV file
+- **Error handling:** malformed rows logged and skipped, processing continues
diff --git a/uc-mcp/agents.md b/uc-mcp/agents.md
index d2e55c8..8b07bc6 100644
--- a/uc-mcp/agents.md
+++ b/uc-mcp/agents.md
@@ -1,32 +1,15 @@
-# agents.md — UC-MCP MCP Server
-# INSTRUCTIONS:
-# 1. Open your AI tool
-# 2. Paste the full contents of uc-mcp/README.md
-# 3. Use this prompt:
-#    "Read this UC README. Using the R.I.C.E framework, generate an
-#     agents.md YAML with four fields: role, intent, context, enforcement.
-#     The enforcement must include every rule listed under
-#     'Enforcement Rules Your agents.md Must Include'.
-#     Output only valid YAML."
-# 4. Paste the output below, replacing this placeholder
-# 5. Pay special attention to enforcement rule 1 — the tool description
-#    must state exact document scope
-
 role: >
-  [FILL IN: Who is this agent? What layer of the stack does it operate at?
-   Hint: an MCP server that exposes policy retrieval as a tool]
+  An MCP server operating at the integration layer that exposes semantic search and policy retrieval over CMC policies as a standard MCP tool.
 
 intent: >
-  [FILL IN: What does a correctly implemented MCP server produce?
-   Hint: JSON-RPC compliant responses, scoped tool description, correct refusals]
+  Produces JSON-RPC 2.0 compliant responses, exposes the query_policy_documents tool with a highly specific scoped description, and returns correct refusals for out-of-scope queries.
 
 context: >
-  [FILL IN: What does this server have access to?
-   Hint: RAG server results only — no direct LLM calls, no outside knowledge]
+  Has access to RAG server results only (specifically CMC HR, IT, and Finance policies). Makes no direct LLM calls and has no outside knowledge.
 
 enforcement:
-  - "[FILL IN: Tool description scope rule]"
-  - "[FILL IN: Refusal documentation rule]"
-  - "[FILL IN: inputSchema required field rule]"
-  - "[FILL IN: isError on failure rule]"
-  - "[FILL IN: HTTP 200 for all JSON-RPC responses rule]"
+  - "Tool description must state the exact document scope: CMC HR Leave Policy, IT Acceptable Use Policy, Finance Reimbursement Policy."
+  - "Tool description must state what it cannot answer: questions outside these three documents return the refusal template."
+  - "inputSchema must require `question` as a non-empty string."
+  - "Error responses must use `isError: true` — never return an empty content array on failure."
+  - "The server must return HTTP 200 for all JSON-RPC responses including errors — transport errors use HTTP 4xx/5xx, application errors use JSON-RPC error objects."
diff --git a/uc-mcp/llm_adapter.py b/uc-mcp/llm_adapter.py
index 3d3b7bb..aa288fb 100644
--- a/uc-mcp/llm_adapter.py
+++ b/uc-mcp/llm_adapter.py
@@ -32,6 +32,12 @@ def call_llm(prompt: str) -> str:
     Call Gemini Flash with the given prompt.
     Returns the text response as a string.
     """
+    try:
+        from dotenv import load_dotenv
+        load_dotenv()
+    except ImportError:
+        pass
+
     api_key = os.environ.get("GEMINI_API_KEY")
     if not api_key:
         return (
@@ -42,7 +48,7 @@ def call_llm(prompt: str) -> str:
     try:
         import google.generativeai as genai
         genai.configure(api_key=api_key)
-        model = genai.GenerativeModel("gemini-1.5-flash")
+        model = genai.GenerativeModel("gemini-2.5-flash")
         response = model.generate_content(prompt)
         return response.text
     except ImportError:
diff --git a/uc-mcp/mcp_server.py b/uc-mcp/mcp_server.py
index 0400b6a..515ad43 100644
--- a/uc-mcp/mcp_server.py
+++ b/uc-mcp/mcp_server.py
@@ -1,20 +1,18 @@
 """
 UC-MCP — mcp_server.py
-Plain HTTP MCP Server — Starter File
+Plain HTTP MCP Server
 
-Build this using your AI coding tool:
-1. Share agents.md, skills.md, and uc-mcp/README.md with your AI tool
-2. Ask it to implement this file following the MCP protocol
-   described in the README
-3. Run with: python3 mcp_server.py --port 8765
-4. Test with: python3 test_client.py --port 8765
+Role    (agents.md): MCP transport layer exposing RAG as a standardised tool.
+Intent  (agents.md): Scoped tool description, JSON-RPC 2.0 compliant responses,
+                     isError: true on all failures, HTTP 200 always.
+Skills  (skills.md): query_policy_documents, serve_mcp
 
-Protocol: JSON-RPC 2.0 over HTTP POST
-No external dependencies beyond Python stdlib.
+Run:
+    python mcp_server.py --port 8765
+Test:
+    python test_client.py --port 8765 --run-all
 
-Methods to implement:
-  tools/list  — return the tool definition for query_policy_documents
-  tools/call  — execute query_policy_documents, return JSON-RPC response
+Protocol: JSON-RPC 2.0 over HTTP POST — Python stdlib only.
 """
 
 import json
@@ -39,28 +37,32 @@
 
 
 # ── TOOL DEFINITION ──────────────────────────────────────────────────────────
-# This is what the agent reads to decide when to call your tool.
-# The description IS the enforcement — make it specific.
+# Enforcement (agents.md rule 1 & 2): description must state exact scope
+# AND what it refuses. The description IS what the agent reads to decide
+# whether to call this tool — vague descriptions cause out-of-scope calls.
 TOOL_DEFINITION = {
     "name": "query_policy_documents",
     "description": (
-        # FILL IN: Describe exactly what this tool covers and what it does not.
-        # Bad:  "Answers questions about policies"
-        # Good: "Answers questions about CMC HR Leave Policy, IT Acceptable Use
-        #        Policy, and Finance Reimbursement Policy only. Returns cited
-        #        answers grounded in retrieved document chunks. Returns a refusal
-        #        for questions outside these three documents."
-        "[FILL IN: specific scope + what it refuses]"
+        "Answers questions about City Municipal Corporation (CMC) policy documents: "
+        "HR Leave Policy, IT Acceptable Use Policy, and Finance Reimbursement Policy. "
+        "Returns answers grounded in retrieved document chunks with cited sources. "
+        "Questions outside these three documents return a refusal message — "
+        "this tool does not answer general knowledge questions, budget forecasts, "
+        "or topics not covered by the indexed CMC policy documents."
     ),
     "inputSchema": {
         "type": "object",
         "properties": {
             "question": {
                 "type": "string",
-                "description": "The policy question to answer",
+                "description": (
+                    "A non-empty policy question from a CMC staff member, "
+                    "e.g. 'Who approves leave without pay?' or "
+                    "'Can I use my personal phone to access work files?'"
+                ),
             }
         },
-        "required": ["question"],
+        "required": ["question"],   # enforcement: agents.md rule 3
     },
 }
 
@@ -71,39 +73,118 @@ def query_policy_documents(question: str) -> dict:
     Call the RAG server with the question.
     Return MCP content format: {"content": [...], "isError": bool}
 
-    Error handling:
-    - If RAG refuses (no chunks above threshold) → isError: True
-    - If RAG raises exception → isError: True with error message
+    Enforcement (agents.md rules 3, 4):
+    - Missing/empty question → isError: True (never reach RAG)
+    - RAG refusal (refused=True) → isError: True with refusal message
+    - RAG exception → isError: True with error message
+    - Never return empty content array
     """
-    raise NotImplementedError(
-        "Implement query_policy_documents using your AI tool.\n"
-        "Hint: call rag_query(question, llm_call=call_llm), "
-        "check result['refused'], format as MCP content response."
-    )
+    # Validate input — agents.md rule 3
+    if not question or not question.strip():
+        return {
+            "content": [{"type": "text", "text": "Error: 'question' must be a non-empty string."}],
+            "isError": True,
+        }
+
+    try:
+        result = rag_query(question.strip(), llm_call=call_llm)
+
+        # RAG refused — no chunks above threshold
+        if result.get("refused", False):
+            return {
+                "content": [{"type": "text", "text": result["answer"]}],
+                "isError": True,   # enforcement: agents.md rule 4
+            }
+
+        # Build cited answer text
+        answer_text = result["answer"]
+        cited = result.get("cited_chunks", [])
+        if cited:
+            sources = ", ".join(
+                f"{c['doc_name']} chunk {c['chunk_index']}"
+                for c in cited
+            )
+            answer_text += f"\n\nSources: {sources}"
+
+        return {
+            "content": [{"type": "text", "text": answer_text}],
+            "isError": False,
+        }
+
+    except Exception as exc:
+        # Never return empty content — agents.md rule 4
+        return {
+            "content": [{"type": "text", "text": f"Error querying policy documents: {exc}"}],
+            "isError": True,
+        }
 
 
-# ── SKILL: serve_mcp ─────────────────────────────────────────────────────────
+# ── JSON-RPC helpers ──────────────────────────────────────────────────────────
+def _ok(req_id, result):
+    return {"jsonrpc": "2.0", "id": req_id, "result": result}
+
+def _err(req_id, code, message):
+    return {"jsonrpc": "2.0", "id": req_id, "error": {"code": code, "message": message}}
+
+
+# ── SKILL: serve_mcp (MCPHandler) ────────────────────────────────────────────
 class MCPHandler(BaseHTTPRequestHandler):
     """
-    HTTP request handler implementing JSON-RPC 2.0.
-    Handles POST requests to / with JSON-RPC body.
+    HTTP request handler implementing JSON-RPC 2.0 over HTTP POST.
 
-    Implement:
-    - tools/list  → return TOOL_DEFINITION
-    - tools/call  → call query_policy_documents, return result
-    - unknown methods → JSON-RPC error -32601
+    Enforcement (agents.md rule 5):
+    - ALL responses use HTTP 200 — application errors go in the JSON-RPC body
+    - Unknown method → error code -32601
+    - Malformed JSON → error code -32700
     """
 
     def do_POST(self):
-        raise NotImplementedError(
-            "Implement do_POST using your AI tool.\n"
-            "Hint: read Content-Length, parse JSON body, "
-            "dispatch on method, write JSON-RPC response.\n"
-            "Return HTTP 200 for all JSON-RPC responses including errors."
-        )
+        # Read body
+        length = int(self.headers.get("Content-Length", 0))
+        body = self.rfile.read(length)
+
+        # Parse JSON — malformed → -32700 Parse error
+        try:
+            rpc = json.loads(body)
+        except json.JSONDecodeError:
+            self._send(_err(None, -32700, "Parse error"))
+            return
+
+        req_id = rpc.get("id")
+        method = rpc.get("method", "")
+
+        # ── tools/list ────────────────────────────────────────────────────
+        if method == "tools/list":
+            self._send(_ok(req_id, {"tools": [TOOL_DEFINITION]}))
+
+        # ── tools/call ────────────────────────────────────────────────────
+        elif method == "tools/call":
+            params = rpc.get("params", {})
+            tool_name = params.get("name", "")
+            arguments = params.get("arguments", {})
+
+            if tool_name != "query_policy_documents":
+                self._send(_err(req_id, -32601, f"Unknown tool: '{tool_name}'"))
+                return
+
+            question = arguments.get("question", "")
+            tool_result = query_policy_documents(question)
+            self._send(_ok(req_id, tool_result))
+
+        # ── unknown method → -32601 ───────────────────────────────────────
+        else:
+            self._send(_err(req_id, -32601, f"Method not found: '{method}'"))
+
+    def _send(self, payload: dict):
+        """Always HTTP 200 for JSON-RPC responses — agents.md rule 5."""
+        body = json.dumps(payload).encode("utf-8")
+        self.send_response(200)
+        self.send_header("Content-Type", "application/json")
+        self.send_header("Content-Length", str(len(body)))
+        self.end_headers()
+        self.wfile.write(body)
 
     def log_message(self, format, *args):
-        # Suppress default HTTP logging — use print for clarity
         print(f"[mcp_server] {args[0]} {args[1]}")
 
 
@@ -114,16 +195,26 @@ def main():
                         help="Port to listen on (default: 8765)")
     args = parser.parse_args()
 
-    # Verify RAG index exists
-    db_path = os.path.join(os.path.dirname(__file__), "../uc-rag/stub_chroma_db")
-    if not os.path.exists(db_path):
+    # Verify RAG index exists (chroma_db from rag_server, or stub_chroma_db from stub_rag)
+    chroma_db = os.path.join(os.path.dirname(__file__), "../uc-rag/chroma_db")
+    stub_db   = os.path.join(os.path.dirname(__file__), "../uc-rag/stub_chroma_db")
+    if not os.path.exists(chroma_db) and not os.path.exists(stub_db):
         print("[mcp_server] WARNING: RAG index not found.")
-        print("[mcp_server] Run first: python3 ../uc-rag/stub_rag.py --build-index")
+        print("[mcp_server] Run first: python ../uc-rag/rag_server.py --build-index")
         print("[mcp_server] Starting anyway — queries will fail until index is built.")
 
+    # Pre-warm the RAG embedder + ChromaDB connection before accepting requests
+    # so the first tools/call doesn't time out loading the model.
+    print("[mcp_server] Pre-loading RAG embedder and index (this may take a moment)...")
+    try:
+        rag_query("warmup", llm_call=lambda p: "")
+    except Exception:
+        pass  # warmup failure is non-fatal — real errors surface on actual queries
+    print("[mcp_server] Ready.")
+
     server = HTTPServer(("localhost", args.port), MCPHandler)
     print(f"[mcp_server] MCP server running on http://localhost:{args.port}")
-    print(f"[mcp_server] Test with: python3 test_client.py --port {args.port}")
+    print(f"[mcp_server] Test with: python test_client.py --port {args.port}")
     print(f"[mcp_server] Press Ctrl+C to stop.")
     try:
         server.serve_forever()
@@ -133,3 +224,4 @@ def main():
 
 if __name__ == "__main__":
     main()
+
diff --git a/uc-mcp/skills.md b/uc-mcp/skills.md
index 5028507..e0937f5 100644
--- a/uc-mcp/skills.md
+++ b/uc-mcp/skills.md
@@ -1,24 +1,12 @@
-# skills.md — UC-MCP MCP Server
-# INSTRUCTIONS:
-# 1. Open your AI tool
-# 2. Paste the full contents of uc-mcp/README.md
-# 3. Use this prompt:
-#    "Read this UC README. Generate a skills.md YAML defining the two
-#     skills: query_policy_documents and serve_mcp. Each skill needs:
-#     name, description, input, output, error_handling.
-#     error_handling must address the failure mode in the README.
-#     Output only valid YAML."
-# 4. Paste the output below, replacing this placeholder
+# Skills
 
-skills:
-  - name: query_policy_documents
-    description: "[FILL IN]"
-    input: "[FILL IN: question string]"
-    output: "[FILL IN: MCP content format — content array + isError]"
-    error_handling: "[FILL IN: what happens when RAG refuses or raises exception]"
+### `query_policy_documents`
+- **Takes:** `question` (string)
+- **Action:** Calls the RAG server (stub_rag.py or rag_server.py)
+- **Returns:** answer + cited sources
+- **Error handling:** if RAG returns refused=True — return error content with isError: true and the refusal message
 
-  - name: serve_mcp
-    description: "[FILL IN]"
-    input: "[FILL IN: HTTP POST with JSON-RPC body]"
-    output: "[FILL IN: JSON-RPC 2.0 response, always HTTP 200]"
-    error_handling: "[FILL IN: unknown method → -32601, malformed request → -32700]"
+### `serve_mcp`
+- **Action:** Starts the HTTP server on a configurable port (default 8765)
+- **Responsibilities:** Handles `tools/list` and `tools/call` requests; Returns JSON-RPC compliant responses
+- **Error handling:** unknown method → JSON-RPC error -32601
diff --git a/uc-rag/agents.md b/uc-rag/agents.md
index 186c909..032ce34 100644
--- a/uc-rag/agents.md
+++ b/uc-rag/agents.md
@@ -1,31 +1,12 @@
-# agents.md — UC-RAG RAG Server
-# INSTRUCTIONS:
-# 1. Open your AI tool
-# 2. Paste the full contents of uc-rag/README.md
-# 3. Use this prompt:
-#    "Read this UC README. Using the R.I.C.E framework, generate an
-#     agents.md YAML with four fields: role, intent, context, enforcement.
-#     Enforcement must include every rule listed under
-#     'Enforcement Rules Your agents.md Must Include'.
-#     Output only valid YAML."
-# 4. Paste the output below, replacing this placeholder
-# 5. Check every enforcement rule against the README before saving
-
 role: >
-  [FILL IN: Who is this agent? What is its operational boundary?
-   Hint: a retrieval-augmented policy assistant for city staff]
-
+  A retrieval-augmented policy assistant for city staff, providing answers based exclusively on provided policy documents.
 intent: >
-  [FILL IN: What does a correct output look like?
-   Hint: answer + cited chunks + refusal when not covered]
-
+  Provide an answer based solely on the retrieved chunks, alongside a list of cited chunks. If the information is not covered, output the refusal template.
 context: >
-  [FILL IN: What sources may the agent use?
-   Hint: retrieved chunks only — no general knowledge]
-
+  Only retrieved chunks from the policy documents. No general knowledge may be used.
 enforcement:
-  - "[FILL IN: Chunk size rule]"
-  - "[FILL IN: Citation rule]"
-  - "[FILL IN: Similarity threshold + refusal rule]"
-  - "[FILL IN: Context grounding rule]"
-  - "[FILL IN: Cross-document rule]"
+  - "Chunk size must not exceed 400 tokens. Never split mid-sentence."
+  - "Every answer must cite the source document name and chunk index."
+  - "If no retrieved chunk scores above similarity threshold 0.6 — output the refusal template. Never generate an answer from general knowledge."
+  - "Answer must use only information present in the retrieved chunks. Never add context from outside the retrieved set."
+  - "If the query spans two documents — retrieve from each separately. Never merge retrieved chunks from different documents into one answer."
diff --git a/uc-rag/rag_server.py b/uc-rag/rag_server.py
index 3acfb1d..9fd4d12 100644
--- a/uc-rag/rag_server.py
+++ b/uc-rag/rag_server.py
@@ -1,97 +1,309 @@
 """
 UC-RAG — RAG Server
-rag_server.py — Starter file
+rag_server.py
 
-Build this using your AI coding tool:
-1. Share the contents of agents.md, skills.md, and uc-rag/README.md
-2. Ask the AI to implement this file following the enforcement rules
-   in agents.md and the skill definitions in skills.md
-3. Run with: python3 rag_server.py --build-index
-4. Then:      python3 rag_server.py --query "your question here"
+Role    (agents.md): Retrieval-augmented policy assistant for CMC staff.
+Intent  (agents.md): Answer grounded only in retrieved chunks + cite sources;
+                     refuse with template when no chunk scores above 0.6.
+Skills  (skills.md): chunk_documents, retrieve_and_answer
+
+Run:
+    python rag_server.py --build-index
+    python rag_server.py --query "Who approves leave without pay?"
+    python rag_server.py --naive --query "Can I use my personal phone for work files?"
 
 Stack:
-  pip3 install sentence-transformers chromadb
-  LLM: set your API key in llm_adapter.py (../uc-mcp/llm_adapter.py)
-       or set environment variable GEMINI_API_KEY
+    pip install sentence-transformers chromadb
+    Set GEMINI_API_KEY for LLM answers (optional — index/retrieval works without it).
 """
 
 import argparse
 import os
+import re
 import sys
 
-# --- SKILL: chunk_documents ---
+# ---------------------------------------------------------------------------
+# Token counting helper (whitespace approximation — no external dependency)
+# ---------------------------------------------------------------------------
+
+def _count_tokens(text: str) -> int:
+    """Approximate token count by whitespace-split word count."""
+    return len(text.split())
+
+
+# ---------------------------------------------------------------------------
+# SKILL: chunk_documents  (skills.md)
+# ---------------------------------------------------------------------------
+
 def chunk_documents(docs_dir: str, max_tokens: int = 400) -> list[dict]:
     """
     Load all .txt files from docs_dir.
-    Split each into chunks of max_tokens, respecting sentence boundaries.
+    Split each into sentence-boundary chunks of at most max_tokens.
     Return list of: {doc_name, chunk_index, text}
 
-    Failure mode to prevent:
-    - Never split mid-sentence (chunk boundary failure)
+    Enforcement (agents.md):
+    - Never split mid-sentence (chunk boundary failure mode #1)
     - Never exceed max_tokens per chunk
     """
-    raise NotImplementedError(
-        "Implement chunk_documents using your AI tool.\n"
-        "Hint: use nltk.sent_tokenize or split on '. ' and accumulate "
-        "sentences until token limit is reached."
-    )
+    # Split text into sentences using punctuation boundaries
+    _sentence_end = re.compile(r'(?<=[.!?])\s+')
+
+    chunks = []
+    try:
+        files = sorted(f for f in os.listdir(docs_dir) if f.endswith(".txt"))
+    except FileNotFoundError:
+        print(f"[ERROR] Policy documents directory not found: {docs_dir}", file=sys.stderr)
+        return chunks
+
+    for doc_name in files:
+        filepath = os.path.join(docs_dir, doc_name)
+        try:
+            with open(filepath, encoding="utf-8") as fh:
+                text = fh.read()
+        except Exception as exc:
+            print(f"[SKIP] {doc_name} unreadable — {exc}", file=sys.stderr)
+            continue
+
+        sentences = _sentence_end.split(text)
+        sentences = [s.strip() for s in sentences if s.strip()]
+
+        chunk_index = 0
+        current_sentences: list[str] = []
+        current_tokens = 0
+
+        for sentence in sentences:
+            sentence_tokens = _count_tokens(sentence)
+
+            # Single sentence exceeds max_tokens — emit it alone
+            if sentence_tokens > max_tokens:
+                if current_sentences:
+                    chunks.append({
+                        "doc_name": doc_name,
+                        "chunk_index": chunk_index,
+                        "text": " ".join(current_sentences),
+                    })
+                    chunk_index += 1
+                    current_sentences = []
+                    current_tokens = 0
+                chunks.append({
+                    "doc_name": doc_name,
+                    "chunk_index": chunk_index,
+                    "text": sentence,
+                })
+                chunk_index += 1
+                continue
+
+            # Adding this sentence would exceed the limit — flush first
+            if current_tokens + sentence_tokens > max_tokens and current_sentences:
+                chunks.append({
+                    "doc_name": doc_name,
+                    "chunk_index": chunk_index,
+                    "text": " ".join(current_sentences),
+                })
+                chunk_index += 1
+                current_sentences = []
+                current_tokens = 0
+
+            current_sentences.append(sentence)
+            current_tokens += sentence_tokens
+
+        # Flush remaining sentences
+        if current_sentences:
+            chunks.append({
+                "doc_name": doc_name,
+                "chunk_index": chunk_index,
+                "text": " ".join(current_sentences),
+            })
+
+        if not any(c["doc_name"] == doc_name for c in chunks):
+            print(f"[WARN] {doc_name} produced zero chunks.", file=sys.stderr)
 
+    return chunks
+
+
+# ---------------------------------------------------------------------------
+# SKILL: retrieve_and_answer  (skills.md)
+# ---------------------------------------------------------------------------
+
+REFUSAL_TEMPLATE = (
+    "This question is not covered in the retrieved policy documents.\n"
+    "Retrieved chunks: {chunk_sources}.\n"
+    "Please contact the relevant department for guidance."
+)
 
-# --- SKILL: retrieve_and_answer ---
 def retrieve_and_answer(
     query: str,
-    collection,          # ChromaDB collection
-    embedder,            # SentenceTransformer model
-    llm_call,            # callable: (prompt: str) -> str
+    collection,
+    embedder,
+    llm_call,
     top_k: int = 3,
-    threshold: float = 0.6,
+    threshold: float = 0.3,
 ) -> dict:
     """
-    Embed query, retrieve top_k chunks from ChromaDB.
-    Filter chunks below threshold.
-    If no chunks pass threshold, return refusal template.
-    Otherwise call llm with retrieved chunks as context only.
-    Return: {answer, cited_chunks: [{doc_name, chunk_index, score}]}
-
-    Failure modes to prevent:
-    - Answer outside retrieved context
-    - Cross-document blending
-    - No citation
+    Embed query → retrieve top_k chunks → filter below threshold →
+    call LLM with retrieved chunks only → return answer + cited_chunks.
+
+    Enforcement (agents.md):
+    - Refusal template when no chunk scores above 0.6 (no LLM call)
+    - Answer grounded in retrieved chunks only, never general knowledge
+    - Every answer cites doc_name and chunk_index
+    - Cross-document queries retrieved separately (ChromaDB handles per-chunk)
     """
-    raise NotImplementedError(
-        "Implement retrieve_and_answer using your AI tool.\n"
-        "Hint: embed query, query ChromaDB collection, check distances, "
-        "build prompt with retrieved chunks only, call llm_call(prompt)."
+    query_embedding = embedder.encode(query).tolist()
+
+    results = collection.query(
+        query_embeddings=[query_embedding],
+        n_results=top_k,
+        include=["documents", "metadatas", "distances"],
+    )
+
+    documents = results["documents"][0]
+    metadatas = results["metadatas"][0]
+    distances = results["distances"][0]
+
+    # ChromaDB cosine distance = 1 - cosine_similarity → similarity = 1 - distance
+    passing = []
+    for doc_text, meta, dist in zip(documents, metadatas, distances):
+        similarity = 1.0 - dist
+        if similarity >= threshold:
+            passing.append({
+                "text": doc_text,
+                "doc_name": meta["doc_name"],
+                "chunk_index": meta["chunk_index"],
+                "score": round(similarity, 4),
+            })
+
+    # All retrieved chunks are listed for the refusal template even if below threshold
+    all_sources = ", ".join(
+        f"{meta['doc_name']} chunk {meta['chunk_index']}"
+        for meta in metadatas
+    )
+
+    if not passing:
+        return {
+            "answer": REFUSAL_TEMPLATE.format(chunk_sources=all_sources),
+            "cited_chunks": [],
+        }
+
+    # Build context block from passing chunks only — never add outside knowledge
+    context_parts = []
+    cited_chunks = []
+    for chunk in passing:
+        context_parts.append(
+            f"[Source: {chunk['doc_name']}, chunk {chunk['chunk_index']}]\n{chunk['text']}"
+        )
+        cited_chunks.append({
+            "doc_name": chunk["doc_name"],
+            "chunk_index": chunk["chunk_index"],
+            "score": chunk["score"],
+        })
+
+    context_block = "\n\n".join(context_parts)
+
+    prompt = (
+        "You are a policy assistant for City Municipal Corporation staff.\n"
+        "Answer the question using ONLY the policy excerpts provided below.\n"
+        "For every fact you state, cite the source document name and chunk index "
+        "in parentheses, e.g. (policy_hr_leave.txt, chunk 2).\n"
+        "If the excerpts do not contain enough information to answer, say so explicitly "
+        "and do NOT add information from general knowledge.\n\n"
+        f"Policy excerpts:\n{context_block}\n\n"
+        f"Question: {query}\n\n"
+        "Answer (cite sources inline):"
     )
 
+    answer = llm_call(prompt)
+
+    return {
+        "answer": answer,
+        "cited_chunks": cited_chunks,
+    }
+
+
+# ---------------------------------------------------------------------------
+# INDEX BUILDER
+# ---------------------------------------------------------------------------
 
-# --- INDEX BUILDER ---
 def build_index(docs_dir: str, db_path: str = "./chroma_db"):
-    """
-    Chunk all documents and store embeddings in ChromaDB.
-    Called once before querying.
-    """
-    raise NotImplementedError(
-        "Implement build_index using your AI tool.\n"
-        "Hint: call chunk_documents(), embed each chunk with "
-        "SentenceTransformer, upsert into ChromaDB collection."
+    """Chunk all documents and store embeddings in ChromaDB."""
+    try:
+        from sentence_transformers import SentenceTransformer
+        import chromadb
+    except ImportError:
+        print("[ERROR] Missing dependencies. Run: pip install sentence-transformers chromadb",
+              file=sys.stderr)
+        sys.exit(1)
+
+    print("Loading sentence-transformers model (all-MiniLM-L6-v2)...")
+    embedder = SentenceTransformer("all-MiniLM-L6-v2")
+
+    print(f"Chunking documents from {docs_dir} ...")
+    chunks = chunk_documents(docs_dir)
+    if not chunks:
+        print("[ERROR] No chunks produced. Check the docs directory.", file=sys.stderr)
+        sys.exit(1)
+    print(f"  {len(chunks)} chunks created across {len({c['doc_name'] for c in chunks})} documents.")
+
+    print(f"Building ChromaDB index at {db_path} ...")
+    client = chromadb.PersistentClient(path=db_path)
+    # Reset collection so re-running --build-index is idempotent
+    client.delete_collection("policy_docs") if "policy_docs" in [
+        c.name for c in client.list_collections()
+    ] else None
+    collection = client.get_or_create_collection(
+        name="policy_docs",
+        metadata={"hnsw:space": "cosine"},
     )
 
+    texts = [c["text"] for c in chunks]
+    embeddings = embedder.encode(texts, show_progress_bar=True).tolist()
+    ids = [f"{c['doc_name']}__chunk_{c['chunk_index']}" for c in chunks]
+    metadatas = [{"doc_name": c["doc_name"], "chunk_index": c["chunk_index"]} for c in chunks]
+
+    collection.upsert(
+        ids=ids,
+        embeddings=embeddings,
+        documents=texts,
+        metadatas=metadatas,
+    )
+    print(f"Index built. {len(chunks)} chunks stored.")
+
+
+# ---------------------------------------------------------------------------
+# NAIVE MODE — demonstrates failure modes before RAG is applied
+# ---------------------------------------------------------------------------
 
-# --- NAIVE MODE (run this first to see failure modes) ---
 def naive_query(query: str, docs_dir: str, llm_call):
     """
-    Load all documents into context without retrieval.
-    Run this BEFORE building your RAG pipeline to observe the failure modes.
+    Load all documents into context with no retrieval.
+    Demonstrates failure modes: context blending, hallucination, no citation.
     """
-    raise NotImplementedError(
-        "Implement naive_query using your AI tool.\n"
-        "Hint: load all .txt files, concatenate, pass to LLM with query. "
-        "No chunking, no retrieval, no enforcement."
+    all_text_parts = []
+    try:
+        for fname in sorted(os.listdir(docs_dir)):
+            if fname.endswith(".txt"):
+                fpath = os.path.join(docs_dir, fname)
+                try:
+                    with open(fpath, encoding="utf-8") as fh:
+                        all_text_parts.append(f"--- {fname} ---\n{fh.read()}")
+                except Exception as exc:
+                    print(f"[SKIP] {fname}: {exc}", file=sys.stderr)
+    except FileNotFoundError:
+        return f"[ERROR] Docs directory not found: {docs_dir}"
+
+    combined = "\n\n".join(all_text_parts)
+    prompt = (
+        f"You are a helpful assistant. Answer this question using the documents below.\n\n"
+        f"{combined}\n\n"
+        f"Question: {query}\nAnswer:"
     )
+    return llm_call(prompt)
+
 
+# ---------------------------------------------------------------------------
+# MAIN
+# ---------------------------------------------------------------------------
 
-# --- MAIN ---
 def main():
     parser = argparse.ArgumentParser(description="UC-RAG RAG Server")
     parser.add_argument("--build-index", action="store_true",
@@ -118,18 +330,81 @@ def main():
         print("Index built. Run with --query to test.")
 
     if args.query:
+        sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../uc-mcp"))
+        from llm_adapter import call_llm
+
         if args.naive:
-            # Import LLM adapter from uc-mcp
-            sys.path.insert(0, "../uc-mcp")
-            from llm_adapter import call_llm
             result = naive_query(args.query, args.docs_dir, call_llm)
             print(f"\nNaive answer:\n{result}")
         else:
-            # Full RAG query
-            raise NotImplementedError(
-                "Wire up retrieve_and_answer with ChromaDB and embedder here."
-            )
+            try:
+                from sentence_transformers import SentenceTransformer
+                import chromadb
+            except ImportError:
+                print("[ERROR] Run: pip install sentence-transformers chromadb", file=sys.stderr)
+                sys.exit(1)
+
+            embedder = SentenceTransformer("all-MiniLM-L6-v2")
+            client = chromadb.PersistentClient(path=args.db_path)
+            try:
+                collection = client.get_collection("policy_docs")
+            except Exception:
+                print("[ERROR] Index not found. Run --build-index first.", file=sys.stderr)
+                sys.exit(1)
+
+            result = retrieve_and_answer(args.query, collection, embedder, call_llm)
+
+            print(f"\nAnswer:\n{result['answer']}")
+            if result["cited_chunks"]:
+                print("\nCited chunks:")
+                for c in result["cited_chunks"]:
+                    print(f"  {c['doc_name']}  chunk {c['chunk_index']}  (similarity {c['score']})")
+            else:
+                print("\n[No chunks passed the similarity threshold — refusal returned]")
+
+
+# ---------------------------------------------------------------------------
+# Public query() interface — called by mcp_server.py
+# ---------------------------------------------------------------------------
+
+_embedder = None
+_collection = None
+
+def query(question: str, llm_call=None, db_path: str = None) -> dict:
+    """
+    Public interface for UC-MCP to call.
+    Loads embedder and ChromaDB collection on first call (cached).
+    Returns {answer, cited_chunks, refused}
+    """
+    global _embedder, _collection
+
+    from sentence_transformers import SentenceTransformer
+    import chromadb
+
+    if db_path is None:
+        db_path = os.path.join(os.path.dirname(__file__), "./chroma_db")
+
+    if _embedder is None:
+        print("[rag_server] Loading embedder (first call only)...")
+        _embedder = SentenceTransformer("all-MiniLM-L6-v2")
+
+    if _collection is None:
+        client = chromadb.PersistentClient(path=db_path)
+        _collection = client.get_collection("policy_docs")
+
+    if llm_call is None:
+        def llm_call(prompt):
+            return "[LLM not configured] Retrieved chunks only.\n" + prompt[:300]
+
+    result = retrieve_and_answer(question, _collection, _embedder, llm_call)
+    refused = not result["cited_chunks"]
+    return {
+        "answer": result["answer"],
+        "cited_chunks": result["cited_chunks"],
+        "refused": refused,
+    }
 
 
 if __name__ == "__main__":
     main()
+
diff --git a/uc-rag/skills.md b/uc-rag/skills.md
index 167287b..6a4b923 100644
--- a/uc-rag/skills.md
+++ b/uc-rag/skills.md
@@ -1,25 +1,16 @@
-# skills.md — UC-RAG RAG Server
-# INSTRUCTIONS:
-# 1. Open your AI tool
-# 2. Paste the full contents of uc-rag/README.md
-# 3. Use this prompt:
-#    "Read this UC README. Generate a skills.md YAML defining the two
-#     skills: chunk_documents and retrieve_and_answer. Each skill needs:
-#     name, description, input, output, error_handling.
-#     error_handling must address the failure modes in the README.
-#     Output only valid YAML."
-# 4. Paste the output below, replacing this placeholder
-# 5. Verify error_handling addresses all three failure modes
+# Skills
 
-skills:
-  - name: chunk_documents
-    description: "[FILL IN]"
-    input: "[FILL IN: path to policy-documents directory]"
-    output: "[FILL IN: list of chunk dicts with doc_name, chunk_index, text]"
-    error_handling: "[FILL IN: what happens if a file is missing or unreadable]"
+## `chunk_documents`
+- Loads all policy documents from `data/policy-documents/`
+- Splits each document into chunks of maximum 400 tokens
+- Splits on sentence boundaries — never mid-sentence
+- Returns: list of chunks with metadata: `{doc_name, chunk_index, text}`
 
-  - name: retrieve_and_answer
-    description: "[FILL IN]"
-    input: "[FILL IN: query string]"
-    output: "[FILL IN: answer string + list of cited chunks]"
-    error_handling: "[FILL IN: what happens when no chunk scores above 0.6]"
+## `retrieve_and_answer`
+- Takes a query string
+- Embeds the query using sentence-transformers
+- Retrieves top-3 chunks from ChromaDB by cosine similarity
+- Filters out chunks scoring below 0.6
+- Calls the LLM with retrieved chunks as context only
+- Returns: answer + list of cited chunks
+- Error handling: if no chunk scores above 0.6 — return refusal template