diff --git a/.env.example b/.env.example
index fc19d62..40cb0fc 100644
--- a/.env.example
+++ b/.env.example
@@ -23,6 +23,8 @@ REDIS_DECODE_RESPONSES=true
 
 # Security
 SECRET_KEY=change-me-in-production-use-strong-random-key
+# Fernet encryption key for OAuth tokens (must be 32+ characters)
+ENCRYPTION_KEY=change-me-must-be-32-chars-padded!
 ALGORITHM=HS256
 ACCESS_TOKEN_EXPIRE_MINUTES=30
 REFRESH_TOKEN_EXPIRE_DAYS=7
@@ -40,6 +42,8 @@ YOUTUBE_REDIRECT_URI=http://localhost:8000/api/v1/youtube/auth/callback
 # Rate Limiting
 RATE_LIMIT_PER_MINUTE=60
 RATE_LIMIT_BURST=10
+# Toggle rate limiting on/off
+RATE_LIMIT_ENABLED=true
 
 # Quota Limits
 DEFAULT_DAILY_ANSWER_LIMIT=100
@@ -51,6 +55,13 @@ QUEUE_CLASSIFICATION=classification
 QUEUE_EMBEDDING=embedding
 QUEUE_CLUSTERING=clustering
 QUEUE_ANSWER_GENERATION=answer_generation
+QUEUE_YOUTUBE_POSTING=youtube_posting
+
+# Worker Thresholds
+# Minimum confidence to forward a classified question to embedding
+CLASSIFICATION_CONFIDENCE_THRESHOLD=0.4
+# Minimum cosine similarity to join an existing cluster
+CLUSTERING_SIMILARITY_THRESHOLD=0.65
 
 # Logging
 LOG_LEVEL=INFO
@@ -68,5 +79,27 @@ WEBSOCKET_TIMEOUT=300
 WORKERS=classification,embeddings,clustering,answer_generation,trigger_monitor
 
 GEMINI_API_KEY=your-gemini-api-key
+# Gemini model for classification, answers, and summarization
+GEMINI_MODEL=gemini-2.5-flash
+# Gemini model for generating text embeddings
+GEMINI_EMBEDDING_MODEL=gemini-embedding-001
+# Number of questions needed before triggering cluster answer generation
+CLUSTERING_THRESHOLD=5
+
+# Mock / Testing
+# Enable mock YouTube polling (no real API calls)
+MOCK_YOUTUBE=false
+# Seconds between mock YouTube messages
+MOCK_MESSAGE_INTERVAL=2.0
+
+# Frontend
+# Absolute path to frontend/dist directory for static file serving
+FRONTEND_DIR=
+
+# Prometheus
+PROMETHEUS_MULTIPROC_DIR=/tmp/prometheus_multiproc
 
-FRONTEND_DIR=
\ No newline at end of file
+# Grafana Cloud (Prometheus remote_write)
+GCLOUD_HOSTED_METRICS_URL=
+GCLOUD_HOSTED_METRICS_ID=
+GCLOUD_RW_API_KEY=
\ No newline at end of file
diff --git a/.gitignore b/.gitignore
index f134569..c45a475 100644
--- a/.gitignore
+++ b/.gitignore
@@ -100,3 +100,8 @@ logs/
 *.seed
 tmp/
 *.bak
+
+CLAUDE.md
+.claude
+
+data-alloy
\ No newline at end of file
diff --git a/Makefile b/Makefile
index 0178af1..2c8636a 100644
--- a/Makefile
+++ b/Makefile
@@ -22,7 +22,7 @@ help:
 	@echo "  make clean             - Clean generated files"
 
 run-backend:
-	cd backend && uvicorn app.main:app --reload --host 0.0.0.0 --port 8000
+	cd backend && PYTHONPATH=$(CURDIR) uvicorn app.main:app --reload --host 0.0.0.0 --port 8000
 
 run-workers:
 	python -m workers.runner
@@ -33,8 +33,11 @@ format:
 
 lint:
 	ruff check backend workers scripts
-	flake8 backend workers scripts --max-line-length=119 --ignore=D107,D212,E501,W503,W605,D203,D100
-	pylint backend workers scripts --disable=line-too-long,trailing-whitespace,missing-function-docstring,consider-using-f-string,import-error,too-few-public-methods,redefined-outer-name
+	flake8 backend workers scripts --max-line-length=119 --ignore=D107,D212,E501,W503,W605,D203,D100 \
+		--per-file-ignores="backend/alembic/*:E402,F401 backend/app/main.py:E402,F824 backend/app/db/models/migrations/*:W391 workers/*/worker.py:E402,F824 workers/*/mock_worker.py:E402,F824 workers/runner.py:E402 scripts/*:E402,E226"
+	pylint backend workers scripts \
+		--ignore-paths="backend/alembic/versions/" \
+		--disable=line-too-long,trailing-whitespace,missing-function-docstring,missing-module-docstring,missing-class-docstring,consider-using-f-string,import-error,too-few-public-methods,redefined-outer-name,wrong-import-position,wrong-import-order,ungrouped-imports,invalid-name,logging-fstring-interpolation,global-statement,global-variable-not-assigned,unnecessary-pass,fixme,pointless-string-statement,broad-exception-caught,duplicate-code,too-many-locals,too-many-arguments,too-many-branches,too-many-statements,too-many-nested-blocks,too-many-instance-attributes,unused-argument,unused-import,unused-variable,no-member,import-outside-toplevel,raise-missing-from,not-callable,singleton-comparison,no-else-continue,implicit-str-concat,keyword-arg-before-vararg,missing-timeout,subprocess-run-check,protected-access
 
 test:
 	pytest backend/tests workers -v
diff --git a/README.md b/README.md
index 6233a45..13c1cfb 100644
--- a/README.md
+++ b/README.md
@@ -44,6 +44,17 @@ youtube_polling worker  ──► Redis queue
 
 Comments flow from YouTube → Redis workers → Gemini AI for classification and embedding → pgvector for semantic clustering → answer generation → real-time WebSocket delivery to the teacher dashboard (and optionally back to the stream).
 
+## Features
+
+- **Real-time question clustering** — student comments are embedded and clustered live using nearest-centroid algorithm with milestone triggers
+- **RAG-augmented answers** — AI-generated answers grounded in teacher-uploaded documents (PDF, DOCX, TXT)
+- **YouTube integration** — polls live chat, posts answers directly back to YouTube
+- **Content moderation** — Gemini-powered filtering before classification and before YouTube posting
+- **WebSocket dashboard** — real-time updates with exponential backoff reconnection and 100-message cap
+- **Teacher isolation** — every data endpoint enforces ownership; RAG retrieval is scoped per teacher
+- **Observability** — Prometheus metrics, circuit breaker pattern on all Gemini calls, structured logging
+- **Scheduled maintenance** — automatic daily quota reset and hourly expired token cleanup
+
 ## Quick Start
 
 ### Prerequisites
@@ -84,28 +95,47 @@ This starts PostgreSQL, Redis, the FastAPI backend, and all workers. The API is
 cd backend && alembic upgrade head
 ```
 
-## Running Without Docker
+## Running Without Docker (Native Development)
+
+**Prerequisites:**
+- Python 3.13+
+- Node.js 20+
+- PostgreSQL 15+ with the [pgvector extension](https://github.com/pgvector/pgvector)
+- Redis 7+
+
+**Steps:**
+
+1. **Clone and set up environment variables:**
+```bash
+cp .env.example .env.development
+# Fill in your GEMINI_API_KEY, SECRET_KEY, ENCRYPTION_KEY, and YouTube OAuth credentials
+```
 
-**Backend:**
+2. **Install backend dependencies:**
 ```bash
-pip install -r backend/requirements.txt
-uvicorn backend.app.main:app --reload
+cd backend
+python -m venv venv && source venv/bin/activate
+pip install -r requirements.txt
 ```
 
-**Workers:**
+3. **Install frontend dependencies:**
 ```bash
-python -m workers.classification.worker
-python -m workers.embeddings.worker
-python -m workers.clustering.worker
-python -m workers.answer_generation.worker
-python -m workers.trigger_monitor.worker
+cd frontend && npm install
 ```
 
-**Chrome extension:**
+4. **Run database migrations:**
 ```bash
-cd chrome-extension && npm install && npm run build
+make migrate
 ```
-Load `chrome-extension/dist` as an unpacked extension in Chrome.
+
+5. **Start all services in one command:**
+```bash
+./start_dev.sh
+```
+This opens a tmux session with 9 panes: backend API, 6 AI workers, scheduler, and the Vite dev server.
+
+6. **Open the app:**
+   Visit `http://localhost:5173`
 
 ## API
 
@@ -130,6 +160,13 @@ make lint     # run linters
 make test     # run tests
 ```
 
+## Known Limitations
+
+- **No production deployment config** — docker-compose is development-oriented; nginx and production Dockerfile are not included
+- **Chrome extension** — functional but not published to the Chrome Web Store
+- **YouTube quota** — the YouTube Data API v3 has daily quota limits; high-traffic sessions may hit limits
+- **Single-region** — no multi-region or horizontal scaling configuration
+
 ## License
 
 MIT
diff --git a/alloy/config.alloy b/alloy/config.alloy
new file mode 100644
index 0000000..dd397f3
--- /dev/null
+++ b/alloy/config.alloy
@@ -0,0 +1,22 @@
+prometheus.scrape "fastapi" {
+  targets = [{
+    __address__ = "localhost:8000",
+  }]
+  metrics_path    = "/metrics"
+  scrape_interval = "15s"
+  forward_to      = [prometheus.remote_write.grafana_cloud.receiver]
+}
+
+prometheus.remote_write "grafana_cloud" {
+  endpoint {
+    url = sys.env("GCLOUD_HOSTED_METRICS_URL")
+    basic_auth {
+      username = sys.env("GCLOUD_HOSTED_METRICS_ID")
+      password = sys.env("GCLOUD_RW_API_KEY")
+    }
+  }
+  external_labels = {
+    job         = "ai_doubt_manager",
+    environment = "development",
+  }
+}
diff --git a/backend/alembic/versions/6f04ebe5f0fb_add_hnsw_indexes_comments_rag_documents.py b/backend/alembic/versions/6f04ebe5f0fb_add_hnsw_indexes_comments_rag_documents.py
new file mode 100644
index 0000000..3ce0cfe
--- /dev/null
+++ b/backend/alembic/versions/6f04ebe5f0fb_add_hnsw_indexes_comments_rag_documents.py
@@ -0,0 +1,35 @@
+"""add hnsw indexes to comments and rag_documents embedding columns
+
+Revision ID: 6f04ebe5f0fb
+Revises: d4e5f6a7b8c9
+Create Date: 2026-03-15 00:00:00.000000
+
+"""
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision = "6f04ebe5f0fb"
+down_revision = "d4e5f6a7b8c9"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS idx_comments_embedding_hnsw
+        ON comments
+        USING hnsw (embedding vector_cosine_ops)
+        WITH (m = 16, ef_construction = 64)
+    """)
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS idx_rag_documents_embedding_hnsw
+        ON rag_documents
+        USING hnsw (embedding vector_cosine_ops)
+        WITH (m = 16, ef_construction = 64)
+    """)
+
+
+def downgrade() -> None:
+    op.execute("DROP INDEX IF EXISTS idx_rag_documents_embedding_hnsw")
+    op.execute("DROP INDEX IF EXISTS idx_comments_embedding_hnsw")
diff --git a/backend/alembic/versions/6fe440076f64_recreate_clusters_centroid_hnsw_with_params.py b/backend/alembic/versions/6fe440076f64_recreate_clusters_centroid_hnsw_with_params.py
new file mode 100644
index 0000000..a4a2e99
--- /dev/null
+++ b/backend/alembic/versions/6fe440076f64_recreate_clusters_centroid_hnsw_with_params.py
@@ -0,0 +1,34 @@
+"""recreate clusters centroid hnsw index with tuning params
+
+Revision ID: 6fe440076f64
+Revises: 6f04ebe5f0fb
+Create Date: 2026-03-15 00:00:00.000000
+
+"""
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision = "6fe440076f64"
+down_revision = "6f04ebe5f0fb"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.execute("DROP INDEX IF EXISTS clusters_centroid_hnsw_idx")
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS idx_clusters_centroid_embedding_hnsw
+        ON clusters
+        USING hnsw (centroid_embedding vector_cosine_ops)
+        WITH (m = 16, ef_construction = 64)
+    """)
+
+
+def downgrade() -> None:
+    op.execute("DROP INDEX IF EXISTS idx_clusters_centroid_embedding_hnsw")
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS clusters_centroid_hnsw_idx
+        ON clusters
+        USING hnsw (centroid_embedding vector_cosine_ops)
+    """)
diff --git a/backend/alembic/versions/c3d4e5f6a7b8_add_hnsw_indexes.py b/backend/alembic/versions/c3d4e5f6a7b8_add_hnsw_indexes.py
new file mode 100644
index 0000000..11a7646
--- /dev/null
+++ b/backend/alembic/versions/c3d4e5f6a7b8_add_hnsw_indexes.py
@@ -0,0 +1,35 @@
+"""add_hnsw_indexes
+
+Revision ID: c3d4e5f6a7b8
+Revises: b2c3d4e5f6a7
+Create Date: 2026-03-09 00:00:00.000000
+
+"""
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision = "c3d4e5f6a7b8"
+down_revision = "b2c3d4e5f6a7"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS idx_comments_embedding_hnsw
+        ON comments
+        USING hnsw (embedding vector_l2_ops)
+        WITH (m = 16, ef_construction = 64)
+    """)
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS idx_rag_documents_embedding_hnsw
+        ON rag_documents
+        USING hnsw (embedding vector_l2_ops)
+        WITH (m = 16, ef_construction = 64)
+    """)
+
+
+def downgrade() -> None:
+    op.execute("DROP INDEX IF EXISTS idx_rag_documents_embedding_hnsw")
+    op.execute("DROP INDEX IF EXISTS idx_comments_embedding_hnsw")
diff --git a/backend/alembic/versions/d4e5f6a7b8c9_add_clusters_centroid_hnsw.py b/backend/alembic/versions/d4e5f6a7b8c9_add_clusters_centroid_hnsw.py
new file mode 100644
index 0000000..5a78da2
--- /dev/null
+++ b/backend/alembic/versions/d4e5f6a7b8c9_add_clusters_centroid_hnsw.py
@@ -0,0 +1,27 @@
+"""add clusters centroid hnsw index for cosine similarity
+
+Revision ID: d4e5f6a7b8c9
+Revises: c3d4e5f6a7b8
+Create Date: 2026-03-12 00:00:00.000000
+
+"""
+
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision = "d4e5f6a7b8c9"
+down_revision = "c3d4e5f6a7b8"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.execute("""
+        CREATE INDEX IF NOT EXISTS clusters_centroid_hnsw_idx
+        ON clusters
+        USING hnsw (centroid_embedding vector_cosine_ops)
+    """)
+
+
+def downgrade() -> None:
+    op.execute("DROP INDEX IF EXISTS clusters_centroid_hnsw_idx")
diff --git a/backend/app/api/v1/dashboard.py b/backend/app/api/v1/dashboard.py
index 4f1830d..23f7cec 100644
--- a/backend/app/api/v1/dashboard.py
+++ b/backend/app/api/v1/dashboard.py
@@ -1,6 +1,7 @@
 """Teacher dashboard API routes."""
 
 import logging
+import re
 from datetime import (
     datetime,
     timezone,
@@ -32,6 +33,8 @@
     BaseModel,
     Field,
 )
+from sqlalchemy import update
+from sqlalchemy.exc import IntegrityError
 from sqlalchemy.orm import Session
 
 router = APIRouter(prefix="/dashboard", tags=["dashboard"])
@@ -70,7 +73,7 @@ async def submit_manual_question(
     if not session:
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="Session not found")
 
-    texts = [t.strip() for t in payload.text.split("\n") if t.strip()]
+    texts = [re.sub(r"<[^>]+>", "", t).strip() for t in payload.text.split("\n") if t.strip()]
     created_count = 0
     manager = QueueManager()
 
@@ -82,7 +85,11 @@ async def submit_manual_question(
             text=text,
         )
         db.add(comment)
-        db.flush()
+        try:
+            db.flush()
+        except IntegrityError:
+            db.rollback()
+            raise HTTPException(status_code=status.HTTP_409_CONFLICT, detail="Duplicate question submission.")
         manager.enqueue(
             QUEUE_CLASSIFICATION,
             ClassificationPayload(
@@ -125,8 +132,18 @@ async def approve_answer(
         raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail="Answer not found")
 
     answer, cluster, session = result
-    if answer.is_posted:
-        raise HTTPException(status_code=status.HTTP_400_BAD_REQUEST, detail="Already posted")
+
+    rows_updated = db.execute(
+        update(Answer)
+        .where(Answer.id == answer_id, Answer.is_posted == False)  # noqa: E712
+        .values(is_posted=True, posted_at=datetime.now(timezone.utc))
+    ).rowcount
+
+    if rows_updated == 0:
+        raise HTTPException(status_code=status.HTTP_409_CONFLICT, detail="Already approved")
+
+    db.commit()
+    db.refresh(answer)
 
     yt_token = db.query(YouTubeToken).filter(YouTubeToken.teacher_id == current_user.id).first()
 
@@ -140,16 +157,11 @@ async def approve_answer(
             ).to_dict(),
         )
         logger.info(f"Enqueued answer {answer_id} for YouTube posting")
-    else:
-        answer.is_posted = True
-        answer.posted_at = datetime.now(timezone.utc)
-        db.commit()
 
-    db.refresh(answer)
     return answer
 
 
-@router.post("/answers/{answer_id}/edit", response_model=AnswerResponse)
+@router.patch("/answers/{answer_id}", response_model=AnswerResponse)
 async def edit_answer(
     answer_id: UUID,
     payload: AnswerUpdate,
@@ -217,3 +229,48 @@ async def get_session_stats(
         "answers_generated": answers_generated,
         "answers_posted": answers_posted,
     }
+
+
+@router.get("/clusters/{cluster_id}/representative")
+async def get_representative_question(
+    cluster_id: UUID,
+    current_user: Teacher = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> dict:
+    """Return the comment whose embedding is closest to the cluster centroid."""
+    from sqlalchemy import text as sa_text
+
+    cluster = (
+        db.query(Cluster)
+        .join(StreamingSession, Cluster.session_id == StreamingSession.id)
+        .filter(
+            Cluster.id == cluster_id,
+            StreamingSession.teacher_id == current_user.id,
+        )
+        .first()
+    )
+    if not cluster:
+        raise HTTPException(status_code=404, detail="Cluster not found")
+    if cluster.centroid_embedding is None:
+        raise HTTPException(status_code=404, detail="No centroid available")
+
+    centroid_str = "[" + ",".join(str(v) for v in cluster.centroid_embedding) + "]"
+
+    row = db.execute(
+        sa_text("""
+            SELECT c.id, c.text,
+                   1 - (c.embedding <=> CAST(:centroid AS vector)) AS similarity
+            FROM comments c
+            WHERE c.cluster_id = :cluster_id
+              AND c.is_question = TRUE
+              AND c.embedding IS NOT NULL
+            ORDER BY c.embedding <=> CAST(:centroid AS vector)
+            LIMIT 1
+        """),
+        {"centroid": centroid_str, "cluster_id": str(cluster_id)},
+    ).first()
+
+    if not row:
+        raise HTTPException(status_code=404, detail="No representative question found")
+
+    return {"comment_id": str(row.id), "text": row.text, "similarity": float(row.similarity)}
diff --git a/backend/app/api/v1/metrics.py b/backend/app/api/v1/metrics.py
index 080a5b4..9e2fd4c 100644
--- a/backend/app/api/v1/metrics.py
+++ b/backend/app/api/v1/metrics.py
@@ -2,6 +2,7 @@
 
 from app.core.security import get_current_active_user
 from app.db.models.answer import Answer
+from app.db.models.cluster import Cluster
 from app.db.models.comment import Comment
 from app.db.models.streaming_session import StreamingSession
 from app.db.models.teacher import Teacher
@@ -20,13 +21,37 @@ async def get_metrics(
     current_user: Teacher = Depends(get_current_active_user),
     db: Session = Depends(get_db),
 ) -> dict:
-    """Get system metrics. Requires authentication.
+    """Get metrics scoped to current teacher. Requires authentication.
 
     Returns:
         Dict with active_sessions, questions_processed, and answers_generated counts.
     """
+    active_sessions = (
+        db.query(StreamingSession)
+        .filter(
+            StreamingSession.teacher_id == current_user.id,
+            StreamingSession.is_active.is_(True),
+        )
+        .count()
+    )
+
+    questions_processed = (
+        db.query(Comment)
+        .join(StreamingSession, Comment.session_id == StreamingSession.id)
+        .filter(StreamingSession.teacher_id == current_user.id)
+        .count()
+    )
+
+    answers_generated = (
+        db.query(Answer)
+        .join(Cluster, Answer.cluster_id == Cluster.id)
+        .join(StreamingSession, Cluster.session_id == StreamingSession.id)
+        .filter(StreamingSession.teacher_id == current_user.id)
+        .count()
+    )
+
     return {
-        "active_sessions": db.query(StreamingSession).filter(StreamingSession.is_active.is_(True)).count(),
-        "questions_processed": db.query(Comment).count(),
-        "answers_generated": db.query(Answer).count(),
+        "active_sessions": active_sessions,
+        "questions_processed": questions_processed,
+        "answers_generated": answers_generated,
     }
diff --git a/backend/app/api/v1/websocket.py b/backend/app/api/v1/websocket.py
index 46aca60..d789f93 100644
--- a/backend/app/api/v1/websocket.py
+++ b/backend/app/api/v1/websocket.py
@@ -41,19 +41,31 @@ async def websocket_endpoint(
         try:
             raw = await websocket.receive_text()
             first_msg = json.loads(raw)
-        except (json.JSONDecodeError, Exception):
-            await websocket.close(code=4001, reason="Auth message required")
+        except WebSocketDisconnect:
+            manager.disconnect(session_id, conn_id)
+            return
+        except Exception:
+            try:
+                await websocket.close(code=4001, reason="Auth message required")
+            except Exception:
+                pass
             manager.disconnect(session_id, conn_id)
             return
 
         if first_msg.get("type") != "auth" or not first_msg.get("token"):
-            await websocket.close(code=4001, reason="Auth message required")
+            try:
+                await websocket.close(code=4001, reason="Auth message required")
+            except Exception:
+                pass
             manager.disconnect(session_id, conn_id)
             return
 
         payload = verify_token(first_msg["token"])
         if not payload:
-            await websocket.close(code=4001, reason="Invalid token")
+            try:
+                await websocket.close(code=4001, reason="Invalid token")
+            except Exception:
+                pass
             manager.disconnect(session_id, conn_id)
             return
 
@@ -61,7 +73,10 @@ async def websocket_endpoint(
         try:
             session_obj = db.query(StreamingSession).filter(StreamingSession.id == session_id).first()
             if not session_obj or str(session_obj.teacher_id) != payload.get("sub"):
-                await websocket.close(code=4003, reason="Forbidden")
+                try:
+                    await websocket.close(code=4003, reason="Forbidden")
+                except Exception:
+                    pass
                 manager.disconnect(session_id, conn_id)
                 return
         finally:
@@ -103,3 +118,7 @@ async def websocket_endpoint(
         logger.error(f"WebSocket error: {e}")
         if conn_id:
             manager.disconnect(session_id, conn_id)
+        try:
+            await websocket.close(code=1011)
+        except Exception:
+            pass
diff --git a/backend/app/api/v1/youtube.py b/backend/app/api/v1/youtube.py
index 6d0105e..ed46673 100644
--- a/backend/app/api/v1/youtube.py
+++ b/backend/app/api/v1/youtube.py
@@ -105,8 +105,6 @@ async def oauth_callback(
         )
 
     data = json.loads(state_data_raw)
-    _redis.delete(f"yt_state:{state}")
-    _redis.delete(f"yt_state_teacher:{data['teacher_id']}")
 
     oauth_service = YouTubeOAuthService()
     try:
@@ -142,6 +140,10 @@ async def oauth_callback(
     db.commit()
     logger.info(f"YouTube token stored for teacher {teacher_id}")
 
+    # Delete Redis state after successful DB commit — if this fails, keys expire via TTL
+    _redis.delete(f"yt_state:{state}")
+    _redis.delete(f"yt_state_teacher:{data['teacher_id']}")
+
     return HTMLResponse(content=_OAUTH_SUCCESS_HTML)
 
 
@@ -158,9 +160,17 @@ async def refresh_token(
             detail="No YouTube token found",
         )
 
+    try:
+        decrypted_refresh = decrypt_data(token.refresh_token)
+    except Exception:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail="YouTube token is invalid or corrupted. Please reconnect your YouTube account.",
+        )
+
     oauth_service = YouTubeOAuthService()
     try:
-        refreshed = oauth_service.refresh_token(decrypt_data(token.refresh_token))
+        refreshed = oauth_service.refresh_token(decrypted_refresh)
     except Exception as e:
         logger.error(f"Token refresh failed: {e}")
         raise HTTPException(
@@ -219,7 +229,14 @@ async def get_video_info(
             detail="YouTube not connected",
         )
 
-    access_token = decrypt_data(token.access_token)
+    try:
+        access_token = decrypt_data(token.access_token)
+    except Exception:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail="YouTube token is invalid or corrupted. Please reconnect your YouTube account.",
+        )
+
     client = YouTubeClient(access_token)
     try:
         info = client.get_video_info(video_id)
@@ -249,7 +266,14 @@ async def validate_video(
     if not token:
         return {"valid": False, "is_live": False, "title": ""}
 
-    access_token = decrypt_data(token.access_token)
+    try:
+        access_token = decrypt_data(token.access_token)
+    except Exception:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail="YouTube token is invalid or corrupted. Please reconnect your YouTube account.",
+        )
+
     client = YouTubeClient(access_token)
     try:
         info = client.get_video_info(video_id)
diff --git a/backend/app/core/config.py b/backend/app/core/config.py
index 5956279..607ab1a 100644
--- a/backend/app/core/config.py
+++ b/backend/app/core/config.py
@@ -16,6 +16,15 @@
     SettingsConfigDict,
 )
 
+from workers.common.queue import (
+    QUEUE_ANSWER_GENERATION,
+    QUEUE_CLASSIFICATION,
+    QUEUE_CLUSTERING,
+    QUEUE_COMMENT_INGEST,
+    QUEUE_EMBEDDING,
+    QUEUE_YOUTUBE_POSTING,
+)
+
 
 class Settings(BaseSettings):
     """Application settings loaded from environment variables."""
@@ -88,18 +97,35 @@ def validate_encryption_key(cls, v: str) -> str:
     default_monthly_session_limit: int = 30
 
     # Worker queue names
-    queue_comment_ingest: str = "comment_ingest"
-    queue_classification: str = "classification"
-    queue_embedding: str = "embedding"
-    queue_clustering: str = "clustering"
-    queue_answer_generation: str = "answer_generation"
+    queue_comment_ingest: str = QUEUE_COMMENT_INGEST
+    queue_classification: str = QUEUE_CLASSIFICATION
+    queue_embedding: str = QUEUE_EMBEDDING
+    queue_clustering: str = QUEUE_CLUSTERING
+    queue_answer_generation: str = QUEUE_ANSWER_GENERATION
+    queue_youtube_posting: str = QUEUE_YOUTUBE_POSTING
+
+    # Worker thresholds
+    classification_confidence_threshold: float = 0.4
+    clustering_similarity_threshold: float = 0.65
 
     # Gemini AI
     gemini_api_key: str = Field(default="", description="Gemini API key")
+
+    @field_validator("gemini_api_key")
+    @classmethod
+    def validate_gemini_api_key(cls, v: str) -> str:
+        if not v or not v.strip():
+            raise ValueError("gemini_api_key must be set — Gemini workers cannot function without it")
+        return v
+
     gemini_model: str = "gemini-2.5-flash"
     gemini_embedding_model: str = "gemini-embedding-001"
     clustering_threshold: int = Field(default=5, description="Questions needed to trigger clustering")
 
+    # Mock / Testing
+    mock_youtube: bool = False
+    mock_message_interval: float = 2.0
+
     # Logging
     log_level: str = "INFO"
     log_json: bool = False
diff --git a/backend/app/core/metrics.py b/backend/app/core/metrics.py
index 166139e..e6c16eb 100644
--- a/backend/app/core/metrics.py
+++ b/backend/app/core/metrics.py
@@ -1,15 +1,23 @@
 """Prometheus metrics for observability."""
 
-from app.core.config import settings
-from prometheus_client import (
+import os
+
+# Must be set BEFORE importing prometheus_client for multiprocess mode
+os.environ.setdefault("PROMETHEUS_MULTIPROC_DIR", "/tmp/prometheus_multiproc")
+os.makedirs("/tmp/prometheus_multiproc", exist_ok=True)
+
+from app.core.config import settings  # noqa: E402
+from prometheus_client import (  # noqa: E402
     CONTENT_TYPE_LATEST,
+    CollectorRegistry,
     Counter,
     Gauge,
     Histogram,
     generate_latest,
+    multiprocess,
 )
-from starlette.requests import Request
-from starlette.responses import Response
+from starlette.requests import Request  # noqa: E402
+from starlette.responses import Response  # noqa: E402
 
 http_requests_total = Counter("http_requests_total", "Total HTTP requests", ["method", "endpoint", "status"])
 
@@ -18,7 +26,10 @@
 )
 
 websocket_connections_active = Gauge(
-    "websocket_connections_active", "Number of active WebSocket connections", ["session_id"]
+    "websocket_connections_active",
+    "Number of active WebSocket connections",
+    ["session_id"],
+    multiprocess_mode="liveall",
 )
 
 websocket_messages_total = Counter("websocket_messages_total", "Total WebSocket messages", ["type", "direction"])
@@ -31,30 +42,34 @@
 
 redis_operations_total = Counter("redis_operations_total", "Total Redis operations", ["operation"])
 
-queue_size = Gauge("queue_size", "Number of items in queue", ["queue_name"])
+queue_size = Gauge("queue_size", "Number of items in queue", ["queue_name"], multiprocess_mode="liveall")
 
 queue_processed_total = Counter("queue_processed_total", "Total queue items processed", ["queue_name", "status"])
 
-worker_heartbeat = Gauge("worker_heartbeat", "Worker last heartbeat timestamp", ["worker_name"])
+worker_heartbeat = Gauge(
+    "worker_heartbeat", "Worker last heartbeat timestamp", ["worker_name"], multiprocess_mode="liveall"
+)
 
-quota_usage = Gauge("quota_usage", "Quota usage", ["teacher_id", "quota_type"])
+quota_usage = Gauge("quota_usage", "Quota usage", ["teacher_id", "quota_type"], multiprocess_mode="liveall")
 
-quota_limit = Gauge("quota_limit", "Quota limit", ["teacher_id", "quota_type"])
+quota_limit = Gauge("quota_limit", "Quota limit", ["teacher_id", "quota_type"], multiprocess_mode="liveall")
 
 
 async def metrics_endpoint(request: Request) -> Response:
-    """Prometheus metrics endpoint.
+    """Prometheus metrics endpoint using multiprocess collector.
 
     Args:
         request: Incoming request.
 
     Returns:
-        Metrics response.
+        Metrics response in Prometheus text format.
     """
     if not settings.enable_metrics:
         return Response("Metrics disabled", status_code=404)
 
-    metrics_data = generate_latest()
+    registry = CollectorRegistry()
+    multiprocess.MultiProcessCollector(registry)
+    metrics_data = generate_latest(registry)
     return Response(content=metrics_data, media_type=CONTENT_TYPE_LATEST)
 
 
diff --git a/backend/app/core/middleware.py b/backend/app/core/middleware.py
index de35bfc..63f25dd 100644
--- a/backend/app/core/middleware.py
+++ b/backend/app/core/middleware.py
@@ -9,6 +9,10 @@
 )
 
 from app.core.logging import get_logger
+from app.core.metrics import (
+    increment_http_requests,
+    observe_request_duration,
+)
 from fastapi import (
     Request,
     Response,
@@ -65,6 +69,9 @@ async def dispatch(self, request: Request, call_next: Callable) -> Response:
             response.headers["X-Request-ID"] = request_id
             response.headers["X-Process-Time"] = str(process_time)
 
+            increment_http_requests(request.method, request.url.path, response.status_code)
+            observe_request_duration(request.method, request.url.path, process_time)
+
             logger.info(
                 "Request completed",
                 extra={
@@ -80,6 +87,8 @@ async def dispatch(self, request: Request, call_next: Callable) -> Response:
 
         except Exception as e:
             process_time = time.time() - start_time
+            increment_http_requests(request.method, request.url.path, 500)
+            observe_request_duration(request.method, request.url.path, process_time)
             logger.error(
                 f"Request failed: {str(e)}",
                 extra={
diff --git a/backend/app/db/models/migrations/__init__.py b/backend/app/db/models/migrations/__init__.py
index d4f52dc..fd8058a 100644
--- a/backend/app/db/models/migrations/__init__.py
+++ b/backend/app/db/models/migrations/__init__.py
@@ -1,2 +1 @@
 """Migrations directory."""
-
diff --git a/backend/app/main.py b/backend/app/main.py
index 14a3eca..8a550cb 100644
--- a/backend/app/main.py
+++ b/backend/app/main.py
@@ -7,11 +7,10 @@
 """FastAPI application main entry point."""
 
 import asyncio
-import json
+import glob
 import logging
 import os
 
-import redis.asyncio as aioredis
 from app.api.v1 import (
     answers,
     auth,
@@ -32,7 +31,10 @@
 from app.core.middleware import RequestContextMiddleware
 from app.core.rate_limit_middleware import RateLimitMiddleware
 from app.services.websocket.manager import manager
-from fastapi import FastAPI
+from fastapi import (
+    FastAPI,
+    Request,
+)
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.staticfiles import StaticFiles
 
@@ -76,26 +78,6 @@
     logger.info(f"Serving frontend from {settings.frontend_dir} at /app")
 
 
-async def _relay_redis_events() -> None:
-    """Subscribe to worker-published Redis pub/sub events and relay via WebSocket."""
-    try:
-        r = aioredis.from_url(settings.redis_url, decode_responses=True)
-        pubsub = r.pubsub()
-        await pubsub.psubscribe("ws:session:*")
-        async for message in pubsub.listen():
-            if message["type"] != "pmessage":
-                continue
-            channel = message["channel"]  # "ws:session:{session_id}"
-            session_id = channel.split(":")[-1]
-            try:
-                event = json.loads(message["data"])
-                await manager.broadcast_to_session(session_id, event)
-            except Exception as e:
-                logger.error(f"Failed to relay Redis event for session {session_id}: {e}")
-    except Exception as e:
-        logger.error(f"Redis relay error: {e}")
-
-
 @app.get("/")
 async def root() -> dict:
     """Root endpoint."""
@@ -118,11 +100,8 @@ async def health() -> dict:
 
 
 @app.get("/metrics")
-async def metrics():
+async def metrics(request: Request):
     """Prometheus metrics endpoint."""
-    from starlette.requests import Request
-
-    request = Request(scope={"type": "http"})
     return await metrics_endpoint(request)
 
 
@@ -133,11 +112,17 @@ async def metrics():
 async def startup_event():
     """Application startup event."""
     global _relay_task
+
+    # Clear stale multiprocess metric files from previous runs
+    multiproc_dir = os.environ.get("PROMETHEUS_MULTIPROC_DIR", "/tmp/prometheus_multiproc")
+    for f in glob.glob(os.path.join(multiproc_dir, "*.db")):
+        os.unlink(f)
+
     logger.info(
         f"Starting {settings.app_name} v{settings.app_version}",
         extra={"environment": settings.environment, "debug": settings.debug},
     )
-    _relay_task = asyncio.create_task(_relay_redis_events())
+    _relay_task = asyncio.create_task(manager.start_subscriber())
 
 
 @app.on_event("shutdown")
diff --git a/backend/app/services/gemini/circuit_breaker.py b/backend/app/services/gemini/circuit_breaker.py
new file mode 100644
index 0000000..3a9960d
--- /dev/null
+++ b/backend/app/services/gemini/circuit_breaker.py
@@ -0,0 +1,76 @@
+"""Circuit breaker for Gemini API calls."""
+
+from __future__ import annotations
+
+import logging
+import time
+
+logger = logging.getLogger(__name__)
+
+
+class CircuitOpenError(Exception):
+    """Raised when circuit breaker is open — Gemini calls blocked."""
+
+    pass
+
+
+class GeminiCircuitBreaker:
+    """Per-process circuit breaker that fails fast during sustained Gemini outages."""
+
+    def __init__(
+        self,
+        failure_threshold: int = 5,
+        recovery_timeout: float = 30.0,
+        state_change_callback: callable | None = None,
+    ):
+        self._failure_threshold = failure_threshold
+        self._recovery_timeout = recovery_timeout
+        self._failure_count = 0
+        self._state = "closed"
+        self._opened_at = None
+        self._state_change_callback = state_change_callback
+
+    @property
+    def state(self) -> str:
+        """Returns 'closed', 'open', or 'half_open'."""
+        if self._state == "open" and time.monotonic() - self._opened_at >= self._recovery_timeout:
+            return "half_open"
+        return self._state
+
+    def record_success(self) -> None:
+        """Reset failure count, close circuit."""
+        was_open = self._state != "closed"
+        self._failure_count = 0
+        self._state = "closed"
+        self._opened_at = None
+        if was_open:
+            logger.info("Gemini circuit breaker closed after successful probe")
+            if self._state_change_callback:
+                self._state_change_callback(self.state)
+
+    def record_failure(self) -> None:
+        """Increment failure count. Open circuit if threshold reached."""
+        self._failure_count += 1
+        if self._failure_count >= self._failure_threshold and self._state == "closed":
+            self._state = "open"
+            self._opened_at = time.monotonic()
+            logger.warning(
+                "Gemini circuit breaker OPEN after %d consecutive failures. " "Calls blocked for %.0fs.",
+                self._failure_count,
+                self._recovery_timeout,
+            )
+            if self._state_change_callback:
+                self._state_change_callback(self.state)
+        elif self._state == "open" and self.state == "half_open":
+            self._opened_at = time.monotonic()
+            logger.warning("Gemini circuit breaker re-opened after failed probe")
+            if self._state_change_callback:
+                self._state_change_callback(self.state)
+
+    def ensure_closed(self) -> None:
+        """Raise CircuitOpenError if circuit is open. Allow if half_open or closed."""
+        current = self.state
+        if current == "open":
+            raise CircuitOpenError(f"Gemini circuit breaker is open. Retry after {self._recovery_timeout}s.")
+        if current == "half_open":
+            logger.info("Gemini circuit breaker half-open, allowing probe request")
diff --git a/backend/app/services/gemini/client.py b/backend/app/services/gemini/client.py
index caa2f7b..5bb147b 100644
--- a/backend/app/services/gemini/client.py
+++ b/backend/app/services/gemini/client.py
@@ -6,6 +6,10 @@
 
 import numpy as np
 from app.core.config import settings
+from app.services.gemini.circuit_breaker import (
+    CircuitOpenError,
+    GeminiCircuitBreaker,
+)
 from google import genai
 from google.genai import types
 from tenacity import (
@@ -28,6 +32,7 @@ class GeminiClient:
     def __init__(self):
         self._client = genai.Client(api_key=settings.gemini_api_key)
         self._semaphore = threading.Semaphore(5)
+        self._circuit_breaker = GeminiCircuitBreaker()
 
     @retry(stop=stop_after_attempt(3), wait=wait_exponential(min=1, max=10))
     def generate_embedding(self, text: str) -> list[float]:
@@ -36,20 +41,52 @@ def generate_embedding(self, text: str) -> list[float]:
         Note: Google's embedding model requires normalization for dimensions
         other than 3072 to ensure accurate semantic similarity.
         """
-        with self._semaphore:
-            result = self._client.models.embed_content(
-                model=settings.gemini_embedding_model,
-                contents=text,
-                config=types.EmbedContentConfig(output_dimensionality=768),
-            )
-            # Get embedding values
-            embedding_values = result.embeddings[0].values
-
-            # Normalize (required for 768-dim per Google docs)
-            embedding_np = np.array(embedding_values)
-            normed_embedding = embedding_np / np.linalg.norm(embedding_np)
-
-            return normed_embedding.tolist()
+        self._circuit_breaker.ensure_closed()
+        try:
+            with self._semaphore:
+                result = self._client.models.embed_content(
+                    model=settings.gemini_embedding_model,
+                    contents=text,
+                    config=types.EmbedContentConfig(output_dimensionality=768),
+                )
+                # Get embedding values
+                embedding_values = result.embeddings[0].values
+
+                # Normalize (required for 768-dim per Google docs)
+                embedding_np = np.array(embedding_values)
+                normed_embedding = embedding_np / np.linalg.norm(embedding_np)
+
+                self._circuit_breaker.record_success()
+                return normed_embedding.tolist()
+        except CircuitOpenError:
+            raise
+        except Exception:
+            self._circuit_breaker.record_failure()
+            raise
+
+    CLASSIFICATION_SYSTEM_INSTRUCTION = (
+        "You are a Teaching Assistant for a Live Stream. Your job is to identify "
+        '"Student Doubts." A student doubt is any inquiry, confusion, or request '
+        "for clarification. Classify as a question if the student is seeking an "
+        "answer, even if they use informal language or omit question marks."
+    )
+
+    CLASSIFICATION_FEW_SHOT = (
+        "Examples:\n"
+        'Comment: "I dont get the list part" -> {"is_question": true, "confidence": 0.92}\n'
+        'Comment: "Wait, why is that true?" -> {"is_question": true, "confidence": 0.97}\n'
+        'Comment: "Hello from London" -> {"is_question": false, "confidence": 0.95}\n'
+        'Comment: "Can you repeat the last step?" -> {"is_question": true, "confidence": 0.96}\n'
+    )
+
+    CLASSIFICATION_RESPONSE_SCHEMA = {
+        "type": "object",
+        "properties": {
+            "is_question": {"type": "boolean"},
+            "confidence": {"type": "number"},
+        },
+        "required": ["is_question", "confidence"],
+    }
 
     @retry(stop=stop_after_attempt(3), wait=wait_exponential(min=1, max=10))
     def classify_question(self, text: str) -> dict:
@@ -58,18 +95,31 @@ def classify_question(self, text: str) -> dict:
         Returns:
             dict with keys 'is_question' (bool) and 'confidence' (float 0-1).
         """
-        with self._semaphore:
-            prompt = (
-                f'Is this a question? Return JSON only: {{"is_question": bool, "confidence": float 0-1}}\n'
-                f"Comment: {text}"
-            )
-            response = self._client.models.generate_content(model=settings.gemini_model, contents=prompt)
-            raw = response.text.strip().removeprefix("```json").removesuffix("```").strip()
-            result = json.loads(raw)
-            logger.debug(
-                f"Classified comment: is_question={result.get('is_question')}, confidence={result.get('confidence')}"
-            )
-            return result
+        self._circuit_breaker.ensure_closed()
+        try:
+            with self._semaphore:
+                prompt = f"{self.CLASSIFICATION_FEW_SHOT}\nComment: {text}"
+                response = self._client.models.generate_content(
+                    model=settings.gemini_model,
+                    contents=prompt,
+                    config=types.GenerateContentConfig(
+                        system_instruction=self.CLASSIFICATION_SYSTEM_INSTRUCTION,
+                        response_mime_type="application/json",
+                        response_schema=self.CLASSIFICATION_RESPONSE_SCHEMA,
+                    ),
+                )
+                result = json.loads(response.text)
+                logger.debug(
+                    f"Classified comment: is_question={result.get('is_question')}, "
+                    f"confidence={result.get('confidence')}"
+                )
+                self._circuit_breaker.record_success()
+                return result
+        except CircuitOpenError:
+            raise
+        except Exception:
+            self._circuit_breaker.record_failure()
+            raise
 
     @retry(stop=stop_after_attempt(3), wait=wait_exponential(min=1, max=10))
     def generate_answer(self, question: str, context: str | None) -> str:
@@ -82,21 +132,54 @@ def generate_answer(self, question: str, context: str | None) -> str:
         Returns:
             Answer text.
         """
-        with self._semaphore:
-            if context:
+        self._circuit_breaker.ensure_closed()
+        try:
+            with self._semaphore:
+                if context:
+                    prompt = (
+                        f"You are a teaching assistant answering student questions during a live class.\n"
+                        f"Answer concisely and clearly using only the provided context.\n\n"
+                        f"Context:\n{context}\n\n"
+                        f"Question(s):\n{question}"
+                    )
+                else:
+                    prompt = (
+                        f"You are a teaching assistant answering student questions during a live class.\n"
+                        f"No teacher-uploaded context is available. Answer concisely and clearly "
+                        f"using your general knowledge.\n\n"
+                        f"Question(s):\n{question}"
+                    )
+                response = self._client.models.generate_content(model=settings.gemini_model, contents=prompt)
+                logger.debug("Answer generated successfully")
+                self._circuit_breaker.record_success()
+                return response.text
+        except CircuitOpenError:
+            raise
+        except Exception:
+            self._circuit_breaker.record_failure()
+            raise
+
+    @retry(stop=stop_after_attempt(3), wait=wait_exponential(min=1, max=10))
+    def summarize_cluster(self, questions: list[str]) -> str:
+        """Summarize a cluster of questions in 8 words or less."""
+        self._circuit_breaker.ensure_closed()
+        try:
+            with self._semaphore:
+                joined = "\n".join(f"- {q}" for q in questions)
                 prompt = (
-                    f"You are a teaching assistant answering student questions during a live class.\n"
-                    f"Answer concisely and clearly using only the provided context.\n\n"
-                    f"Context:\n{context}\n\n"
-                    f"Question(s):\n{question}"
+                    "Summarize what these questions are asking in 8 words or less. "
+                    "Return only the summary, no punctuation.\n\n"
+                    f"{joined}"
                 )
-            else:
-                prompt = (
-                    f"You are a teaching assistant answering student questions during a live class.\n"
-                    f"No teacher-uploaded context is available. Answer concisely and clearly "
-                    f"using your general knowledge.\n\n"
-                    f"Question(s):\n{question}"
+                response = self._client.models.generate_content(
+                    model=settings.gemini_model,
+                    contents=prompt,
+                    config=types.GenerateContentConfig(max_output_tokens=20),
                 )
-            response = self._client.models.generate_content(model=settings.gemini_model, contents=prompt)
-            logger.debug("Answer generated successfully")
-            return response.text
+                self._circuit_breaker.record_success()
+                return response.text.strip()
+        except CircuitOpenError:
+            raise
+        except Exception:
+            self._circuit_breaker.record_failure()
+            raise
diff --git a/backend/app/services/moderation.py b/backend/app/services/moderation.py
index 999ad4b..f055c02 100644
--- a/backend/app/services/moderation.py
+++ b/backend/app/services/moderation.py
@@ -1,35 +1,117 @@
-"""Content moderation service."""
+"""Content moderation service using Gemini AI."""
 
+import json
+import logging
 from typing import Optional
 
+from app.core.config import settings
+from app.services.gemini.client import GeminiClient
+from google.genai import types
+
+logger = logging.getLogger(__name__)
+
+MODERATION_SYSTEM_INSTRUCTION = (
+    "You are a content moderator for an educational platform where students ask "
+    "questions to teachers during live YouTube sessions. "
+    "Your job is to identify content that is inappropriate for an academic setting."
+)
+
+COMMENT_MODERATION_SCHEMA = {
+    "type": "object",
+    "properties": {
+        "approved": {"type": "boolean"},
+        "reason": {"type": "string"},
+        "category": {
+            "type": "string",
+            "enum": ["safe", "spam", "offensive", "harmful", "irrelevant"],
+        },
+    },
+    "required": ["approved", "reason", "category"],
+}
+
+COMMENT_MODERATION_PROMPT = """Analyze this student comment from a live educational stream.
+
+Comment: "{text}"
+
+Approve if: genuine academic question or statement, non-English content, minor typos, informal language.
+Reject if: profanity, personal attacks, spam or promotional content, self-harm, explicit content.
+
+Respond only with JSON."""
+
+ANSWER_MODERATION_PROMPT = """Analyze this AI-generated answer that will be posted publicly to YouTube on behalf of a teacher.
+
+Answer: "{text}"
+
+Approve if: factual academic content, clear explanation, appropriate tone.
+Reject if: harmful advice, offensive language, factual content that could cause harm if wrong.
+
+Respond only with JSON."""
+
 
 class ModerationService:
-    """Service for content moderation."""
+    """Service for content moderation using Gemini AI."""
 
     def __init__(self):
-        """Initialize moderation service."""
-        pass
+        self._gemini = GeminiClient()
 
     def moderate_comment(self, text: str) -> tuple[bool, Optional[str]]:
-        """Moderate a comment for inappropriate content.
-
-        Args:
-            text: Comment text to moderate.
+        """Moderate a student comment for inappropriate content.
 
         Returns:
             Tuple of (is_safe, reason_if_unsafe).
+            On any Gemini failure, approves by default to avoid blocking the pipeline.
         """
-        # TODO: Implement actual moderation logic
-        return (True, None)
+        try:
+            prompt = COMMENT_MODERATION_PROMPT.format(text=text)
+            response = self._gemini._client.models.generate_content(
+                model=settings.gemini_model,
+                contents=prompt,
+                config=types.GenerateContentConfig(
+                    system_instruction=MODERATION_SYSTEM_INSTRUCTION,
+                    response_mime_type="application/json",
+                    response_schema=COMMENT_MODERATION_SCHEMA,
+                ),
+            )
+            result = json.loads(response.text)
+            approved = result.get("approved", True)
+            reason = result.get("reason") if not approved else None
+            category = result.get("category", "safe")
+            logger.info(
+                "Comment moderation result",
+                extra={"approved": approved, "category": category, "reason": reason},
+            )
+            return (approved, reason)
+        except Exception as e:
+            logger.error(f"Moderation failed for comment, approving by default: {e}")
+            return (True, None)
 
     def moderate_answer(self, text: str) -> tuple[bool, Optional[str]]:
-        """Moderate an answer for inappropriate content.
-
-        Args:
-            text: Answer text to moderate.
+        """Moderate an AI-generated answer before it is posted to YouTube.
 
         Returns:
             Tuple of (is_safe, reason_if_unsafe).
+            On any Gemini failure, approves by default to avoid blocking the pipeline.
         """
-        # TODO: Implement actual moderation logic
-        return (True, None)
+        try:
+            prompt = ANSWER_MODERATION_PROMPT.format(text=text)
+            response = self._gemini._client.models.generate_content(
+                model=settings.gemini_model,
+                contents=prompt,
+                config=types.GenerateContentConfig(
+                    system_instruction=MODERATION_SYSTEM_INSTRUCTION,
+                    response_mime_type="application/json",
+                    response_schema=COMMENT_MODERATION_SCHEMA,
+                ),
+            )
+            result = json.loads(response.text)
+            approved = result.get("approved", True)
+            reason = result.get("reason") if not approved else None
+            category = result.get("category", "safe")
+            logger.info(
+                "Answer moderation result",
+                extra={"approved": approved, "category": category, "reason": reason},
+            )
+            return (approved, reason)
+        except Exception as e:
+            logger.error(f"Moderation failed for answer, approving by default: {e}")
+            return (True, None)
diff --git a/backend/app/services/rag/document_service.py b/backend/app/services/rag/document_service.py
index 16c9430..d382928 100644
--- a/backend/app/services/rag/document_service.py
+++ b/backend/app/services/rag/document_service.py
@@ -103,7 +103,12 @@ async def upload_document(
     base_title = file.filename or "document"
 
     for i, chunk in enumerate(chunks):
-        embedding = gemini.generate_embedding(chunk)
+        try:
+            embedding = gemini.generate_embedding(chunk)
+        except Exception as e:
+            logger.error(f"Embedding generation failed at chunk {i + 1}/{len(chunks)}: {e}")
+            db.rollback()
+            raise HTTPException(status_code=502, detail="Embedding generation failed. Please try again.")
         doc = RAGDocument(
             teacher_id=teacher_id,
             title=f"{base_title} (chunk {i + 1}/{len(chunks)})",
diff --git a/backend/app/services/sessions/__init__.py b/backend/app/services/sessions/__init__.py
deleted file mode 100644
index df2ca2f..0000000
--- a/backend/app/services/sessions/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""Sessions services package."""
diff --git a/backend/app/services/sessions/lifecycle.py b/backend/app/services/sessions/lifecycle.py
deleted file mode 100644
index 4f52018..0000000
--- a/backend/app/services/sessions/lifecycle.py
+++ /dev/null
@@ -1,55 +0,0 @@
-"""Streaming session lifecycle management."""
-
-from typing import Optional
-
-
-class SessionLifecycleService:
-    """Service for managing streaming session lifecycle."""
-
-    def __init__(self):
-        """Initialize session lifecycle service."""
-        pass
-
-    def create_session(self, teacher_id: int, youtube_video_id: str, title: Optional[str] = None) -> dict:
-        """Create a new streaming session.
-
-        Args:
-            teacher_id: Teacher ID.
-            youtube_video_id: YouTube video ID.
-            title: Optional session title.
-
-        Returns:
-            Session data dictionary.
-        """
-        # TODO: Implement actual session creation
-        return {
-            "id": 1,
-            "teacher_id": teacher_id,
-            "youtube_video_id": youtube_video_id,
-            "title": title,
-            "is_active": True,
-        }
-
-    def end_session(self, session_id: int) -> bool:
-        """End a streaming session.
-
-        Args:
-            session_id: Session ID to end.
-
-        Returns:
-            True if successful, False otherwise.
-        """
-        # TODO: Implement actual session ending
-        return True
-
-    def get_active_session(self, teacher_id: int) -> Optional[dict]:
-        """Get active session for a teacher.
-
-        Args:
-            teacher_id: Teacher ID.
-
-        Returns:
-            Session data dictionary or None if not found.
-        """
-        # TODO: Implement actual session retrieval
-        return None
diff --git a/backend/app/services/sessions/stats.py b/backend/app/services/sessions/stats.py
deleted file mode 100644
index 9c8417c..0000000
--- a/backend/app/services/sessions/stats.py
+++ /dev/null
@@ -1,42 +0,0 @@
-"""Streaming session statistics service."""
-
-
-class SessionStatsService:
-    """Service for calculating session statistics."""
-
-    def __init__(self):
-        """Initialize session stats service."""
-        pass
-
-    def get_session_stats(self, session_id: int) -> dict:
-        """Get statistics for a session.
-
-        Args:
-            session_id: Session ID.
-
-        Returns:
-            Statistics dictionary.
-        """
-        # TODO: Implement actual stats calculation
-        return {
-            "total_comments": 0,
-            "total_questions": 0,
-            "total_clusters": 0,
-            "total_answers": 0,
-        }
-
-    def get_teacher_stats(self, teacher_id: int) -> dict:
-        """Get statistics for a teacher.
-
-        Args:
-            teacher_id: Teacher ID.
-
-        Returns:
-            Statistics dictionary.
-        """
-        # TODO: Implement actual stats calculation
-        return {
-            "total_sessions": 0,
-            "total_comments": 0,
-            "total_answers": 0,
-        }
diff --git a/backend/app/services/websocket/events.py b/backend/app/services/websocket/events.py
index c2777f3..0709152 100644
--- a/backend/app/services/websocket/events.py
+++ b/backend/app/services/websocket/events.py
@@ -23,6 +23,7 @@ class WebSocketEventType(str, Enum):
 
     COMMENT_CREATED = "comment_created"
     COMMENT_CLASSIFIED = "comment_classified"
+    COMMENT_EMBEDDED = "comment_embedded"
 
     CLUSTER_CREATED = "cluster_created"
     CLUSTER_UPDATED = "cluster_updated"
@@ -107,6 +108,21 @@ def create_comment_classified_event(self, comment_id: str, is_question: bool, co
             message=f"Comment classified as {'question' if is_question else 'not a question'}",
         )
 
+    def create_comment_embedded_event(self, comment_id: str) -> Dict[str, Any]:
+        """Create a comment embedded event.
+
+        Args:
+            comment_id: Comment identifier.
+
+        Returns:
+            Event message dictionary.
+        """
+        return self.create_base_event(
+            WebSocketEventType.COMMENT_EMBEDDED,
+            data={"comment_id": comment_id},
+            message="Comment embedding generated",
+        )
+
     def create_cluster_created_event(self, cluster_data: Dict[str, Any]) -> Dict[str, Any]:
         """Create a cluster created event.
 
diff --git a/backend/app/services/websocket/manager.py b/backend/app/services/websocket/manager.py
index 4130e0b..b531891 100644
--- a/backend/app/services/websocket/manager.py
+++ b/backend/app/services/websocket/manager.py
@@ -1,7 +1,9 @@
 """WebSocket connection manager."""
 
 import asyncio
+import json
 import logging
+import uuid
 from datetime import (
     datetime,
     timezone,
@@ -12,6 +14,7 @@
     Optional,
 )
 
+import redis.asyncio as aioredis
 from app.core.config import settings
 from fastapi import (
     WebSocket,
@@ -45,6 +48,7 @@ def __init__(self):
         """Initialize WebSocket manager."""
         self.active_connections: Dict[str, Dict[str, ConnectionInfo]] = {}
         self.heartbeat_task: Optional[asyncio.Task] = None
+        self._redis: Optional[aioredis.Redis] = None
 
     async def connect(self, session_id: str, websocket: WebSocket, connection_id: Optional[str] = None) -> str:
         """Connect a WebSocket to a session.
@@ -60,8 +64,6 @@ async def connect(self, session_id: str, websocket: WebSocket, connection_id: Op
         await websocket.accept()
 
         if connection_id is None:
-            import uuid
-
             connection_id = str(uuid.uuid4())
 
         if session_id not in self.active_connections:
@@ -99,6 +101,52 @@ def disconnect(self, session_id: str, connection_id: str) -> None:
             if not self.active_connections[session_id]:
                 del self.active_connections[session_id]
 
+    async def publish(self, session_id: str, message: Dict[str, Any]) -> None:
+        """Publish a message to Redis channel ws:{session_id}.
+
+        Any subscriber process that owns a connection for this session
+        will pick it up and deliver it locally.
+        """
+        try:
+            if self._redis is None:
+                self._redis = aioredis.from_url(settings.redis_url, decode_responses=True)
+            await self._redis.publish(f"ws:{session_id}", json.dumps(message))
+        except Exception as e:
+            logger.error(f"Redis publish failed, resetting connection: {e}")
+            self._redis = None
+            raise
+
+    async def start_subscriber(self) -> None:
+        """Subscribe to ws:* and deliver messages to locally held connections.
+
+        Reconnects with exponential backoff on Redis failure.
+        """
+        backoff = 1
+        while True:
+            r = None
+            try:
+                r = aioredis.from_url(settings.redis_url, decode_responses=True)
+                pubsub = r.pubsub()
+                await pubsub.psubscribe("ws:*")
+                backoff = 1
+                async for message in pubsub.listen():
+                    if message["type"] != "pmessage":
+                        continue
+                    channel: str = message["channel"]  # "ws:{session_id}"
+                    session_id = channel[3:]  # strip "ws:" prefix
+                    try:
+                        event = json.loads(message["data"])
+                        await self.broadcast_to_session(session_id, event)
+                    except Exception as e:
+                        logger.error(f"Failed to deliver WS event for session {session_id}: {e}")
+            except Exception as e:
+                logger.error(f"WS subscriber error, reconnecting in {backoff}s: {e}")
+                await asyncio.sleep(backoff)
+                backoff = min(backoff * 2, 30)
+            finally:
+                if r:
+                    await r.aclose()
+
     async def send_personal_message(self, session_id: str, connection_id: str, message: Dict[str, Any]) -> bool:
         """Send a message to a specific WebSocket.
 
diff --git a/backend/app/tasks/monitoring.py b/backend/app/tasks/monitoring.py
deleted file mode 100644
index a381f89..0000000
--- a/backend/app/tasks/monitoring.py
+++ /dev/null
@@ -1,21 +0,0 @@
-"""Monitoring background task."""
-
-from app.core.logging import get_logger
-
-logger = get_logger(__name__)
-
-
-async def collect_metrics() -> None:
-    """Collect system metrics.
-
-    This task should run periodically to collect and report metrics.
-    """
-    logger.info("Starting metrics collection")
-    # TODO: Implement actual metrics collection
-    logger.info("Metrics collection completed")
-
-
-async def schedule_monitoring() -> None:
-    """Schedule monitoring tasks."""
-    # TODO: Implement scheduling logic
-    pass
diff --git a/backend/app/tasks/quota_reset.py b/backend/app/tasks/quota_reset.py
index e415508..2e38fd4 100644
--- a/backend/app/tasks/quota_reset.py
+++ b/backend/app/tasks/quota_reset.py
@@ -1,21 +1,45 @@
-"""Quota reset background task."""
+"""Quota reset task — resets used counts for all expired quota periods."""
 
-from app.core.logging import get_logger
+import logging
+from datetime import (
+    datetime,
+    timedelta,
+    timezone,
+)
 
-logger = get_logger(__name__)
+from app.db.models.quota import Quota
+from sqlalchemy.orm import Session
 
+logger = logging.getLogger(__name__)
 
-async def reset_quotas() -> None:
-    """Reset quotas for all teachers.
 
-    This task should run periodically to reset quota usage.
+def reset_quotas(db: Session) -> None:
+    """Reset all quotas whose reset_at timestamp has passed.
+
+    Sets used=0 and advances reset_at to the next period boundary.
+    Safe to run frequently — only touches rows where reset_at <= now.
     """
-    logger.info("Starting quota reset task")
-    # TODO: Implement actual quota reset logic
-    logger.info("Quota reset task completed")
+    now = datetime.now(timezone.utc)
+
+    expired = db.query(Quota).filter(Quota.reset_at <= now).all()
+
+    if not expired:
+        logger.debug("No quotas due for reset")
+        return
 
+    reset_count = 0
+    for quota in expired:
+        quota.used = 0
+        if quota.period == "daily":
+            quota.reset_at = now + timedelta(days=1)
+        elif quota.period == "monthly":
+            # Advance by roughly one month (30 days)
+            quota.reset_at = now + timedelta(days=30)
+        else:
+            # Unknown period — advance by 1 day as safe fallback
+            logger.warning(f"Unknown quota period '{quota.period}' for quota {quota.id}, defaulting to daily")
+            quota.reset_at = now + timedelta(days=1)
+        reset_count += 1
 
-async def schedule_quota_reset() -> None:
-    """Schedule quota reset task."""
-    # TODO: Implement scheduling logic
-    pass
+    db.commit()
+    logger.info(f"Reset {reset_count} quota(s)")
diff --git a/backend/app/tasks/token_cleanup.py b/backend/app/tasks/token_cleanup.py
index c281d02..daaf6ab 100644
--- a/backend/app/tasks/token_cleanup.py
+++ b/backend/app/tasks/token_cleanup.py
@@ -1,21 +1,41 @@
-"""Token cleanup background task."""
+"""Token cleanup task — removes unrecoverable expired YouTube tokens."""
 
-from app.core.logging import get_logger
+import logging
+from datetime import (
+    datetime,
+    timezone,
+)
 
-logger = get_logger(__name__)
+from app.db.models.youtube_token import YouTubeToken
+from sqlalchemy.orm import Session
 
+logger = logging.getLogger(__name__)
 
-async def cleanup_expired_tokens() -> None:
-    """Clean up expired OAuth tokens.
 
-    This task should run periodically to remove expired tokens.
+def cleanup_expired_tokens(db: Session) -> None:
+    """Delete YouTubeToken rows that are expired and have no refresh token.
+
+    Tokens with a refresh_token can be renewed by the application — those are
+    left alone. Only tokens that are both expired AND unrefreshable are removed.
     """
-    logger.info("Starting token cleanup task")
-    # TODO: Implement actual token cleanup logic
-    logger.info("Token cleanup task completed")
+    now = datetime.now(timezone.utc)
+
+    deleted = (
+        db.query(YouTubeToken)
+        .filter(
+            YouTubeToken.expires_at <= now,
+            YouTubeToken.refresh_token.is_(None),
+        )
+        .all()
+    )
+
+    if not deleted:
+        logger.debug("No expired unrecoverable tokens found")
+        return
 
+    count = len(deleted)
+    for token in deleted:
+        db.delete(token)
 
-async def schedule_token_cleanup() -> None:
-    """Schedule token cleanup task."""
-    # TODO: Implement scheduling logic
-    pass
+    db.commit()
+    logger.info(f"Deleted {count} expired unrecoverable YouTube token(s)")
diff --git a/backend/app/utils/text.py b/backend/app/utils/text.py
deleted file mode 100644
index 01e2949..0000000
--- a/backend/app/utils/text.py
+++ /dev/null
@@ -1,42 +0,0 @@
-"""Text processing utilities."""
-
-from typing import List
-
-
-def clean_text(text: str) -> str:
-    """Clean and normalize text.
-
-    Args:
-        text: Raw text input.
-
-    Returns:
-        Cleaned text string.
-    """
-    # TODO: Implement actual text cleaning
-    return text.strip()
-
-
-def extract_hashtags(text: str) -> List[str]:
-    """Extract hashtags from text.
-
-    Args:
-        text: Text to extract hashtags from.
-
-    Returns:
-        List of hashtag strings.
-    """
-    # TODO: Implement actual hashtag extraction
-    return []
-
-
-def is_question(text: str) -> bool:
-    """Check if text appears to be a question.
-
-    Args:
-        text: Text to check.
-
-    Returns:
-        True if text is a question, False otherwise.
-    """
-    # TODO: Implement actual question detection
-    return text.strip().endswith("?")
diff --git a/backend/app/utils/time.py b/backend/app/utils/time.py
deleted file mode 100644
index 41d42e2..0000000
--- a/backend/app/utils/time.py
+++ /dev/null
@@ -1,32 +0,0 @@
-"""Time utility functions."""
-
-from datetime import (
-    datetime,
-    timezone,
-)
-from typing import Optional
-
-
-def utc_now() -> datetime:
-    """Get current UTC datetime.
-
-    Returns:
-        Current UTC datetime.
-    """
-    return datetime.now(timezone.utc)
-
-
-def parse_datetime(dt_str: str) -> Optional[datetime]:
-    """Parse datetime string to datetime object.
-
-    Args:
-        dt_str: Datetime string.
-
-    Returns:
-        Datetime object or None if parsing fails.
-    """
-    # TODO: Implement actual datetime parsing
-    try:
-        return datetime.fromisoformat(dt_str.replace("Z", "+00:00"))
-    except Exception:
-        return None
diff --git a/backend/pyproject.toml b/backend/pyproject.toml
new file mode 100644
index 0000000..105bcac
--- /dev/null
+++ b/backend/pyproject.toml
@@ -0,0 +1,4 @@
+[tool.pytest.ini_options]
+asyncio_mode = "auto"
+asyncio_default_fixture_loop_scope = "function"
+testpaths = ["tests"]
diff --git a/backend/requirements.txt b/backend/requirements.txt
index 8270680..61b504d 100644
--- a/backend/requirements.txt
+++ b/backend/requirements.txt
@@ -4,6 +4,7 @@ aiosignal==1.4.0
 alembic==1.14.0
 annotated-types==0.7.0
 anyio==4.12.0
+apscheduler==3.10.4
 attrs==25.4.0
 bcrypt==4.1.2
 black==26.3.0
diff --git a/backend/tests/conftest.py b/backend/tests/conftest.py
new file mode 100644
index 0000000..383b994
--- /dev/null
+++ b/backend/tests/conftest.py
@@ -0,0 +1,166 @@
+"""Shared test fixtures: test DB, async client, auth helpers."""
+
+import os
+import uuid
+from collections.abc import AsyncGenerator
+from unittest.mock import patch
+
+import pytest
+import pytest_asyncio
+from httpx import (
+    ASGITransport,
+    AsyncClient,
+)
+from sqlalchemy import (
+    create_engine,
+    event,
+    text,
+)
+from sqlalchemy.orm import sessionmaker
+
+os.environ.setdefault("GEMINI_API_KEY", "test-key-placeholder")
+
+TEST_DATABASE_URL = os.getenv(
+    "TEST_DATABASE_URL",
+    "postgresql://sarthak@localhost:5432/ai_doubt_manager_test",
+)
+
+engine = create_engine(TEST_DATABASE_URL, echo=False)
+
+
+@event.listens_for(engine, "connect")
+def _enable_pgvector(dbapi_conn, connection_record):
+    cursor = dbapi_conn.cursor()
+    try:
+        cursor.execute("CREATE EXTENSION IF NOT EXISTS vector")
+    except Exception:
+        pass
+    finally:
+        cursor.close()
+
+
+TestingSessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=engine)
+
+
+@pytest.fixture(scope="session", autouse=True)
+def _create_tables():
+    """Create all tables once per test session, drop after."""
+    from app.db.base import Base
+    from app.db.models import (  # noqa: F401 — force model registration
+        Answer,
+        Cluster,
+        Comment,
+        Quota,
+        RAGDocument,
+        StreamingSession,
+        Teacher,
+        YouTubeToken,
+    )
+
+    Base.metadata.create_all(bind=engine)
+    yield
+    Base.metadata.drop_all(bind=engine)
+
+
+def _override_get_db():
+    db = TestingSessionLocal()
+    try:
+        yield db
+    finally:
+        db.close()
+
+
+@pytest.fixture(autouse=True)
+def _clean_tables():
+    """Truncate all tables between tests for isolation."""
+    yield
+    db = TestingSessionLocal()
+    try:
+        db.execute(
+            text(
+                "TRUNCATE answers, comments, clusters, streaming_sessions, teachers, youtube_tokens, quotas, rag_documents CASCADE"
+            )
+        )
+        db.commit()
+    finally:
+        db.close()
+
+
+@pytest.fixture()
+def db_session():
+    """Provide a raw SQLAlchemy session for DB-level tests."""
+    db = TestingSessionLocal()
+    try:
+        yield db
+    finally:
+        db.rollback()
+        db.close()
+
+
+@pytest_asyncio.fixture()
+async def client() -> AsyncGenerator[AsyncClient, None]:
+    """Async HTTP client wired to the FastAPI app with test DB + mocked Redis."""
+    from app.db.session import get_db
+    from app.main import app
+
+    app.dependency_overrides[get_db] = _override_get_db
+
+    with (
+        patch("app.services.token_blacklist.token_blacklist.is_blacklisted", return_value=False),
+        patch("app.services.token_blacklist.token_blacklist.blacklist_token"),
+        patch("app.core.rate_limit_middleware.RateLimitMiddleware.dispatch", side_effect=_passthrough_dispatch),
+        patch("workers.common.queue.QueueManager.enqueue", return_value=None),
+        patch("app.services.websocket.manager.manager.start_subscriber", return_value=None),
+    ):
+        transport = ASGITransport(app=app)
+        async with AsyncClient(transport=transport, base_url="http://test") as ac:
+            yield ac
+
+    app.dependency_overrides.clear()
+
+
+async def _passthrough_dispatch(request, call_next):
+    """Bypass rate limiting in tests."""
+    return await call_next(request)
+
+
+# ---------------------------------------------------------------------------
+# Auth helper fixtures
+# ---------------------------------------------------------------------------
+
+
+async def _register_and_login(client: AsyncClient, email: str, name: str, password: str) -> dict:
+    """Register a teacher and log in, return auth headers."""
+    await client.post(
+        "/api/v1/auth/register",
+        json={"email": email, "password": password, "name": name},
+    )
+    resp = await client.post(
+        "/api/v1/auth/login",
+        json={"email": email, "password": password},
+    )
+    token = resp.json()["access_token"]
+    return {"Authorization": f"Bearer {token}"}
+
+
+@pytest_asyncio.fixture()
+async def auth_headers(client: AsyncClient) -> dict:
+    """Register + login Teacher A, return Bearer headers."""
+    return await _register_and_login(client, "teacher_a@test.com", "Teacher A", "password123")
+
+
+@pytest_asyncio.fixture()
+async def second_auth_headers(client: AsyncClient) -> dict:
+    """Register + login Teacher B, return Bearer headers."""
+    return await _register_and_login(client, "teacher_b@test.com", "Teacher B", "password456")
+
+
+@pytest_asyncio.fixture()
+async def session_id(client: AsyncClient, auth_headers: dict) -> str:
+    """Create a streaming session for Teacher A, return its UUID string."""
+    resp = await client.post(
+        "/api/v1/sessions/",
+        json={"youtube_video_id": f"test_video_{uuid.uuid4().hex[:8]}"},
+        headers=auth_headers,
+    )
+    return resp.json()["id"]
diff --git a/backend/tests/test_auth.py b/backend/tests/test_auth.py
new file mode 100644
index 0000000..e0dedcf
--- /dev/null
+++ b/backend/tests/test_auth.py
@@ -0,0 +1,92 @@
+"""Black-box contract tests for auth endpoints."""
+
+import pytest
+from httpx import AsyncClient
+
+
+@pytest.fixture()
+def _teacher_data():
+    return {"email": "auth_test@test.com", "password": "password123", "name": "Auth Tester"}
+
+
+async def test_register_success(client: AsyncClient, _teacher_data: dict):
+    resp = await client.post("/api/v1/auth/register", json=_teacher_data)
+    assert resp.status_code == 201
+    body = resp.json()
+    assert "id" in body
+    assert body["email"] == _teacher_data["email"]
+    assert body["name"] == _teacher_data["name"]
+    assert body["is_active"] is True
+
+
+async def test_register_duplicate_email(client: AsyncClient, _teacher_data: dict):
+    await client.post("/api/v1/auth/register", json=_teacher_data)
+    resp = await client.post("/api/v1/auth/register", json=_teacher_data)
+    assert resp.status_code == 400
+
+
+async def test_login_success(client: AsyncClient, _teacher_data: dict):
+    await client.post("/api/v1/auth/register", json=_teacher_data)
+    resp = await client.post(
+        "/api/v1/auth/login",
+        json={"email": _teacher_data["email"], "password": _teacher_data["password"]},
+    )
+    assert resp.status_code == 200
+    body = resp.json()
+    assert "access_token" in body
+    assert "refresh_token" in body
+    assert body["token_type"] == "bearer"
+    assert "expires_in" in body
+
+
+async def test_login_wrong_password(client: AsyncClient, _teacher_data: dict):
+    await client.post("/api/v1/auth/register", json=_teacher_data)
+    resp = await client.post(
+        "/api/v1/auth/login",
+        json={"email": _teacher_data["email"], "password": "wrongpassword"},
+    )
+    assert resp.status_code == 401
+
+
+async def test_login_nonexistent_email(client: AsyncClient):
+    resp = await client.post(
+        "/api/v1/auth/login",
+        json={"email": "nobody@test.com", "password": "password123"},
+    )
+    assert resp.status_code == 401
+
+
+async def test_me_with_valid_token(client: AsyncClient, _teacher_data: dict):
+    await client.post("/api/v1/auth/register", json=_teacher_data)
+    login_resp = await client.post(
+        "/api/v1/auth/login",
+        json={"email": _teacher_data["email"], "password": _teacher_data["password"]},
+    )
+    token = login_resp.json()["access_token"]
+
+    resp = await client.get("/api/v1/auth/me", headers={"Authorization": f"Bearer {token}"})
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["email"] == _teacher_data["email"]
+    assert body["name"] == _teacher_data["name"]
+
+
+async def test_me_without_token(client: AsyncClient):
+    resp = await client.get("/api/v1/auth/me")
+    assert resp.status_code in [401, 403]
+
+
+async def test_refresh_token(client: AsyncClient, _teacher_data: dict):
+    await client.post("/api/v1/auth/register", json=_teacher_data)
+    login_resp = await client.post(
+        "/api/v1/auth/login",
+        json={"email": _teacher_data["email"], "password": _teacher_data["password"]},
+    )
+    refresh_token = login_resp.json()["refresh_token"]
+
+    resp = await client.post("/api/v1/auth/refresh", json={"refresh_token": refresh_token})
+    assert resp.status_code == 200
+    body = resp.json()
+    assert "access_token" in body
+    assert "refresh_token" in body
+    assert body["token_type"] == "bearer"
diff --git a/backend/tests/test_dashboard.py b/backend/tests/test_dashboard.py
new file mode 100644
index 0000000..f0f8ed6
--- /dev/null
+++ b/backend/tests/test_dashboard.py
@@ -0,0 +1,119 @@
+"""Black-box contract tests for dashboard endpoints."""
+
+import uuid
+
+from httpx import AsyncClient
+from sqlalchemy.orm import sessionmaker
+from tests.conftest import engine
+
+TestingSessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=engine)
+
+
+def _create_cluster_and_answer(session_id: str) -> tuple[str, str]:
+    """Insert a cluster + answer directly via SQLAlchemy, return (answer_id, cluster_id)."""
+    from app.db.models.answer import Answer
+    from app.db.models.cluster import Cluster
+
+    db = TestingSessionLocal()
+    try:
+        cluster = Cluster(
+            session_id=session_id,
+            title="Test Cluster",
+            similarity_threshold=0.8,
+        )
+        db.add(cluster)
+        db.flush()
+
+        answer = Answer(
+            cluster_id=cluster.id,
+            text="Original answer text",
+        )
+        db.add(answer)
+        db.commit()
+        return str(answer.id), str(cluster.id)
+    finally:
+        db.close()
+
+
+async def test_manual_question_creates_comments(client: AsyncClient, auth_headers: dict, session_id: str):
+    resp = await client.post(
+        f"/api/v1/dashboard/sessions/{session_id}/manual-question",
+        json={"text": "Q1\nQ2\nQ3"},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 201
+    assert resp.json() == {"created": 3}
+
+
+async def test_manual_question_max_10(client: AsyncClient, auth_headers: dict, session_id: str):
+    questions = "\n".join(f"Question {i}" for i in range(15))
+    resp = await client.post(
+        f"/api/v1/dashboard/sessions/{session_id}/manual-question",
+        json={"text": questions},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 201
+    assert resp.json() == {"created": 10}
+
+
+async def test_manual_question_nonexistent_session(client: AsyncClient, auth_headers: dict):
+    fake_id = str(uuid.uuid4())
+    resp = await client.post(
+        f"/api/v1/dashboard/sessions/{fake_id}/manual-question",
+        json={"text": "Some question"},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 404
+
+
+async def test_session_stats_empty(client: AsyncClient, auth_headers: dict, session_id: str):
+    resp = await client.get(
+        f"/api/v1/dashboard/sessions/{session_id}/stats",
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["total_comments"] == 0
+    assert body["questions"] == 0
+    assert body["answered"] == 0
+    assert body["clusters"] == 0
+    assert body["answers_generated"] == 0
+    assert body["answers_posted"] == 0
+
+
+async def test_edit_answer(client: AsyncClient, auth_headers: dict, session_id: str):
+    answer_id, _ = _create_cluster_and_answer(session_id)
+    resp = await client.patch(
+        f"/api/v1/dashboard/answers/{answer_id}",
+        json={"text": "Edited answer text"},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["text"] == "Edited answer text"
+    assert "id" in body
+    assert "cluster_id" in body
+    assert "created_at" in body
+
+
+async def test_edit_answer_not_found(client: AsyncClient, auth_headers: dict):
+    fake_id = str(uuid.uuid4())
+    resp = await client.patch(
+        f"/api/v1/dashboard/answers/{fake_id}",
+        json={"text": "Doesn't matter"},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 404
+
+
+async def test_approve_answer(client: AsyncClient, auth_headers: dict, session_id: str):
+    answer_id, _ = _create_cluster_and_answer(session_id)
+    resp = await client.post(
+        f"/api/v1/dashboard/answers/{answer_id}/approve",
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["id"] == answer_id
+    assert "text" in body
+    assert "cluster_id" in body
diff --git a/backend/tests/test_db_constraints.py b/backend/tests/test_db_constraints.py
new file mode 100644
index 0000000..3263ed6
--- /dev/null
+++ b/backend/tests/test_db_constraints.py
@@ -0,0 +1,65 @@
+"""DB-level constraint tests via direct SQLAlchemy inserts."""
+
+import uuid
+
+import pytest
+from app.db.models.comment import Comment
+from app.db.models.streaming_session import StreamingSession
+from app.db.models.teacher import Teacher
+from sqlalchemy.exc import IntegrityError
+
+
+def _create_session_in_db(db) -> str:
+    """Insert a teacher + session directly, return session UUID string."""
+    teacher = Teacher(
+        email=f"constraint_{uuid.uuid4().hex[:8]}@test.com",
+        name="Constraint Tester",
+        hashed_password="fakehash",
+    )
+    db.add(teacher)
+    db.flush()
+
+    session = StreamingSession(
+        teacher_id=teacher.id,
+        youtube_video_id=f"vid_{uuid.uuid4().hex[:8]}",
+    )
+    db.add(session)
+    db.flush()
+    return str(session.id)
+
+
+def test_comment_youtube_comment_id_not_null(db_session):
+    session_id = _create_session_in_db(db_session)
+    comment = Comment(
+        session_id=session_id,
+        youtube_comment_id=None,
+        author_name="Test",
+        text="Should fail",
+    )
+    db_session.add(comment)
+    with pytest.raises(IntegrityError):
+        db_session.flush()
+
+
+def test_comment_youtube_comment_id_unique(db_session):
+    session_id = _create_session_in_db(db_session)
+    yt_id = f"dup_{uuid.uuid4().hex[:8]}"
+
+    c1 = Comment(
+        session_id=session_id,
+        youtube_comment_id=yt_id,
+        author_name="Test",
+        text="First",
+    )
+    db_session.add(c1)
+    db_session.flush()
+
+    c2 = Comment(
+        session_id=session_id,
+        youtube_comment_id=yt_id,
+        author_name="Test",
+        text="Duplicate",
+    )
+    db_session.add(c2)
+    with pytest.raises(IntegrityError):
+        db_session.flush()
diff --git a/backend/tests/test_rag.py b/backend/tests/test_rag.py
new file mode 100644
index 0000000..41fa40f
--- /dev/null
+++ b/backend/tests/test_rag.py
@@ -0,0 +1,141 @@
+"""Black-box contract tests for RAG document endpoints.
+
+Endpoint paths (from backend/app/api/v1/rag.py + main.py mount):
+  POST   /api/v1/rag/documents       — upload (multipart, field name "file")
+  GET    /api/v1/rag/documents        — list owned documents
+  DELETE /api/v1/rag/documents/{id}   — delete owned document (204)
+
+Upload calls upload_document() which invokes GeminiClient.generate_embedding
+— that is already patched to None by the client fixture (QueueManager.enqueue
+is stubbed), but we also need to patch the Gemini call inside upload_document.
+"""
+
+import io
+import uuid
+from unittest.mock import patch
+
+from httpx import AsyncClient
+
+
+async def test_upload_document_appears_in_list(client: AsyncClient, auth_headers: dict):
+    """Upload a small PDF → 2xx → GET list → document appears in response."""
+    pdf_content = b"%PDF-1.4 fake pdf content with enough words " + b"word " * 50
+
+    with (
+        patch("app.services.rag.document_service.GeminiClient") as mock_gemini_cls,
+        patch("app.services.rag.document_service._extract_text_pdf", return_value="Some test content " * 50),
+    ):
+        mock_gemini = mock_gemini_cls.return_value
+        mock_gemini.generate_embedding.return_value = [0.1] * 768
+
+        resp = await client.post(
+            "/api/v1/rag/documents",
+            files={"file": ("test.pdf", io.BytesIO(pdf_content), "application/pdf")},
+            headers=auth_headers,
+        )
+
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["chunks_created"] >= 1
+    assert len(body["document_ids"]) >= 1
+
+    # Verify it appears in the list
+    list_resp = await client.get("/api/v1/rag/documents", headers=auth_headers)
+    assert list_resp.status_code == 200
+    docs = list_resp.json()
+    uploaded_ids = set(body["document_ids"])
+    listed_ids = {d["id"] for d in docs}
+    assert uploaded_ids.issubset(listed_ids)
+
+
+async def test_teacher_only_sees_own_documents(client: AsyncClient, auth_headers: dict, second_auth_headers: dict):
+    """Teacher A uploads → Teacher B lists → Teacher B sees 0 documents."""
+    pdf_content = b"%PDF-1.4 fake pdf content with enough words " + b"word " * 50
+
+    with (
+        patch("app.services.rag.document_service.GeminiClient") as mock_gemini_cls,
+        patch("app.services.rag.document_service._extract_text_pdf", return_value="Some test content " * 50),
+    ):
+        mock_gemini = mock_gemini_cls.return_value
+        mock_gemini.generate_embedding.return_value = [0.1] * 768
+
+        await client.post(
+            "/api/v1/rag/documents",
+            files={"file": ("test.pdf", io.BytesIO(pdf_content), "application/pdf")},
+            headers=auth_headers,
+        )
+
+    # Teacher B should see nothing
+    list_resp = await client.get("/api/v1/rag/documents", headers=second_auth_headers)
+    assert list_resp.status_code == 200
+    assert list_resp.json() == []
+
+
+async def test_delete_document_removes_it_from_list(client: AsyncClient, auth_headers: dict):
+    """Upload → delete → list → document gone."""
+    pdf_content = b"%PDF-1.4 fake pdf content with enough words " + b"word " * 50
+
+    with (
+        patch("app.services.rag.document_service.GeminiClient") as mock_gemini_cls,
+        patch("app.services.rag.document_service._extract_text_pdf", return_value="Some test content " * 50),
+    ):
+        mock_gemini = mock_gemini_cls.return_value
+        mock_gemini.generate_embedding.return_value = [0.1] * 768
+
+        resp = await client.post(
+            "/api/v1/rag/documents",
+            files={"file": ("test.pdf", io.BytesIO(pdf_content), "application/pdf")},
+            headers=auth_headers,
+        )
+
+    doc_id = resp.json()["document_ids"][0]
+
+    del_resp = await client.delete(f"/api/v1/rag/documents/{doc_id}", headers=auth_headers)
+    assert del_resp.status_code == 204
+
+    list_resp = await client.get("/api/v1/rag/documents", headers=auth_headers)
+    listed_ids = {d["id"] for d in list_resp.json()}
+    assert doc_id not in listed_ids
+
+
+async def test_delete_nonexistent_document_returns_404(client: AsyncClient, auth_headers: dict):
+    """DELETE with random UUID → 404."""
+    fake_id = str(uuid.uuid4())
+    resp = await client.delete(f"/api/v1/rag/documents/{fake_id}", headers=auth_headers)
+    assert resp.status_code == 404
+
+
+async def test_teacher_b_cannot_delete_teacher_a_document(
+    client: AsyncClient, auth_headers: dict, second_auth_headers: dict
+):
+    """Teacher A uploads → Teacher B tries to delete → 404 (ownership boundary)."""
+    pdf_content = b"%PDF-1.4 fake pdf content with enough words " + b"word " * 50
+
+    with (
+        patch("app.services.rag.document_service.GeminiClient") as mock_gemini_cls,
+        patch("app.services.rag.document_service._extract_text_pdf", return_value="Some test content " * 50),
+    ):
+        mock_gemini = mock_gemini_cls.return_value
+        mock_gemini.generate_embedding.return_value = [0.1] * 768
+
+        resp = await client.post(
+            "/api/v1/rag/documents",
+            files={"file": ("test.pdf", io.BytesIO(pdf_content), "application/pdf")},
+            headers=auth_headers,
+        )
+
+    doc_id = resp.json()["document_ids"][0]
+
+    # Teacher B tries to delete Teacher A's document
+    del_resp = await client.delete(f"/api/v1/rag/documents/{doc_id}", headers=second_auth_headers)
+    assert del_resp.status_code == 404
+
+
+async def test_upload_invalid_file_type_is_rejected(client: AsyncClient, auth_headers: dict):
+    """Upload a .exe file → 415 (unsupported media type)."""
+    resp = await client.post(
+        "/api/v1/rag/documents",
+        files={"file": ("malware.exe", io.BytesIO(b"MZ fake exe"), "application/octet-stream")},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 415
diff --git a/backend/tests/test_security.py b/backend/tests/test_security.py
new file mode 100644
index 0000000..a2b1a7e
--- /dev/null
+++ b/backend/tests/test_security.py
@@ -0,0 +1,72 @@
+"""Black-box ownership boundary tests: teacher A cannot access teacher B's resources."""
+
+from httpx import AsyncClient
+
+
+async def _create_session(client: AsyncClient, auth_headers: dict) -> str:
+    """Create a session via API, return its UUID string."""
+    resp = await client.post(
+        "/api/v1/sessions/",
+        json={"youtube_video_id": "vid_security_test"},
+        headers=auth_headers,
+    )
+    return resp.json()["id"]
+
+
+async def test_teacher_b_cannot_get_teacher_a_session(
+    client: AsyncClient, auth_headers: dict, second_auth_headers: dict
+):
+    session_id = await _create_session(client, auth_headers)
+    resp = await client.get(
+        f"/api/v1/sessions/{session_id}",
+        headers=second_auth_headers,
+    )
+    assert resp.status_code in [403, 404]
+
+
+async def test_teacher_b_cannot_update_teacher_a_session(
+    client: AsyncClient, auth_headers: dict, second_auth_headers: dict
+):
+    session_id = await _create_session(client, auth_headers)
+    resp = await client.patch(
+        f"/api/v1/sessions/{session_id}",
+        json={"title": "Hijacked"},
+        headers=second_auth_headers,
+    )
+    assert resp.status_code in [403, 404]
+
+
+async def test_teacher_b_cannot_end_teacher_a_session(
+    client: AsyncClient, auth_headers: dict, second_auth_headers: dict
+):
+    session_id = await _create_session(client, auth_headers)
+    resp = await client.post(
+        f"/api/v1/sessions/{session_id}/end",
+        headers=second_auth_headers,
+    )
+    assert resp.status_code in [403, 404]
+
+
+async def test_teacher_b_cannot_see_teacher_a_sessions_in_list(
+    client: AsyncClient, auth_headers: dict, second_auth_headers: dict
+):
+    a_session_id = await _create_session(client, auth_headers)
+    b_session_id = await _create_session(client, second_auth_headers)
+
+    resp = await client.get("/api/v1/sessions/", headers=second_auth_headers)
+    assert resp.status_code == 200
+    ids = [s["id"] for s in resp.json()]
+    assert b_session_id in ids
+    assert a_session_id not in ids
+
+
+async def test_teacher_b_cannot_submit_manual_question_to_teacher_a_session(
+    client: AsyncClient, auth_headers: dict, second_auth_headers: dict
+):
+    session_id = await _create_session(client, auth_headers)
+    resp = await client.post(
+        f"/api/v1/dashboard/sessions/{session_id}/manual-question",
+        json={"text": "Unauthorized question"},
+        headers=second_auth_headers,
+    )
+    assert resp.status_code in [403, 404]
diff --git a/backend/tests/test_sessions.py b/backend/tests/test_sessions.py
new file mode 100644
index 0000000..1343196
--- /dev/null
+++ b/backend/tests/test_sessions.py
@@ -0,0 +1,69 @@
+"""Black-box contract tests for session endpoints."""
+
+import uuid
+
+from httpx import AsyncClient
+
+
+async def test_create_session(client: AsyncClient, auth_headers: dict):
+    resp = await client.post(
+        "/api/v1/sessions/",
+        json={"youtube_video_id": "vid_create_test"},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 201
+    body = resp.json()
+    assert "id" in body
+    assert body["youtube_video_id"] == "vid_create_test"
+    assert body["is_active"] is True
+    assert "teacher_id" in body
+
+
+async def test_list_sessions_empty(client: AsyncClient, auth_headers: dict):
+    resp = await client.get("/api/v1/sessions/", headers=auth_headers)
+    assert resp.status_code == 200
+    assert resp.json() == []
+
+
+async def test_list_sessions_returns_own(client: AsyncClient, auth_headers: dict, session_id: str):
+    resp = await client.get("/api/v1/sessions/", headers=auth_headers)
+    assert resp.status_code == 200
+    sessions = resp.json()
+    assert len(sessions) >= 1
+    ids = [s["id"] for s in sessions]
+    assert session_id in ids
+
+
+async def test_get_session_by_id(client: AsyncClient, auth_headers: dict, session_id: str):
+    resp = await client.get(f"/api/v1/sessions/{session_id}", headers=auth_headers)
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["id"] == session_id
+    assert body["is_active"] is True
+
+
+async def test_update_session(client: AsyncClient, auth_headers: dict, session_id: str):
+    resp = await client.patch(
+        f"/api/v1/sessions/{session_id}",
+        json={"title": "Updated Title"},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200
+    assert resp.json()["title"] == "Updated Title"
+
+
+async def test_end_session(client: AsyncClient, auth_headers: dict, session_id: str):
+    resp = await client.post(
+        f"/api/v1/sessions/{session_id}/end",
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200
+    body = resp.json()
+    assert body["is_active"] is False
+    assert body["ended_at"] is not None
+
+
+async def test_get_nonexistent_session(client: AsyncClient, auth_headers: dict):
+    fake_id = str(uuid.uuid4())
+    resp = await client.get(f"/api/v1/sessions/{fake_id}", headers=auth_headers)
+    assert resp.status_code == 404
diff --git a/backend/tests/test_websocket.py b/backend/tests/test_websocket.py
new file mode 100644
index 0000000..aed756e
--- /dev/null
+++ b/backend/tests/test_websocket.py
@@ -0,0 +1,159 @@
+"""Black-box contract tests for the WebSocket endpoint.
+
+WebSocket path: /ws/{session_id}
+Auth: first message must be JSON {"type": "auth", "token": "<jwt>"}
+Close codes: 4001 (auth required / invalid token), 4003 (forbidden — wrong owner)
+
+Uses Starlette's TestClient for WebSocket since httpx does not support WS upgrade.
+
+Note: The WS handler uses SessionLocal() directly (not dependency injection),
+so we patch app.api.v1.websocket.SessionLocal to return a test DB session.
+"""
+
+import uuid
+from unittest.mock import patch
+
+import pytest
+from app.main import app
+from starlette.testclient import TestClient
+from starlette.websockets import WebSocketDisconnect
+from tests.conftest import (
+    TestingSessionLocal,
+    _override_get_db,
+)
+
+_PATCHES = (
+    patch("app.services.token_blacklist.token_blacklist.is_blacklisted", return_value=False),
+    patch("app.services.token_blacklist.token_blacklist.blacklist_token"),
+    patch("app.core.rate_limit_middleware.RateLimitMiddleware.dispatch", side_effect=None),
+    patch("workers.common.queue.QueueManager.enqueue", return_value=None),
+    patch("app.services.websocket.manager.manager.start_subscriber", return_value=None),
+)
+
+
+def _get_test_app():
+    """Return the FastAPI app with test DB + mocked externals."""
+    from app.db.session import get_db
+
+    app.dependency_overrides[get_db] = _override_get_db
+    return app
+
+
+def _register_and_login_sync(client: TestClient, email: str, name: str, password: str) -> str:
+    """Register + login synchronously via TestClient, return JWT access token."""
+    client.post("/api/v1/auth/register", json={"email": email, "password": password, "name": name})
+    resp = client.post("/api/v1/auth/login", json={"email": email, "password": password})
+    return resp.json()["access_token"]
+
+
+def _create_session_sync(client: TestClient, token: str) -> str:
+    """Create a streaming session, return its UUID string."""
+    resp = client.post(
+        "/api/v1/sessions/",
+        json={"youtube_video_id": f"ws_test_{uuid.uuid4().hex[:8]}"},
+        headers={"Authorization": f"Bearer {token}"},
+    )
+    return resp.json()["id"]
+
+
+async def _passthrough_dispatch(request, call_next):
+    """Bypass rate limiting in tests."""
+    return await call_next(request)
+
+
+def test_websocket_rejects_connection_without_token():
+    """Connect then send non-auth message → server closes with code 4001."""
+    test_app = _get_test_app()
+    session_id = str(uuid.uuid4())
+
+    with (
+        patch("app.services.token_blacklist.token_blacklist.is_blacklisted", return_value=False),
+        patch("app.services.token_blacklist.token_blacklist.blacklist_token"),
+        patch("app.core.rate_limit_middleware.RateLimitMiddleware.dispatch", side_effect=_passthrough_dispatch),
+        patch("workers.common.queue.QueueManager.enqueue", return_value=None),
+        patch("app.services.websocket.manager.manager.start_subscriber", return_value=None),
+    ):
+        with TestClient(test_app) as tc:
+            with pytest.raises(WebSocketDisconnect) as exc_info:
+                with tc.websocket_connect(f"/ws/{session_id}") as ws:
+                    # Send a message that is valid JSON but not an auth message
+                    ws.send_json({"type": "not_auth"})
+                    ws.receive_json()  # triggers the disconnect exception
+
+            assert exc_info.value.code == 4001
+
+    app.dependency_overrides.clear()
+
+
+def test_websocket_rejects_invalid_token():
+    """Connect with token='garbage' in auth message → close code 4001."""
+    test_app = _get_test_app()
+    session_id = str(uuid.uuid4())
+
+    with (
+        patch("app.services.token_blacklist.token_blacklist.is_blacklisted", return_value=False),
+        patch("app.services.token_blacklist.token_blacklist.blacklist_token"),
+        patch("app.core.rate_limit_middleware.RateLimitMiddleware.dispatch", side_effect=_passthrough_dispatch),
+        patch("workers.common.queue.QueueManager.enqueue", return_value=None),
+        patch("app.services.websocket.manager.manager.start_subscriber", return_value=None),
+    ):
+        with TestClient(test_app) as tc:
+            with pytest.raises(WebSocketDisconnect) as exc_info:
+                with tc.websocket_connect(f"/ws/{session_id}") as ws:
+                    ws.send_json({"type": "auth", "token": "garbage"})
+                    ws.receive_json()
+
+            assert exc_info.value.code == 4001
+
+    app.dependency_overrides.clear()
+
+
+def test_websocket_accepts_valid_owner_connection():
+    """Register → login → create session → WS connect with valid token → connection accepted."""
+    test_app = _get_test_app()
+
+    with (
+        patch("app.services.token_blacklist.token_blacklist.is_blacklisted", return_value=False),
+        patch("app.services.token_blacklist.token_blacklist.blacklist_token"),
+        patch("app.core.rate_limit_middleware.RateLimitMiddleware.dispatch", side_effect=_passthrough_dispatch),
+        patch("workers.common.queue.QueueManager.enqueue", return_value=None),
+        patch("app.services.websocket.manager.manager.start_subscriber", return_value=None),
+        patch("app.api.v1.websocket.SessionLocal", TestingSessionLocal),
+    ):
+        with TestClient(test_app) as tc:
+            token = _register_and_login_sync(tc, "ws_owner@test.com", "WS Owner", "password123")
+            session_id = _create_session_sync(tc, token)
+
+            with tc.websocket_connect(f"/ws/{session_id}") as ws:
+                ws.send_json({"type": "auth", "token": token})
+                msg = ws.receive_json()
+                assert msg["type"] == "connected"
+
+    app.dependency_overrides.clear()
+
+
+def test_websocket_rejects_wrong_teacher_session():
+    """Teacher A creates session → Teacher B connects with own token → close code 4003."""
+    test_app = _get_test_app()
+
+    with (
+        patch("app.services.token_blacklist.token_blacklist.is_blacklisted", return_value=False),
+        patch("app.services.token_blacklist.token_blacklist.blacklist_token"),
+        patch("app.core.rate_limit_middleware.RateLimitMiddleware.dispatch", side_effect=_passthrough_dispatch),
+        patch("workers.common.queue.QueueManager.enqueue", return_value=None),
+        patch("app.services.websocket.manager.manager.start_subscriber", return_value=None),
+        patch("app.api.v1.websocket.SessionLocal", TestingSessionLocal),
+    ):
+        with TestClient(test_app) as tc:
+            token_a = _register_and_login_sync(tc, "ws_a@test.com", "Teacher A", "password123")
+            token_b = _register_and_login_sync(tc, "ws_b@test.com", "Teacher B", "password456")
+            session_id = _create_session_sync(tc, token_a)
+
+            with pytest.raises(WebSocketDisconnect) as exc_info:
+                with tc.websocket_connect(f"/ws/{session_id}") as ws:
+                    ws.send_json({"type": "auth", "token": token_b})
+                    ws.receive_json()
+
+            assert exc_info.value.code == 4003
+
+    app.dependency_overrides.clear()
diff --git a/docker-compose.yml b/docker-compose.yml
index 0e672fd..f14e2b9 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -11,6 +11,7 @@ services:
       - "127.0.0.1:5432:5432"
     volumes:
       - postgres_data:/var/lib/postgresql/data
+    command: postgres -c max_connections=100
 
   redis:
     image: redis:7-alpine
diff --git a/docs/SYSTEM_DESIGN_REPORT.md b/docs/SYSTEM_DESIGN_REPORT.md
new file mode 100644
index 0000000..ae446f0
--- /dev/null
+++ b/docs/SYSTEM_DESIGN_REPORT.md
@@ -0,0 +1,613 @@
+# System Design Specification Report: AI Live Doubt Manager
+
+> **Prepared for**: Senior Consultant Deep-Dive Audit
+> **Date**: 2026-03-13
+> **Stack**: FastAPI 0.115 / React 19 / PostgreSQL 15 (pgvector) / Redis 7 / Google Gemini AI
+> **Scope**: Full-stack architecture — backend, worker pipeline, frontend, infrastructure
+
+---
+
+## 1. High-Level Architecture
+
+### 1.1 Core Pattern: Event-Driven Pipeline with Real-Time Relay
+
+The system follows a **producer-consumer pipeline architecture** with three distinct runtime tiers:
+
+| Tier | Technology | Role |
+|------|-----------|------|
+| **API Tier** | FastAPI, uvicorn (2 workers) | HTTP/WS ingress, auth, CRUD, real-time relay |
+| **Worker Tier** | 6 independent Python processes | Asynchronous AI processing pipeline |
+| **Data Tier** | PostgreSQL 15 + Redis 7 | Persistence, coordination, pub/sub |
+
+**Why this pattern**: Live YouTube sessions generate bursty comment traffic. Synchronous AI processing (classification → embedding → clustering → answer generation) would block API responses and create unacceptable latency. The pipeline decouples ingress from processing, allowing each stage to scale independently and fail independently without losing data — Redis queues persist tasks until consumed.
+
+### 1.2 System Topology
+
+```
+YouTube Live Chat API
+       │
+  [Polling Worker] ──enqueue──▶ [Classification] ──▶ [Embedding] ──▶ [Clustering] ──▶ [Answer Gen] ──▶ [YT Posting]
+       │                              │                   │               │                │                │
+       ▼                              ▼                   ▼               ▼                ▼                ▼
+   PostgreSQL ◀──────────── all workers write directly ──────────▶  Redis pub/sub ──▶ WS Manager ──▶ Browser
+       ▲                                                                                    ▲
+       │                                                                                    │
+  [FastAPI API] ◀─── HTTP/WS ─── [React 19 SPA]                                            │
+       │                              │                                                     │
+       └─── Redis (queues, pub/sub, rate limits, quota, token blacklist, caching) ──────────┘
+```
+
+**Why direct DB writes from workers (not routing through the API)**: Workers need transactional guarantees — e.g., the clustering worker must atomically update the centroid vector and assign the comment in one transaction. Routing writes through the API would add latency, create a single point of failure, and complicate error handling. Each worker manages its own DB connection pool (`pool_size=2, max_overflow=3`) to keep total connections manageable.
+
+### 1.3 Communication Patterns
+
+| Pattern | Where Used | Why This Pattern |
+|---------|-----------|-----------------|
+| **Request-Response (HTTP)** | All API endpoints | Standard CRUD, synchronous auth flows |
+| **Priority Queue (Redis ZSET)** | Worker pipeline (6 queues) | Ordered processing, priority support, atomic dequeue via `ZPOPMIN`. ZSET over LIST because it enables delayed retry (future timestamps as scores) |
+| **Pub/Sub (Redis)** | WebSocket relay (`ws:{session_id}`) | Workers publish events; API subscriber delivers to browsers. Decouples worker processes from WebSocket connection state |
+| **Polling (HTTP)** | YouTube Live Chat ingestion | YouTube API offers no webhooks for live chat; polling at 5s intervals is the only option. Capped at 10 concurrent threads via `ThreadPoolExecutor` |
+
+---
+
+## 2. Data Modeling & Persistence
+
+### 2.1 PostgreSQL Schema (pgvector-enabled)
+
+**Entity-Relationship Overview**:
+
+```
+Teachers (1) ──▶ (M) StreamingSessions (1) ──▶ (M) Comments
+                                           (1) ──▶ (M) Clusters (1) ──▶ (M) Answers
+Teachers (1) ──▶ (1) YouTubeTokens
+Teachers (1) ──▶ (M) Quotas
+Teachers (1) ──▶ (M) RAGDocuments
+Comments (M) ──▶ (1) Clusters  [SET NULL on cluster delete]
+```
+
+**Vector-enabled tables**:
+
+| Model | Column | Dimensions | Index | Purpose |
+|-------|--------|-----------|-------|---------|
+| `comments` | `embedding` | Vector(768) | None (sequential scan) | Semantic similarity for clustering |
+| `clusters` | `centroid_embedding` | Vector(768) | None (sequential scan) | Running centroid for nearest-centroid matching |
+| `rag_documents` | `embedding` | Vector(768) | None (sequential scan) | Cosine distance retrieval for answer grounding |
+
+**Why 768 dimensions (not Gemini's native 3072)**: 768 is the balance point — reduces storage and index cost by ~75% while retaining sufficient semantic fidelity for question clustering (not fine-grained retrieval). The code explicitly normalizes embeddings post-generation because Google requires normalization for non-3072 dimensions.
+
+**Why pgvector over a dedicated vector DB (Qdrant, Pinecone, etc.)**: The system already requires PostgreSQL for relational data. pgvector eliminates an infrastructure dependency. At the expected scale (hundreds to low thousands of comments per session), sequential scan is fast enough. The tradeoff: pgvector cannot handle billion-scale ANN, but this system doesn't need it.
+
+### 2.2 Key Schema Design Decisions
+
+| Decision | Implementation | Why |
+|----------|---------------|-----|
+| `youtube_comment_id` NOT NULL + UNIQUE | Manual comments use `f"manual:{uuid4()}"` prefix | Enables idempotent ingestion — polling worker checks for existing ID before insert, preventing duplicates across polling cycles |
+| `Cluster.comment_count` denormalized | Updated atomically in clustering worker | Centroid update formula `(old * n + new) / (n + 1)` needs `n` in the same transaction. `COUNT(*)` would be slower and subject to phantom reads |
+| Answers persisted before posting | `is_posted` boolean + async YouTube posting | Separates "answer generated" (always succeeds) from "answer posted" (may fail due to quota/auth). Dashboard shows pending answers immediately |
+| CASCADE on `session_id` | Deleting session removes all child data | Session deletion is a "nuke everything" operation |
+| SET NULL on `cluster_id` | Cluster deletion preserves comments | Comments may be re-clustered; destroying them would lose data |
+| Fernet encryption on YouTube tokens | `encrypt_data`/`decrypt_data` via `backend/app/core/encryption.py` | A DB breach without the encryption key cannot expose YouTube OAuth tokens |
+
+### 2.3 Composite Indexes
+
+```
+idx_session_teacher_active     (teacher_id, is_active)     — session list queries
+idx_comment_session_question   (session_id, is_question)   — clustering worker queries
+idx_comment_session_answered   (session_id, is_answered)    — dashboard stats
+idx_comment_cluster            (cluster_id)                 — cluster detail views
+idx_answer_cluster_posted      (cluster_id, is_posted)      — pending answers filter
+idx_quota_teacher_type         (teacher_id, quota_type)     — quota lookups
+```
+
+### 2.4 Redis Usage Map (6 Distinct Roles)
+
+| Role | Key Pattern | Data Structure | TTL | Why Redis |
+|------|------------|---------------|-----|-----------|
+| Task queues | `classification`, `embedding`, etc. | Sorted Set (ZSET) | None | Priority ordering via `score = priority * 1M + timestamp` |
+| Dead letter queues | `{queue}_dlq` | ZSET | None | Failed task inspection after 3 retries |
+| Rate limiting | `ratelimit:{ip}` | String (INCR) | 60s | Sliding window counter, per-IP |
+| YouTube quota | `yt_quota:{teacher_id}:{date}` | String (INCRBY) | TTL to midnight | Per-teacher daily quota (10,000 units) |
+| Token blacklist | `blacklist:token:{hash}` | String | Token's remaining TTL | JWT logout revocation (Redis GET per request) |
+| YouTube cache | `youtube:poll:{session_id}:*` | String | 3600s | Caches `live_chat_id` to avoid repeated API calls (1 unit each) |
+| WebSocket relay | `ws:{session_id}` | Pub/Sub channel | N/A | Cross-process event delivery to browsers |
+| CSRF state | `yt_state:{state}` | String | 600s | OAuth flow protection (10 min window) |
+
+**Why `volatile-lru` eviction policy**: Queue entries have no TTL and are protected from eviction. TTL-bearing keys (rate limits, cached chat IDs) are evictable under memory pressure — acceptable because they are regenerable.
+
+---
+
+## 3. Component Interactions
+
+### 3.1 API Layer — Middleware Stack
+
+Execution order (outermost → innermost):
+
+1. **RateLimitMiddleware** (`backend/app/core/rate_limit_middleware.py`) — Redis-backed IP throttling (60 req/min). Skips `/health`, `/metrics`, `/docs`. **Why outermost**: Reject abusive traffic before auth or DB work.
+2. **RequestContextMiddleware** (`backend/app/core/middleware.py`) — Injects `X-Request-ID` and tracks execution time via `contextvars`. **Why**: Distributed tracing without a full APM solution.
+3. **CORSMiddleware** — Configured origins from env (`:5173` for Vite dev, `:8000`, `:8080`).
+
+### 3.2 Auth Flow
+
+```
+Client ──Bearer token──▶ HTTPBearer ──▶ verify_token() ──▶ Redis blacklist check ──▶ DB Teacher lookup ──▶ is_active check
+```
+
+**Why Redis blacklist**: JWTs are stateless; without a blacklist, a logged-out token remains valid until expiry. Cost: one Redis GET per authenticated request.
+
+**Multi-tenancy enforcement**: Every data-access endpoint JOINs to `StreamingSession` to verify `teacher_id == current_user.id`. This is the authorization boundary — there are no role-based permissions beyond ownership.
+
+### 3.3 Worker Pipeline Detail
+
+```
+[1. Classification]  Gemini 2.5-flash: "Is this a question?" → {is_question, confidence}
+        │             GATE: Only enqueues if is_question=True (filters ~60-70% of comments)
+        ▼
+[2. Embedding]       Gemini embedding-001: text → 768-dim normalized vector
+        │             IDEMPOTENT: Skips if comment.embedding already exists
+        ▼
+[3. Clustering]      pgvector cosine distance against session's cluster centroids
+        │             Threshold ≥ 0.65 → join cluster; < 0.65 → create new
+        │             Centroid update: new = normalize((old * n + vec) / (n + 1))
+        │             Triggers answer gen on: new cluster OR milestones {3, 10, 25}
+        ▼
+[4. Answer Gen]      RAG: top-5 nearest documents by centroid embedding
+        │             Two-prompt: with-context vs. without-context (prevents hallucination)
+        │             Semaphore: max 5 concurrent Gemini calls
+        │             Auto-enqueues to YT posting if teacher has YouTube connected
+        ▼
+[5. YT Posting]      Posts to YouTube Live Chat (200 char limit)
+        │             Publishes WebSocket event on success
+        ▼
+      Done
+
+[6. YT Polling]      Independent 5s cycle, ThreadPoolExecutor (max 10 threads)
+                      Deduplicates via youtube_comment_id UNIQUE constraint
+                      Token auto-refresh on HTTP 401
+```
+
+**Why milestones {3, 10, 25}**: At 3, the cluster has enough signal for a meaningful title (also generated here). At 10 and 25, accumulated question variants provide richer context for a more comprehensive answer. This avoids regenerating on every question (Gemini quota) while updating answers as understanding deepens.
+
+**Why semaphore(5)**: Rate-limits Gemini API calls across all threads sharing a `GeminiClient` instance. Uses `threading.Semaphore` (not asyncio) because workers are synchronous Python processes.
+
+### 3.4 WebSocket Relay Architecture
+
+```
+Worker process ──publish──▶ Redis channel "ws:{session_id}" ──subscribe──▶ API process ──broadcast──▶ Browser WS clients
+```
+
+**Why not direct worker-to-browser**: Workers are separate OS processes (potentially separate containers). They have no access to the API's in-memory WebSocket registry. Redis pub/sub provides the cross-process bridge. Multiple API instances each subscribe independently and deliver to their own local connections — natural load distribution.
+
+**WebSocket auth**: Client sends `{"type": "auth", "token": "<jwt>"}` as first message. **Why first-message auth over query param**: Query params appear in server logs and browser history.
+
+### 3.5 YouTube OAuth Flow
+
+```
+Frontend ──GET /youtube/auth/url──▶ Backend generates OAuth URL + CSRF state (Redis, 10min TTL)
+     │
+     ▼  (popup window)
+Google OAuth consent ──redirect──▶ Backend callback validates state, exchanges code
+     │                              Encrypts tokens (Fernet), stores in DB
+     ▼                              Returns HTML that postMessages to opener
+Frontend receives message, closes popup, updates connection status
+```
+
+---
+
+## 4. State Management & AI/ML Memory
+
+### 4.1 Online Learning — No Model Persistence
+
+The system uses **online nearest-centroid clustering**, not batch KMeans. State is the centroid vectors stored in the `clusters` table:
+
+```python
+# Centroid update formula (workers/clustering/worker.py)
+new_centroid = (old_centroid * comment_count + new_embedding) / (comment_count + 1)
+normalized_centroid = new_centroid / ||new_centroid||
+```
+
+**Why online over batch KMeans**: Live sessions require immediate clustering of each incoming question. Batch KMeans would require periodic re-processing of all comments. The tradeoff: online nearest-centroid is order-dependent (different insertion orders produce different clusters), but for grouping similar student questions in real-time, this is acceptable.
+
+### 4.2 RAG Architecture
+
+```
+Teacher uploads document ──▶ Chunked + embedded (768-dim) ──▶ Stored in rag_documents table
+                                                                       │
+Answer Generation Worker ──pgvector cosine distance──▶ Top 5 nearest docs by cluster centroid
+                                                                       │
+                                              ┌─────────────────────────┘
+                                              ▼
+                              Two-prompt system:
+                              ├─ WITH context: "Answer using only the provided context"
+                              └─ WITHOUT context: "No context available, use general knowledge"
+```
+
+**Why centroid as query vector (not individual question text)**: The centroid represents the semantic center of all questions in the cluster. This retrieves documents relevant to the cluster's *theme*, not just one question's phrasing.
+
+**Why two separate prompts**: A single prompt with optional context leads to inconsistent behavior — the model may hallucinate when no context is provided, or ignore context when it exists. Explicit prompts produce predictable outputs.
+
+### 4.3 Gemini Model Usage
+
+| Operation | Model | Where | Concurrency |
+|-----------|-------|-------|-------------|
+| Classification | `gemini-2.5-flash` | Classification worker | Sequential (1 at a time) |
+| Embeddings | `gemini-embedding-001` | Embedding worker | Sequential |
+| Cluster summarization | `gemini-2.0-flash` | Clustering worker (at count=3) | Sequential |
+| Answer generation | `gemini-2.5-flash` | Answer generation worker | Semaphore(5) |
+
+All operations use `tenacity` retry: 3 attempts, exponential backoff 1s → 10s.
+
+### 4.4 Frontend State Architecture
+
+| Scope | Mechanism | What Lives Here |
+|-------|-----------|----------------|
+| **Global** | `AuthContext` | JWT token, user email/name, login/logout/register |
+| **Global** | `ThemeContext` | dark/light mode (localStorage, cross-tab sync) |
+| **Session-scoped** | `DashboardPage` state | activeSession, sessionEvents (cap 200), quotaAlert |
+| **Component-local** | `useState` hooks | Fetch states, forms, UI toggles, caches |
+| **Real-time** | `useWebSocket` hook | WS messages (cap 100), connected/reconnecting status |
+
+**Why refetch-on-WS-event (not pure WS-driven state)**: WS events are notifications ("something changed"), not complete state snapshots. Debounced refetching (500-2000ms) ensures the dashboard always shows authoritative server state, preventing drift from missed or out-of-order messages.
+
+**Why localStorage for JWT (not httpOnly cookie)**: The WebSocket auth flow requires JavaScript access to the token (sent as first WS message). httpOnly cookies cannot be read by JavaScript.
+
+---
+
+## 5. Infrastructure & DevOps
+
+### 5.1 Docker Compose Services
+
+| Service | Image | Port | Key Config |
+|---------|-------|------|-----------|
+| `postgres` | `pgvector/pgvector:pg15` | 127.0.0.1:5432 | `max_connections=100`, volume: `postgres_data` |
+| `redis` | `redis:7-alpine` | 127.0.0.1:6379 | `maxmemory 256mb`, `volatile-lru`, RDB snapshots |
+| `api` | Custom (Python 3.13-slim) | 8000 | `uvicorn --workers 2` |
+| `workers` | Custom (Python 3.13-slim) | None | `python -m workers.runner` (all 6 workers in one container) |
+
+**Why `max_connections=100`**: Connection budget is 15 (API) + 30 (workers) = 45 active. 100 provides ~2x headroom for admin connections, migrations, and monitoring.
+
+**Why single workers container**: Development simplicity. Production should separate workers into individual containers for independent scaling and failure isolation.
+
+**Why `volatile-lru`**: Queue entries (no TTL) are protected from eviction. TTL-bearing keys (rate limits, caches) are evictable under memory pressure — they are regenerable.
+
+### 5.2 CI/CD Pipeline (GitHub Actions)
+
+```
+[Lint Job]                              [Test Job]
+  Python 3.13                             Python 3.13
+  black + isort + ruff                    Services: pgvector:pg15 + redis:7
+  Checks: backend/, workers/              pytest backend/tests workers -v
+  Line length: 119 chars                  Dummy GEMINI_API_KEY
+```
+
+**Lint → Test** dependency chain. Both jobs run on push.
+
+### 5.3 Configuration Management
+
+`backend/app/core/config.py` — Pydantic `BaseSettings` with `@lru_cache` singleton.
+
+Key configuration groups:
+- **Database**: pool_size=5, max_overflow=10, pool_recycle=3600s, pool_pre_ping=True
+- **Redis**: max_connections=10, decode_responses=True
+- **Security**: HS256, access_token=30min, refresh_token=7d, bcrypt_rounds=12
+- **Gemini**: api_key, model names, clustering_threshold
+- **YouTube**: client_id, client_secret, redirect_uri
+- **WebSocket**: heartbeat_interval=30s, timeout=300s
+- **Rate limiting**: requests_per_minute, enabled flag
+- **Encryption**: encryption_key (≥32 chars, validated at startup)
+
+Environment loading: `.env.{environment}` files with fallback.
+
+---
+
+## 6. Critical Paths
+
+### 6.1 Path 1: Comment → Posted Answer (Highest Complexity)
+
+**Stages**: YouTube comment → Polling worker → DB insert → Classification → Embedding → Clustering → Answer generation → YouTube posting → WebSocket notification
+
+**Latency budget**: ~10-30 seconds total. Gemini API calls dominate: classification (~500ms), embedding (~300ms), answer generation (~2-5s). Each inter-stage hop adds ~1s (poll interval).
+
+**Failure recovery**: Tasks remain in Redis queues on worker crash (ZPOPMIN is atomic). `tenacity` retries transient Gemini failures. Queue-level retry (3 attempts, 60s delay) catches persistent failures. DLQ captures exhausted retries for manual inspection.
+
+### 6.2 Path 2: WebSocket Real-Time Delivery
+
+**Risk**: Redis pub/sub is fire-and-forget. If the API subscriber task crashes or disconnects, events are lost during reconnection (exponential backoff, max 30s). Frontend's debounced refetch partially mitigates stale data.
+
+### 6.3 Path 3: YouTube OAuth Token Lifecycle
+
+**Risk**: If the encryption key (`settings.encryption_key[:32]`) is lost or changed, all stored YouTube tokens become undecryptable, severing all YouTube connections system-wide. The key must be treated as infrastructure state, not a rotatable secret.
+
+---
+
+## 7. Potential Bottlenecks & Availability Risks
+
+### 7.1 Single-Threaded Worker Bottleneck — **SEVERITY: HIGH**
+
+Each pipeline worker is a single-threaded Python process. During traffic spikes (popular live session, hundreds of comments/minute), the classification worker becomes the bottleneck — ~2 comments/second throughput (Gemini-bound). A spike of 10 comments/second creates a growing backlog.
+
+**Mitigation**: Horizontal scaling — run multiple instances per worker. `ZPOPMIN`-based dequeue is safe for concurrent consumers. No code changes needed.
+
+### 7.2 Redis Pub/Sub Message Loss — **SEVERITY: MEDIUM**
+
+Pub/sub delivers only to currently connected subscribers. API restart = lost events during reconnection window. Dashboard may show stale data.
+
+**Mitigation**: Replace pub/sub with Redis Streams (`XADD`/`XREAD` with consumer groups). Streams persist messages and support "read from last acknowledged" semantics.
+
+### 7.3 No pgvector Index on Vector Columns — **SEVERITY: MEDIUM (time-bomb)**
+
+Clustering worker's `ORDER BY centroid_embedding <=> :emb` performs sequential scan. Fine at O(100) clusters. Becomes a latency cliff at O(10,000+).
+
+**Mitigation**: Add HNSW index on `clusters.centroid_embedding` and `rag_documents.embedding`. Migration files exist for HNSW indexes but may not cover all vector columns.
+
+### 7.4 YouTube Quota Exhaustion — **SEVERITY: MEDIUM**
+
+Daily quota: 10,000 units/teacher. Poll cost: 5 units. At 5-second intervals: `5 × (86400/5) = 86,400 units/day` — **far exceeding the limit**. Polling effectively stops after ~2000 polls (~2.8 hours).
+
+**Mitigation**: Use YouTube API's `pollingIntervalMillis` response field for adaptive polling. Implement exponential backoff when no new messages arrive.
+
+### 7.5 Gemini API as Single Point of Failure — **SEVERITY: HIGH**
+
+All AI operations depend on one Gemini API key. Key revocation, rate limiting, or Gemini outage stalls the entire pipeline. `tenacity` handles transient failures but not sustained outages.
+
+**Mitigation**: Circuit breaker pattern with degraded-mode fallbacks (e.g., regex-based classification). Multiple API keys with rotation.
+
+### 7.6 Connection Pool Exhaustion Under Scale — **SEVERITY: LOW-MEDIUM**
+
+Current budget: 45/100 connections. Each horizontally-scaled worker instance adds 5 connections. 11+ additional instances exhaust the pool.
+
+**Mitigation**: Deploy PgBouncer for connection multiplexing between workers and PostgreSQL.
+
+### 7.7 JWT in localStorage — **SEVERITY: LOW (security note)**
+
+localStorage is vulnerable to XSS. A single XSS vulnerability exposes the JWT. However, this is a deliberate tradeoff — WebSocket auth requires JavaScript access to the token, and httpOnly cookies cannot be read by JS.
+
+**Mitigation**: Strict CSP headers, input sanitization, and regular XSS audits. Consider a dual-auth scheme (cookie for HTTP, short-lived token for WS).
+
+---
+
+## Appendix: Key File Paths
+
+| Component | Path |
+|-----------|------|
+| API entry point | `backend/app/main.py` |
+| Configuration | `backend/app/core/config.py` |
+| Auth & security | `backend/app/core/security.py`, `encryption.py` |
+| Database models | `backend/app/db/models/*.py` |
+| API routes | `backend/app/api/v1/*.py` |
+| WebSocket manager | `backend/app/services/websocket/manager.py` |
+| Gemini AI client | `backend/app/services/gemini/client.py` |
+| YouTube services | `backend/app/services/youtube/client.py`, `oauth.py`, `quota.py` |
+| Queue infrastructure | `workers/common/queue.py` |
+| Worker payloads | `workers/common/schemas.py` |
+| Classification worker | `workers/classification/worker.py` |
+| Embedding worker | `workers/embeddings/worker.py` |
+| Clustering worker | `workers/clustering/worker.py` |
+| Answer generation worker | `workers/answer_generation/worker.py` |
+| YouTube polling worker | `workers/youtube_polling/worker.py` |
+| YouTube posting worker | `workers/youtube_posting/worker.py` |
+| Frontend entry | `frontend/src/main.jsx` → `App.jsx` |
+| API service layer | `frontend/src/services/api.js` |
+| WebSocket hook | `frontend/src/hooks/useWebSocket.js` |
+| Dashboard page | `frontend/src/pages/DashboardPage.jsx` |
+| Docker Compose | `docker-compose.yml` |
+| CI/CD | `.github/workflows/ci.yml` |
+
+---
+
+## 8. Scaling Roadmap
+
+### 8.1 Current Capacity Baseline
+
+| Resource | Current Limit | Utilization | Headroom |
+|----------|--------------|-------------|----------|
+| Gemini API concurrency | 5 (semaphore) | Burst-dependent | Low under load |
+| YouTube quota | 10,000 units/teacher/day | 5 units/poll × 12 polls/min = 3,600/hr | Exhausts in ~2.8 hrs |
+| DB connections (API) | 5 + 10 overflow = 15 | Request-dependent | 55 of 100 unused |
+| DB connections (Workers) | 6 × (2 + 3) = 30 | Steady | See above |
+| Redis memory | 256 MB | ~70-200 KB for queues | Ample |
+| API rate limit | 60 req/min/IP | Per-IP | No per-user limiting |
+| Worker throughput | 1 process per stage | ~2 comments/sec (Gemini-bound) | Backlog at >2/sec |
+
+### 8.2 Phase 1: Quick Wins (Week 1-2)
+
+| Change | Current | Target | Effort | Impact |
+|--------|---------|--------|--------|--------|
+| Gemini semaphore | 5 | 15-20 | 1 line (`client.py:30`) | 3-4x answer gen throughput |
+| YouTube poll interval | 5s fixed | Adaptive (use API's `pollingIntervalMillis`) | Medium | 50-70% quota savings |
+| Redis memory | 256 MB | 512 MB | Config change | 2x headroom |
+| Worker pool size | 2+3 | 5+5 per worker | Config change (`common/db.py`) | Handle connection bursts |
+| PostgreSQL max_connections | 100 | 200 | Docker config | Support horizontal workers |
+
+### 8.3 Phase 2: Horizontal Scaling (Month 1-2)
+
+**Worker horizontal scaling** — The ZPOPMIN-based queue dequeue is inherently safe for concurrent consumers. No code changes needed to run N instances of any worker:
+
+```
+# Scale classification to 3 instances
+docker-compose up --scale classification-worker=3
+```
+
+**Requires**: Split `workers` Docker service into per-worker services. Current single-container design bundles all 6 workers.
+
+**PgBouncer for connection multiplexing** — Each new worker instance adds 5 DB connections. At 20+ worker instances, PostgreSQL's 100-connection limit is reached. PgBouncer in transaction mode multiplexes many worker connections over fewer PostgreSQL connections.
+
+```
+Workers (100 connections) → PgBouncer (20 connections) → PostgreSQL
+```
+
+**Redis Sentinel for HA** — Single Redis instance is a SPOF for all queues, pub/sub, rate limits, and quota tracking. Redis Sentinel provides automatic failover with minimal configuration.
+
+### 8.4 Phase 3: High Volume (Month 3-6, 1000+ concurrent users)
+
+| Component | Strategy | Trigger |
+|-----------|----------|---------|
+| Comments table | Partition by `session_id` (range) | >10M rows |
+| Embeddings | Local model fallback (e.g., `all-MiniLM-L6-v2`) | Gemini cost > $100/day |
+| YouTube quota | Quota tiering (premium teachers get 50K/day) | Teachers hitting limits daily |
+| Worker autoscaling | Scale on queue depth (>100 tasks → spawn pod) | Sustained backlog |
+| pgvector | Add HNSW index on vector columns | >10K clusters per session |
+| Redis | Redis Cluster (sharding) | >1GB memory or >50K ops/sec |
+| API | Multiple uvicorn instances behind load balancer | >500 concurrent WebSocket connections |
+
+### 8.5 Phase 4: Multi-Region (Month 6-12)
+
+- **Database**: Read replicas for dashboard queries, write primary for ingestion
+- **Workers**: Deploy regionally, share Redis Cluster
+- **CDN**: Frontend static assets via CloudFront/Cloudflare
+- **Gemini API**: Multi-key rotation across regions for quota distribution
+
+---
+
+## 9. Cost Modeling
+
+### 9.1 Gemini API Costs
+
+**Per-comment pipeline cost** (assuming ~60% of comments are questions):
+
+| Operation | Model | Input Tokens (est.) | Output Tokens (est.) | Cost/Call |
+|-----------|-------|-------------------|---------------------|-----------|
+| Classification | gemini-2.5-flash | ~100 | ~30 | ~$0.000015 |
+| Embedding | gemini-embedding-001 | ~100 | N/A | ~$0.000010 |
+| Cluster summary | gemini-2.0-flash | ~200 | ~20 | ~$0.000005 |
+| Answer generation | gemini-2.5-flash | ~500 (with RAG context) | ~200 | ~$0.000060 |
+
+**Per-session cost estimate** (1-hour session, 500 comments):
+
+| Stage | Calls | Cost |
+|-------|-------|------|
+| Classification | 500 | $0.0075 |
+| Embedding | 300 (60% questions) | $0.003 |
+| Cluster summaries | ~30 clusters | $0.00015 |
+| Answer generation | ~60 (30 clusters × 1-2 milestones) | $0.0036 |
+| **Total per session** | **~890 calls** | **~$0.014** |
+
+**Monthly projection** (10 teachers, 5 sessions/week each):
+
+```
+10 teachers × 5 sessions/week × 4 weeks × $0.014 = $2.80/month (Gemini only)
+```
+
+At scale (100 teachers, 10 sessions/week): **~$56/month** in Gemini costs.
+
+### 9.2 YouTube Quota Cost Analysis
+
+**Per-session quota burn** (1 hour, 5-second polling):
+
+| Operation | Calls | Units | Total |
+|-----------|-------|-------|-------|
+| Polling | 720 (3600s ÷ 5s) | 5 | 3,600 |
+| Get chat ID | 1 (cached after first) | 1 | 1 |
+| Post answers | ~30 (1 per cluster) | 50 | 1,500 |
+| **Total** | | | **5,101 units** |
+
+**Daily capacity**: 10,000 units → ~1.96 sessions/day at current polling rate.
+
+**With adaptive polling** (10s average): ~3.5 sessions/day.
+
+**With YouTube-recommended interval** (~15-30s): ~5-8 sessions/day.
+
+### 9.3 Infrastructure Costs (Docker/Cloud)
+
+| Component | Minimum Spec | Est. Monthly Cost (AWS) |
+|-----------|-------------|------------------------|
+| PostgreSQL (pgvector) | db.t3.medium (2 vCPU, 4GB) | ~$50 |
+| Redis | cache.t3.micro (0.5GB) | ~$15 |
+| API (ECS/EC2) | t3.small (2 vCPU, 2GB) | ~$20 |
+| Workers (ECS/EC2) | t3.medium (2 vCPU, 4GB) | ~$35 |
+| Frontend (S3 + CloudFront) | Static hosting | ~$5 |
+| **Total** | | **~$125/month** |
+
+### 9.4 Cost Optimization Opportunities
+
+| Optimization | Savings | Effort |
+|-------------|---------|--------|
+| Embedding cache by text hash (avoid re-embedding identical questions) | 10-30% Gemini cost | Low |
+| Local embedding model fallback (sentence-transformers) | 90% embedding cost | Medium |
+| Adaptive YouTube polling (back off when idle) | 50-70% quota savings | Low |
+| Batch classification (group 5-10 comments per Gemini call) | 60-80% classification cost | Medium |
+| Gemini response caching (identical question patterns) | 20-40% answer gen cost | Medium |
+
+---
+
+## 10. Threat Model (STRIDE Analysis)
+
+### 10.1 Threat Matrix
+
+#### Spoofing
+
+| Threat | Vector | Severity | Current Mitigation | Gap |
+|--------|--------|----------|-------------------|-----|
+| JWT token theft | XSS → localStorage access | **HIGH** | Token blacklist on logout | Token in localStorage is XSS-vulnerable |
+| Teacher impersonation | Stolen refresh token (7-day lifetime) | **HIGH** | Refresh token rotation (not implemented) | No refresh token rotation on use |
+| WebSocket hijacking | Intercepted auth message | **MEDIUM** | First-message JWT auth + ownership check | No message-level encryption (relies on WSS) |
+| OAuth state forgery | Brute-force 128-bit state | **LOW** | 10-min TTL + single-use deletion | Secure by design |
+
+#### Tampering
+
+| Threat | Vector | Severity | Current Mitigation | Gap |
+|--------|--------|----------|-------------------|-----|
+| Answer text injection | Edit answer endpoint with malicious content | **MEDIUM** | Auth + ownership check | No content sanitization before YouTube posting |
+| Comment text overflow | Unbounded text field in schema | **MEDIUM** | SQLAlchemy Text column (no DB limit) | No `max_length` on CommentCreate schema |
+| Cluster centroid poisoning | Submit adversarial embeddings via manual questions | **LOW** | Online centroid averaging dilutes adversarial inputs | Requires many adversarial inputs to shift centroid significantly |
+| Queue payload manipulation | Direct Redis access | **LOW** | Redis bound to 127.0.0.1 | No authentication on Redis (password not configured) |
+
+#### Repudiation
+
+| Threat | Vector | Severity | Current Mitigation | Gap |
+|--------|--------|----------|-------------------|-----|
+| Denied answer approval | Teacher claims they didn't approve a post | **MEDIUM** | `posted_at` timestamp on Answer model | No audit log of who approved what |
+| Session data deletion | Teacher deletes session (CASCADE) | **LOW** | Intentional feature | No soft-delete or audit trail |
+
+#### Information Disclosure
+
+| Threat | Vector | Severity | Current Mitigation | Gap |
+|--------|--------|----------|-------------------|-----|
+| YouTube token exposure | Database breach | **HIGH** | Fernet encryption at rest | Encryption key in env var — single key for all tokens |
+| Cross-tenant data leakage | Broken ownership check | **HIGH** | JOIN-based ownership verification on all endpoints | Relies on developer discipline (no automated test) |
+| JWT secret exposure | Env var leak / config dump | **HIGH** | Single HS256 secret in settings | No key rotation mechanism |
+| Error message leakage | Unhandled exceptions in API | **MEDIUM** | FastAPI default error handling | Debug mode configurable — ensure `debug=False` in production |
+
+#### Denial of Service
+
+| Threat | Vector | Severity | Current Mitigation | Gap |
+|--------|--------|----------|-------------------|-----|
+| API rate limit bypass | Distributed IPs | **HIGH** | Per-IP rate limiting (60/min) | No per-user or per-session rate limiting |
+| WebSocket flood | Send thousands of messages per second | **HIGH** | None detected | No per-connection message rate limit |
+| Queue flooding | Rapid manual question submission (10/request, no cooldown) | **MEDIUM** | Max 10 questions per request | No per-session cooldown or daily limit |
+| YouTube quota exhaustion | Create many sessions with polling | **MEDIUM** | Quota check per poll | No limit on concurrent active sessions per teacher |
+| Gemini API exhaustion | Trigger thousands of classifications | **MEDIUM** | Semaphore(5) limits concurrency | No per-teacher Gemini call budget |
+
+#### Elevation of Privilege
+
+| Threat | Vector | Severity | Current Mitigation | Gap |
+|--------|--------|----------|-------------------|-----|
+| Access other teacher's data | Modify session_id in API calls | **HIGH** | Ownership JOIN on every query | No RBAC — only owner/not-owner model |
+| Admin escalation | No admin role exists | **N/A** | Single-role system (teacher only) | No admin panel or elevated access |
+| Worker process compromise | Worker has direct DB write access | **MEDIUM** | Workers share DB credentials with API | No least-privilege DB users per component |
+
+### 10.2 Top 5 Actionable Recommendations
+
+| Priority | Recommendation | Addresses | Effort |
+|----------|---------------|-----------|--------|
+| **P0** | Add `max_length` validation on all text fields in Pydantic schemas | Tampering, DoS | Low |
+| **P0** | Add per-connection WebSocket message rate limit (e.g., 10 msg/sec) | DoS | Low |
+| **P1** | Migrate JWT from localStorage to SessionStorage; add CSP headers | Spoofing | Medium |
+| **P1** | Add Redis AUTH password in production | Tampering | Low |
+| **P2** | Implement audit log table for answer approvals and session deletions | Repudiation | Medium |
+
+### 10.3 Security Configuration Checklist (Production Deployment)
+
+```
+[ ] Set debug=False in FastAPI
+[ ] Set LOG_JSON=True for structured logging
+[ ] Set CORS origins to production domain only
+[ ] Configure Redis AUTH password
+[ ] Ensure ENCRYPTION_KEY is unique per environment (≥32 chars)
+[ ] Ensure SECRET_KEY is unique per environment
+[ ] Set RATE_LIMIT_ENABLED=True
+[ ] Verify PostgreSQL connections are SSL-encrypted
+[ ] Disable /docs and /redoc endpoints in production
+[ ] Add CSP, X-Frame-Options, X-Content-Type-Options headers
+[ ] Configure HTTPS termination (TLS 1.2+)
+[ ] Set up log aggregation for security event monitoring
+```
diff --git a/frontend/css/styles.css b/frontend/css/styles.css
deleted file mode 100644
index c0c0129..0000000
--- a/frontend/css/styles.css
+++ /dev/null
@@ -1,428 +0,0 @@
-/* ============================================================
-   Base Reset & Variables
-   ============================================================ */
-*, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
-[hidden] { display: none !important; }
-
-:root {
-  --color-primary: #2563eb;
-  --color-primary-hover: #1d4ed8;
-  --color-danger: #dc2626;
-  --color-danger-hover: #b91c1c;
-  --color-success: #16a34a;
-  --color-bg: #f8fafc;
-  --color-surface: #ffffff;
-  --color-border: #e2e8f0;
-  --color-text: #1e293b;
-  --color-muted: #64748b;
-  --radius: 8px;
-  --shadow: 0 1px 3px rgba(0,0,0,0.1);
-}
-
-body {
-  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
-  background: var(--color-bg);
-  color: var(--color-text);
-  font-size: 14px;
-  line-height: 1.5;
-}
-
-/* ============================================================
-   Auth View
-   ============================================================ */
-#auth-view {
-  min-height: 100vh;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-  padding: 24px;
-}
-
-.auth-card {
-  background: var(--color-surface);
-  border: 1px solid var(--color-border);
-  border-radius: var(--radius);
-  box-shadow: var(--shadow);
-  padding: 32px;
-  width: 100%;
-  max-width: 400px;
-}
-
-.auth-card h1 {
-  font-size: 20px;
-  font-weight: 700;
-  color: var(--color-primary);
-  margin-bottom: 24px;
-  text-align: center;
-}
-
-.auth-card h2 {
-  font-size: 16px;
-  font-weight: 600;
-  margin-bottom: 16px;
-}
-
-.auth-card form {
-  display: flex;
-  flex-direction: column;
-  gap: 12px;
-}
-
-.auth-card label {
-  display: flex;
-  flex-direction: column;
-  gap: 4px;
-  font-weight: 500;
-}
-
-.error-msg {
-  background: #fef2f2;
-  border: 1px solid #fecaca;
-  color: var(--color-danger);
-  border-radius: 4px;
-  padding: 8px 12px;
-  font-size: 13px;
-  margin-bottom: 8px;
-}
-
-/* ============================================================
-   Header
-   ============================================================ */
-.app-header {
-  background: var(--color-surface);
-  border-bottom: 1px solid var(--color-border);
-  padding: 0 24px;
-  height: 56px;
-  display: flex;
-  align-items: center;
-  justify-content: space-between;
-  position: sticky;
-  top: 0;
-  z-index: 10;
-  box-shadow: var(--shadow);
-}
-
-.logo { font-weight: 700; font-size: 16px; color: var(--color-primary); }
-.user-name { color: var(--color-muted); margin-right: 12px; }
-.header-right { display: flex; align-items: center; }
-
-/* ============================================================
-   Main Layout
-   ============================================================ */
-.app-main { padding: 20px 24px; max-width: 1400px; margin: 0 auto; }
-
-.panels-grid {
-  display: grid;
-  grid-template-columns: 360px 1fr;
-  gap: 20px;
-}
-
-.left-column, .right-column {
-  display: flex;
-  flex-direction: column;
-  gap: 16px;
-}
-
-/* ============================================================
-   Panel
-   ============================================================ */
-.panel {
-  background: var(--color-surface);
-  border: 1px solid var(--color-border);
-  border-radius: var(--radius);
-  padding: 16px;
-  box-shadow: var(--shadow);
-}
-
-.panel h2 {
-  font-size: 14px;
-  font-weight: 600;
-  margin-bottom: 12px;
-  display: flex;
-  align-items: center;
-  gap: 8px;
-}
-
-/* ============================================================
-   Forms
-   ============================================================ */
-label {
-  display: flex;
-  flex-direction: column;
-  gap: 4px;
-  font-weight: 500;
-  font-size: 13px;
-  margin-bottom: 8px;
-}
-
-input[type="text"],
-input[type="email"],
-input[type="password"],
-textarea {
-  width: 100%;
-  padding: 8px 10px;
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  font-size: 13px;
-  font-family: inherit;
-  color: var(--color-text);
-  background: var(--color-bg);
-  transition: border-color 0.15s;
-}
-
-input:focus, textarea:focus {
-  outline: none;
-  border-color: var(--color-primary);
-  background: #fff;
-}
-
-textarea { resize: vertical; min-height: 80px; }
-
-.hint { font-size: 12px; color: var(--color-muted); margin-bottom: 6px; }
-
-/* ============================================================
-   Buttons
-   ============================================================ */
-.btn {
-  display: inline-flex;
-  align-items: center;
-  justify-content: center;
-  gap: 6px;
-  padding: 7px 14px;
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  font-size: 13px;
-  font-weight: 500;
-  cursor: pointer;
-  background: var(--color-surface);
-  color: var(--color-text);
-  transition: background 0.15s, border-color 0.15s;
-  white-space: nowrap;
-}
-
-.btn:hover { background: #f1f5f9; }
-
-.btn-primary {
-  background: var(--color-primary);
-  color: #fff;
-  border-color: var(--color-primary);
-  width: 100%;
-  margin-top: 4px;
-}
-
-.btn-primary:hover { background: var(--color-primary-hover); border-color: var(--color-primary-hover); }
-
-.btn-danger {
-  background: var(--color-danger);
-  color: #fff;
-  border-color: var(--color-danger);
-  width: 100%;
-  margin-top: 8px;
-}
-
-.btn-danger:hover { background: var(--color-danger-hover); }
-
-.btn-danger-sm {
-  background: #fff;
-  color: var(--color-danger);
-  border-color: #fecaca;
-  font-size: 12px;
-  padding: 4px 10px;
-}
-
-.btn-danger-sm:hover { background: #fef2f2; }
-
-.btn-sm { padding: 5px 10px; font-size: 12px; }
-
-.btn-loading {
-  opacity: 0.65;
-  pointer-events: none;
-}
-
-button[disabled] { opacity: 0.5; pointer-events: none; }
-
-/* ============================================================
-   Badges
-   ============================================================ */
-.badge {
-  display: inline-flex;
-  align-items: center;
-  padding: 2px 8px;
-  border-radius: 12px;
-  font-size: 11px;
-  font-weight: 600;
-  white-space: nowrap;
-}
-
-.badge-question { background: #dbeafe; color: #1e40af; }
-.badge-not-question { background: #f1f5f9; color: #64748b; }
-.badge-classifying { background: #fef9c3; color: #92400e; }
-.badge-posted { background: #dcfce7; color: #166534; }
-.badge-active { background: #dcfce7; color: #166534; }
-.badge-disconnected { background: #f1f5f9; color: #64748b; }
-.badge-connected { background: #dbeafe; color: #1e40af; }
-.badge-pending { background: #fef3c7; color: #92400e; }
-
-/* ============================================================
-   Questions Feed
-   ============================================================ */
-.questions-feed {
-  height: 400px;
-  overflow-y: auto;
-  scroll-behavior: smooth;
-  display: flex;
-  flex-direction: column;
-  gap: 6px;
-}
-
-.feed-item {
-  display: flex;
-  align-items: flex-start;
-  gap: 8px;
-  padding: 8px 10px;
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  background: var(--color-bg);
-  font-size: 13px;
-}
-
-.feed-item-author {
-  font-weight: 600;
-  color: var(--color-primary);
-  white-space: nowrap;
-  flex-shrink: 0;
-  font-size: 12px;
-}
-
-.feed-item-text { flex: 1; }
-.feed-item-badge { flex-shrink: 0; }
-
-.empty-msg { color: var(--color-muted); font-size: 13px; text-align: center; padding: 24px 0; }
-
-/* ============================================================
-   Clusters Panel
-   ============================================================ */
-#clusters-list {
-  display: flex;
-  flex-direction: column;
-  gap: 12px;
-  max-height: 600px;
-  overflow-y: auto;
-}
-
-.cluster-card {
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  padding: 12px;
-  background: var(--color-bg);
-}
-
-.cluster-header {
-  display: flex;
-  align-items: center;
-  justify-content: space-between;
-  margin-bottom: 8px;
-}
-
-.cluster-title { font-weight: 600; font-size: 13px; }
-.cluster-count { color: var(--color-muted); font-size: 12px; }
-
-.cluster-answer {
-  background: #fff;
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  padding: 10px;
-  font-size: 13px;
-  margin-bottom: 8px;
-  white-space: pre-wrap;
-  max-height: 120px;
-  overflow-y: auto;
-}
-
-.cluster-actions {
-  display: flex;
-  gap: 8px;
-  flex-wrap: wrap;
-}
-
-/* ============================================================
-   YouTube Panel
-   ============================================================ */
-.yt-status-row {
-  margin-bottom: 10px;
-}
-
-/* ============================================================
-   Metrics Grid
-   ============================================================ */
-.metrics-grid {
-  display: grid;
-  grid-template-columns: 1fr 1fr;
-  gap: 10px;
-}
-
-.metric-card {
-  background: var(--color-bg);
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  padding: 10px 12px;
-  text-align: center;
-}
-
-.metric-value { font-size: 24px; font-weight: 700; color: var(--color-primary); }
-.metric-label { font-size: 11px; color: var(--color-muted); margin-top: 2px; }
-
-/* ============================================================
-   Session Info
-   ============================================================ */
-.session-info {
-  display: flex;
-  align-items: center;
-  gap: 8px;
-  margin-bottom: 6px;
-}
-
-/* ============================================================
-   Toast Notifications
-   ============================================================ */
-#toast-container {
-  position: fixed;
-  bottom: 24px;
-  right: 24px;
-  display: flex;
-  flex-direction: column;
-  gap: 8px;
-  z-index: 1000;
-}
-
-.toast {
-  padding: 10px 16px;
-  border-radius: 8px;
-  font-size: 13px;
-  font-weight: 500;
-  box-shadow: 0 4px 12px rgba(0,0,0,0.15);
-  animation: slideIn 0.2s ease;
-  max-width: 320px;
-}
-
-.toast-success { background: #166534; color: #fff; }
-.toast-error   { background: #991b1b; color: #fff; }
-.toast-info    { background: #1e40af; color: #fff; }
-.toast-warning { background: #92400e; color: #fff; }
-
-@keyframes slideIn {
-  from { transform: translateX(100%); opacity: 0; }
-  to   { transform: translateX(0);   opacity: 1; }
-}
-
-/* ============================================================
-   Responsive
-   ============================================================ */
-@media (max-width: 900px) {
-  .panels-grid { grid-template-columns: 1fr; }
-}
-
-/* ============================================================
-   Hidden utility
-   ============================================================ */
-.hidden { display: none !important; }
diff --git a/frontend/index.html b/frontend/index.html
index 1c366fa..98e0244 100644
--- a/frontend/index.html
+++ b/frontend/index.html
@@ -4,6 +4,9 @@
     <meta charset="UTF-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
     <title>AI Live Doubt Manager</title>
+    <link rel="preconnect" href="https://fonts.googleapis.com">
+    <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+    <link href="https://fonts.googleapis.com/css2?family=Azeret+Mono:wght@400;700&family=Outfit:wght@300;400;500;600;700&display=swap" rel="stylesheet">
   </head>
   <body>
     <div id="root"></div>
diff --git a/frontend/js/api.js b/frontend/js/api.js
deleted file mode 100644
index a185284..0000000
--- a/frontend/js/api.js
+++ /dev/null
@@ -1,155 +0,0 @@
-/**
- * API client for AI Live Doubt Manager.
- * Handles all fetch calls with auth, error handling, and 401 auto-logout.
- */
-
-class API {
-  constructor() {
-    this.token = localStorage.getItem('token');
-  }
-
-  async request(method, path, body = null) {
-    const opts = {
-      method,
-      headers: {
-        'Content-Type': 'application/json',
-        ...(this.token ? { 'Authorization': `Bearer ${this.token}` } : {}),
-      },
-      ...(body !== null ? { body: JSON.stringify(body) } : {}),
-    };
-
-    const resp = await fetch(path, opts);
-
-    if (resp.status === 401) {
-      this.token = null;
-      localStorage.removeItem('token');
-      // Emit custom event so app can react without causing reload loops
-      window.dispatchEvent(new CustomEvent('auth:expired'));
-      throw new Error('Unauthorized');
-    }
-
-    if (resp.status === 429) {
-      throw new Error('rate_limit');
-    }
-
-    if (!resp.ok) {
-      let message = `HTTP ${resp.status}`;
-      try {
-        const errBody = await resp.json();
-        message = errBody.detail || errBody.message || message;
-      } catch {
-        // ignore parse error
-      }
-      throw new Error(message);
-    }
-
-    if (resp.status === 204) return null;
-    return resp.json();
-  }
-
-  // ----------------------------------------------------------------
-  // Auth
-  // ----------------------------------------------------------------
-
-  async login(email, password) {
-    const data = await this.request('POST', '/api/v1/auth/login', {
-      email,
-      password,
-    });
-    this.token = data.access_token;
-    localStorage.setItem('token', this.token);
-    return data;
-  }
-
-  async register(email, password, name) {
-    const data = await this.request('POST', '/api/v1/auth/register', {
-      email, password, name,
-    });
-    return data;
-  }
-
-  async logout() {
-    try { await this.request('POST', '/api/v1/auth/logout'); } catch {}
-    this.token = null;
-    localStorage.removeItem('token');
-    window.location.reload();
-  }
-
-  async getMe() {
-    return this.request('GET', '/api/v1/auth/me');
-  }
-
-  // ----------------------------------------------------------------
-  // Sessions
-  // ----------------------------------------------------------------
-
-  async getSessions() {
-    return this.request('GET', '/api/v1/sessions/');
-  }
-
-  async createSession(data) {
-    return this.request('POST', '/api/v1/sessions/', data);
-  }
-
-  async endSession(id) {
-    return this.request('POST', `/api/v1/sessions/${id}/end`);
-  }
-
-  async getSessionComments(id, limit = 100, offset = 0) {
-    return this.request('GET', `/api/v1/sessions/${id}/comments?limit=${limit}&offset=${offset}`);
-  }
-
-  async getSessionClusters(id) {
-    return this.request('GET', `/api/v1/sessions/${id}/clusters`);
-  }
-
-  async getSessionStats(id) {
-    return this.request('GET', `/api/v1/dashboard/sessions/${id}/stats`);
-  }
-
-  // ----------------------------------------------------------------
-  // YouTube
-  // ----------------------------------------------------------------
-
-  async getYouTubeAuthURL(returnUrl = '/app') {
-    return this.request('GET', `/api/v1/youtube/auth/url?return_url=${encodeURIComponent(returnUrl)}`);
-  }
-
-  async getYouTubeStatus() {
-    return this.request('GET', '/api/v1/youtube/auth/status');
-  }
-
-  async disconnectYouTube() {
-    return this.request('DELETE', '/api/v1/youtube/auth/disconnect');
-  }
-
-  async validateVideo(videoId) {
-    return this.request('GET', `/api/v1/youtube/videos/${videoId}/validate`);
-  }
-
-  // ----------------------------------------------------------------
-  // Dashboard
-  // ----------------------------------------------------------------
-
-  async submitManualQuestion(sessionId, text) {
-    return this.request('POST', `/api/v1/dashboard/sessions/${sessionId}/manual-question`, { text });
-  }
-
-  async approveAnswer(answerId) {
-    return this.request('POST', `/api/v1/dashboard/answers/${answerId}/approve`);
-  }
-
-  async editAnswer(answerId, text) {
-    return this.request('POST', `/api/v1/dashboard/answers/${answerId}/edit`, { text });
-  }
-
-  // ----------------------------------------------------------------
-  // Metrics
-  // ----------------------------------------------------------------
-
-  async getMetrics() {
-    return this.request('GET', '/api/v1/metrics');
-  }
-}
-
-window.api = new API();
diff --git a/frontend/js/app.js b/frontend/js/app.js
deleted file mode 100644
index a29fd7d..0000000
--- a/frontend/js/app.js
+++ /dev/null
@@ -1,616 +0,0 @@
-/**
- * Main application logic for AI Live Doubt Manager dashboard.
- */
-
-const app = (() => {
-  // ----------------------------------------------------------------
-  // State
-  // ----------------------------------------------------------------
-  let currentUser = null;
-  let activeSession = null;
-  let feedCount = 0;
-  let statsRefreshTimer = null;
-
-  // ----------------------------------------------------------------
-  // Toast Notifications
-  // ----------------------------------------------------------------
-  function showToast(message, type = 'info') {
-    const container = document.getElementById('toast-container');
-    const toast = document.createElement('div');
-    toast.className = `toast toast-${type}`;
-    toast.textContent = message;
-    container.appendChild(toast);
-    setTimeout(() => toast.remove(), 4000);
-  }
-
-  // ----------------------------------------------------------------
-  // Loading state helpers
-  // ----------------------------------------------------------------
-  function setLoading(btn, loading, loadingText = 'Loading...') {
-    if (!btn) return;
-    if (loading) {
-      btn._originalText = btn.textContent;
-      btn.textContent = loadingText;
-      btn.classList.add('btn-loading');
-      btn.disabled = true;
-    } else {
-      btn.textContent = btn._originalText || btn.textContent;
-      btn.classList.remove('btn-loading');
-      btn.disabled = false;
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // View switching
-  // ----------------------------------------------------------------
-  function showDashboard() {
-    document.getElementById('auth-view').hidden = true;
-    document.getElementById('dashboard-view').hidden = false;
-  }
-
-  function showAuth() {
-    document.getElementById('auth-view').hidden = false;
-    document.getElementById('dashboard-view').hidden = true;
-  }
-
-  function showLogin() {
-    document.getElementById('login-form').classList.remove('hidden');
-    document.getElementById('register-form').classList.add('hidden');
-    document.getElementById('login-error').classList.add('hidden');
-  }
-
-  function showRegister() {
-    document.getElementById('login-form').classList.add('hidden');
-    document.getElementById('register-form').classList.remove('hidden');
-    document.getElementById('register-error').classList.add('hidden');
-  }
-
-  // ----------------------------------------------------------------
-  // Auth Handlers
-  // ----------------------------------------------------------------
-  async function handleLogin(event) {
-    event.preventDefault();
-    const email = document.getElementById('login-email').value;
-    const password = document.getElementById('login-password').value;
-    const btn = document.getElementById('login-btn');
-    const errEl = document.getElementById('login-error');
-
-    errEl.classList.add('hidden');
-    setLoading(btn, true, 'Signing in...');
-    try {
-      await api.login(email, password);
-      await initDashboard();
-    } catch (e) {
-      errEl.textContent = e.message || 'Login failed';
-      errEl.classList.remove('hidden');
-    } finally {
-      setLoading(btn, false);
-    }
-  }
-
-  async function handleRegister(event) {
-    event.preventDefault();
-    const name = document.getElementById('register-name').value;
-    const email = document.getElementById('register-email').value;
-    const password = document.getElementById('register-password').value;
-    const btn = document.getElementById('register-btn');
-    const errEl = document.getElementById('register-error');
-
-    errEl.classList.add('hidden');
-    setLoading(btn, true, 'Creating account...');
-    try {
-      await api.register(email, password, name);
-      // Auto-login after registration
-      await api.login(email, password);
-      await initDashboard();
-    } catch (e) {
-      errEl.textContent = e.message || 'Registration failed';
-      errEl.classList.remove('hidden');
-    } finally {
-      setLoading(btn, false);
-    }
-  }
-
-  async function logout() {
-    await api.logout();
-  }
-
-  // ----------------------------------------------------------------
-  // Dashboard Initialization
-  // ----------------------------------------------------------------
-  async function initDashboard() {
-    try {
-      currentUser = await api.getMe();
-    } catch (e) {
-      showAuth();
-      return;
-    }
-
-    document.getElementById('user-name').textContent =
-      currentUser.name || currentUser.email || '';
-
-    showDashboard();
-    await loadYouTubeStatus();
-
-    // Load most recent active session if any
-    try {
-      const sessions = await api.getSessions();
-      const active = sessions.find(s => s.is_active);
-      if (active) {
-        setActiveSession(active);
-      }
-    } catch (e) {
-      // ignore
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // Session Management
-  // ----------------------------------------------------------------
-  async function handleCreateSession(event) {
-    event.preventDefault();
-    const title = document.getElementById('session-title').value.trim();
-    const videoId = document.getElementById('session-video-id').value.trim();
-    const btn = document.getElementById('create-session-btn');
-
-    setLoading(btn, true, 'Starting...');
-    try {
-      const session = await api.createSession({
-        title,
-        youtube_video_id: videoId || null,
-      });
-      setActiveSession(session);
-      showToast('Session started!', 'success');
-    } catch (e) {
-      showToast(e.message || 'Failed to create session', 'error');
-    } finally {
-      setLoading(btn, false);
-    }
-  }
-
-  function setActiveSession(session) {
-    activeSession = session;
-
-    document.getElementById('no-session').hidden = true;
-    document.getElementById('active-session').hidden = false;
-    document.getElementById('active-session-title').textContent = session.title;
-
-    const videoEl = document.getElementById('active-session-video');
-    if (session.youtube_video_id) {
-      videoEl.textContent = `YouTube: ${session.youtube_video_id}`;
-    } else {
-      videoEl.textContent = 'Manual mode (no YouTube video)';
-    }
-
-    // Connect WebSocket
-    dashboardWS.disconnect();
-    registerWebSocketHandlers();
-    dashboardWS.connect(session.id);
-
-    // Start stats refresh
-    refreshStats();
-    if (statsRefreshTimer) clearInterval(statsRefreshTimer);
-    statsRefreshTimer = setInterval(refreshStats, 10000);
-
-    // Load existing comments and clusters
-    loadComments();
-    loadClusters();
-  }
-
-  async function endSession() {
-    if (!activeSession) return;
-    const btn = document.getElementById('end-session-btn');
-    setLoading(btn, true, 'Ending...');
-    try {
-      await api.endSession(activeSession.id);
-      activeSession = null;
-      dashboardWS.disconnect();
-      if (statsRefreshTimer) clearInterval(statsRefreshTimer);
-
-      document.getElementById('no-session').hidden = false;
-      document.getElementById('active-session').hidden = true;
-      document.getElementById('questions-feed').innerHTML =
-        '<p class="empty-msg">Session ended.</p>';
-      document.getElementById('clusters-list').innerHTML =
-        '<p class="empty-msg">No clusters yet.</p>';
-      feedCount = 0;
-      document.getElementById('feed-count').textContent = '0';
-      showToast('Session ended', 'info');
-    } catch (e) {
-      showToast(e.message || 'Failed to end session', 'error');
-    } finally {
-      setLoading(btn, false);
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // YouTube OAuth
-  // ----------------------------------------------------------------
-  async function connectYouTube() {
-    const btn = document.getElementById('yt-connect-btn');
-    setLoading(btn, true, 'Connecting...');
-    try {
-      const data = await api.getYouTubeAuthURL('/app');
-      const popup = window.open(
-        data.url,
-        'youtube_oauth',
-        'width=600,height=700,noopener'
-      );
-
-      // Listen for postMessage from OAuth result page
-      const onMessage = (event) => {
-        if (event.origin !== location.origin) return;
-        if (event.data && event.data.type === 'youtube_oauth_complete') {
-          window.removeEventListener('message', onMessage);
-          if (popup && !popup.closed) popup.close();
-          loadYouTubeStatus();
-          showToast('YouTube connected!', 'success');
-        }
-      };
-      window.addEventListener('message', onMessage);
-
-      // Clean up if popup is closed without completing
-      const pollClosed = setInterval(() => {
-        if (popup && popup.closed) {
-          clearInterval(pollClosed);
-          window.removeEventListener('message', onMessage);
-          setLoading(btn, false);
-          loadYouTubeStatus();
-        }
-      }, 500);
-    } catch (e) {
-      showToast(e.message || 'Failed to start YouTube OAuth', 'error');
-      setLoading(btn, false);
-    }
-  }
-
-  async function disconnectYouTube() {
-    const btn = document.getElementById('yt-disconnect-btn');
-    setLoading(btn, true, 'Disconnecting...');
-    try {
-      await api.disconnectYouTube();
-      await loadYouTubeStatus();
-      showToast('YouTube disconnected', 'info');
-    } catch (e) {
-      showToast(e.message || 'Failed to disconnect', 'error');
-    } finally {
-      setLoading(btn, false);
-    }
-  }
-
-  async function loadYouTubeStatus() {
-    try {
-      const status = await api.getYouTubeStatus();
-      const badge = document.getElementById('yt-status-badge');
-      const connectRow = document.getElementById('yt-connect-row');
-      const connectedRow = document.getElementById('yt-connected-row');
-      const expiresEl = document.getElementById('yt-expires-at');
-
-      if (status.connected) {
-        badge.textContent = 'Connected';
-        badge.className = 'badge badge-connected';
-        connectRow.hidden = true;
-        connectedRow.hidden = false;
-        if (status.expires_at) {
-          expiresEl.textContent = `Token expires: ${new Date(status.expires_at).toLocaleString()}`;
-        }
-      } else {
-        badge.textContent = 'Disconnected';
-        badge.className = 'badge badge-disconnected';
-        connectRow.hidden = false;
-        connectedRow.hidden = true;
-        // Re-enable connect button in case it was loading
-        setLoading(document.getElementById('yt-connect-btn'), false);
-      }
-    } catch (e) {
-      // ignore — not critical
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // Manual Questions
-  // ----------------------------------------------------------------
-  async function submitManualQuestions() {
-    if (!activeSession) {
-      showToast('Start a session first', 'warning');
-      return;
-    }
-    const textarea = document.getElementById('manual-textarea');
-    const text = textarea.value.trim();
-    if (!text) return;
-
-    const btn = document.getElementById('manual-submit-btn');
-    setLoading(btn, true, 'Submitting...');
-    try {
-      const result = await api.submitManualQuestion(activeSession.id, text);
-      textarea.value = '';
-      showToast(`${result.created} question(s) submitted`, 'success');
-    } catch (e) {
-      if (e.message === 'rate_limit') {
-        showToast('Rate limit hit, try again in 60s', 'warning');
-      } else {
-        showToast(e.message || 'Failed to submit questions', 'error');
-      }
-    } finally {
-      setLoading(btn, false);
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // Feed (Questions)
-  // ----------------------------------------------------------------
-  async function loadComments() {
-    if (!activeSession) return;
-    try {
-      const comments = await api.getSessionComments(activeSession.id, 100, 0);
-      const feed = document.getElementById('questions-feed');
-      feed.innerHTML = '';
-      feedCount = 0;
-      comments.forEach(c => appendFeedItem(c));
-    } catch (e) {
-      // ignore
-    }
-  }
-
-  function appendFeedItem(comment) {
-    const feed = document.getElementById('questions-feed');
-
-    // Remove empty message if present
-    const empty = feed.querySelector('.empty-msg');
-    if (empty) empty.remove();
-
-    const item = document.createElement('div');
-    item.className = 'feed-item';
-    item.dataset.commentId = comment.id;
-
-    let badgeHtml = '<span class="badge badge-classifying">Classifying...</span>';
-    if (comment.is_question === true) {
-      badgeHtml = '<span class="badge badge-question">Question</span>';
-    } else if (comment.is_question === false) {
-      badgeHtml = '<span class="badge badge-not-question">Not a question</span>';
-    }
-
-    item.innerHTML = `
-      <span class="feed-item-author">${escHtml(comment.author_name || 'Unknown')}</span>
-      <span class="feed-item-text">${escHtml(comment.text)}</span>
-      <span class="feed-item-badge">${badgeHtml}</span>
-    `;
-
-    feed.prepend(item);
-    feedCount++;
-    document.getElementById('feed-count').textContent = feedCount;
-  }
-
-  function updateFeedItemBadge(commentId, isQuestion) {
-    const item = document.querySelector(`[data-comment-id="${commentId}"]`);
-    if (!item) return;
-    const badgeEl = item.querySelector('.feed-item-badge');
-    if (!badgeEl) return;
-    if (isQuestion) {
-      badgeEl.innerHTML = '<span class="badge badge-question">Question</span>';
-    } else {
-      badgeEl.innerHTML = '<span class="badge badge-not-question">Not a question</span>';
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // Clusters
-  // ----------------------------------------------------------------
-  async function loadClusters() {
-    if (!activeSession) return;
-    try {
-      const clusters = await api.getSessionClusters(activeSession.id);
-      const list = document.getElementById('clusters-list');
-      list.innerHTML = '';
-      if (!clusters.length) {
-        list.innerHTML = '<p class="empty-msg">No clusters yet.</p>';
-        return;
-      }
-      clusters.forEach(cluster => upsertClusterCard(cluster));
-    } catch (e) {
-      // ignore
-    }
-  }
-
-  function upsertClusterCard(cluster) {
-    const list = document.getElementById('clusters-list');
-
-    // Remove empty message
-    const empty = list.querySelector('.empty-msg');
-    if (empty) empty.remove();
-
-    let card = document.querySelector(`[data-cluster-id="${cluster.id}"]`);
-    if (!card) {
-      card = document.createElement('div');
-      card.className = 'cluster-card';
-      card.dataset.clusterId = cluster.id;
-      list.prepend(card);
-    }
-
-    const answers = cluster.answers || [];
-    const latestAnswer = answers[answers.length - 1];
-
-    let answerHtml = '<p class="hint">Generating answer...</p>';
-    let actionsHtml = '';
-
-    if (latestAnswer) {
-      const postedBadge = latestAnswer.is_posted
-        ? '<span class="badge badge-posted">Posted</span>'
-        : '<span class="badge badge-pending">Pending</span>';
-
-      answerHtml = `
-        <div class="cluster-answer" id="answer-text-${latestAnswer.id}">${escHtml(latestAnswer.text)}</div>
-        <div style="margin-bottom:6px;">${postedBadge}</div>
-      `;
-      actionsHtml = `
-        <button class="btn btn-sm" onclick="app.copyAnswer('${latestAnswer.id}')">Copy</button>
-      `;
-      if (!latestAnswer.is_posted) {
-        actionsHtml += `
-          <button class="btn btn-primary btn-sm" id="approve-btn-${latestAnswer.id}"
-            onclick="app.approveAnswer('${latestAnswer.id}')">Approve &amp; Post</button>
-        `;
-      }
-    }
-
-    card.innerHTML = `
-      <div class="cluster-header">
-        <span class="cluster-title">${escHtml(cluster.title || 'Untitled Cluster')}</span>
-        <span class="cluster-count">${cluster.comment_count || 0} questions</span>
-      </div>
-      ${answerHtml}
-      <div class="cluster-actions">${actionsHtml}</div>
-    `;
-  }
-
-  async function approveAnswer(answerId) {
-    const btn = document.getElementById(`approve-btn-${answerId}`);
-    setLoading(btn, true, 'Posting...');
-    try {
-      await api.approveAnswer(answerId);
-      showToast('Answer approved for posting', 'success');
-      loadClusters();
-    } catch (e) {
-      if (e.message === 'rate_limit') {
-        showToast('Rate limit hit, try again in 60s', 'warning');
-      } else {
-        showToast(e.message || 'Failed to approve answer', 'error');
-      }
-      setLoading(btn, false);
-    }
-  }
-
-  function copyAnswer(answerId) {
-    const el = document.getElementById(`answer-text-${answerId}`);
-    if (!el) return;
-    navigator.clipboard.writeText(el.textContent).then(() => {
-      showToast('Answer copied to clipboard', 'success');
-    }).catch(() => {
-      showToast('Failed to copy', 'error');
-    });
-  }
-
-  // ----------------------------------------------------------------
-  // Stats
-  // ----------------------------------------------------------------
-  async function refreshStats() {
-    if (!activeSession) return;
-    try {
-      const stats = await api.getSessionStats(activeSession.id);
-      document.getElementById('stat-total').textContent = stats.total_comments ?? '—';
-      document.getElementById('stat-questions').textContent = stats.questions ?? '—';
-      document.getElementById('stat-clusters').textContent = stats.clusters ?? '—';
-      document.getElementById('stat-posted').textContent = stats.answers_posted ?? '—';
-    } catch (e) {
-      // ignore
-    }
-  }
-
-  // ----------------------------------------------------------------
-  // WebSocket Event Handlers
-  // ----------------------------------------------------------------
-  function registerWebSocketHandlers() {
-    dashboardWS.on('connected', () => {
-      console.log('WebSocket connected');
-    });
-
-    dashboardWS.on('comment_created', (data) => {
-      appendFeedItem(data);
-      refreshStats();
-    });
-
-    dashboardWS.on('comment_classified', (data) => {
-      updateFeedItemBadge(data.comment_id, data.is_question);
-      refreshStats();
-    });
-
-    dashboardWS.on('cluster_created', (data) => {
-      upsertClusterCard(data);
-      refreshStats();
-    });
-
-    dashboardWS.on('cluster_updated', (data) => {
-      upsertClusterCard(data);
-      refreshStats();
-    });
-
-    dashboardWS.on('answer_ready', (data) => {
-      loadClusters();
-      showToast('New answer generated — review in Clusters panel', 'info');
-    });
-
-    dashboardWS.on('answer_posted', (data) => {
-      loadClusters();
-      refreshStats();
-      showToast('Answer posted to YouTube!', 'success');
-    });
-
-    dashboardWS.on('error', (data) => {
-      showToast(data.msg || 'Connection error', 'error');
-    });
-  }
-
-  // ----------------------------------------------------------------
-  // Utility
-  // ----------------------------------------------------------------
-  function escHtml(str) {
-    if (!str) return '';
-    return str
-      .replace(/&/g, '&amp;')
-      .replace(/</g, '&lt;')
-      .replace(/>/g, '&gt;')
-      .replace(/"/g, '&quot;')
-      .replace(/'/g, '&#39;');
-  }
-
-  // ----------------------------------------------------------------
-  // Bootstrap
-  // ----------------------------------------------------------------
-  async function init() {
-    // Handle auth expiry globally
-    window.addEventListener('auth:expired', () => {
-      currentUser = null;
-      activeSession = null;
-      dashboardWS.disconnect();
-      showAuth();
-      showLogin();
-    });
-
-    // Check for stored token
-    const token = localStorage.getItem('token');
-    if (token) {
-      api.token = token;
-      try {
-        await initDashboard();
-      } catch (e) {
-        // Token invalid — show login
-        localStorage.removeItem('token');
-        api.token = null;
-        showAuth();
-        showLogin();
-      }
-    } else {
-      showAuth();
-      showLogin();
-    }
-  }
-
-  // Start on DOMContentLoaded
-  document.addEventListener('DOMContentLoaded', init);
-
-  // Public API
-  return {
-    handleLogin,
-    handleRegister,
-    logout,
-    showLogin,
-    showRegister,
-    handleCreateSession,
-    endSession,
-    connectYouTube,
-    disconnectYouTube,
-    submitManualQuestions,
-    approveAnswer,
-    copyAnswer,
-  };
-})();
diff --git a/frontend/js/websocket.js b/frontend/js/websocket.js
deleted file mode 100644
index 12e12dc..0000000
--- a/frontend/js/websocket.js
+++ /dev/null
@@ -1,83 +0,0 @@
-/**
- * WebSocket client with exponential backoff reconnection.
- */
-
-class DashboardWebSocket {
-  constructor() {
-    this.ws = null;
-    this.handlers = {};
-    this.retryCount = 0;
-    this.maxRetries = 10;
-    this._sessionId = null;
-  }
-
-  connect(sessionId) {
-    this._sessionId = sessionId;
-    const token = localStorage.getItem('token');
-    const protocol = location.protocol === 'https:' ? 'wss' : 'ws';
-    const tokenParam = token ? `&token=${encodeURIComponent(token)}` : '';
-    const url = `${protocol}://${location.host}/ws/${sessionId}?connection_id=${Date.now()}${tokenParam}`;
-
-    this.ws = new WebSocket(url);
-
-    this.ws.onopen = () => {
-      this.retryCount = 0;
-      this._emit('connected', {});
-    };
-
-    this.ws.onmessage = (e) => {
-      try {
-        const msg = JSON.parse(e.data);
-        this._emit(msg.type, msg.data || msg);
-      } catch (err) {
-        console.error('WS parse error', err);
-      }
-    };
-
-    this.ws.onclose = (e) => {
-      // Auth/forbidden errors — do not retry
-      if (e.code === 4001 || e.code === 4003) {
-        this._emit('error', { msg: 'WebSocket auth error' });
-        return;
-      }
-      if (this.retryCount >= this.maxRetries) {
-        this._emit('error', { msg: 'Connection lost after maximum retries' });
-        return;
-      }
-      const delay = Math.min(1000 * Math.pow(2, this.retryCount), 30000);
-      this.retryCount++;
-      setTimeout(() => {
-        if (this._sessionId) this.connect(this._sessionId);
-      }, delay);
-    };
-
-    this.ws.onerror = () => {
-      this._emit('error', { msg: 'WebSocket error' });
-    };
-  }
-
-  on(type, cb) {
-    this.handlers[type] = cb;
-  }
-
-  _emit(type, data) {
-    if (this.handlers[type]) this.handlers[type](data);
-  }
-
-  send(obj) {
-    if (this.ws && this.ws.readyState === WebSocket.OPEN) {
-      this.ws.send(JSON.stringify(obj));
-    }
-  }
-
-  disconnect() {
-    this._sessionId = null;
-    if (this.ws) {
-      this.ws.onclose = null; // prevent reconnect
-      this.ws.close();
-      this.ws = null;
-    }
-  }
-}
-
-window.dashboardWS = new DashboardWebSocket();
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index b853323..5184eb3 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -7,6 +7,7 @@ import { RegisterPage } from './pages/RegisterPage';
 import { DashboardPage } from './pages/DashboardPage';
 import LandingPage from './pages/LandingPage';
 import { SettingsPage } from './pages/SettingsPage';
+import { ErrorBoundary } from './components/ErrorBoundary';
 import { ToastContainer } from './components/Toast/Toast';
 import { GlobalShortcutsHandler } from './components/GlobalShortcutsHandler';
 
@@ -23,7 +24,9 @@ export default function App() {
               path="/dashboard"
               element={
                 <ProtectedRoute>
-                  <DashboardPage />
+                  <ErrorBoundary>
+                    <DashboardPage />
+                  </ErrorBoundary>
                 </ProtectedRoute>
               }
             />
@@ -31,7 +34,9 @@ export default function App() {
               path="/settings"
               element={
                 <ProtectedRoute>
-                  <SettingsPage />
+                  <ErrorBoundary>
+                    <SettingsPage />
+                  </ErrorBoundary>
                 </ProtectedRoute>
               }
             />
diff --git a/frontend/src/components/Dashboard/ActivityLog.jsx b/frontend/src/components/Dashboard/ActivityLog.jsx
index 973d97a..6fdb06a 100644
--- a/frontend/src/components/Dashboard/ActivityLog.jsx
+++ b/frontend/src/components/Dashboard/ActivityLog.jsx
@@ -30,10 +30,10 @@ export function ActivityLog({ sessionEvents }) {
 
   return (
     <div className="activity-log">
-      {events.map((msg, i) => {
+      {events.map((msg) => {
         const meta = EVENT_META[msg.type];
         return (
-          <div key={i} className="activity-item">
+          <div key={msg.timestamp + '-' + msg.type} className="activity-item">
             <span className="activity-icon">{meta.icon}</span>
             <span className="activity-text">{meta.label(msg.data)}</span>
             <span className="activity-time">{relativeTime(msg.timestamp)}</span>
diff --git a/frontend/src/components/Dashboard/AnalyticsPanel.jsx b/frontend/src/components/Dashboard/AnalyticsPanel.jsx
index 18e40ad..4e31c9c 100644
--- a/frontend/src/components/Dashboard/AnalyticsPanel.jsx
+++ b/frontend/src/components/Dashboard/AnalyticsPanel.jsx
@@ -3,8 +3,9 @@ import {
   BarChart, Bar, LineChart, Line,
   XAxis, YAxis, CartesianGrid, Tooltip, ResponsiveContainer,
 } from 'recharts';
-import { getSessionAnalytics, getSessionClusters, fetchAllComments } from '../../services/api';
+import { getSessionAnalytics, getSessionClusters, getClusterComments } from '../../services/api';
 import { ActivityLog } from './ActivityLog';
+import { Skeleton } from '../Skeleton';
 
 const ANALYTICS_EVENTS = new Set([
   'comment_created', 'comment_classified',
@@ -70,15 +71,18 @@ export function AnalyticsPanel({ sessionId, token, sessionEvents }) {
   async function handleExportCSV() {
     setExporting(true);
     try {
-      const [clusters, comments] = await Promise.all([
-        getSessionClusters(sessionId, token),
-        fetchAllComments(sessionId, token),
-      ]);
+      const clusters = await getSessionClusters(sessionId, token);
       const rows = [['Question', 'Answer', 'Cluster', 'Timestamp', 'Is Posted']];
-      (clusters || []).forEach(cluster => {
-        const clusterComments = (comments || []).filter(c => c.cluster_id === cluster.id);
+      for (const cluster of (clusters || [])) {
+        let comments;
+        try {
+          comments = await getClusterComments(cluster.id, token);
+        } catch (e) {
+          console.warn(`Skipping cluster ${cluster.id} in export:`, e.message);
+          continue;
+        }
         const latestAnswer = cluster.answers?.[cluster.answers.length - 1];
-        clusterComments.forEach(comment => {
+        for (const comment of (comments || [])) {
           rows.push([
             comment.text,
             latestAnswer?.text || '',
@@ -86,8 +90,8 @@ export function AnalyticsPanel({ sessionId, token, sessionEvents }) {
             new Date(comment.created_at).toLocaleString(),
             latestAnswer?.is_posted ? 'Yes' : 'No',
           ]);
-        });
-      });
+        }
+      }
       const csv = rows
         .map(row => row.map(cell => `"${String(cell ?? '').replace(/"/g, '""')}"`).join(','))
         .join('\n');
@@ -102,20 +106,29 @@ export function AnalyticsPanel({ sessionId, token, sessionEvents }) {
   async function handleExportJSON() {
     setExporting(true);
     try {
-      const [clusters, comments] = await Promise.all([
-        getSessionClusters(sessionId, token),
-        fetchAllComments(sessionId, token),
-      ]);
-      const output = (clusters || []).map(cluster => ({
-        cluster_id: cluster.id,
-        title: cluster.title,
-        comment_count: cluster.comment_count,
-        answer: cluster.answers?.[cluster.answers.length - 1]?.text || null,
-        is_posted: cluster.answers?.[cluster.answers.length - 1]?.is_posted ?? false,
-        questions: (comments || [])
-          .filter(c => c.cluster_id === cluster.id)
-          .map(c => ({ text: c.text, author: c.author_name, timestamp: c.created_at })),
-      }));
+      const clusters = await getSessionClusters(sessionId, token);
+      const output = [];
+      for (const cluster of (clusters || [])) {
+        let comments;
+        try {
+          comments = await getClusterComments(cluster.id, token);
+        } catch (e) {
+          console.warn(`Skipping cluster ${cluster.id} in export:`, e.message);
+          continue;
+        }
+        output.push({
+          cluster_id: cluster.id,
+          title: cluster.title,
+          comment_count: cluster.comment_count,
+          answer: cluster.answers?.[cluster.answers.length - 1]?.text || null,
+          is_posted: cluster.answers?.[cluster.answers.length - 1]?.is_posted ?? false,
+          questions: (comments || []).map(c => ({
+            text: c.text,
+            author: c.author_name,
+            timestamp: c.created_at,
+          })),
+        });
+      }
       downloadBlob(
         JSON.stringify(output, null, 2),
         'application/json',
@@ -128,7 +141,20 @@ export function AnalyticsPanel({ sessionId, token, sessionEvents }) {
     }
   }
 
-  if (loading) return <div className="panel"><p className="empty-msg">Loading analytics...</p></div>;
+  if (loading) return (
+    <div className="panel">
+      <h2>Session Analytics</h2>
+      <div className="analytics-stats">
+        {[1, 2, 3, 4].map(i => (
+          <div key={i} className="analytics-stat">
+            <Skeleton className="sk-analytics-value" />
+            <Skeleton className="sk-analytics-label" />
+          </div>
+        ))}
+      </div>
+      <Skeleton className="sk-analytics-chart" />
+    </div>
+  );
   if (error) return <div className="panel"><p className="error-msg">{error}</p></div>;
 
   // Derive cumulative line chart data
@@ -203,7 +229,16 @@ export function AnalyticsPanel({ sessionId, token, sessionEvents }) {
             </div>
           </>
         ) : (
-          <p className="empty-msg" style={{ marginBottom: 16 }}>No time data yet.</p>
+          <div className="empty-state" style={{ marginBottom: 16 }}>
+            <span className="empty-state-icon">
+              <svg width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round">
+                <line x1="18" y1="20" x2="18" y2="10"/><line x1="12" y1="20" x2="12" y2="4"/>
+                <line x1="6" y1="20" x2="6" y2="14"/><line x1="2" y1="20" x2="22" y2="20"/>
+              </svg>
+            </span>
+            <p className="empty-state-title">No data yet</p>
+            <p className="empty-state-description">Analytics will appear once questions start coming in</p>
+          </div>
         )}
 
         {data.top_clusters.length > 0 && (
diff --git a/frontend/src/components/Dashboard/ClusterDetailsModal.jsx b/frontend/src/components/Dashboard/ClusterDetailsModal.jsx
index d11baa7..9103bcd 100644
--- a/frontend/src/components/Dashboard/ClusterDetailsModal.jsx
+++ b/frontend/src/components/Dashboard/ClusterDetailsModal.jsx
@@ -1,3 +1,5 @@
+import { Skeleton } from '../Skeleton';
+
 export function ClusterDetailsModal({ cluster, comments, onClose }) {
   const answers = cluster.answers ?? [];
   const latestAnswer = answers.length > 0 ? answers[answers.length - 1] : null;
@@ -10,9 +12,24 @@ export function ClusterDetailsModal({ cluster, comments, onClose }) {
 
         <div className="cluster-comments-list">
           {comments === null ? (
-            <p className="hint">Loading questions...</p>
+            <div className="skeleton-list">
+              {[1, 2, 3, 4].map(i => (
+                <div key={i} className="skeleton-row">
+                  <Skeleton className="sk-comment-author" />
+                  <Skeleton className="sk-comment-text" />
+                </div>
+              ))}
+            </div>
           ) : comments.length === 0 ? (
-            <div className="empty-state"><p>No questions assigned yet.</p></div>
+            <div className="empty-state">
+              <span className="empty-state-icon">
+                <svg width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round">
+                  <path d="M21 15a2 2 0 0 1-2 2H7l-4 4V5a2 2 0 0 1 2-2h14a2 2 0 0 1 2 2z"/>
+                </svg>
+              </span>
+              <p className="empty-state-title">No questions assigned</p>
+              <p className="empty-state-description">Questions will appear here once grouped into this cluster</p>
+            </div>
           ) : (
             comments.map(c => (
               <div key={c.id} className="cluster-comment-item">
diff --git a/frontend/src/components/Dashboard/ClustersPanel.jsx b/frontend/src/components/Dashboard/ClustersPanel.jsx
index 2d5c856..48ace26 100644
--- a/frontend/src/components/Dashboard/ClustersPanel.jsx
+++ b/frontend/src/components/Dashboard/ClustersPanel.jsx
@@ -1,7 +1,8 @@
 import { useState, useEffect, useRef } from 'react';
-import { getSessionClusters, approveAnswer, editAnswer, getClusterComments } from '../../services/api';
+import { getSessionClusters, approveAnswer, editAnswer, getClusterComments, getRepresentativeQuestion } from '../../services/api';
 import { showToast } from '../../hooks/useToast';
 import { ClusterDetailsModal } from './ClusterDetailsModal';
+import { Skeleton } from '../Skeleton';
 
 const REFETCH_EVENTS = new Set(['cluster_created', 'cluster_updated', 'answer_ready', 'answer_posted']);
 
@@ -16,7 +17,11 @@ export function ClustersPanel({ sessionId, token, wsMessages, approveFirstRef })
   const [clusterFilter, setClusterFilter] = useState('all');
   const [selectedCluster, setSelectedCluster] = useState(null);
   const [modalComments, setModalComments] = useState(null);
+  const [expandedIds, setExpandedIds] = useState(new Set());
+  const [repQuestions, setRepQuestions] = useState({});
   const commentCache = useRef(new Map());
+  const debounceRef = useRef(null);
+  const fetchedClusterIds = useRef(new Set());
 
   async function fetchClusters() {
     const data = await getSessionClusters(sessionId, token);
@@ -54,24 +59,54 @@ export function ClustersPanel({ sessionId, token, wsMessages, approveFirstRef })
         handleApprove(latest.id);
       }
     };
-    return () => { approveFirstRef.current = null; }; // cleanup on unmount — prevents stale calls
+    return () => { approveFirstRef.current = null; };
   }, [clusters, approveFirstRef]);
 
-  // WS-triggered refetch — targeted cache invalidation
+  // WS-triggered refetch — debounced
   useEffect(() => {
     if (!wsMessages || wsMessages.length === 0) return;
     const last = wsMessages[wsMessages.length - 1];
     if (last && REFETCH_EVENTS.has(last.type)) {
       const affectedId = last.data?.cluster_id ?? last.data?.id ?? null;
-      if (affectedId) {
-        commentCache.current.delete(affectedId);
-      } else {
-        commentCache.current.clear();
-      }
-      fetchClusters().catch(() => {});
+      clearTimeout(debounceRef.current);
+      debounceRef.current = setTimeout(() => {
+        if (affectedId) commentCache.current.delete(affectedId);
+        else commentCache.current.clear();
+        fetchClusters().catch(() => {});
+      }, 1000);
     }
+    return () => clearTimeout(debounceRef.current);
   }, [wsMessages]);
 
+  // Reset repQuestions on session change
+  useEffect(() => {
+    fetchedClusterIds.current = new Set();
+    setRepQuestions({});
+  }, [sessionId]);
+
+  // Fetch representative question for each cluster (once per cluster id)
+  useEffect(() => {
+    clusters.forEach(cluster => {
+      if (cluster.comment_count <= 1) return;
+      if (fetchedClusterIds.current.has(cluster.id)) return;
+      fetchedClusterIds.current.add(cluster.id);
+      getRepresentativeQuestion(cluster.id, token)
+        .then(data => {
+          if (data?.text) setRepQuestions(prev => ({ ...prev, [cluster.id]: data.text }));
+        })
+        .catch(() => {});
+    });
+  }, [clusters]);
+
+  function toggleExpand(id) {
+    setExpandedIds(prev => {
+      const next = new Set(prev);
+      if (next.has(id)) next.delete(id);
+      else next.add(id);
+      return next;
+    });
+  }
+
   async function openClusterModal(cluster) {
     setSelectedCluster(cluster);
     if (commentCache.current.has(cluster.id)) {
@@ -145,8 +180,11 @@ export function ClustersPanel({ sessionId, token, wsMessages, approveFirstRef })
   });
 
   return (
-    <section className="panel">
-      <h2>Clusters &amp; Answers</h2>
+    <section className="panel panel-scrollable panel-clusters">
+      <h2>
+        Clusters &amp; Answers
+        <span className="badge">{clusters.length}</span>
+      </h2>
 
       <div className="filter-tabs">
         {['all', 'pending', 'approved'].map(tab => (
@@ -162,14 +200,12 @@ export function ClustersPanel({ sessionId, token, wsMessages, approveFirstRef })
 
       {isLoadingInitial ? (
         <div className="clusters-list">
-          {[1, 2].map(i => (
+          {[1, 2, 3].map(i => (
             <div key={i} className="cluster-card">
-              <div style={{ display: 'flex', justifyContent: 'space-between', marginBottom: 8 }}>
-                <div className="skeleton" style={{ width: '60%', height: 16 }} />
-                <div className="skeleton" style={{ width: 60, height: 14 }} />
+              <div className="cluster-header">
+                <Skeleton className="sk-cluster-title" />
+                <Skeleton className="sk-cluster-count" />
               </div>
-              <div className="skeleton" style={{ height: 60, marginBottom: 8 }} />
-              <div className="skeleton" style={{ width: 80, height: 28 }} />
             </div>
           ))}
         </div>
@@ -179,10 +215,20 @@ export function ClustersPanel({ sessionId, token, wsMessages, approveFirstRef })
         <div className="clusters-list">
           {filteredClusters.length === 0 ? (
             <div className="empty-state">
-              <span className="empty-icon">🤖</span>
-              <p>{clusters.length === 0 ? 'No clusters yet' : 'No clusters match this filter'}</p>
+              <span className="empty-state-icon">
+                <svg width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round">
+                  <circle cx="12" cy="5" r="2"/><circle cx="5" cy="19" r="2"/><circle cx="19" cy="19" r="2"/>
+                  <line x1="12" y1="7" x2="5" y2="17"/><line x1="12" y1="7" x2="19" y2="17"/>
+                  <line x1="5" y1="19" x2="19" y2="19"/>
+                </svg>
+              </span>
+              <p className="empty-state-title">
+                {clusters.length === 0 ? 'No clusters yet' : 'No clusters match this filter'}
+              </p>
               {clusters.length === 0 && (
-                <p className="empty-hint">Questions cluster automatically after 5 similar ones arrive</p>
+                <p className="empty-state-description">
+                  Clusters form automatically once enough questions arrive
+                </p>
               )}
             </div>
           ) : (
@@ -190,87 +236,104 @@ export function ClustersPanel({ sessionId, token, wsMessages, approveFirstRef })
               const answers = cluster.answers || [];
               const latestAnswer = answers[answers.length - 1];
               const isEditing = latestAnswer && editingAnswerId === latestAnswer.id;
+              const isExpanded = expandedIds.has(cluster.id);
+              const isApproved = latestAnswer?.is_posted === true;
+
               return (
-                <div key={cluster.id} className="cluster-card">
-                  <div className="cluster-header">
-                    <span
-                      className="cluster-title"
-                      style={{ cursor: 'pointer' }}
-                      onClick={() => openClusterModal(cluster)}
-                    >
+                <div
+                  key={cluster.id}
+                  className={`cluster-card${isApproved ? ' cluster-approved' : ''}${isExpanded ? ' expanded' : ''}`}
+                >
+                  <div className="cluster-header" onClick={() => toggleExpand(cluster.id)}>
+                    <span className="cluster-title">
                       {cluster.title || 'Untitled Cluster'}
                     </span>
+                    <span className="cluster-count">{cluster.comment_count || 0}q</span>
+                    {isApproved && (
+                      <span className="cluster-approved-badge">✓ POSTED</span>
+                    )}
                     <span
-                      className="cluster-count"
-                      style={{ cursor: 'pointer' }}
-                      onClick={() => openClusterModal(cluster)}
+                      className="cluster-expand-icon"
+                      onClick={e => { e.stopPropagation(); openClusterModal(cluster); }}
+                      title="View details"
                     >
-                      {cluster.comment_count || 0} questions
+                      ▼
                     </span>
                   </div>
-                  {latestAnswer ? (
-                    <>
-                      {isEditing ? (
-                        <textarea
-                          value={editedText}
-                          onChange={e => setEditedText(e.target.value)}
-                          style={{ width: '100%', marginBottom: 8, minHeight: 80 }}
-                        />
-                      ) : (
-                        <div className="cluster-answer">{latestAnswer.text}</div>
-                      )}
-                      <div style={{ marginBottom: 6 }}>
-                        <span className={`badge ${latestAnswer.is_posted ? 'badge-posted' : 'badge-pending'}`}>
-                          {latestAnswer.is_posted ? 'Posted' : 'Pending'}
-                        </span>
-                      </div>
-                      <div className="cluster-actions">
-                        {isEditing ? (
-                          <>
-                            <button
-                              className="btn btn-primary btn-sm"
-                              onClick={() => handleSaveEdit(latestAnswer.id)}
-                              disabled={savingId === latestAnswer.id || !editedText.trim()}
-                            >
-                              {savingId === latestAnswer.id ? 'Saving...' : 'Save'}
-                            </button>
-                            <button className="btn btn-sm" onClick={cancelEdit}>
-                              Cancel
-                            </button>
-                          </>
-                        ) : (
-                          <>
-                            <button
-                              className="btn btn-sm"
-                              onClick={() => copyToClipboard(latestAnswer.text)}
-                            >
-                              Copy
-                            </button>
-                            {!latestAnswer.is_posted && (
+                  {repQuestions[cluster.id] && (
+                    <div className="cluster-rep-question">
+                      <span className="cluster-rep-label">Most asked:</span>
+                      {repQuestions[cluster.id]}
+                    </div>
+                  )}
+
+                  <div className={`cluster-body${isExpanded ? ' expanded' : ''}`}>
+                    <div className="cluster-body-inner">
+                      {latestAnswer ? (
+                        <>
+                          {isEditing ? (
+                            <textarea
+                              value={editedText}
+                              onChange={e => setEditedText(e.target.value)}
+                              style={{ width: '100%', marginBottom: 8, minHeight: 80 }}
+                            />
+                          ) : (
+                            <div className="cluster-answer">{latestAnswer.text}</div>
+                          )}
+                          <div style={{ marginBottom: 6 }}>
+                            <span className={`badge ${latestAnswer.is_posted ? 'badge-posted' : 'badge-pending'}`}>
+                              {latestAnswer.is_posted ? 'Posted' : 'Pending'}
+                            </span>
+                          </div>
+                          <div className="cluster-actions">
+                            {isEditing ? (
                               <>
                                 <button
-                                  className="btn btn-sm"
-                                  onClick={() => startEdit(latestAnswer)}
-                                  disabled={loading}
+                                  className="btn btn-primary btn-sm"
+                                  style={{ width: 'auto', marginTop: 0 }}
+                                  onClick={() => handleSaveEdit(latestAnswer.id)}
+                                  disabled={savingId === latestAnswer.id || !editedText.trim()}
                                 >
-                                  Edit
+                                  {savingId === latestAnswer.id ? 'Saving…' : 'Save'}
                                 </button>
+                                <button className="btn btn-sm" onClick={cancelEdit}>Cancel</button>
+                              </>
+                            ) : (
+                              <>
                                 <button
-                                  className="btn btn-primary btn-sm"
-                                  onClick={() => handleApprove(latestAnswer.id)}
-                                  disabled={loading}
+                                  className="btn btn-sm"
+                                  onClick={() => copyToClipboard(latestAnswer.text)}
                                 >
-                                  {loading ? 'Posting...' : 'Approve & Post'}
+                                  Copy
                                 </button>
+                                {!latestAnswer.is_posted && (
+                                  <>
+                                    <button
+                                      className="btn btn-sm"
+                                      onClick={() => startEdit(latestAnswer)}
+                                      disabled={loading}
+                                    >
+                                      Edit
+                                    </button>
+                                    <button
+                                      className="btn btn-primary btn-sm"
+                                      style={{ width: 'auto', marginTop: 0 }}
+                                      onClick={() => handleApprove(latestAnswer.id)}
+                                      disabled={loading}
+                                    >
+                                      {loading ? 'Posting…' : 'Approve & Post'}
+                                    </button>
+                                  </>
+                                )}
                               </>
                             )}
-                          </>
-                        )}
-                      </div>
-                    </>
-                  ) : (
-                    <p className="hint">Generating answer...</p>
-                  )}
+                          </div>
+                        </>
+                      ) : (
+                        <p className="hint">Generating answer…</p>
+                      )}
+                    </div>
+                  </div>
                 </div>
               );
             })
diff --git a/frontend/src/components/Dashboard/DocumentUpload.jsx b/frontend/src/components/Dashboard/DocumentUpload.jsx
index 5725ef2..183718d 100644
--- a/frontend/src/components/Dashboard/DocumentUpload.jsx
+++ b/frontend/src/components/Dashboard/DocumentUpload.jsx
@@ -1,6 +1,7 @@
 import { useState, useEffect, useRef } from 'react';
 import { uploadDocument, getDocuments, deleteDocument } from '../../services/api';
 import { showToast } from '../../hooks/useToast';
+import { Skeleton } from '../Skeleton';
 
 const MAX_SIZE = 10 * 1024 * 1024;
 const ALLOWED = ['.pdf', '.docx', '.txt'];
@@ -17,10 +18,10 @@ export function DocumentUpload({ sessionId, token }) {
   const [isLoadingInitial, setIsLoadingInitial] = useState(true);
   const [uploading, setUploading] = useState(false);
   const [pct, setPct] = useState(0);
+  const [sectionExpanded, setSectionExpanded] = useState(false);
   const fileRef = useRef(null);
   const uploadXhrRef = useRef(null);
 
-  // Fetch docs for current session — stale closure guard
   useEffect(() => {
     let stale = false;
     async function run() {
@@ -38,7 +39,6 @@ export function DocumentUpload({ sessionId, token }) {
     return () => { stale = true; };
   }, [sessionId, token]);
 
-  // Abort in-flight upload when session changes
   useEffect(() => {
     return () => {
       if (uploadXhrRef.current) {
@@ -71,7 +71,6 @@ export function DocumentUpload({ sessionId, token }) {
         const n = result.chunks_created;
         showToast(`Uploaded — ${n} chunk${n !== 1 ? 's' : ''} indexed.`, 'success');
         if (fileRef.current) fileRef.current.value = '';
-        // Refetch docs for this session
         const data = await getDocuments({ token, sessionId });
         setDocs(data || []);
       }
@@ -103,48 +102,50 @@ export function DocumentUpload({ sessionId, token }) {
 
   return (
     <section className="panel">
-      <h2>RAG Documents</h2>
-      <p className="hint" style={{ marginBottom: 10 }}>
-        Upload files to give the AI extra context when generating answers.
-      </p>
+      <div
+        style={{ display: 'flex', alignItems: 'center', justifyContent: 'space-between', cursor: 'pointer', marginBottom: sectionExpanded ? 10 : 0 }}
+        onClick={() => setSectionExpanded(e => !e)}
+      >
+        <span className="sidebar-section-title" style={{ marginBottom: 0 }}>
+          RAG DOCS {docs.length > 0 && `(${docs.length})`}
+        </span>
+        <span style={{ color: 'var(--color-muted)', fontSize: 10, fontFamily: 'var(--font-display)' }}>
+          {sectionExpanded ? '▲' : '▼'}
+        </span>
+      </div>
 
-      <form onSubmit={handleUpload}>
-        <input
-          ref={fileRef}
-          type="file"
-          accept=".pdf,.docx,.txt"
-          style={{ display: 'block', marginBottom: 8, fontSize: 13, width: '100%' }}
-        />
-        {pct > 0 && pct < 100 && (
-          <div style={{ background: 'var(--color-border)', borderRadius: 4, height: 4, margin: '6px 0' }}>
-            <div style={{ width: `${pct}%`, height: '100%', background: 'var(--color-primary)', borderRadius: 4, transition: 'width 0.2s' }} />
-          </div>
-        )}
-        <button type="submit" className="btn btn-primary" disabled={uploading}>
-          {uploading ? 'Uploading...' : 'Upload'}
-        </button>
-      </form>
+      {sectionExpanded && (
+        <>
+          <p className="hint" style={{ marginBottom: 8, marginTop: 6 }}>
+            Upload files (.pdf, .docx, .txt) to give the AI context.
+          </p>
 
-      <div style={{ marginTop: 14 }}>
-        {isLoadingInitial ? (
-          <div style={{ display: 'flex', flexDirection: 'column', gap: 8, marginTop: 4 }}>
-            {[1, 2].map(i => (
-              <div key={i} className="skeleton" style={{ height: 32 }} />
-            ))}
-          </div>
-        ) : docs.length === 0 ? (
-          <div className="empty-state">
-            <span className="empty-icon">📄</span>
-            <p>No documents uploaded yet</p>
-            <p className="empty-hint">Upload PDFs to give the AI extra context when answering</p>
-          </div>
-        ) : (
-          <>
-            <p className="hint" style={{ marginBottom: 6 }}>
-              Indexed documents ({docs.length}):
-            </p>
-            <div style={{ maxHeight: 200, overflowY: 'auto' }}>
-              {docs.map(doc => (
+          <form onSubmit={handleUpload}>
+            <input
+              ref={fileRef}
+              type="file"
+              accept=".pdf,.docx,.txt"
+              style={{ display: 'block', marginBottom: 8, fontSize: 11, width: '100%', color: 'var(--color-muted)' }}
+            />
+            {pct > 0 && pct < 100 && (
+              <div style={{ background: 'var(--color-border)', height: 3, margin: '6px 0' }}>
+                <div style={{ width: `${pct}%`, height: '100%', background: 'var(--color-accent)', transition: 'width 0.2s' }} />
+              </div>
+            )}
+            <button type="submit" className="btn btn-primary" disabled={uploading}>
+              {uploading ? 'Uploading…' : 'Upload'}
+            </button>
+          </form>
+
+          <div style={{ marginTop: 12 }}>
+            {isLoadingInitial ? (
+              <div className="skeleton-list">
+                {[1, 2].map(i => <Skeleton key={i} className="sk-doc-row" />)}
+              </div>
+            ) : docs.length === 0 ? (
+              <p className="hint" style={{ textAlign: 'center', paddingTop: 8 }}>No documents yet</p>
+            ) : (
+              docs.map(doc => (
                 <div
                   key={doc.id}
                   style={{
@@ -152,14 +153,14 @@ export function DocumentUpload({ sessionId, token }) {
                     alignItems: 'center',
                     justifyContent: 'space-between',
                     gap: 8,
-                    padding: '6px 0',
+                    padding: '5px 0',
                     borderBottom: '1px solid var(--color-border)',
                   }}
                 >
-                  <div style={{ minWidth: 0 }}>
+                  <div style={{ minWidth: 0, flex: 1 }}>
                     <span
                       style={{
-                        fontSize: 12,
+                        fontSize: 11,
                         color: 'var(--color-text)',
                         display: 'block',
                         overflow: 'hidden',
@@ -170,9 +171,8 @@ export function DocumentUpload({ sessionId, token }) {
                     >
                       {doc.filename || doc.title}
                     </span>
-                    <span style={{ fontSize: 11, color: 'var(--color-muted)' }}>
+                    <span style={{ fontSize: 10, color: 'var(--color-muted)', fontFamily: 'var(--font-display)' }}>
                       {formatBytes(doc.file_size_bytes)}
-                      {doc.created_at && ` · ${new Date(doc.created_at).toLocaleDateString()}`}
                     </span>
                   </div>
                   <button
@@ -180,14 +180,14 @@ export function DocumentUpload({ sessionId, token }) {
                     onClick={() => handleDelete(doc.id)}
                     style={{ flexShrink: 0 }}
                   >
-                    Delete
+                    ✕
                   </button>
                 </div>
-              ))}
-            </div>
-          </>
-        )}
-      </div>
+              ))
+            )}
+          </div>
+        </>
+      )}
     </section>
   );
 }
diff --git a/frontend/src/components/Dashboard/ManualInput.jsx b/frontend/src/components/Dashboard/ManualInput.jsx
index a9ef981..4c99ece 100644
--- a/frontend/src/components/Dashboard/ManualInput.jsx
+++ b/frontend/src/components/Dashboard/ManualInput.jsx
@@ -6,6 +6,8 @@ export function ManualInput({ sessionId, token, textareaRef }) {
   const [loading, setLoading] = useState(false);
   const [message, setMessage] = useState(null); // { type: 'success'|'error', text }
 
+  const lineCount = text ? text.split('\n').filter(l => l.trim()).length : 0;
+
   async function handleSubmit(e) {
     e.preventDefault();
     const trimmed = text.trim();
@@ -30,22 +32,29 @@ export function ManualInput({ sessionId, token, textareaRef }) {
   return (
     <section className="panel">
       <h2>Manual Questions</h2>
-      <p className="hint">Enter questions (one per line, up to 10).</p>
+      <p className="hint">One question per line, up to 10.</p>
       <form onSubmit={handleSubmit}>
         <textarea
           ref={textareaRef}
           value={text}
           onChange={e => setText(e.target.value)}
-          rows={5}
+          rows={4}
           placeholder={"What is Newton's first law?\nHow do I solve quadratic equations?"}
+          style={{ fontFamily: 'var(--font-display)', fontSize: 11 }}
         />
+        <p className="hint" style={{ textAlign: 'right', marginBottom: 4, marginTop: 2 }}>
+          {lineCount} / 10
+        </p>
         {message && (
-          <p className={message.type === 'error' ? 'error-msg' : ''} style={message.type === 'success' ? { color: 'var(--color-success)', fontSize: 13, marginTop: 4 } : {}}>
+          <p
+            className={message.type === 'error' ? 'error-msg' : ''}
+            style={message.type === 'success' ? { color: 'var(--color-success)', fontSize: 11, marginTop: 2, marginBottom: 4 } : {}}
+          >
             {message.text}
           </p>
         )}
-        <button type="submit" className="btn btn-primary" disabled={loading}>
-          {loading ? 'Submitting...' : 'Submit Questions'}
+        <button type="submit" className="btn btn-primary" disabled={loading || lineCount === 0}>
+          {loading ? 'Submitting…' : 'Submit Questions'}
         </button>
       </form>
     </section>
diff --git a/frontend/src/components/Dashboard/MetricsCards.jsx b/frontend/src/components/Dashboard/MetricsCards.jsx
index 4a2cdb2..6680c3c 100644
--- a/frontend/src/components/Dashboard/MetricsCards.jsx
+++ b/frontend/src/components/Dashboard/MetricsCards.jsx
@@ -1,5 +1,6 @@
-import { useState, useEffect } from 'react';
+import { useState, useEffect, useRef } from 'react';
 import { getSessionStats } from '../../services/api';
+import { Skeleton } from '../Skeleton';
 
 const REFETCH_EVENTS = new Set(['comment_created', 'cluster_created', 'answer_ready', 'answer_posted', 'comment_classified']);
 
@@ -7,6 +8,7 @@ export function MetricsCards({ sessionId, token, wsMessages }) {
   const [stats, setStats] = useState(null);
   const [isLoadingInitial, setIsLoadingInitial] = useState(true);
   const [error, setError] = useState(null);
+  const debounceRef = useRef(null);
 
   useEffect(() => {
     let stale = false;
@@ -31,15 +33,19 @@ export function MetricsCards({ sessionId, token, wsMessages }) {
     return () => { stale = true; };
   }, [sessionId, token]);
 
-  // WS-triggered refetch — does NOT set isLoadingInitial
+  // WS-triggered refetch — debounced, does NOT set isLoadingInitial
   useEffect(() => {
     if (!sessionId || !wsMessages || wsMessages.length === 0) return;
     const last = wsMessages[wsMessages.length - 1];
     if (last && REFETCH_EVENTS.has(last.type)) {
-      getSessionStats(sessionId, token)
-        .then(data => { if (data) setStats(data); })
-        .catch(() => {});
+      clearTimeout(debounceRef.current);
+      debounceRef.current = setTimeout(() => {
+        getSessionStats(sessionId, token)
+          .then(data => { if (data) setStats(data); })
+          .catch(() => {});
+      }, 1000);
     }
+    return () => clearTimeout(debounceRef.current);
   }, [wsMessages]);
 
   return (
@@ -49,8 +55,8 @@ export function MetricsCards({ sessionId, token, wsMessages }) {
         <div className="metrics-grid">
           {[1, 2, 3, 4].map(i => (
             <div key={i} className="metric-card">
-              <div className="skeleton" style={{ height: 32, marginBottom: 6 }} />
-              <div className="skeleton" style={{ height: 12, width: '55%', margin: '0 auto' }} />
+              <Skeleton className="sk-metric-value" />
+              <Skeleton className="sk-metric-label" />
             </div>
           ))}
         </div>
diff --git a/frontend/src/components/Dashboard/QuestionsFeed.jsx b/frontend/src/components/Dashboard/QuestionsFeed.jsx
index 408ac50..ae0d037 100644
--- a/frontend/src/components/Dashboard/QuestionsFeed.jsx
+++ b/frontend/src/components/Dashboard/QuestionsFeed.jsx
@@ -1,5 +1,6 @@
 import { useState, useEffect } from 'react';
 import { getSessionComments } from '../../services/api';
+import { Skeleton } from '../Skeleton';
 
 const PAGE_SIZE = 20;
 
@@ -25,7 +26,7 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
     return () => clearTimeout(timer);
   }, [searchQuery]);
 
-  // Initial fetch — reset everything on session/token change
+  // Initial fetch — reset everything on session change
   useEffect(() => {
     let stale = false;
     setOffset(0);
@@ -36,9 +37,9 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
       setError(null);
       try {
         const data = await getSessionComments(sessionId, token, PAGE_SIZE, 0);
-        if (!stale) {
-          setComments(data || []);
-          setHasMore((data || []).length === PAGE_SIZE);
+        if (!stale && data) {
+          setComments(data);
+          setHasMore(data.length === PAGE_SIZE);
         }
       } catch (e) {
         if (!stale) setError(e.message);
@@ -50,14 +51,32 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
     return () => { stale = true; };
   }, [sessionId, token]);
 
-  // Process WebSocket messages
+  // Re-fetch when token refreshes while initial load is still pending
   useEffect(() => {
+    if (!sessionId || !token || !isLoadingInitial) return;
+    let stale = false;
+    getSessionComments(sessionId, token, PAGE_SIZE, 0).then(data => {
+      if (!stale && data) {
+        setComments(data);
+        setHasMore(data.length === PAGE_SIZE);
+        setIsLoadingInitial(false);
+      }
+    });
+    return () => { stale = true; };
+  }, [token]);
+
+  // Process WebSocket messages — skip until initial fetch is done
+  useEffect(() => {
+    if (isLoadingInitial) return;
     if (!wsMessages || wsMessages.length === 0) return;
     const last = wsMessages[wsMessages.length - 1];
     if (!last) return;
 
     if (last.type === 'comment_created') {
-      setComments(prev => [last.data || last, ...prev]);
+      setComments(prev => {
+        if (prev.some(c => c.id === (last.data?.id ?? last.id))) return prev;
+        return [last.data || last, ...prev];
+      });
       // do NOT touch offset
     } else if (last.type === 'comment_classified') {
       const { comment_id, is_question } = last.data || last;
@@ -65,7 +84,7 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
         prev.map(c => c.id === comment_id ? { ...c, is_question } : c)
       );
     }
-  }, [wsMessages]);
+  }, [wsMessages, isLoadingInitial]);
 
   async function loadMore() {
     if (loadingMore) return;
@@ -85,7 +104,7 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
     : comments;
 
   return (
-    <section className="panel">
+    <section className="panel panel-scrollable panel-feed">
       <h2>
         Live Feed{' '}
         <span className="badge">{comments.length}</span>
@@ -108,11 +127,11 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
 
       {isLoadingInitial ? (
         <div className="questions-feed">
-          {[1, 2, 3].map(i => (
+          {[1, 2, 3, 4, 5].map(i => (
             <div key={i} className="feed-item">
-              <div className="skeleton" style={{ width: 60, height: 14 }} />
-              <div className="skeleton" style={{ flex: 1, height: 14 }} />
-              <div className="skeleton" style={{ width: 70, height: 18, borderRadius: 12 }} />
+              <Skeleton className="sk-feed-author" />
+              <Skeleton className="sk-feed-text" />
+              <Skeleton className="sk-feed-badge" />
             </div>
           ))}
         </div>
@@ -123,10 +142,18 @@ export function QuestionsFeed({ sessionId, token, wsMessages }) {
           <div className="questions-feed">
             {filteredComments.length === 0 ? (
               <div className="empty-state">
-                <span className="empty-icon">📝</span>
-                <p>{debouncedQuery ? 'No matching questions' : 'No questions yet'}</p>
+                <span className="empty-state-icon">
+                  <svg width="32" height="32" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="1.5" strokeLinecap="round" strokeLinejoin="round">
+                    <path d="M21 15a2 2 0 0 1-2 2H7l-4 4V5a2 2 0 0 1 2-2h14a2 2 0 0 1 2 2z"/>
+                  </svg>
+                </span>
+                <p className="empty-state-title">
+                  {debouncedQuery ? 'No matching questions' : 'No questions yet'}
+                </p>
                 {!debouncedQuery && (
-                  <p className="empty-hint">Connect YouTube or submit manual questions above to get started</p>
+                  <p className="empty-state-description">
+                    Questions from your live stream will appear here
+                  </p>
                 )}
               </div>
             ) : (
diff --git a/frontend/src/components/Dashboard/QuotaBanner.jsx b/frontend/src/components/Dashboard/QuotaBanner.jsx
new file mode 100644
index 0000000..d61ad09
--- /dev/null
+++ b/frontend/src/components/Dashboard/QuotaBanner.jsx
@@ -0,0 +1,49 @@
+const DEFAULT_MESSAGES = {
+  warning: 'YouTube API quota is running low. New comments may stop being processed soon.',
+  critical: 'YouTube API quota exhausted. Comment processing and posting are paused until quota resets.',
+};
+
+const WarningIcon = () => (
+  <svg
+    className="quota-banner-icon"
+    viewBox="0 0 20 20"
+    fill="currentColor"
+    aria-hidden="true"
+  >
+    <path
+      fillRule="evenodd"
+      d="M8.485 2.495c.673-1.167 2.357-1.167 3.03 0l6.28 10.875c.673 1.167-.17 2.625-1.516 2.625H3.72c-1.347 0-2.189-1.458-1.515-2.625L8.485 2.495zM10 5a.75.75 0 01.75.75v3.5a.75.75 0 01-1.5 0v-3.5A.75.75 0 0110 5zm0 9a1 1 0 100-2 1 1 0 000 2z"
+      clipRule="evenodd"
+    />
+  </svg>
+);
+
+const DismissIcon = () => (
+  <svg
+    viewBox="0 0 14 14"
+    fill="currentColor"
+    aria-hidden="true"
+    width="14"
+    height="14"
+  >
+    <path d="M1.293 1.293a1 1 0 011.414 0L7 5.586l4.293-4.293a1 1 0 111.414 1.414L8.414 7l4.293 4.293a1 1 0 01-1.414 1.414L7 8.414l-4.293 4.293a1 1 0 01-1.414-1.414L5.586 7 1.293 2.707a1 1 0 010-1.414z" />
+  </svg>
+);
+
+export function QuotaBanner({ level, message, onDismiss }) {
+  const text = message || DEFAULT_MESSAGES[level];
+  return (
+    <div className={`quota-banner quota-banner-${level}`} role="alert">
+      <WarningIcon />
+      <span className="quota-banner-text">{text}</span>
+      <button
+        className="quota-banner-dismiss"
+        onClick={onDismiss}
+        aria-label="Dismiss quota alert"
+        type="button"
+      >
+        <DismissIcon />
+      </button>
+    </div>
+  );
+}
diff --git a/frontend/src/components/Dashboard/SessionList.jsx b/frontend/src/components/Dashboard/SessionList.jsx
index 4ed6005..963227e 100644
--- a/frontend/src/components/Dashboard/SessionList.jsx
+++ b/frontend/src/components/Dashboard/SessionList.jsx
@@ -6,27 +6,22 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState(null);
 
-  // Create session form state
   const [title, setTitle] = useState('');
   const [videoId, setVideoId] = useState('');
   const [creating, setCreating] = useState(false);
   const [createError, setCreateError] = useState('');
 
-  // End session state
   const [ending, setEnding] = useState(false);
   const [showEndConfirm, setShowEndConfirm] = useState(false);
   const [filter, setFilter] = useState('all');
 
-  useEffect(() => {
-    fetchSessions();
-  }, []);
+  useEffect(() => { fetchSessions(); }, []);
 
   async function fetchSessions() {
     try {
       setLoading(true);
       const data = await getSessions(token);
       setSessions(data || []);
-      // Auto-select first active session if none selected
       if (!activeSession) {
         const active = (data || []).find(s => s.is_active);
         if (active) onSelect(active);
@@ -83,11 +78,9 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
             <h3>End session?</h3>
             <p>This will stop YouTube polling and end the session. This cannot be undone.</p>
             <div className="modal-actions">
-              <button className="btn btn-sm" onClick={() => setShowEndConfirm(false)}>
-                Cancel
-              </button>
-              <button className="btn btn-danger btn-sm" onClick={handleEnd} disabled={ending}>
-                {ending ? 'Ending...' : 'End Session'}
+              <button className="btn btn-sm" onClick={() => setShowEndConfirm(false)}>Cancel</button>
+              <button className="btn btn-danger btn-sm" style={{ width: 'auto', marginTop: 0 }} onClick={handleEnd} disabled={ending}>
+                {ending ? 'Ending…' : 'End Session'}
               </button>
             </div>
           </div>
@@ -97,30 +90,35 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
       {activeSession ? (
         <div>
           <div className="session-info">
-            <strong>{activeSession.title}</strong>
+            <strong style={{ fontSize: 12, fontFamily: 'var(--font-display)', letterSpacing: '0.03em' }}>
+              {activeSession.title}
+            </strong>
             <span className="badge badge-active">Live</span>
           </div>
           {activeSession.youtube_video_id ? (
             <p className="hint">YouTube: {activeSession.youtube_video_id}</p>
           ) : (
-            <p className="hint">Manual mode (no YouTube video)</p>
+            <p className="hint">Manual mode</p>
           )}
-          <button
-            onClick={() => setShowEndConfirm(true)}
-            className="btn btn-danger"
-            disabled={ending}
-          >
-            {ending ? 'Ending...' : 'End Session'}
-          </button>
-          <button onClick={() => onSelect(null)} className="btn" style={{ marginLeft: 8 }}>
-            Switch Session
-          </button>
+          <div style={{ display: 'flex', gap: 6, marginTop: 8 }}>
+            <button
+              onClick={() => setShowEndConfirm(true)}
+              className="btn btn-danger-sm"
+              disabled={ending}
+              style={{ flex: 1 }}
+            >
+              {ending ? 'Ending…' : 'End Session'}
+            </button>
+            <button onClick={() => onSelect(null)} className="btn btn-sm" style={{ flex: 1 }}>
+              Switch
+            </button>
+          </div>
         </div>
       ) : (
         <div>
           <form onSubmit={handleCreate}>
             <label>
-              Session Title
+              Title
               <input
                 ref={titleInputRef}
                 type="text"
@@ -131,7 +129,7 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
               />
             </label>
             <label>
-              YouTube Video ID <span className="hint">(optional)</span>
+              YouTube Video ID <span className="hint" style={{ display: 'inline', marginBottom: 0 }}>(optional)</span>
               <input
                 type="text"
                 value={videoId}
@@ -141,16 +139,16 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
             </label>
             {createError && <p className="error-msg">{createError}</p>}
             <button type="submit" className="btn btn-primary" disabled={creating}>
-              {creating ? 'Starting...' : 'Start Session'}
+              {creating ? 'Starting…' : 'Start Session'}
             </button>
           </form>
 
           {loading ? (
-            <p style={{ marginTop: 12, color: 'var(--color-muted)', fontSize: 13 }}>Loading sessions...</p>
+            <p className="hint" style={{ marginTop: 10 }}>Loading sessions…</p>
           ) : error ? (
             <p className="error-msg" style={{ marginTop: 8 }}>{error}</p>
           ) : sessions.length > 0 ? (
-            <div style={{ marginTop: 16 }}>
+            <div style={{ marginTop: 14 }}>
               <select
                 className="session-filter"
                 value={filter}
@@ -161,25 +159,33 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
                 <option value="ended">Ended Only</option>
               </select>
               {(() => {
-                const displayedSessions = sessions.filter(s => {
+                const displayed = sessions.filter(s => {
                   if (filter === 'active') return s.is_active;
                   if (filter === 'ended') return !s.is_active;
                   return true;
                 });
-                return displayedSessions.length > 0 ? displayedSessions.map(s => (
+                return displayed.length > 0 ? displayed.map(s => (
                   <div
                     key={s.id}
                     onClick={() => onSelect(s)}
                     style={{
-                      padding: '6px 8px',
-                      fontSize: 12,
+                      padding: '6px 0',
+                      fontSize: 11,
                       color: 'var(--color-muted)',
                       borderBottom: '1px solid var(--color-border)',
                       cursor: 'pointer',
+                      display: 'flex',
+                      alignItems: 'center',
+                      gap: 6,
+                      transition: 'color 0.12s',
                     }}
+                    onMouseEnter={e => e.currentTarget.style.color = 'var(--color-text)'}
+                    onMouseLeave={e => e.currentTarget.style.color = 'var(--color-muted)'}
                   >
-                    {s.title}
-                    {s.is_active && <span className="badge badge-active" style={{ marginLeft: 6 }}>Live</span>}
+                    <span style={{ flex: 1, overflow: 'hidden', textOverflow: 'ellipsis', whiteSpace: 'nowrap' }}>
+                      {s.title}
+                    </span>
+                    {s.is_active && <span className="badge badge-active">Live</span>}
                   </div>
                 )) : (
                   <p className="hint" style={{ marginTop: 8 }}>No sessions match this filter.</p>
@@ -190,7 +196,7 @@ export function SessionList({ token, onSelect, activeSession, titleInputRef }) {
             <div className="empty-state" style={{ padding: '16px 0' }}>
               <span className="empty-icon">🎓</span>
               <p>No sessions yet</p>
-              <p className="empty-hint">Create your first session to start managing questions</p>
+              <p className="empty-hint">Create your first session above</p>
             </div>
           ) : null}
         </div>
diff --git a/frontend/src/components/Dashboard/YouTubePanel.jsx b/frontend/src/components/Dashboard/YouTubePanel.jsx
index abc0750..aab6210 100644
--- a/frontend/src/components/Dashboard/YouTubePanel.jsx
+++ b/frontend/src/components/Dashboard/YouTubePanel.jsx
@@ -1,4 +1,4 @@
-import { useState, useEffect } from 'react';
+import { useState, useEffect, useRef } from 'react';
 import { getYouTubeStatus, getYouTubeAuthURL, disconnectYouTube } from '../../services/api';
 
 export function YouTubePanel({ token }) {
@@ -6,6 +6,16 @@ export function YouTubePanel({ token }) {
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState(null);
   const [actionLoading, setActionLoading] = useState(false);
+  const pollIntervalRef = useRef(null);
+  const messageHandlerRef = useRef(null);
+
+  useEffect(() => () => {
+    clearInterval(pollIntervalRef.current);
+    if (messageHandlerRef.current) {
+      window.removeEventListener('message', messageHandlerRef.current);
+      messageHandlerRef.current = null;
+    }
+  }, []);
 
   useEffect(() => {
     fetchStatus();
@@ -14,10 +24,16 @@ export function YouTubePanel({ token }) {
   async function fetchStatus() {
     try {
       setLoading(true);
+      setError(null);
       const status = await getYouTubeStatus(token);
+      if (!status) {
+        // 401 silently returned undefined — show disconnected, not an error
+        setYtStatus({ connected: false });
+        return;
+      }
       setYtStatus(status);
     } catch (e) {
-      setError(e.message);
+      setError(e.message || 'Connection error');
     } finally {
       setLoading(false);
     }
@@ -29,19 +45,24 @@ export function YouTubePanel({ token }) {
       const data = await getYouTubeAuthURL(token);
       const popup = window.open(data.url, 'youtube_oauth', 'width=600,height=700,noopener');
 
-      window.addEventListener('message', function handler(e) {
+      const handler = (e) => {
         if (e.origin !== window.location.origin) return;
         if (e.data?.type === 'youtube_oauth_complete') {
+          messageHandlerRef.current = null;
+          clearInterval(pollIntervalRef.current);
+          pollIntervalRef.current = null;
           popup?.close();
           fetchStatus();
           setActionLoading(false);
         }
-      }, { once: true });
+      };
+      messageHandlerRef.current = handler;
+      window.addEventListener('message', handler, { once: true });
 
-      // Fallback: if popup is closed without completing
-      const pollClosed = setInterval(() => {
+      pollIntervalRef.current = setInterval(() => {
         if (popup && popup.closed) {
-          clearInterval(pollClosed);
+          clearInterval(pollIntervalRef.current);
+          pollIntervalRef.current = null;
           fetchStatus();
           setActionLoading(false);
         }
@@ -68,7 +89,7 @@ export function YouTubePanel({ token }) {
     <section className="panel">
       <h2>YouTube</h2>
       {loading ? (
-        <p>Loading...</p>
+        <p className="hint">Loading…</p>
       ) : error ? (
         <p className="error-msg">{error}</p>
       ) : (
@@ -81,19 +102,23 @@ export function YouTubePanel({ token }) {
           {ytStatus?.connected ? (
             <>
               {ytStatus.expires_at && (
-                <p className="hint">Token expires: {new Date(ytStatus.expires_at).toLocaleString()}</p>
+                <p className="hint">Expires: {new Date(ytStatus.expires_at).toLocaleString()}</p>
               )}
               <button
                 onClick={handleDisconnect}
                 className="btn btn-danger-sm"
                 disabled={actionLoading}
               >
-                {actionLoading ? 'Disconnecting...' : 'Disconnect'}
+                {actionLoading ? 'Disconnecting…' : 'Disconnect'}
               </button>
             </>
           ) : (
-            <button onClick={handleConnect} className="btn" disabled={actionLoading}>
-              {actionLoading ? 'Connecting...' : 'Connect YouTube'}
+            <button
+              onClick={handleConnect}
+              className="btn btn-primary"
+              disabled={actionLoading}
+            >
+              {actionLoading ? 'Connecting…' : 'Connect YouTube'}
             </button>
           )}
         </>
diff --git a/frontend/src/components/ErrorBoundary.jsx b/frontend/src/components/ErrorBoundary.jsx
new file mode 100644
index 0000000..637c088
--- /dev/null
+++ b/frontend/src/components/ErrorBoundary.jsx
@@ -0,0 +1,41 @@
+import { Component } from 'react';
+
+export class ErrorBoundary extends Component {
+  constructor(props) {
+    super(props);
+    this.state = { hasError: false, error: null };
+  }
+
+  static getDerivedStateFromError(error) {
+    return { hasError: true, error };
+  }
+
+  componentDidCatch(error, info) {
+    console.error('ErrorBoundary caught:', error, info);
+  }
+
+  render() {
+    if (this.state.hasError) {
+      return (
+        <div className="error-boundary">
+          <h2>Something went wrong</h2>
+          <details>
+            <summary>Error details</summary>
+            <pre>{this.state.error?.message}</pre>
+          </details>
+          {/*
+            Reload instead of setState({ hasError: false }): clearing state would immediately
+            re-render the child, causing an infinite crash loop for structural errors
+            (bad prop, null data, etc.). Reload is the safer default. Trade-off: any unsaved
+            state (manual question drafts, in-progress edits) is lost, but this only triggers
+            on a hard component crash.
+          */}
+          <button className="btn" onClick={() => window.location.reload()}>
+            Retry
+          </button>
+        </div>
+      );
+    }
+    return this.props.children;
+  }
+}
diff --git a/frontend/src/components/Layout/Header.jsx b/frontend/src/components/Layout/Header.jsx
index 8ffd677..82b6f9a 100644
--- a/frontend/src/components/Layout/Header.jsx
+++ b/frontend/src/components/Layout/Header.jsx
@@ -12,24 +12,33 @@ export function Header({ connected = false, reconnecting = false, activeSession
     navigate('/');
   }
 
+  const dotClass = `connection-dot ${reconnecting ? 'reconnecting' : connected ? 'connected' : 'connecting'}`;
+
   return (
     <header className="app-header">
-      <div className="header-left">
-        <span className="logo">AI Doubt Manager</span>
-      </div>
-      <div className="header-right" style={{ gap: 8 }}>
+      <div className="header-wordmark">AI Doubt Manager</div>
+
+      <div className="header-center">
         {activeSession && (
-          <span className={`connection-status ${reconnecting ? 'reconnecting' : connected ? 'connected' : 'connecting'}`}>
-            {reconnecting ? '🟡 Reconnecting...' : connected ? '🟢 Connected' : '⚪ Connecting...'}
-          </span>
+          <>
+            <span className="header-session-name">{activeSession.title}</span>
+            <span className="live-badge">
+              <span className="live-badge-dot" />
+              LIVE
+            </span>
+          </>
         )}
-        {displayName && <span className="user-name">{displayName}</span>}
+      </div>
+
+      <div className="header-right">
+        {activeSession && <span className={dotClass} title={reconnecting ? 'Reconnecting…' : connected ? 'Connected' : 'Connecting…'} />}
+        {displayName && <span className="header-user-email">{displayName}</span>}
         <button
           onClick={toggleTheme}
           className="btn btn-sm"
           aria-label={theme === 'dark' ? 'Switch to light mode' : 'Switch to dark mode'}
         >
-          {theme === 'dark' ? '☀ Light' : '🌙 Dark'}
+          {theme === 'dark' ? '☀' : '🌙'}
         </button>
         <Link to="/settings" className="btn btn-sm">Settings</Link>
         <button onClick={handleLogout} className="btn btn-sm">Logout</button>
diff --git a/frontend/src/components/Skeleton.jsx b/frontend/src/components/Skeleton.jsx
new file mode 100644
index 0000000..faf2283
--- /dev/null
+++ b/frontend/src/components/Skeleton.jsx
@@ -0,0 +1,3 @@
+export function Skeleton({ className = '' }) {
+  return <div className={`skeleton${className ? ' ' + className : ''}`} />;
+}
diff --git a/frontend/src/context/AuthContext.jsx b/frontend/src/context/AuthContext.jsx
index 7248d52..7d5fd3d 100644
--- a/frontend/src/context/AuthContext.jsx
+++ b/frontend/src/context/AuthContext.jsx
@@ -1,9 +1,10 @@
-import { createContext, useState } from 'react';
+import { createContext, useCallback, useEffect, useState } from 'react';
 import {
   login as apiLogin,
   register as apiRegister,
   logout as apiLogout,
   updateProfile as apiUpdateProfile,
+  refreshAccessToken,
 } from '../services/api';
 
 export const AuthContext = createContext(null);
@@ -12,11 +13,58 @@ export function AuthProvider({ children }) {
   const [token, setToken] = useState(() => localStorage.getItem('token'));
   const [userEmail, setUserEmail] = useState(() => localStorage.getItem('userEmail') || '');
   const [userName, setUserName] = useState(() => localStorage.getItem('userName') || '');
+  const [isLoading, setIsLoading] = useState(true);
+
+  const logout = useCallback(async () => {
+    const currentToken = localStorage.getItem('token');
+    try { await apiLogout(currentToken); } catch (_) {}
+    localStorage.removeItem('token');
+    localStorage.removeItem('refreshToken');
+    localStorage.removeItem('userEmail');
+    localStorage.removeItem('userName');
+    setToken(null);
+    setUserEmail('');
+    setUserName('');
+  }, []);
+
+  useEffect(() => {
+    const storedToken = localStorage.getItem('token');
+    if (!storedToken) {
+      setIsLoading(false);
+      return;
+    }
+    try {
+      const payload = JSON.parse(
+        atob(storedToken.split('.')[1].replace(/-/g, '+').replace(/_/g, '/'))
+      );
+      if (payload.exp * 1000 > Date.now()) {
+        setIsLoading(false);
+        return;
+      }
+    } catch {
+      logout().finally(() => setIsLoading(false));
+      return;
+    }
+    const refreshToken = localStorage.getItem('refreshToken');
+    if (!refreshToken) {
+      logout().finally(() => setIsLoading(false));
+      return;
+    }
+    refreshAccessToken().then((newToken) => {
+      if (newToken) {
+        setToken(newToken);
+      } else {
+        logout();
+      }
+      setIsLoading(false);
+    });
+  }, [logout]);
 
   async function login(email, password) {
     const data = await apiLogin(email, password);
     // data = { access_token, refresh_token, token_type, expires_in }
     localStorage.setItem('token', data.access_token);
+    localStorage.setItem('refreshToken', data.refresh_token);
     localStorage.setItem('userEmail', email);
     setToken(data.access_token);
     setUserEmail(email);
@@ -30,16 +78,6 @@ export function AuthProvider({ children }) {
     await login(email, password);
   }
 
-  async function logout() {
-    try { await apiLogout(token); } catch (_) {}
-    localStorage.removeItem('token');
-    localStorage.removeItem('userEmail');
-    localStorage.removeItem('userName');
-    setToken(null);
-    setUserEmail('');
-    setUserName('');
-  }
-
   async function updateProfile(name) {
     const updated = await apiUpdateProfile({ name }, token);
     localStorage.setItem('userName', updated.name);
@@ -49,6 +87,8 @@ export function AuthProvider({ children }) {
 
   const displayName = userName || userEmail;
 
+  if (isLoading) return null;
+
   return (
     <AuthContext.Provider value={{
       token,
diff --git a/frontend/src/index.css b/frontend/src/index.css
index 8fa774d..c60e880 100644
--- a/frontend/src/index.css
+++ b/frontend/src/index.css
@@ -5,225 +5,455 @@
 [hidden] { display: none !important; }
 
 :root {
-  /* Brand */
-  --color-primary: #3b82f6;
-  --color-primary-hover: #2563eb;
-  --color-danger: #ef4444;
-  --color-danger-hover: #dc2626;
-  --color-success: #22c55e;
+  /* Typography */
+  --font-display: 'Azeret Mono', monospace;
+  --font-body: 'Outfit', sans-serif;
 
   /* Surfaces */
-  --color-bg: #0f172a;
-  --color-surface: #1e293b;
-  --color-surface-alt: #0f172a;
-  --color-border: #334155;
-  --color-text: #f1f5f9;
-  --color-muted: #94a3b8;
-
-  /* Form focus */
-  --color-input-focus-bg: #1e293b;
-
-  /* Error/danger inline */
-  --color-error-bg: #450a0a;
-  --color-error-border: #991b1b;
-  --color-btn-hover: #0f172a;
-  --color-danger-sm-bg: #1e293b;
-  --color-danger-sm-hover: #0f172a;
+  --color-bg:            #08090D;
+  --color-surface:       #0F1117;
+  --color-surface-alt:   #0B0C12;
+  --color-surface-hover: #161824;
+  --color-border:        #1C1F2E;
+  --color-border-bright: #272B3F;
+
+  /* Text */
+  --color-text:      #E2E4ED;
+  --color-muted:     #4E5270;
+  --color-muted-mid: #6B7094;
+
+  /* Brand / Accent */
+  --color-accent:        #FF6B35;
+  --color-accent-dim:    rgba(255,107,53,0.10);
+  --color-accent-hover:  #E85A28;
+  --color-primary:       #FF6B35;
+  --color-primary-hover: #E85A28;
+
+  /* Semantic */
+  --color-danger:       #F43F5E;
+  --color-danger-hover: #DC2646;
+  --color-success:      #34D399;
+  --color-warning:      #FBBF24;
+
+  /* Legacy compat */
+  --color-input-focus-bg:   #0B0C12;
+  --color-error-bg:         #1A0A10;
+  --color-error-border:     #4A1025;
+  --color-warning-bg:       #1A1500;
+  --color-warning-border:   #4A3500;
+  --color-btn-hover:        #161824;
+  --color-danger-sm-bg:     #0F1117;
+  --color-danger-sm-hover:  #1A0A10;
 
   /* Badge variables */
-  --badge-question-bg: #1e3a5f;   --badge-question-color: #93c5fd;
-  --badge-not-question-bg: #1e293b; --badge-not-question-color: #94a3b8;
-  --badge-classifying-bg: #422006;  --badge-classifying-color: #fde68a;
-  --badge-posted-bg: #14532d;       --badge-posted-color: #86efac;
-  --badge-active-bg: #14532d;       --badge-active-color: #86efac;
-  --badge-disconnected-bg: #1e293b; --badge-disconnected-color: #94a3b8;
-  --badge-connected-bg: #1e3a5f;    --badge-connected-color: #93c5fd;
-  --badge-pending-bg: #422006;      --badge-pending-color: #fde68a;
+  --badge-question-bg:      rgba(255,107,53,0.10);  --badge-question-color:    #FF6B35;
+  --badge-not-question-bg:  #0F1117;                --badge-not-question-color:#4E5270;
+  --badge-classifying-bg:   rgba(251,191,36,0.10);  --badge-classifying-color: #FBBF24;
+  --badge-posted-bg:        rgba(52,211,153,0.10);  --badge-posted-color:      #34D399;
+  --badge-active-bg:        rgba(52,211,153,0.10);  --badge-active-color:      #34D399;
+  --badge-disconnected-bg:  #0F1117;                --badge-disconnected-color:#4E5270;
+  --badge-connected-bg:     rgba(255,107,53,0.10);  --badge-connected-color:   #FF6B35;
+  --badge-pending-bg:       rgba(251,191,36,0.10);  --badge-pending-color:     #FBBF24;
 
   /* Connection status */
-  --status-connected-bg: #14532d;   --status-connected-color: #86efac;
-  --status-reconnecting-bg: #422006; --status-reconnecting-color: #fde68a;
-  --status-connecting-bg: #1e293b;  --status-connecting-color: #94a3b8;
-
-  --radius: 8px;
-  --shadow: 0 1px 3px rgba(0,0,0,0.4);
+  --status-connected-bg:    rgba(52,211,153,0.08);  --status-connected-color:   #34D399;
+  --status-reconnecting-bg: rgba(251,191,36,0.08);  --status-reconnecting-color:#FBBF24;
+  --status-connecting-bg:   #0F1117;                --status-connecting-color:  #4E5270;
+
+  --shadow: 0 1px 3px rgba(0,0,0,0.7);
+  --radius: 0px;
+  --header-height: 48px;
+  --sidebar-width: 240px;
+  --sidebar-rail-width: 60px;
 }
 
 [data-theme='light'] {
-  --color-primary: #2563eb;
-  --color-primary-hover: #1d4ed8;
-  --color-danger: #dc2626;
-  --color-danger-hover: #b91c1c;
-  --color-success: #16a34a;
-  --color-bg: #f8fafc;
-  --color-surface: #ffffff;
-  --color-surface-alt: #f8fafc;
-  --color-border: #e2e8f0;
-  --color-text: #1e293b;
-  --color-muted: #64748b;
-  --color-input-focus-bg: #ffffff;
-  --color-error-bg: #fef2f2;
-  --color-error-border: #fecaca;
-  --color-btn-hover: #f1f5f9;
-  --color-danger-sm-bg: #ffffff;
-  --color-danger-sm-hover: #fef2f2;
-
-  --badge-question-bg: #dbeafe;   --badge-question-color: #1e40af;
-  --badge-not-question-bg: #f1f5f9; --badge-not-question-color: #64748b;
-  --badge-classifying-bg: #fef9c3;  --badge-classifying-color: #92400e;
-  --badge-posted-bg: #dcfce7;       --badge-posted-color: #166534;
-  --badge-active-bg: #dcfce7;       --badge-active-color: #166534;
-  --badge-disconnected-bg: #f1f5f9; --badge-disconnected-color: #64748b;
-  --badge-connected-bg: #dbeafe;    --badge-connected-color: #1e40af;
-  --badge-pending-bg: #fef3c7;      --badge-pending-color: #92400e;
-
-  --status-connected-bg: #dcfce7;   --status-connected-color: #166534;
-  --status-reconnecting-bg: #fef3c7; --status-reconnecting-color: #92400e;
-  --status-connecting-bg: #f1f5f9;  --status-connecting-color: #64748b;
-
-  --shadow: 0 1px 3px rgba(0,0,0,0.1);
+  --color-bg:            #F5F5F0;
+  --color-surface:       #FFFFFF;
+  --color-surface-alt:   #F5F5F0;
+  --color-surface-hover: #EAEAE4;
+  --color-border:        #D8D8D0;
+  --color-border-bright: #C0C0B8;
+
+  --color-text:      #1A1B22;
+  --color-muted:     #7A7B88;
+  --color-muted-mid: #5A5B68;
+
+  --color-accent:        #D4520A;
+  --color-accent-dim:    rgba(212,82,10,0.08);
+  --color-accent-hover:  #B84508;
+  --color-primary:       #D4520A;
+  --color-primary-hover: #B84508;
+
+  --color-danger:       #DC2646;
+  --color-danger-hover: #B81D38;
+  --color-success:      #059669;
+  --color-warning:      #B45309;
+
+  --color-input-focus-bg:   #FFFFFF;
+  --color-error-bg:         #FFF0F3;
+  --color-error-border:     #FFCCD5;
+  --color-warning-bg:       #FFFAEB;
+  --color-warning-border:   #FFE88A;
+  --color-btn-hover:        #EAEAE4;
+  --color-danger-sm-bg:     #FFFFFF;
+  --color-danger-sm-hover:  #FFF0F3;
+
+  --badge-question-bg:      #FFF0E8;   --badge-question-color:    #B84508;
+  --badge-not-question-bg:  #F0F0EC;   --badge-not-question-color:#5A5B68;
+  --badge-classifying-bg:   #FFF8E0;   --badge-classifying-color: #92400E;
+  --badge-posted-bg:        #E0FFF4;   --badge-posted-color:      #065F46;
+  --badge-active-bg:        #E0FFF4;   --badge-active-color:      #065F46;
+  --badge-disconnected-bg:  #F0F0EC;   --badge-disconnected-color:#5A5B68;
+  --badge-connected-bg:     #FFF0E8;   --badge-connected-color:   #B84508;
+  --badge-pending-bg:       #FFF8E0;   --badge-pending-color:     #92400E;
+
+  --status-connected-bg:    #E0FFF4;   --status-connected-color:   #065F46;
+  --status-reconnecting-bg: #FFF8E0;   --status-reconnecting-color:#92400E;
+  --status-connecting-bg:   #F0F0EC;   --status-connecting-color:  #5A5B68;
+
+  --shadow: 0 1px 3px rgba(0,0,0,0.08);
+}
+
+[data-theme='light'] body {
+  background:
+    linear-gradient(0deg, rgba(212,82,10,0.02) 1px, transparent 1px),
+    linear-gradient(90deg, rgba(212,82,10,0.02) 1px, transparent 1px),
+    var(--color-bg);
+  background-size: 32px 32px, 32px 32px, 100% 100%;
+}
+
+/* ============================================================
+   Keyframe Animations
+   ============================================================ */
+@keyframes live-pulse {
+  0%, 100% { opacity: 1; transform: scale(1); }
+  50%       { opacity: 0.4; transform: scale(0.85); }
+}
+@keyframes question-enter {
+  from { opacity: 0; transform: translateY(8px); }
+  to   { opacity: 1; transform: translateY(0); }
+}
+@keyframes status-pulse {
+  0%, 100% { opacity: 1; }
+  50%       { opacity: 0.5; }
+}
+@keyframes badge-pop {
+  0%   { transform: scale(0.6); opacity: 0; }
+  70%  { transform: scale(1.15); }
+  100% { transform: scale(1); opacity: 1; }
+}
+@keyframes toast-enter {
+  from { opacity: 0; transform: translateX(12px); }
+  to   { opacity: 1; transform: translateX(0); }
+}
+@keyframes shimmer {
+  0%   { background-position: 200% 0; }
+  100% { background-position: -200% 0; }
+}
+@keyframes sidebar-enter {
+  from { opacity: 0; transform: translateX(-12px); }
+  to   { opacity: 1; transform: translateX(0); }
+}
+@keyframes col-enter {
+  from { opacity: 0; transform: translateY(6px); }
+  to   { opacity: 1; transform: translateY(0); }
+}
+@keyframes border-arm {
+  from { border-color: var(--color-accent); box-shadow: 0 0 8px rgba(255,107,53,0.25); }
+  to   { border-color: var(--color-success); box-shadow: 0 0 12px rgba(52,211,153,0.3); }
 }
 
+/* ============================================================
+   Base
+   ============================================================ */
 body {
-  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, sans-serif;
-  background: var(--color-bg);
+  font-family: var(--font-body);
+  background:
+    linear-gradient(0deg, rgba(255,107,53,0.02) 1px, transparent 1px),
+    linear-gradient(90deg, rgba(255,107,53,0.02) 1px, transparent 1px),
+    var(--color-bg);
+  background-size: 32px 32px, 32px 32px, 100% 100%;
   color: var(--color-text);
   font-size: 14px;
   line-height: 1.5;
 }
 
 /* ============================================================
-   Auth View
+   App Shell
    ============================================================ */
-.auth-view {
-  min-height: 100vh;
+.app-shell {
+  display: flex;
+  flex-direction: column;
+  height: 100vh;
+  overflow: hidden;
+}
+
+/* ============================================================
+   Header — 3-zone layout
+   ============================================================ */
+.app-header {
+  background: var(--color-surface);
+  border-bottom: 1px solid var(--color-border);
+  height: var(--header-height);
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 0 16px;
+  position: sticky;
+  top: 0;
+  z-index: 20;
+  flex-shrink: 0;
+  gap: 12px;
+}
+
+.header-wordmark {
+  font-family: var(--font-display);
+  font-size: 11px;
+  font-weight: 700;
+  letter-spacing: 0.1em;
+  color: var(--color-accent);
+  text-transform: uppercase;
+  white-space: nowrap;
+  flex-shrink: 0;
+}
+
+.header-center {
   display: flex;
   align-items: center;
+  gap: 10px;
+  font-family: var(--font-display);
+  font-size: 11px;
+  flex: 1;
   justify-content: center;
-  padding: 24px;
+  min-width: 0;
 }
 
-.auth-card {
-  background: var(--color-surface);
-  border: 1px solid var(--color-border);
-  border-radius: var(--radius);
-  box-shadow: var(--shadow);
-  padding: 32px;
-  width: 100%;
-  max-width: 400px;
+.header-session-name {
+  color: var(--color-muted-mid);
+  font-weight: 400;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
 }
 
-.auth-card h1 {
-  font-size: 20px;
+.live-badge {
+  display: inline-flex;
+  align-items: center;
+  gap: 5px;
+  background: var(--color-accent-dim);
+  color: var(--color-accent);
+  font-family: var(--font-display);
+  font-size: 9px;
   font-weight: 700;
-  color: var(--color-primary);
-  margin-bottom: 24px;
-  text-align: center;
+  letter-spacing: 0.12em;
+  padding: 2px 8px;
+  border: 1px solid rgba(255, 107, 53, 0.3);
+  flex-shrink: 0;
 }
 
-.auth-card h2 {
-  font-size: 16px;
-  font-weight: 600;
-  margin-bottom: 16px;
+.live-badge-dot {
+  width: 6px;
+  height: 6px;
+  border-radius: 50%;
+  background: var(--color-accent);
+  flex-shrink: 0;
+  animation: live-pulse 1.5s infinite;
 }
 
-.auth-card form {
+.header-right {
   display: flex;
-  flex-direction: column;
-  gap: 12px;
+  align-items: center;
+  gap: 8px;
+  flex-shrink: 0;
 }
 
-.auth-card label {
+.connection-dot {
+  width: 8px;
+  height: 8px;
+  border-radius: 50%;
+  flex-shrink: 0;
+}
+.connection-dot.connected    { background: var(--color-success); }
+.connection-dot.reconnecting { background: var(--color-warning); animation: status-pulse 1.5s ease-in-out infinite; }
+.connection-dot.connecting   { background: var(--color-muted); }
+
+.header-user-email {
+  font-family: var(--font-display);
+  font-size: 10px;
+  color: var(--color-muted);
+  max-width: 140px;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+/* Logo alias for landing page */
+.logo {
+  font-family: var(--font-display);
+  font-weight: 700;
+  font-size: 12px;
+  color: var(--color-accent);
+  letter-spacing: 0.08em;
+  text-transform: uppercase;
+}
+
+/* ============================================================
+   App Body + Sidebar
+   ============================================================ */
+.app-body {
+  display: flex;
+  flex: 1;
+  min-height: 0;
+  overflow: hidden;
+}
+
+.app-sidebar {
+  width: var(--sidebar-width);
+  flex-shrink: 0;
   display: flex;
   flex-direction: column;
-  gap: 4px;
-  font-weight: 500;
+  background: var(--color-surface);
+  border-right: 1px solid var(--color-border);
+  overflow: hidden;
+  transition: width 0.22s ease;
 }
 
-.auth-switch {
-  margin-top: 16px;
-  text-align: center;
-  font-size: 13px;
-  color: var(--color-muted);
+.app-sidebar.collapsed {
+  width: var(--sidebar-rail-width);
 }
 
-.auth-switch a {
-  color: var(--color-primary);
-  text-decoration: none;
+.sidebar-content {
+  flex: 1;
+  overflow-y: auto;
+  overflow-x: hidden;
+  min-height: 0;
 }
 
-.auth-switch a:hover {
-  text-decoration: underline;
+.app-sidebar.collapsed .sidebar-content {
+  overflow: hidden;
 }
 
-.error-msg {
-  background: var(--color-error-bg);
-  border: 1px solid var(--color-error-border);
-  color: var(--color-danger);
-  border-radius: 4px;
-  padding: 8px 12px;
-  font-size: 13px;
+.sidebar-section-title {
+  font-family: var(--font-display);
+  font-size: 9px;
+  font-weight: 700;
+  letter-spacing: 0.12em;
+  text-transform: uppercase;
+  color: var(--color-muted);
   margin-bottom: 8px;
+  white-space: nowrap;
+  overflow: hidden;
 }
 
-/* ============================================================
-   Header
-   ============================================================ */
-.app-header {
-  background: var(--color-surface);
-  border-bottom: 1px solid var(--color-border);
-  padding: 0 24px;
-  height: 56px;
+.sidebar-toggle {
+  flex-shrink: 0;
   display: flex;
   align-items: center;
-  justify-content: space-between;
-  position: sticky;
-  top: 0;
-  z-index: 10;
-  box-shadow: var(--shadow);
+  justify-content: center;
+  width: 100%;
+  height: 36px;
+  border: none;
+  border-top: 1px solid var(--color-border);
+  background: var(--color-surface);
+  color: var(--color-muted);
+  cursor: pointer;
+  transition: background 0.15s, color 0.15s;
+}
+
+.sidebar-toggle:hover {
+  background: var(--color-surface-hover);
+  color: var(--color-text);
 }
 
-.logo { font-weight: 700; font-size: 16px; color: var(--color-primary); }
-.user-name { color: var(--color-muted); margin-right: 12px; }
-.header-right { display: flex; align-items: center; }
+.sidebar-toggle svg {
+  transition: transform 0.22s ease;
+  flex-shrink: 0;
+}
+
+.app-sidebar.collapsed .sidebar-toggle svg {
+  transform: rotate(180deg);
+}
 
 /* ============================================================
-   Main Layout
+   Main — 3-column layout
    ============================================================ */
-.app-main { padding: 20px 24px; max-width: 1400px; margin: 0 auto; }
-
-.panels-grid {
+.app-main {
+  flex: 1;
+  min-width: 0;
   display: grid;
-  grid-template-columns: 360px 1fr;
-  gap: 20px;
+  grid-template-columns: 40fr 35fr 25fr;
+  overflow: hidden;
 }
 
-.left-column, .right-column {
+.main-col {
   display: flex;
   flex-direction: column;
-  gap: 16px;
+  overflow: hidden;
+  border-right: 1px solid var(--color-border);
+  min-width: 0;
+}
+
+.main-col:last-child {
+  border-right: none;
+}
+
+/* Third column scrolls itself (multiple stacked panels) */
+.main-col.col-scrollable {
+  overflow-y: auto;
+}
+
+.col-body {
+  flex: 1;
+  min-height: 0;
+  overflow-y: auto;
+}
+
+/* Panel-scrollable fills its column when placed directly in main-col */
+.main-col > .panel-scrollable {
+  flex: 1;
+  min-height: 0;
+  border-bottom: none;
 }
 
 /* ============================================================
-   Panel
+   Panel (flat / transparent inside sidebar & columns)
    ============================================================ */
 .panel {
-  background: var(--color-surface);
-  border: 1px solid var(--color-border);
-  border-radius: var(--radius);
-  padding: 16px;
-  box-shadow: var(--shadow);
+  background: transparent;
+  border: none;
+  border-bottom: 1px solid var(--color-border);
+  border-radius: 0;
+  padding: 14px;
 }
 
 .panel h2 {
-  font-size: 14px;
-  font-weight: 600;
+  font-family: var(--font-display);
+  font-size: 9px;
+  font-weight: 700;
+  letter-spacing: 0.1em;
+  text-transform: uppercase;
+  color: var(--color-muted);
   margin-bottom: 12px;
+  padding-bottom: 8px;
+  border-bottom: 1px solid var(--color-border);
   display: flex;
   align-items: center;
   gap: 8px;
 }
 
+.panel-scrollable {
+  display: flex;
+  flex-direction: column;
+  overflow: hidden;
+  flex: 1;
+  min-height: 0;
+}
+
+/* Flex weights (preserved as no-ops — columns handle sizing now) */
+.panel-feed     { }
+.panel-clusters { }
+
 /* ============================================================
    Forms
    ============================================================ */
@@ -232,34 +462,45 @@ label {
   flex-direction: column;
   gap: 4px;
   font-weight: 500;
-  font-size: 13px;
+  font-size: 12px;
   margin-bottom: 8px;
+  color: var(--color-muted-mid);
 }
 
 input[type="text"],
 input[type="email"],
 input[type="password"],
-textarea {
+textarea,
+select {
   width: 100%;
-  padding: 8px 10px;
+  padding: 7px 10px;
   border: 1px solid var(--color-border);
-  border-radius: 6px;
+  border-radius: 0;
   font-size: 13px;
-  font-family: inherit;
+  font-family: var(--font-body);
   color: var(--color-text);
-  background: var(--color-bg);
+  background: var(--color-surface-alt);
   transition: border-color 0.15s;
 }
 
-input:focus, textarea:focus {
+input:focus, textarea:focus, select:focus {
   outline: none;
-  border-color: var(--color-primary);
+  border-color: var(--color-accent);
   background: var(--color-input-focus-bg);
 }
 
+button:focus-visible,
+a:focus-visible,
+input:focus-visible,
+textarea:focus-visible,
+select:focus-visible {
+  outline: 2px solid var(--color-accent);
+  outline-offset: 2px;
+}
+
 textarea { resize: vertical; min-height: 80px; }
 
-.hint { font-size: 12px; color: var(--color-muted); margin-bottom: 6px; }
+.hint { font-size: 11px; color: var(--color-muted); margin-bottom: 6px; }
 
 /* ============================================================
    Buttons
@@ -269,29 +510,37 @@ textarea { resize: vertical; min-height: 80px; }
   align-items: center;
   justify-content: center;
   gap: 6px;
-  padding: 7px 14px;
+  padding: 6px 12px;
   border: 1px solid var(--color-border);
-  border-radius: 6px;
-  font-size: 13px;
-  font-weight: 500;
+  border-radius: 0;
+  font-size: 11px;
+  font-family: var(--font-display);
+  font-weight: 400;
   cursor: pointer;
   background: var(--color-surface);
   color: var(--color-text);
-  transition: background 0.15s, border-color 0.15s;
+  transition: background 0.15s, border-color 0.15s, color 0.15s;
   white-space: nowrap;
+  letter-spacing: 0.03em;
+  text-decoration: none;
 }
 
 .btn:hover { background: var(--color-btn-hover); }
 
 .btn-primary {
-  background: var(--color-primary);
-  color: #fff;
-  border-color: var(--color-primary);
+  background: var(--color-accent);
+  color: #0A0A0F;
+  border-color: var(--color-accent);
+  font-family: var(--font-display);
+  font-weight: 700;
   width: 100%;
   margin-top: 4px;
 }
 
-.btn-primary:hover { background: var(--color-primary-hover); border-color: var(--color-primary-hover); }
+.btn-primary:hover {
+  background: var(--color-accent-hover);
+  border-color: var(--color-accent-hover);
+}
 
 .btn-danger {
   background: var(--color-danger);
@@ -307,15 +556,15 @@ textarea { resize: vertical; min-height: 80px; }
   background: var(--color-danger-sm-bg);
   color: var(--color-danger);
   border-color: var(--color-error-border);
-  font-size: 12px;
-  padding: 4px 10px;
+  font-size: 11px;
+  padding: 3px 8px;
 }
 
 .btn-danger-sm:hover { background: var(--color-danger-sm-hover); }
 
-.btn-sm { padding: 5px 10px; font-size: 12px; }
+.btn-sm { padding: 4px 8px; font-size: 11px; }
 
-button:disabled { opacity: 0.5; pointer-events: none; }
+button:disabled { opacity: 0.4; pointer-events: none; }
 
 /* ============================================================
    Badges
@@ -323,54 +572,71 @@ button:disabled { opacity: 0.5; pointer-events: none; }
 .badge {
   display: inline-flex;
   align-items: center;
-  padding: 2px 8px;
-  border-radius: 12px;
-  font-size: 11px;
-  font-weight: 600;
+  padding: 2px 6px;
+  border-radius: 0;
+  font-size: 9px;
+  font-family: var(--font-display);
+  font-weight: 700;
+  letter-spacing: 0.06em;
   white-space: nowrap;
+  text-transform: uppercase;
 }
 
-.badge-question { background: var(--badge-question-bg); color: var(--badge-question-color); }
-.badge-not-question { background: var(--badge-not-question-bg); color: var(--badge-not-question-color); }
-.badge-classifying { background: var(--badge-classifying-bg); color: var(--badge-classifying-color); }
-.badge-posted { background: var(--badge-posted-bg); color: var(--badge-posted-color); }
-.badge-active { background: var(--badge-active-bg); color: var(--badge-active-color); }
-.badge-disconnected { background: var(--badge-disconnected-bg); color: var(--badge-disconnected-color); }
-.badge-connected { background: var(--badge-connected-bg); color: var(--badge-connected-color); }
-.badge-pending { background: var(--badge-pending-bg); color: var(--badge-pending-color); }
+.badge-question      { background: var(--badge-question-bg);      color: var(--badge-question-color); }
+.badge-not-question  { background: var(--badge-not-question-bg);  color: var(--badge-not-question-color); }
+.badge-classifying   { background: var(--badge-classifying-bg);   color: var(--badge-classifying-color); }
+.badge-posted        { background: var(--badge-posted-bg);        color: var(--badge-posted-color); }
+.badge-active        { background: var(--badge-active-bg);        color: var(--badge-active-color); }
+.badge-disconnected  { background: var(--badge-disconnected-bg);  color: var(--badge-disconnected-color); }
+.badge-connected     { background: var(--badge-connected-bg);     color: var(--badge-connected-color); }
+.badge-pending       { background: var(--badge-pending-bg);       color: var(--badge-pending-color); }
 
 /* ============================================================
    Questions Feed
    ============================================================ */
 .questions-feed {
-  height: 400px;
+  flex: 1;
+  min-height: 0;
   overflow-y: auto;
   scroll-behavior: smooth;
   display: flex;
   flex-direction: column;
-  gap: 6px;
+  gap: 0;
 }
 
 .feed-item {
   display: flex;
   align-items: flex-start;
   gap: 8px;
-  padding: 8px 10px;
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  background: var(--color-surface-alt);
+  padding: 10px 14px;
+  border-left: 2px solid transparent;
+  border-bottom: 1px solid var(--color-border);
+  background: transparent;
   font-size: 13px;
+  transition: background 0.12s, border-left-color 0.12s, transform 0.12s, box-shadow 0.12s;
+  cursor: default;
+  animation: question-enter 0.2s ease both;
+}
+
+.feed-item:hover {
+  background: var(--color-surface-hover);
+  border-left-color: var(--color-accent);
+  transform: translateY(-1px);
+  box-shadow: 0 2px 8px rgba(255, 107, 53, 0.08);
 }
 
 .feed-item-author {
-  font-weight: 600;
-  color: var(--color-primary);
+  font-family: var(--font-display);
+  font-size: 9px;
+  font-weight: 700;
+  color: var(--color-accent);
   white-space: nowrap;
   flex-shrink: 0;
-  font-size: 12px;
+  letter-spacing: 0.04em;
+  padding-top: 2px;
 }
 
-.feed-item-text { flex: 1; }
+.feed-item-text  { flex: 1; font-size: 12px; color: var(--color-text); line-height: 1.5; }
 .feed-item-badge { flex-shrink: 0; }
 
 .empty-msg { color: var(--color-muted); font-size: 13px; text-align: center; padding: 24px 0; }
@@ -381,193 +647,208 @@ button:disabled { opacity: 0.5; pointer-events: none; }
 .clusters-list {
   display: flex;
   flex-direction: column;
-  gap: 12px;
-  max-height: 600px;
+  flex: 1;
+  min-height: 0;
   overflow-y: auto;
 }
 
 .cluster-card {
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  padding: 12px;
-  background: var(--color-surface-alt);
+  border: none;
+  border-left: 2px solid transparent;
+  border-bottom: 1px solid var(--color-border);
+  background: transparent;
+  transition: border-left-color 0.15s;
 }
 
+.cluster-card:hover         { border-left-color: var(--color-accent); }
+.cluster-card.cluster-approved { border-left-color: var(--color-success); }
+
 .cluster-header {
   display: flex;
   align-items: center;
   justify-content: space-between;
-  margin-bottom: 8px;
+  padding: 10px 14px;
+  cursor: pointer;
+  gap: 8px;
+  transition: background 0.12s;
+}
+
+.cluster-header:hover { background: var(--color-surface-hover); }
+
+.cluster-title {
+  font-family: var(--font-display);
+  font-size: 10px;
+  font-weight: 700;
+  color: var(--color-text);
+  flex: 1;
+  min-width: 0;
+  letter-spacing: 0.03em;
+  word-break: break-word;
+  overflow: hidden;
+  display: -webkit-box;
+  -webkit-line-clamp: 2;
+  -webkit-box-orient: vertical;
+}
+
+.cluster-count {
+  font-family: var(--font-display);
+  font-size: 9px;
+  color: var(--color-muted);
+  white-space: nowrap;
+  flex-shrink: 0;
+}
+
+.cluster-expand-icon {
+  color: var(--color-muted);
+  font-size: 9px;
+  flex-shrink: 0;
+  transition: transform 0.2s;
+}
+
+.cluster-card.expanded .cluster-expand-icon {
+  transform: rotate(180deg);
+}
+
+.cluster-body {
+  max-height: 0;
+  opacity: 0;
+  overflow: hidden;
+  transition: max-height 0.25s ease, opacity 0.2s ease;
 }
 
-.cluster-title { font-weight: 600; font-size: 13px; }
-.cluster-count { color: var(--color-muted); font-size: 12px; }
+.cluster-body.expanded {
+  max-height: 320px;
+  opacity: 1;
+}
+
+.cluster-body-inner { padding: 0 14px 12px; }
 
 .cluster-answer {
   background: var(--color-surface-alt);
   border: 1px solid var(--color-border);
-  border-radius: 6px;
-  padding: 10px;
-  font-size: 13px;
+  padding: 8px 10px;
+  font-size: 12px;
   margin-bottom: 8px;
   white-space: pre-wrap;
-  max-height: 120px;
+  max-height: 110px;
   overflow-y: auto;
+  line-height: 1.5;
+  color: var(--color-text);
 }
 
-.cluster-actions {
-  display: flex;
-  gap: 8px;
-  flex-wrap: wrap;
+.cluster-actions { display: flex; gap: 6px; flex-wrap: wrap; }
+
+.cluster-approved-badge {
+  display: inline-flex;
+  align-items: center;
+  gap: 4px;
+  font-family: var(--font-display);
+  font-size: 9px;
+  font-weight: 700;
+  color: var(--color-success);
+  letter-spacing: 0.06em;
+  animation: badge-pop 0.3s ease both;
 }
 
 /* ============================================================
    YouTube Panel
    ============================================================ */
-.yt-status-row {
-  margin-bottom: 10px;
-}
+.yt-status-row { margin-bottom: 10px; }
 
 /* ============================================================
-   Metrics Grid
+   Metrics Grid — 2×2 large stat cards
    ============================================================ */
 .metrics-grid {
   display: grid;
   grid-template-columns: 1fr 1fr;
-  gap: 10px;
 }
 
 .metric-card {
-  background: var(--color-surface-alt);
-  border: 1px solid var(--color-border);
-  border-radius: 6px;
-  padding: 10px 12px;
+  padding: 16px 12px;
   text-align: center;
+  border-right: 1px solid var(--color-border);
+  border-bottom: 1px solid var(--color-border);
+}
+
+.metric-card:nth-child(even)    { border-right: none; }
+.metric-card:nth-last-child(-n+2) { border-bottom: none; }
+
+.metric-value {
+  font-family: var(--font-display);
+  font-size: 28px;
+  font-weight: 700;
+  color: var(--color-accent);
+  line-height: 1.1;
 }
 
-.metric-value { font-size: 24px; font-weight: 700; color: var(--color-primary); }
-.metric-label { font-size: 11px; color: var(--color-muted); margin-top: 2px; }
+.metric-label {
+  font-family: var(--font-display);
+  font-size: 9px;
+  letter-spacing: 0.1em;
+  text-transform: uppercase;
+  color: var(--color-muted);
+  margin-top: 4px;
+}
 
 /* ============================================================
    Session Info
    ============================================================ */
-.session-info {
-  display: flex;
-  align-items: center;
-  gap: 8px;
-  margin-bottom: 6px;
-}
+.session-info { display: flex; align-items: center; gap: 8px; margin-bottom: 6px; }
 
 /* ============================================================
-   Text utils
+   Text utilities
    ============================================================ */
 .text-muted { color: var(--color-muted); font-size: 13px; text-align: center; padding: 24px; }
 
 /* ============================================================
-   Responsive
+   Connection Status (legacy pill — kept for compat)
    ============================================================ */
-@media (max-width: 900px) {
-  .panels-grid { grid-template-columns: 1fr; }
+.connection-status {
+  display: inline-flex; align-items: center; gap: 4px;
+  font-size: 11px; padding: 3px 8px; font-weight: 500;
 }
+.connection-status.connected    { color: var(--color-success); }
+.connection-status.reconnecting { color: var(--color-warning); animation: status-pulse 1.5s ease-in-out infinite; }
+.connection-status.connecting   { color: var(--color-muted); }
 
 /* ============================================================
-   Hidden utility
+   Empty States
    ============================================================ */
-.hidden { display: none !important; }
+.empty-state { text-align: center; padding: 32px 16px; color: var(--color-muted); }
+.empty-icon  { font-size: 28px; display: block; margin-bottom: 8px; }
+.empty-state p   { font-size: 12px; margin-bottom: 4px; }
+.empty-hint      { font-size: 11px; }
+
+.empty-state-icon        { display: block; color: var(--color-muted); margin-bottom: 10px; }
+.empty-state-title       { font-family: var(--font-display); font-size: 11px; font-weight: 700; color: var(--color-muted-mid); margin: 0 0 4px; letter-spacing: 0.05em; }
+.empty-state-description { font-size: 11px; color: var(--color-muted); margin: 0; }
 
 /* ============================================================
-   Landing Page
+   Skeleton layout utilities
    ============================================================ */
-.landing { display: flex; flex-direction: column; min-height: 100vh; }
-
-.landing-header {
-  background: var(--color-surface);
-  border-bottom: 1px solid var(--color-border);
-  padding: 0 48px;
-  height: 60px;
-  display: flex;
-  align-items: center;
-  justify-content: space-between;
-  box-shadow: var(--shadow);
-}
-
-.landing-header .logo { font-size: 18px; font-weight: 700; color: var(--color-primary); }
-.landing-nav { display: flex; gap: 12px; align-items: center; }
-.landing-nav .btn-primary { width: auto; margin-top: 0; }
-
-.landing-hero {
-  text-align: center;
-  padding: 64px 24px 48px;
-  max-width: 680px;
-  margin: 0 auto;
-}
-
-.landing-hero h1 { font-size: 36px; font-weight: 700; color: var(--color-primary); margin-bottom: 16px; }
-.landing-hero .tagline { font-size: 18px; font-weight: 600; color: var(--color-text); margin-bottom: 12px; }
-.landing-hero .subtitle { font-size: 14px; color: var(--color-muted); margin-bottom: 32px; line-height: 1.7; }
-
-.landing-ctas { display: flex; gap: 12px; justify-content: center; flex-wrap: wrap; }
-.landing-ctas .btn { padding: 10px 28px; font-size: 15px; }
-.landing-ctas .btn-primary { width: auto; margin-top: 0; }
+.skeleton-list { display: flex; flex-direction: column; gap: 8px; }
+.skeleton-row  { display: flex; gap: 8px; align-items: center; }
 
-.landing-features {
-  background: var(--color-surface);
-  border-top: 1px solid var(--color-border);
-  padding: 48px 24px;
-  flex: 1;
-}
+.sk-metric-value  { height: 32px; margin-bottom: 6px; }
+.sk-metric-label  { height: 10px; width: 55%; margin: 0 auto; }
 
-.landing-features h2 {
-  text-align: center;
-  font-size: 20px;
-  font-weight: 700;
-  margin-bottom: 32px;
-  color: var(--color-text);
-}
+.sk-feed-author   { width: 60px; height: 12px; flex-shrink: 0; }
+.sk-feed-text     { flex: 1; height: 13px; }
+.sk-feed-badge    { width: 60px; height: 16px; }
 
-.features-grid {
-  display: grid;
-  grid-template-columns: repeat(3, 1fr);
-  gap: 20px;
-  max-width: 900px;
-  margin: 0 auto;
-}
+.sk-cluster-title { width: 60%; height: 13px; }
+.sk-cluster-count { width: 50px; height: 11px; }
+.sk-cluster-body  { height: 50px; margin-bottom: 8px; }
+.sk-cluster-btn   { width: 70px; height: 26px; }
 
-.feature-card {
-  background: var(--color-bg);
-  border: 1px solid var(--color-border);
-  border-radius: var(--radius);
-  padding: 24px;
-  text-align: center;
-}
+.sk-comment-author { width: 64px; height: 12px; flex-shrink: 0; }
+.sk-comment-text   { flex: 1; height: 13px; }
 
-.feature-emoji { font-size: 32px; margin-bottom: 12px; }
-.feature-card h3 { font-size: 14px; font-weight: 600; margin-bottom: 8px; }
-.feature-card p { font-size: 13px; color: var(--color-muted); line-height: 1.6; }
+.sk-doc-row         { height: 30px; }
 
-.landing-footer {
-  background: var(--color-surface);
-  border-top: 1px solid var(--color-border);
-  padding: 20px 24px;
-  text-align: center;
-  font-size: 13px;
-  color: var(--color-muted);
-}
-
-@media (max-width: 700px) {
-  .landing-header { padding: 0 20px; }
-  .landing-hero h1 { font-size: 26px; }
-  .features-grid { grid-template-columns: 1fr; }
-  .landing-ctas { flex-direction: column; align-items: center; }
-}
-
-/* ============================================================
-   Empty States
-   ============================================================ */
-.empty-state { text-align: center; padding: 32px 16px; color: var(--color-muted); }
-.empty-icon { font-size: 32px; display: block; margin-bottom: 8px; }
-.empty-state p { font-size: 13px; margin-bottom: 4px; }
-.empty-hint { font-size: 12px; }
+.sk-analytics-value { height: 26px; margin-bottom: 6px; }
+.sk-analytics-label { height: 10px; width: 60%; margin: 0 auto; }
+.sk-analytics-chart { height: 150px; margin-top: 16px; }
 
 /* ============================================================
    Skeleton shimmer
@@ -576,161 +857,457 @@ button:disabled { opacity: 0.5; pointer-events: none; }
   background: linear-gradient(90deg, var(--color-surface) 25%, var(--color-border) 50%, var(--color-surface) 75%);
   background-size: 200% 100%;
   animation: shimmer 1.5s infinite;
-  border-radius: 4px;
+  border-radius: 0;
 }
-@keyframes shimmer { 0% { background-position: 200% 0; } 100% { background-position: -200% 0; } }
 
 /* ============================================================
    Toast
    ============================================================ */
-.toast-container { position: fixed; top: 16px; right: 16px; z-index: 1000; display: flex; flex-direction: column; gap: 8px; max-width: 320px; pointer-events: none; }
-.toast { background: var(--color-surface); border: 1px solid var(--color-border); border-radius: var(--radius); padding: 10px 14px; box-shadow: 0 4px 12px rgba(0,0,0,0.15); display: flex; align-items: flex-start; gap: 10px; font-size: 13px; pointer-events: auto; }
-.toast-success { border-left: 4px solid var(--color-success); }
-.toast-error { border-left: 4px solid var(--color-danger); }
-.toast-info { border-left: 4px solid var(--color-primary); }
-.toast-close { margin-left: auto; background: none; border: none; cursor: pointer; color: var(--color-muted); font-size: 16px; line-height: 1; padding: 0; }
+.toast-container {
+  position: fixed; top: 16px; right: 16px; z-index: 1000;
+  display: flex; flex-direction: column; gap: 8px;
+  max-width: 320px; pointer-events: none;
+}
 
-/* ============================================================
-   Connection Status
-   ============================================================ */
-.connection-status { display: inline-flex; align-items: center; gap: 4px; font-size: 12px; padding: 3px 8px; border-radius: 12px; font-weight: 500; margin-right: 10px; }
-.connection-status.connected { background: var(--status-connected-bg); color: var(--status-connected-color); }
-.connection-status.reconnecting { background: var(--status-reconnecting-bg); color: var(--status-reconnecting-color); }
-.connection-status.connecting { background: var(--status-connecting-bg); color: var(--status-connecting-color); }
+.toast {
+  background: var(--color-surface);
+  border: 1px solid var(--color-border-bright);
+  border-radius: 0;
+  padding: 10px 14px;
+  box-shadow: 0 4px 20px rgba(0,0,0,0.5);
+  display: flex; align-items: flex-start; gap: 10px;
+  font-size: 13px; pointer-events: auto;
+  animation: toast-enter 0.2s ease both;
+}
+
+.toast-success { border-left: 3px solid var(--color-success); }
+.toast-error   { border-left: 3px solid var(--color-danger); }
+.toast-info    { border-left: 3px solid var(--color-accent); }
+
+.toast-close {
+  margin-left: auto; background: none; border: none;
+  cursor: pointer; color: var(--color-muted); font-size: 16px;
+  line-height: 1; padding: 0;
+}
 
 /* ============================================================
    Modal
    ============================================================ */
 .modal-overlay {
-  position: fixed;
-  top: 0; left: 0; right: 0; bottom: 0;
-  background: rgba(0,0,0,0.5);
-  display: flex;
-  align-items: center;
-  justify-content: center;
+  position: fixed; top: 0; left: 0; right: 0; bottom: 0;
+  background: rgba(0,0,0,0.72);
+  display: flex; align-items: center; justify-content: center;
   z-index: 1000;
+  backdrop-filter: blur(2px);
 }
 
 .modal {
   background: var(--color-surface);
-  border: 1px solid var(--color-border);
-  border-radius: var(--radius);
+  border: 1px solid var(--color-border-bright);
+  border-radius: 0;
   padding: 24px;
-  max-width: 400px;
-  width: 100%;
-  box-shadow: 0 8px 24px rgba(0,0,0,0.3);
+  max-width: 400px; width: 100%;
+  box-shadow: 0 16px 48px rgba(0,0,0,0.6);
+}
+
+.modal h3 {
+  font-family: var(--font-display); font-size: 13px; font-weight: 700;
+  margin-bottom: 8px; letter-spacing: 0.04em;
 }
 
-.modal h3 { font-size: 15px; font-weight: 600; margin-bottom: 8px; }
 .modal p { font-size: 13px; color: var(--color-muted); margin-bottom: 20px; }
 .modal-actions { display: flex; gap: 8px; justify-content: flex-end; }
 .modal-actions .btn-danger { width: auto; margin-top: 0; }
 
-/* Search */
-.search-bar { position: relative; margin-bottom: 8px; }
-.search-result-count { font-size: 12px; color: var(--color-muted); margin-bottom: 8px; }
-
-/* Filter tabs */
-.filter-tabs { display: flex; gap: 4px; margin-bottom: 12px; flex-wrap: wrap; }
-.filter-tab {
-  padding: 4px 12px; border-radius: var(--radius);
-  border: 1px solid var(--color-border); background: transparent;
-  color: var(--color-muted); cursor: pointer; font-size: 13px;
-  transition: background 0.15s, color 0.15s;
-}
-.filter-tab.active { background: var(--color-primary); color: white; border-color: var(--color-primary); }
-.filter-tab:hover:not(.active) { border-color: var(--color-primary); color: var(--color-primary); }
-
-/* Load more */
-.load-more-btn {
-  width: 100%; margin-top: 8px; padding: 8px;
-  border: 1px dashed var(--color-border); border-radius: var(--radius);
-  background: transparent; color: var(--color-muted); cursor: pointer; font-size: 13px;
-}
-.load-more-btn:hover { border-color: var(--color-primary); color: var(--color-primary); }
-.load-more-btn:disabled { opacity: 0.5; cursor: default; }
-
-/* Session filter */
-.session-filter { width: 100%; margin-bottom: 8px; }
-
-/* Cluster modal */
 .modal-large { max-width: 600px; width: 90%; max-height: 80vh; overflow-y: auto; }
+
+/* ============================================================
+   Cluster Details Modal
+   ============================================================ */
 .cluster-comments-list {
   max-height: 280px; overflow-y: auto; margin: 12px 0;
-  border: 1px solid var(--color-border); border-radius: var(--radius); padding: 8px;
+  border: 1px solid var(--color-border); padding: 8px;
 }
+
 .cluster-comment-item {
   display: flex; flex-direction: column; gap: 4px;
   padding: 8px 0; border-bottom: 1px solid var(--color-border);
 }
 .cluster-comment-item:last-child { border-bottom: none; }
+
 .cluster-comment-meta { display: flex; justify-content: space-between; font-size: 11px; color: var(--color-muted); }
+
 .cluster-answer-box {
-  background: var(--color-bg); border-radius: var(--radius);
-  padding: 12px; margin-bottom: 12px; border: 1px solid var(--color-border);
+  background: var(--color-surface-alt); padding: 12px; margin-bottom: 12px;
+  border: 1px solid var(--color-border);
 }
 
 /* ============================================================
-   Settings page
+   Search & Filter
    ============================================================ */
-.settings-layout { max-width: 640px; margin: 0 auto; padding: 24px; display: flex; flex-direction: column; gap: 20px; }
-.settings-title { font-size: 20px; font-weight: 700; color: var(--color-text); }
-.settings-section h2 { font-size: 15px; font-weight: 600; margin-bottom: 16px; padding-bottom: 8px; border-bottom: 1px solid var(--color-border); }
-.settings-row { display: flex; align-items: center; justify-content: space-between; gap: 16px; }
-.settings-back { margin-bottom: 4px; }
+.search-bar           { position: relative; margin-bottom: 8px; }
+.search-result-count  { font-size: 10px; color: var(--color-muted); margin-bottom: 8px; font-family: var(--font-display); }
 
-/* ============================================================
-   Keyboard shortcuts modal
-   ============================================================ */
-.shortcuts-table { width: 100%; border-collapse: collapse; margin: 12px 0 20px; }
-.shortcuts-table td { padding: 6px 8px; font-size: 13px; }
-.shortcuts-table td:first-child { width: 130px; }
-.kbd { display: inline-block; padding: 2px 8px; border: 1px solid var(--color-border); border-radius: 4px; background: var(--color-surface-alt); font-family: monospace; font-size: 12px; color: var(--color-text); }
+.filter-tabs { display: flex; gap: 3px; margin-bottom: 12px; flex-wrap: wrap; }
+
+.filter-tab {
+  padding: 3px 10px;
+  border: 1px solid var(--color-border); background: transparent;
+  color: var(--color-muted); cursor: pointer;
+  font-size: 10px; font-family: var(--font-display);
+  letter-spacing: 0.04em;
+  transition: background 0.15s, color 0.15s, border-color 0.15s;
+}
+
+.filter-tab.active           { background: var(--color-accent); color: #0A0A0F; border-color: var(--color-accent); font-weight: 700; }
+.filter-tab:hover:not(.active) { border-color: var(--color-accent); color: var(--color-accent); }
+
+.load-more-btn {
+  width: 100%; padding: 8px;
+  border: 1px dashed var(--color-border);
+  background: transparent; color: var(--color-muted); cursor: pointer;
+  font-size: 11px; font-family: var(--font-display);
+  letter-spacing: 0.03em;
+  transition: border-color 0.15s, color 0.15s;
+}
+.load-more-btn:hover    { border-color: var(--color-accent); color: var(--color-accent); }
+.load-more-btn:disabled { opacity: 0.4; cursor: default; }
+
+.session-filter { width: 100%; margin-bottom: 8px; }
 
 /* ============================================================
-   Tab Bar (right column toggle)
+   Tab Bar (kept for settings / other pages)
    ============================================================ */
 .tab-bar { display: flex; gap: 4px; margin-bottom: 16px; }
+
 .tab-btn {
-  padding: 6px 16px; border-radius: var(--radius);
+  padding: 5px 14px;
   border: 1px solid var(--color-border); background: transparent;
-  color: var(--color-muted); cursor: pointer; font-size: 13px; font-weight: 500;
+  color: var(--color-muted); cursor: pointer;
+  font-size: 11px; font-weight: 500; font-family: var(--font-display);
   transition: background 0.15s, color 0.15s;
 }
-.tab-btn.active { background: var(--color-primary); color: #fff; border-color: var(--color-primary); }
+
+.tab-btn.active {
+  background: transparent;
+  color: var(--color-accent);
+  border-color: var(--color-border);
+  border-bottom: 2px solid var(--color-accent);
+  padding-bottom: 4px;
+}
+
 .tab-btn:hover:not(.active) { background: var(--color-btn-hover); color: var(--color-text); }
 
 /* ============================================================
    Analytics Panel
    ============================================================ */
-.analytics-stats { display: grid; grid-template-columns: repeat(3, 1fr); gap: 10px; margin-bottom: 16px; }
+.analytics-stats {
+  display: grid; grid-template-columns: 1fr 1fr;
+  gap: 8px; margin-bottom: 16px;
+}
+
 .analytics-stat {
   background: var(--color-surface-alt); border: 1px solid var(--color-border);
-  border-radius: 6px; padding: 12px; text-align: center;
+  padding: 10px; text-align: center;
+}
+
+.analytics-stat-value {
+  font-family: var(--font-display); font-size: 18px; font-weight: 700;
+  color: var(--color-accent);
+}
+
+.analytics-stat-label {
+  font-family: var(--font-display); font-size: 8px; letter-spacing: 0.1em;
+  text-transform: uppercase; color: var(--color-muted); margin-top: 2px;
 }
-.analytics-stat-value { font-size: 20px; font-weight: 700; color: var(--color-primary); }
-.analytics-stat-label { font-size: 11px; color: var(--color-muted); margin-top: 2px; }
 
-.analytics-chart { margin-bottom: 20px; }
-.analytics-chart h3 { font-size: 13px; font-weight: 600; margin-bottom: 8px; color: var(--color-text); }
+.analytics-chart { margin-bottom: 16px; }
+
+.analytics-chart h3 {
+  font-family: var(--font-display); font-size: 9px; font-weight: 700;
+  letter-spacing: 0.1em; text-transform: uppercase; margin-bottom: 8px;
+  color: var(--color-muted);
+}
 
 .top-topics-list { list-style: none; display: flex; flex-direction: column; gap: 6px; margin-bottom: 16px; }
-.top-topics-item { display: flex; align-items: center; justify-content: space-between; font-size: 13px; }
-.top-topics-bar-wrap { flex: 1; margin: 0 10px; height: 6px; background: var(--color-border); border-radius: 3px; overflow: hidden; }
-.top-topics-bar { height: 100%; background: var(--color-primary); border-radius: 3px; }
+.top-topics-item { display: flex; align-items: center; justify-content: space-between; font-size: 12px; }
+.top-topics-bar-wrap { flex: 1; margin: 0 10px; height: 3px; background: var(--color-border); overflow: hidden; }
+.top-topics-bar  { height: 100%; background: var(--color-accent); }
 
 .export-row { display: flex; gap: 8px; flex-wrap: wrap; margin-top: 8px; }
 
 /* ============================================================
    Activity Log
    ============================================================ */
-.activity-log { max-height: 300px; overflow-y: auto; display: flex; flex-direction: column; gap: 6px; }
+.activity-log { max-height: 300px; overflow-y: auto; display: flex; flex-direction: column; gap: 3px; }
+
 .activity-item {
   display: flex; align-items: flex-start; gap: 8px;
-  padding: 6px 8px; border-radius: 6px;
-  background: var(--color-surface-alt); border: 1px solid var(--color-border);
-  font-size: 12px;
+  padding: 5px 8px;
+  background: transparent; border-left: 2px solid var(--color-border);
+  font-size: 11px;
 }
+
 .activity-icon { flex-shrink: 0; }
 .activity-text { flex: 1; color: var(--color-text); }
-.activity-time { color: var(--color-muted); white-space: nowrap; flex-shrink: 0; }
+.activity-time {
+  color: var(--color-muted); white-space: nowrap; flex-shrink: 0;
+  font-family: var(--font-display); font-size: 9px;
+}
+
+/* ============================================================
+   Error Boundary
+   ============================================================ */
+.error-boundary {
+  padding: 2rem; background: var(--color-surface);
+  color: var(--color-text); margin: 2rem;
+  border: 1px solid var(--color-border);
+}
+.error-boundary h2      { font-size: 15px; font-weight: 600; margin-bottom: 12px; }
+.error-boundary details { margin-bottom: 16px; }
+.error-boundary summary { cursor: pointer; color: var(--color-muted); font-size: 13px; }
+.error-boundary pre     { margin-top: 8px; font-size: 12px; white-space: pre-wrap; color: var(--color-muted); }
+
+/* ============================================================
+   Quota Banner
+   ============================================================ */
+.quota-banner {
+  display: flex; flex-direction: row; align-items: center; gap: 10px;
+  padding: 8px 16px; font-size: 12px; font-weight: 500;
+  width: 100%; box-sizing: border-box; flex-shrink: 0;
+}
+.quota-banner-warning  { background: var(--color-warning-bg); border-bottom: 1px solid var(--color-warning-border); color: var(--color-text); }
+.quota-banner-critical { background: var(--color-error-bg); border-bottom: 1px solid var(--color-error-border); color: var(--color-text); }
+.quota-banner-icon     { flex-shrink: 0; width: 16px; height: 16px; }
+.quota-banner-text     { flex: 1; }
+.quota-banner-dismiss  { margin-left: auto; background: none; border: none; cursor: pointer; color: inherit; font-size: 16px; line-height: 1; padding: 0 4px; }
+
+/* ============================================================
+   Auth View
+   ============================================================ */
+.auth-view {
+  min-height: 100vh; display: flex; align-items: center;
+  justify-content: center; padding: 24px;
+}
+
+.auth-card {
+  background: var(--color-surface); border: 1px solid var(--color-border);
+  padding: 32px; width: 100%; max-width: 400px;
+}
+
+.auth-card h1 {
+  font-family: var(--font-display); font-size: 14px; font-weight: 700;
+  color: var(--color-accent); margin-bottom: 24px; text-align: center;
+  letter-spacing: 0.08em; text-transform: uppercase;
+}
+
+.auth-card h2 { font-size: 14px; font-weight: 600; margin-bottom: 16px; }
+.auth-card form { display: flex; flex-direction: column; gap: 12px; }
+.auth-card label { display: flex; flex-direction: column; gap: 4px; font-weight: 500; }
+
+.auth-switch { margin-top: 16px; text-align: center; font-size: 12px; color: var(--color-muted); }
+.auth-switch a { color: var(--color-accent); text-decoration: none; }
+.auth-switch a:hover { text-decoration: underline; }
+
+.error-msg {
+  background: var(--color-error-bg); border: 1px solid var(--color-error-border);
+  color: var(--color-danger); padding: 8px 12px; font-size: 12px; margin-bottom: 8px;
+}
+
+/* ============================================================
+   Settings Page
+   ============================================================ */
+.settings-layout { max-width: 640px; margin: 0 auto; padding: 24px; display: flex; flex-direction: column; gap: 20px; }
+
+.settings-title {
+  font-family: var(--font-display); font-size: 14px; font-weight: 700;
+  color: var(--color-text); letter-spacing: 0.06em; text-transform: uppercase;
+}
+
+.settings-section h2 {
+  font-family: var(--font-display); font-size: 10px; font-weight: 700;
+  letter-spacing: 0.1em; text-transform: uppercase;
+  margin-bottom: 16px; padding-bottom: 8px;
+  border-bottom: 1px solid var(--color-border); color: var(--color-muted);
+}
+
+.settings-row { display: flex; align-items: center; justify-content: space-between; gap: 16px; }
+.settings-back { margin-bottom: 4px; }
+
+/* ============================================================
+   Keyboard Shortcuts Modal
+   ============================================================ */
+.shortcuts-table { width: 100%; border-collapse: collapse; margin: 12px 0 20px; }
+.shortcuts-table td { padding: 6px 8px; font-size: 12px; }
+.shortcuts-table td:first-child { width: 130px; }
+
+.kbd {
+  display: inline-block; padding: 2px 6px;
+  border: 1px solid var(--color-border);
+  background: var(--color-surface-alt);
+  font-family: var(--font-display); font-size: 10px; color: var(--color-text);
+}
+
+/* ============================================================
+   Landing Page
+   ============================================================ */
+.landing { display: flex; flex-direction: column; min-height: 100vh; }
+
+.landing-header {
+  background: var(--color-surface); border-bottom: 1px solid var(--color-border);
+  padding: 0 48px; height: 60px; display: flex; align-items: center; justify-content: space-between;
+}
+
+.landing-nav { display: flex; gap: 12px; align-items: center; }
+.landing-nav .btn-primary { width: auto; margin-top: 0; }
+
+.landing-hero { text-align: center; padding: 64px 24px 48px; max-width: 680px; margin: 0 auto; }
+
+.landing-hero h1 {
+  font-family: var(--font-display); font-size: 28px; font-weight: 700;
+  color: var(--color-accent); margin-bottom: 16px; letter-spacing: 0.04em;
+}
+
+.landing-hero .tagline { font-size: 18px; font-weight: 600; color: var(--color-text); margin-bottom: 12px; }
+.landing-hero .subtitle { font-size: 14px; color: var(--color-muted); margin-bottom: 32px; line-height: 1.7; }
+
+.landing-ctas { display: flex; gap: 12px; justify-content: center; flex-wrap: wrap; }
+.landing-ctas .btn { padding: 10px 28px; font-size: 12px; }
+.landing-ctas .btn-primary { width: auto; margin-top: 0; }
+
+.landing-features { background: var(--color-surface); border-top: 1px solid var(--color-border); padding: 48px 24px; flex: 1; }
+
+.landing-features h2 {
+  font-family: var(--font-display); text-align: center; font-size: 14px; font-weight: 700;
+  margin-bottom: 32px; color: var(--color-text); letter-spacing: 0.06em; text-transform: uppercase;
+}
+
+.features-grid { display: grid; grid-template-columns: repeat(3, 1fr); gap: 20px; max-width: 900px; margin: 0 auto; }
+
+.feature-card { background: var(--color-bg); border: 1px solid var(--color-border); padding: 24px; text-align: center; }
+.feature-emoji { font-size: 28px; margin-bottom: 12px; }
+.feature-card h3 { font-family: var(--font-display); font-size: 11px; font-weight: 700; margin-bottom: 8px; letter-spacing: 0.06em; }
+.feature-card p  { font-size: 12px; color: var(--color-muted); line-height: 1.6; }
+
+.landing-footer { background: var(--color-surface); border-top: 1px solid var(--color-border); padding: 20px 24px; text-align: center; font-size: 12px; color: var(--color-muted); }
+
+/* ============================================================
+   Custom Scrollbars — thin, accent thumb
+   ============================================================ */
+::-webkit-scrollbar         { width: 4px; height: 4px; }
+::-webkit-scrollbar-track   { background: transparent; }
+::-webkit-scrollbar-thumb   { background: var(--color-border); }
+::-webkit-scrollbar-thumb:hover { background: var(--color-accent); }
+
+/* ============================================================
+   Responsive
+   ============================================================ */
+@media (max-width: 1200px) {
+  .app-shell  { height: auto; overflow: auto; }
+  .app-body   { flex-direction: column; overflow: visible; height: auto; }
+  .app-sidebar {
+    width: 100% !important;
+    border-right: none;
+    border-bottom: 1px solid var(--color-border);
+    max-height: 220px;
+    overflow-y: auto;
+  }
+  .app-main {
+    grid-template-columns: 1fr 1fr;
+    height: auto;
+    overflow: visible;
+  }
+  .main-col {
+    overflow: visible;
+    min-height: 300px;
+  }
+  .main-col:last-child {
+    display: flex;
+    grid-column: 1 / -1;
+  }
+}
+
+@media (max-width: 768px) {
+  .app-shell  { height: auto; overflow: auto; }
+  .app-body   { flex-direction: column; overflow: visible; height: auto; }
+  .app-sidebar {
+    width: 100% !important;
+    border-right: none;
+    border-bottom: 1px solid var(--color-border);
+  }
+  .app-main {
+    grid-template-columns: 1fr;
+    height: auto;
+    overflow: visible;
+  }
+  .main-col {
+    overflow: visible;
+    min-height: auto;
+    border-right: none;
+    border-bottom: 1px solid var(--color-border);
+  }
+  .main-col:nth-child(1) { order: 3; }
+  .main-col:nth-child(2) { order: 2; }
+  .main-col:last-child   { order: 1; display: flex; grid-column: unset; }
+}
+
+@media (max-width: 700px) {
+  .landing-header { padding: 0 20px; }
+  .landing-hero h1 { font-size: 22px; }
+  .features-grid   { grid-template-columns: 1fr; }
+  .landing-ctas    { flex-direction: column; align-items: center; }
+}
+
+/* Representative question inside cluster card */
+.cluster-rep-question {
+  font-size: 11px;
+  color: var(--color-text);
+  background: var(--color-accent-dim);
+  border-left: 2px solid var(--color-accent);
+  padding: 4px 8px;
+  margin: 0 14px 0;
+  line-height: 1.4;
+}
+.cluster-rep-label {
+  font-family: var(--font-display);
+  font-size: 9px;
+  font-weight: 700;
+  color: var(--color-accent);
+  letter-spacing: 0.06em;
+  text-transform: uppercase;
+  margin-right: 6px;
+}
+
+/* ============================================================
+   Hidden utility
+   ============================================================ */
+.hidden { display: none !important; }
+
+/* Legacy layout aliases (panels-grid replaced by app-body/app-main) */
+.panels-grid  { display: flex; flex-direction: column; }
+.left-column  { display: flex; flex-direction: column; }
+.right-column { display: flex; flex-direction: column; }
+.tab-view-panels { flex: 1; min-height: 0; display: flex; flex-direction: column; gap: 16px; }
+.analytics-scroll-wrapper { flex: 1; min-height: 0; overflow-y: auto; }
+
+/* User name in legacy header */
+.user-name   { color: var(--color-muted); margin-right: 8px; font-size: 12px; }
+
+/* ============================================================
+   Page Load — staggered entrance
+   ============================================================ */
+.sidebar-content > .panel:nth-child(1) { animation: sidebar-enter 0.3s ease both; animation-delay: 0ms; }
+.sidebar-content > .panel:nth-child(2) { animation: sidebar-enter 0.3s ease both; animation-delay: 50ms; }
+.sidebar-content > .panel:nth-child(3) { animation: sidebar-enter 0.3s ease both; animation-delay: 100ms; }
+.sidebar-content > .panel:nth-child(4) { animation: sidebar-enter 0.3s ease both; animation-delay: 150ms; }
+
+.main-col:nth-child(1) { animation: col-enter 0.3s ease both; animation-delay: 100ms; }
+.main-col:nth-child(2) { animation: col-enter 0.3s ease both; animation-delay: 180ms; }
+.main-col:nth-child(3) { animation: col-enter 0.3s ease both; animation-delay: 260ms; }
+
+/* Approve button — arming hover glow */
+.cluster-actions .btn-primary:hover:not(:disabled) {
+  animation: border-arm 0.2s ease forwards;
+  background: var(--color-success);
+  color: #0A0A0F;
+}
diff --git a/frontend/src/pages/DashboardPage.jsx b/frontend/src/pages/DashboardPage.jsx
index 0bedfd7..8b95412 100644
--- a/frontend/src/pages/DashboardPage.jsx
+++ b/frontend/src/pages/DashboardPage.jsx
@@ -11,12 +11,16 @@ import { QuestionsFeed } from '../components/Dashboard/QuestionsFeed';
 import { ClustersPanel } from '../components/Dashboard/ClustersPanel';
 import { DocumentUpload } from '../components/Dashboard/DocumentUpload';
 import { AnalyticsPanel } from '../components/Dashboard/AnalyticsPanel';
+import { QuotaBanner } from '../components/Dashboard/QuotaBanner';
 
 export function DashboardPage() {
   const { token } = useAuth();
   const [activeSession, setActiveSession] = useState(null);
   const { messages: wsMessages, connected, reconnecting } = useWebSocket(activeSession?.id, token);
 
+  // Sidebar collapse state
+  const [sidebarCollapsed, setSidebarCollapsed] = useState(false);
+
   // Shortcut action refs
   const approveFirstRef = useRef(null);  // wired by ClustersPanel
   const titleInputRef = useRef(null);    // wired by SessionList (new session title input)
@@ -31,25 +35,35 @@ export function DashboardPage() {
     }, [activeSession]),
   });
 
-  // Tab view: 'main' | 'analytics' — reset on session change
-  const [view, setView] = useState('main');
-  useEffect(() => { setView('main'); }, [activeSession?.id]);
-
   // Session-scoped event accumulator — survives WS reconnects, resets on session change
   const [sessionEvents, setSessionEvents] = useState([]);
+  const [quotaAlert, setQuotaAlert] = useState(null);
   useEffect(() => { setSessionEvents([]); }, [activeSession?.id]);
+  useEffect(() => { setQuotaAlert(null); }, [activeSession?.id]);
   useEffect(() => {
     if (!wsMessages || wsMessages.length === 0) return;
     const last = wsMessages[wsMessages.length - 1];
-    if (last) setSessionEvents(prev => [...prev.slice(-199), last]);
+    if (!last) return;
+    setSessionEvents(prev => [...prev.slice(-199), last]);
+    if (last.type === 'quota_alert') {
+      setQuotaAlert(prev => (prev === 'critical' ? 'critical' : 'warning'));
+    } else if (last.type === 'quota_exceeded') {
+      setQuotaAlert('critical');
+    }
   }, [wsMessages]);
 
   return (
-    <div>
+    <div className="app-shell">
       <Header connected={connected} reconnecting={reconnecting} activeSession={activeSession} />
-      <main className="app-main">
-        <div className="panels-grid">
-          <div className="left-column">
+      {quotaAlert && (
+        <QuotaBanner
+          level={quotaAlert}
+          onDismiss={() => setQuotaAlert(null)}
+        />
+      )}
+      <div className="app-body">
+        <aside className={`app-sidebar${sidebarCollapsed ? ' collapsed' : ''}`}>
+          <div className="sidebar-content">
             <SessionList
               token={token}
               onSelect={setActiveSession}
@@ -61,54 +75,65 @@ export function DashboardPage() {
               <ManualInput sessionId={activeSession.id} token={token} textareaRef={manualInputRef} />
             )}
             {activeSession && <DocumentUpload sessionId={activeSession.id} token={token} />}
-            <MetricsCards sessionId={activeSession?.id} token={token} wsMessages={wsMessages} />
           </div>
-          <div className="right-column">
+          <button
+            className="sidebar-toggle"
+            onClick={() => setSidebarCollapsed(c => !c)}
+            aria-label={sidebarCollapsed ? 'Expand sidebar' : 'Collapse sidebar'}
+          >
+            <svg width="14" height="14" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
+              <polyline points="15,18 9,12 15,6" />
+            </svg>
+          </button>
+        </aside>
+
+        <main className="app-main">
+          {/* Column 1 — Live Feed */}
+          <div className="main-col">
             {activeSession ? (
-              <>
-                <div className="tab-bar">
-                  <button
-                    className={`tab-btn${view === 'main' ? ' active' : ''}`}
-                    onClick={() => setView('main')}
-                  >
-                    Questions &amp; Clusters
-                  </button>
-                  <button
-                    className={`tab-btn${view === 'analytics' ? ' active' : ''}`}
-                    onClick={() => setView('analytics')}
-                  >
-                    Analytics
-                  </button>
-                </div>
+              <QuestionsFeed
+                sessionId={activeSession.id}
+                token={token}
+                wsMessages={wsMessages}
+              />
+            ) : (
+              <div className="empty-state" style={{ padding: '48px 24px' }}>
+                <p className="empty-state-title">LIVE FEED</p>
+                <p className="empty-state-description">Select a session to see incoming questions</p>
+              </div>
+            )}
+          </div>
 
-                {view === 'main' ? (
-                  <>
-                    <QuestionsFeed
-                      sessionId={activeSession.id}
-                      token={token}
-                      wsMessages={wsMessages}
-                    />
-                    <ClustersPanel
-                      sessionId={activeSession.id}
-                      token={token}
-                      wsMessages={wsMessages}
-                      approveFirstRef={approveFirstRef}
-                    />
-                  </>
-                ) : (
-                  <AnalyticsPanel
-                    sessionId={activeSession.id}
-                    token={token}
-                    sessionEvents={sessionEvents}
-                  />
-                )}
-              </>
+          {/* Column 2 — Clusters */}
+          <div className="main-col">
+            {activeSession ? (
+              <ClustersPanel
+                sessionId={activeSession.id}
+                token={token}
+                wsMessages={wsMessages}
+                approveFirstRef={approveFirstRef}
+              />
             ) : (
-              <p className="text-muted">Select or create a session to begin.</p>
+              <div className="empty-state" style={{ padding: '48px 24px' }}>
+                <p className="empty-state-title">CLUSTERS</p>
+                <p className="empty-state-description">Question clusters will appear here</p>
+              </div>
+            )}
+          </div>
+
+          {/* Column 3 — Stats + Analytics */}
+          <div className="main-col col-scrollable">
+            <MetricsCards sessionId={activeSession?.id} token={token} wsMessages={wsMessages} />
+            {activeSession && (
+              <AnalyticsPanel
+                sessionId={activeSession.id}
+                token={token}
+                sessionEvents={sessionEvents}
+              />
             )}
           </div>
-        </div>
-      </main>
+        </main>
+      </div>
     </div>
   );
 }
diff --git a/frontend/src/services/api.js b/frontend/src/services/api.js
index a5309eb..00e130a 100644
--- a/frontend/src/services/api.js
+++ b/frontend/src/services/api.js
@@ -3,6 +3,35 @@
  * Base helper redirects to /login on 401.
  */
 
+let refreshPromise = null;
+
+export async function refreshAccessToken() {
+  const refreshToken = localStorage.getItem('refreshToken');
+  if (!refreshToken) return null;
+  try {
+    const res = await fetch('/api/v1/auth/refresh', {
+      method: 'POST',
+      headers: { 'Content-Type': 'application/json' },
+      body: JSON.stringify({ refresh_token: refreshToken }),
+    });
+    if (!res.ok) {
+      console.error(`Token refresh failed: HTTP ${res.status}`);
+      localStorage.removeItem('refreshToken');
+      handleUnauthorized();
+      return null;
+    }
+    const data = await res.json();
+    localStorage.setItem('token', data.access_token);
+    localStorage.setItem('refreshToken', data.refresh_token);
+    return data.access_token;
+  } catch (err) {
+    console.error('Token refresh error:', err);
+    localStorage.removeItem('refreshToken');
+    handleUnauthorized();
+    return null;
+  }
+}
+
 function handleUnauthorized() {
   localStorage.removeItem('token');
   localStorage.removeItem('userEmail');
@@ -16,6 +45,25 @@ async function apiFetch(path, options = {}, token = null) {
   const res = await fetch(path, { ...options, headers });
 
   if (res.status === 401) {
+    if (!refreshPromise) {
+      refreshPromise = refreshAccessToken().finally(() => {
+        refreshPromise = null;
+      });
+    }
+    const newToken = await refreshPromise;
+    if (newToken) {
+      const retryHeaders = { ...headers, Authorization: `Bearer ${newToken}` };
+      const retryRes = await fetch(path, { ...options, headers: retryHeaders });
+      if (!retryRes.ok) {
+        if (retryRes.status === 401) {
+          handleUnauthorized();
+          return;
+        }
+        const body = await retryRes.json().catch(() => ({}));
+        throw new Error(body.detail || body.message || `HTTP ${retryRes.status}`);
+      }
+      return retryRes.status === 204 ? null : retryRes.json();
+    }
     handleUnauthorized();
     return;
   }
@@ -149,6 +197,9 @@ export const deleteDocument = (documentId, token) =>
 export const getClusterComments = (clusterId, token) =>
   apiFetch(`/api/v1/clusters/${clusterId}/comments`, {}, token);
 
+export const getRepresentativeQuestion = (clusterId, token) =>
+  apiFetch(`/api/v1/dashboard/clusters/${clusterId}/representative`, {}, token);
+
 // Profile & password
 export const updateProfile = (data, token) =>
   apiFetch('/api/v1/auth/profile', { method: 'PATCH', body: JSON.stringify(data) }, token);
diff --git a/infra/docker/api.Dockerfile b/infra/docker/api.Dockerfile
index e88c791..148348c 100644
--- a/infra/docker/api.Dockerfile
+++ b/infra/docker/api.Dockerfile
@@ -9,5 +9,5 @@ COPY backend/ ./backend/
 
 ENV PYTHONPATH=/app
 
-CMD ["uvicorn", "backend.app.main:app", "--host", "0.0.0.0", "--port", "8000"]
+CMD ["uvicorn", "backend.app.main:app", "--host", "0.0.0.0", "--port", "8000", "--workers", "2"]
 
diff --git a/infra/docker/redis.conf b/infra/docker/redis.conf
index 6107cc3..ebde656 100644
--- a/infra/docker/redis.conf
+++ b/infra/docker/redis.conf
@@ -1,7 +1,7 @@
 # Redis configuration for AI Live Doubt Manager
 
 maxmemory 256mb
-maxmemory-policy allkeys-lru
+maxmemory-policy volatile-lru
 save 900 1
 save 300 10
 save 60 10000
diff --git a/pyproject.toml b/pyproject.toml
index 4fc422b..1e1ffa6 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -42,14 +42,49 @@ ignore = ["D107", "D212", "E501", "W503", "W605", "D203", "D100"]
 docstring-convention = "all"
 
 [tool.pylint.main]
+ignore-paths = ["backend/alembic/versions/"]
 disable = [
     "line-too-long",
     "trailing-whitespace",
     "missing-function-docstring",
+    "missing-module-docstring",
+    "missing-class-docstring",
     "consider-using-f-string",
     "import-error",
     "too-few-public-methods",
     "redefined-outer-name",
+    "wrong-import-position",
+    "wrong-import-order",
+    "ungrouped-imports",
+    "invalid-name",
+    "logging-fstring-interpolation",
+    "global-statement",
+    "global-variable-not-assigned",
+    "unnecessary-pass",
+    "fixme",
+    "pointless-string-statement",
+    "broad-exception-caught",
+    "duplicate-code",
+    "too-many-locals",
+    "too-many-arguments",
+    "too-many-branches",
+    "too-many-statements",
+    "too-many-nested-blocks",
+    "too-many-instance-attributes",
+    "unused-argument",
+    "unused-import",
+    "unused-variable",
+    "no-member",
+    "import-outside-toplevel",
+    "raise-missing-from",
+    "not-callable",
+    "singleton-comparison",
+    "no-else-continue",
+    "implicit-str-concat",
+    "keyword-arg-before-vararg",
+    "missing-timeout",
+    "subprocess-run-check",
+    "protected-access",
 ]
 
 [tool.radon]
diff --git a/scripts/load_test.py b/scripts/load_test.py
index 6156d9a..5903f97 100644
--- a/scripts/load_test.py
+++ b/scripts/load_test.py
@@ -1,10 +1,12 @@
 """Load testing script."""
 
 import asyncio
-import aiohttp
+import os
 import time
 from typing import List
 
+import aiohttp
+
 
 async def make_request(session: aiohttp.ClientSession, url: str) -> dict:
     """Make a single HTTP request.
@@ -29,22 +31,19 @@ async def run_load_test(url: str, num_requests: int, concurrency: int) -> None:
         concurrency: Number of concurrent requests.
     """
     print(f"Starting load test: {num_requests} requests, {concurrency} concurrent")
-    
+
     async with aiohttp.ClientSession() as session:
         tasks: List = []
         start_time = time.time()
-        
+
         for i in range(0, num_requests, concurrency):
-            batch = [
-                make_request(session, url)
-                for _ in range(min(concurrency, num_requests - i))
-            ]
+            batch = [make_request(session, url) for _ in range(min(concurrency, num_requests - i))]
             tasks.extend(batch)
             await asyncio.gather(*batch)
-        
+
         end_time = time.time()
         duration = end_time - start_time
-        
+
         print(f"Load test completed: {num_requests} requests in {duration:.2f}s")
         print(f"Requests per second: {num_requests / duration:.2f}")
 
@@ -53,6 +52,5 @@ async def run_load_test(url: str, num_requests: int, concurrency: int) -> None:
     url = os.getenv("TEST_URL", "http://localhost:8000/health")
     num_requests = int(os.getenv("NUM_REQUESTS", "100"))
     concurrency = int(os.getenv("CONCURRENCY", "10"))
-    
-    asyncio.run(run_load_test(url, num_requests, concurrency))
 
+    asyncio.run(run_load_test(url, num_requests, concurrency))
diff --git a/scripts/migrate.py b/scripts/migrate.py
index 69797e2..8485628 100644
--- a/scripts/migrate.py
+++ b/scripts/migrate.py
@@ -1,6 +1,5 @@
 """Database migration script."""
 
-import os
 import sys
 from pathlib import Path
 
@@ -21,4 +20,3 @@ def run_migrations() -> None:
 
 if __name__ == "__main__":
     run_migrations()
-
diff --git a/scripts/seed_rag.py b/scripts/seed_rag.py
index 26291af..cd17a28 100644
--- a/scripts/seed_rag.py
+++ b/scripts/seed_rag.py
@@ -1,6 +1,5 @@
 """Script to seed RAG documents."""
 
-import os
 import sys
 from pathlib import Path
 
@@ -8,7 +7,6 @@
 sys.path.insert(0, str(Path(__file__).parent.parent))
 
 from backend.app.db.session import SessionLocal
-from backend.app.db.models.rag import RAGDocument
 
 
 def seed_rag_documents() -> None:
@@ -24,4 +22,3 @@ def seed_rag_documents() -> None:
 
 if __name__ == "__main__":
     seed_rag_documents()
-
diff --git a/scripts/test_ai_pipeline.py b/scripts/test_ai_pipeline.py
index 81d972d..2b007ce 100644
--- a/scripts/test_ai_pipeline.py
+++ b/scripts/test_ai_pipeline.py
@@ -1,25 +1,28 @@
 """End-to-end test for the AI pipeline: classification → embedding → clustering → answer."""
 
 import datetime
-from datetime import timezone
 import os
 import sys
 import time
 import uuid
+from datetime import timezone
 
 _project_root = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
-from sqlalchemy import create_engine
-from sqlalchemy.orm import sessionmaker
+from app.db.models.answer import Answer  # noqa: E402
+from app.db.models.comment import Comment  # noqa: E402
+from app.db.models.streaming_session import StreamingSession  # noqa: E402
+from app.db.models.teacher import Teacher  # noqa: E402
+from sqlalchemy import create_engine  # noqa: E402
+from sqlalchemy.orm import sessionmaker  # noqa: E402
 
-from workers.common.queue import QueueManager, QUEUE_CLASSIFICATION
-from workers.common.schemas import ClassificationPayload
-from app.db.models.teacher import Teacher
-from app.db.models.streaming_session import StreamingSession
-from app.db.models.comment import Comment
-from app.db.models.answer import Answer
+from workers.common.queue import (  # noqa: E402
+    QUEUE_CLASSIFICATION,
+    QueueManager,
+)
+from workers.common.schemas import ClassificationPayload  # noqa: E402
 
 DATABASE_URL = os.environ["DATABASE_URL"]
 engine = create_engine(DATABASE_URL)
@@ -31,36 +34,31 @@
 
 def main():
     # Insert test data
-    teacher = Teacher(
-        email=f"test_{uuid.uuid4()}@test.com",
-        name="Test Teacher",
-        hashed_password="x",
-        is_active=True
-    )
+    teacher = Teacher(email=f"test_{uuid.uuid4()}@test.com", name="Test Teacher", hashed_password="x", is_active=True)
     db.add(teacher)
     db.flush()
-    
+
     session = StreamingSession(
         teacher_id=teacher.id,
         youtube_video_id=f"test_{uuid.uuid4()}",
         is_active=True,
-        started_at=datetime.datetime.now(timezone.utc)
+        started_at=datetime.datetime.now(timezone.utc),
     )
     db.add(session)
     db.flush()
-    
+
     # Create 5 test questions
     questions = [
         "What is photosynthesis?",
         "How does cellular respiration work?",
         "Explain the water cycle",
         "What are the phases of mitosis?",
-        "How do enzymes function in cells?"
+        "How do enzymes function in cells?",
     ]
-    
+
     comments = []
     manager = QueueManager()
-    
+
     for i, question_text in enumerate(questions):
         comment = Comment(
             session_id=session.id,
@@ -68,44 +66,43 @@ def main():
             author_name=f"Student{i+1}",
             text=question_text,
             is_question=False,
-            is_answered=False
+            is_answered=False,
         )
         db.add(comment)
         db.flush()
         comments.append(comment)
-        
+
         # Enqueue for classification
-        manager.enqueue(QUEUE_CLASSIFICATION, ClassificationPayload(
-            comment_id=str(comment.id),
-            text=comment.text,
-            session_id=str(session.id)
-        ).to_dict())
-    
+        manager.enqueue(
+            QUEUE_CLASSIFICATION,
+            ClassificationPayload(comment_id=str(comment.id), text=comment.text, session_id=str(session.id)).to_dict(),
+        )
+
     db.commit()
     print(f"Enqueued {len(comments)} comments for classification")
-    
+
     # Wait for first comment to go through all stages
     first_comment = comments[0]
-    
+
     stages = [
         ("Classification", lambda c: c.is_question is not None),
         ("Embedding", lambda c: c.embedding is not None),
         ("Clustering", lambda c: c.cluster_id is not None),
         ("Answer", lambda c: db.query(Answer).filter(Answer.cluster_id == c.cluster_id).first() is not None),
     ]
-    
+
     start = time.time()
     for name, check in stages:
         print(f"Waiting for {name}...")
         while time.time() - start < TIMEOUT:
             db.refresh(first_comment)
             if check(first_comment):
-                print(f"  ✓ {name} complete ({time.time()-start:.1f}s)")
+                print(f"  ✓ {name} complete ({time.time() - start:.1f}s)")
                 break
             time.sleep(3)
         else:
             print(f"  ✗ {name} timed out after {TIMEOUT}s")
-    
+
     # Cleanup
     for comment in comments:
         db.delete(comment)
@@ -114,5 +111,6 @@ def main():
     db.commit()
     print("Cleanup done")
 
+
 if __name__ == "__main__":
-    main()
\ No newline at end of file
+    main()
diff --git a/scripts/test_tech_debt.py b/scripts/test_tech_debt.py
index 15e6cbb..b9ed74a 100644
--- a/scripts/test_tech_debt.py
+++ b/scripts/test_tech_debt.py
@@ -1,8 +1,8 @@
 """End-to-end tests for Phase 2.5 tech debt fixes."""
 
+import os
 import sys
 import time
-import os
 
 import requests
 
@@ -28,6 +28,7 @@ def clear_rate_limits():
     """Clear rate limit keys from Redis to avoid test pollution."""
     try:
         import redis
+
         r = redis.from_url(os.getenv("REDIS_URL", "redis://localhost:6379/0"))
         deleted = 0
         for key in r.scan_iter("ratelimit:*"):
@@ -78,7 +79,8 @@ def clear_rate_limits():
     # Check source for fixed_salt
     result = subprocess.run(
         ["grep", "-r", "fixed_salt", os.path.join(os.path.dirname(__file__), "../backend")],
-        capture_output=True, text=True
+        capture_output=True,
+        text=True,
     )
     check(
         "No hardcoded fixed_salt in source",
@@ -88,7 +90,11 @@ def clear_rate_limits():
 
     # Test roundtrip via direct import
     sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../backend"))
-    from app.core.encryption import decrypt_data, encrypt_data
+    from app.core.encryption import (
+        decrypt_data,
+        encrypt_data,
+    )
+
     plaintext = "hello world secret"
     encrypted = encrypt_data(plaintext)
     decrypted = decrypt_data(encrypted)
@@ -103,15 +109,14 @@ def clear_rate_limits():
 print("\n=== Test 3: Metrics Endpoint ===")
 
 # Register
-reg = requests.post(f"{BASE_URL}/api/v1/auth/register", json={
-    "email": TEST_EMAIL, "name": "Tech Debt Tester", "password": TEST_PASSWORD
-})
+reg = requests.post(
+    f"{BASE_URL}/api/v1/auth/register",
+    json={"email": TEST_EMAIL, "name": "Tech Debt Tester", "password": TEST_PASSWORD},
+)
 check("Register succeeds", reg.status_code == 201, f"status={reg.status_code}")
 
 # Login
-login = requests.post(f"{BASE_URL}/api/v1/auth/login", json={
-    "email": TEST_EMAIL, "password": TEST_PASSWORD
-})
+login = requests.post(f"{BASE_URL}/api/v1/auth/login", json={"email": TEST_EMAIL, "password": TEST_PASSWORD})
 check("Login succeeds", login.status_code == 200, f"status={login.status_code}")
 token = login.json().get("access_token", "") if login.status_code == 200 else ""
 
@@ -124,10 +129,7 @@ def clear_rate_limits():
 )
 
 if token:
-    metrics_resp = requests.get(
-        f"{BASE_URL}/api/v1/metrics",
-        headers={"Authorization": f"Bearer {token}"}
-    )
+    metrics_resp = requests.get(f"{BASE_URL}/api/v1/metrics", headers={"Authorization": f"Bearer {token}"})
     check(
         "GET /api/v1/metrics with token → 200",
         metrics_resp.status_code == 200,
@@ -148,32 +150,21 @@ def clear_rate_limits():
 print("\n=== Test 4: Token Blacklist ===")
 
 # Fresh login for a clean token
-login2 = requests.post(f"{BASE_URL}/api/v1/auth/login", json={
-    "email": TEST_EMAIL, "password": TEST_PASSWORD
-})
+login2 = requests.post(f"{BASE_URL}/api/v1/auth/login", json={"email": TEST_EMAIL, "password": TEST_PASSWORD})
 check("Second login succeeds", login2.status_code == 200, f"status={login2.status_code}")
 token2 = login2.json().get("access_token", "") if login2.status_code == 200 else ""
 
 if token2:
     # Verify token works pre-logout
-    me_before = requests.get(
-        f"{BASE_URL}/api/v1/auth/me",
-        headers={"Authorization": f"Bearer {token2}"}
-    )
+    me_before = requests.get(f"{BASE_URL}/api/v1/auth/me", headers={"Authorization": f"Bearer {token2}"})
     check("Token valid before logout", me_before.status_code == 200, f"status={me_before.status_code}")
 
     # Logout
-    logout_resp = requests.post(
-        f"{BASE_URL}/api/v1/auth/logout",
-        headers={"Authorization": f"Bearer {token2}"}
-    )
+    logout_resp = requests.post(f"{BASE_URL}/api/v1/auth/logout", headers={"Authorization": f"Bearer {token2}"})
     check("Logout succeeds", logout_resp.status_code == 200, f"status={logout_resp.status_code}")
 
     # Old token should now be rejected
-    me_after = requests.get(
-        f"{BASE_URL}/api/v1/auth/me",
-        headers={"Authorization": f"Bearer {token2}"}
-    )
+    me_after = requests.get(f"{BASE_URL}/api/v1/auth/me", headers={"Authorization": f"Bearer {token2}"})
     check(
         "Old token rejected after logout (401/403)",
         me_after.status_code in (401, 403),
diff --git a/scripts/test_youtube_integration.py b/scripts/test_youtube_integration.py
index d717682..1de2cfc 100644
--- a/scripts/test_youtube_integration.py
+++ b/scripts/test_youtube_integration.py
@@ -4,11 +4,17 @@
 Run with: python -m pytest scripts/test_youtube_integration.py -v
 """
 
-import sys
 import os
+import sys
 import unittest
-from unittest.mock import MagicMock, patch, AsyncMock
-from datetime import datetime, timezone
+from datetime import (
+    datetime,
+    timezone,
+)
+from unittest.mock import (
+    MagicMock,
+    patch,
+)
 
 # Ensure backend is importable
 _root = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
@@ -22,10 +28,14 @@ class TestYouTubeOAuth(unittest.TestCase):
     @patch("app.services.youtube.oauth.Flow")
     def test_get_authorization_url_returns_url_and_state(self, mock_flow_class):
         mock_flow = MagicMock()
-        mock_flow.authorization_url.return_value = ("https://accounts.google.com/o/oauth2/auth?scope=...", "test-state-xyz")
+        mock_flow.authorization_url.return_value = (
+            "https://accounts.google.com/o/oauth2/auth?scope=...",
+            "test-state-xyz",
+        )
         mock_flow_class.from_client_config.return_value = mock_flow
 
         from app.services.youtube.oauth import YouTubeOAuthService
+
         svc = YouTubeOAuthService()
         url, state = svc.get_authorization_url()
 
@@ -48,6 +58,7 @@ def test_exchange_code_returns_token_dict(self, mock_flow_class):
         mock_flow_class.from_client_config.return_value = mock_flow
 
         from app.services.youtube.oauth import YouTubeOAuthService
+
         svc = YouTubeOAuthService()
         result = svc.exchange_code_for_token("auth-code-xyz")
 
@@ -63,13 +74,12 @@ class TestYouTubeClient(unittest.TestCase):
     def test_get_live_chat_id_returns_id(self, mock_build):
         mock_service = MagicMock()
         mock_service.videos().list().execute.return_value = {
-            "items": [{
-                "liveStreamingDetails": {"activeLiveChatId": "chat123"}
-            }]
+            "items": [{"liveStreamingDetails": {"activeLiveChatId": "chat123"}}]
         }
         mock_build.return_value = mock_service
 
         from app.services.youtube.client import YouTubeClient
+
         client = YouTubeClient("access_token")
         chat_id = client.get_live_chat_id("video123")
         self.assertEqual(chat_id, "chat123")
@@ -81,6 +91,7 @@ def test_get_live_chat_id_returns_none_when_no_items(self, mock_build):
         mock_build.return_value = mock_service
 
         from app.services.youtube.client import YouTubeClient
+
         client = YouTubeClient("access_token")
         result = client.get_live_chat_id("nonexistent_video")
         self.assertIsNone(result)
@@ -92,12 +103,20 @@ def test_list_messages_filters_text_events(self, mock_build):
             "items": [
                 {
                     "id": "msg1",
-                    "snippet": {"type": "textMessageEvent", "displayMessage": "Hello", "publishedAt": "2026-01-01T00:00:00Z"},
+                    "snippet": {
+                        "type": "textMessageEvent",
+                        "displayMessage": "Hello",
+                        "publishedAt": "2026-01-01T00:00:00Z",
+                    },
                     "authorDetails": {"displayName": "Alice", "channelId": "ch1"},
                 },
                 {
                     "id": "msg2",
-                    "snippet": {"type": "superChatEvent", "displayMessage": "Donation", "publishedAt": "2026-01-01T00:01:00Z"},
+                    "snippet": {
+                        "type": "superChatEvent",
+                        "displayMessage": "Donation",
+                        "publishedAt": "2026-01-01T00:01:00Z",
+                    },
                     "authorDetails": {"displayName": "Bob", "channelId": "ch2"},
                 },
             ],
@@ -107,6 +126,7 @@ def test_list_messages_filters_text_events(self, mock_build):
         mock_build.return_value = mock_service
 
         from app.services.youtube.client import YouTubeClient
+
         client = YouTubeClient("access_token")
         result = client.list_messages("chat123")
 
@@ -122,6 +142,7 @@ def test_post_message_truncates_to_200_chars(self, mock_build):
         mock_build.return_value = mock_service
 
         from app.services.youtube.client import YouTubeClient
+
         client = YouTubeClient("access_token")
         long_text = "A" * 300
         msg_id = client.post_message("chat123", long_text)
@@ -144,6 +165,7 @@ def test_check_quota_returns_true_when_under_limit(self, mock_redis_lib):
         mock_redis_lib.from_url.return_value = mock_redis
 
         from app.services.youtube.quota import YouTubeQuotaService
+
         svc = YouTubeQuotaService()
         self.assertTrue(svc.check_quota("teacher-1", "poll"))
 
@@ -154,6 +176,7 @@ def test_check_quota_returns_false_when_exceeded(self, mock_redis_lib):
         mock_redis_lib.from_url.return_value = mock_redis
 
         from app.services.youtube.quota import YouTubeQuotaService
+
         svc = YouTubeQuotaService()
         self.assertFalse(svc.check_quota("teacher-1", "poll"))
 
@@ -165,6 +188,7 @@ def test_record_usage_uses_pipeline(self, mock_redis_lib):
         mock_redis_lib.from_url.return_value = mock_redis
 
         from app.services.youtube.quota import YouTubeQuotaService
+
         svc = YouTubeQuotaService()
         svc.record_usage("teacher-1", "post")
 
@@ -179,6 +203,7 @@ def test_check_quota_handles_none_from_redis(self, mock_redis_lib):
         mock_redis_lib.from_url.return_value = mock_redis
 
         from app.services.youtube.quota import YouTubeQuotaService
+
         svc = YouTubeQuotaService()
         # None means 0 used, should allow any operation
         self.assertTrue(svc.check_quota("teacher-1", "post"))
@@ -194,6 +219,7 @@ def test_get_live_chat_id_delegates_to_client(self, mock_client_class):
         mock_client_class.return_value = mock_client
 
         from app.services.youtube.polling import YouTubePollingService
+
         svc = YouTubePollingService()
         result = svc.get_live_chat_id("video123", "access_token")
 
@@ -211,6 +237,7 @@ def test_fetch_messages_delegates_to_client(self, mock_client_class):
         mock_client_class.return_value = mock_client
 
         from app.services.youtube.polling import YouTubePollingService
+
         svc = YouTubePollingService()
         result = svc.fetch_live_chat_messages("chat123", "access_token")
 
@@ -228,6 +255,7 @@ def test_post_message_delegates_to_client(self, mock_client_class):
         mock_client_class.return_value = mock_client
 
         from app.services.youtube.posting import YouTubePostingService
+
         svc = YouTubePostingService()
         result = svc.post_message("chat123", "Test answer text", "access_token")
 
diff --git a/scripts/truncate_embeddings.sql b/scripts/truncate_embeddings.sql
new file mode 100644
index 0000000..02bbe19
--- /dev/null
+++ b/scripts/truncate_embeddings.sql
@@ -0,0 +1,14 @@
+-- Run with: psql $DATABASE_URL -f scripts/truncate_embeddings.sql
+
+BEGIN;
+
+UPDATE comments SET embedding = NULL;
+-- comments.embedding cleared
+
+UPDATE clusters SET centroid_embedding = NULL;
+-- clusters.centroid_embedding cleared
+
+UPDATE rag_documents SET embedding = NULL;
+-- rag_documents.embedding cleared
+
+COMMIT;
diff --git a/scripts/verify_mock_data.py b/scripts/verify_mock_data.py
new file mode 100644
index 0000000..5bb1cf2
--- /dev/null
+++ b/scripts/verify_mock_data.py
@@ -0,0 +1,164 @@
+"""Verify data integrity of mock YouTube ingestion pipeline."""
+
+import os
+import sys
+
+_root = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+sys.path.insert(0, _root)
+sys.path.insert(0, os.path.join(_root, "backend"))
+
+os.environ.setdefault("ENVIRONMENT", "development")
+
+from app.db.models.answer import Answer  # noqa: E402
+from app.db.models.cluster import Cluster  # noqa: E402
+from app.db.models.comment import Comment  # noqa: E402
+from sqlalchemy import (  # noqa: E402
+    case,
+    func,
+)
+
+from workers.common.db import get_db_session  # noqa: E402
+
+
+def run():
+    for db in get_db_session():
+        try:
+            # ---------------------------------------------------------------
+            # 1. Total mock comments
+            # ---------------------------------------------------------------
+            total_mock = db.query(func.count(Comment.id)).filter(Comment.youtube_comment_id.like("mock:%")).scalar()
+            print("=" * 60)
+            print(f"1) TOTAL MOCK COMMENTS: {total_mock}")
+            print("=" * 60)
+
+            if total_mock == 0:
+                print("   No mock comments found. Nothing to verify.")
+                return
+
+            # ---------------------------------------------------------------
+            # 2. Comments grouped by cluster — first 3 texts per cluster
+            # ---------------------------------------------------------------
+            print("\n2) COMMENTS BY CLUSTER (first 3 per cluster)")
+            print("-" * 60)
+
+            # Unclustered
+            unclustered = (
+                db.query(func.count(Comment.id))
+                .filter(
+                    Comment.youtube_comment_id.like("mock:%"),
+                    Comment.cluster_id.is_(None),
+                )
+                .scalar()
+            )
+            print(f"\n  [UNCLUSTERED] — {unclustered} comments")
+            if unclustered:
+                samples = (
+                    db.query(Comment.text)
+                    .filter(
+                        Comment.youtube_comment_id.like("mock:%"),
+                        Comment.cluster_id.is_(None),
+                    )
+                    .limit(3)
+                    .all()
+                )
+                for i, (text,) in enumerate(samples, 1):
+                    print(f'    {i}. "{text}"')
+
+            # Clustered
+            cluster_rows = (
+                db.query(
+                    Cluster.id,
+                    Cluster.title,
+                    func.count(Comment.id).label("cnt"),
+                )
+                .join(Comment, Comment.cluster_id == Cluster.id)
+                .filter(Comment.youtube_comment_id.like("mock:%"))
+                .group_by(Cluster.id, Cluster.title)
+                .order_by(func.count(Comment.id).desc())
+                .all()
+            )
+
+            for cid, title, cnt in cluster_rows:
+                print(f'\n  Cluster: "{title}"  ({cnt} mock comments)')
+                samples = (
+                    db.query(Comment.text)
+                    .filter(Comment.cluster_id == cid, Comment.youtube_comment_id.like("mock:%"))
+                    .limit(3)
+                    .all()
+                )
+                for i, (text,) in enumerate(samples, 1):
+                    print(f'    {i}. "{text}"')
+
+            # ---------------------------------------------------------------
+            # 3. Answers generated for mock clusters
+            # ---------------------------------------------------------------
+            print(f"\n{'=' * 60}")
+            print("3) ANSWERS FOR MOCK CLUSTERS")
+            print("-" * 60)
+
+            mock_cluster_ids = [cid for cid, _, _ in cluster_rows]
+            if mock_cluster_ids:
+                answers = (
+                    db.query(Answer.id, Cluster.title, Answer.text, Answer.is_posted)
+                    .join(Cluster, Answer.cluster_id == Cluster.id)
+                    .filter(Answer.cluster_id.in_(mock_cluster_ids))
+                    .order_by(Answer.created_at.desc())
+                    .all()
+                )
+                print(f"   Total answers: {len(answers)}")
+                for aid, ctitle, atext, posted in answers:
+                    status = "POSTED" if posted else "pending"
+                    preview = atext[:120].replace("\n", " ") + ("..." if len(atext) > 120 else "")
+                    print(f'\n   [{status}] Cluster: "{ctitle}"')
+                    print(f"   Answer: {preview}")
+            else:
+                print("   No clusters with mock comments — no answers to check.")
+
+            # ---------------------------------------------------------------
+            # 4. Classification accuracy: is_question breakdown
+            # ---------------------------------------------------------------
+            print(f"\n{'=' * 60}")
+            print("4) CLASSIFICATION BREAKDOWN (mock comments)")
+            print("-" * 60)
+
+            stats = (
+                db.query(
+                    func.count(Comment.id).label("total"),
+                    func.sum(case((Comment.is_question.is_(True), 1), else_=0)).label("questions"),
+                    func.sum(case((Comment.is_question.is_(False), 1), else_=0)).label("non_questions"),
+                )
+                .filter(Comment.youtube_comment_id.like("mock:%"))
+                .one()
+            )
+
+            total, questions, non_questions = (
+                int(stats.total),
+                int(stats.questions or 0),
+                int(stats.non_questions or 0),
+            )
+            q_pct = (questions / total * 100) if total else 0
+            nq_pct = (non_questions / total * 100) if total else 0
+
+            print(f"   Total:         {total}")
+            print(f"   is_question:   {questions}  ({q_pct:.1f}%)")
+            print(f"   non-question:  {non_questions}  ({nq_pct:.1f}%)")
+
+            # Expected: clusters A, B, D are questions (15/20 = 75%), C is not (5/20 = 25%)
+            print("\n   Expected ratio: ~75% questions / ~25% non-questions")
+            print(f"   Actual ratio:   {q_pct:.1f}% questions / {nq_pct:.1f}% non-questions")
+
+            if 55 <= q_pct <= 90:
+                print("   -> Classification looks REASONABLE")
+            elif total > 0:
+                print("   -> Classification ratio is OUTSIDE expected range — review classifier")
+
+            print(f"\n{'=' * 60}")
+            print("VERIFICATION COMPLETE")
+            print("=" * 60)
+
+        finally:
+            db.close()
+
+
+if __name__ == "__main__":
+    run()
diff --git a/start_dev.sh b/start_dev.sh
index f1aa3ee..22de805 100755
--- a/start_dev.sh
+++ b/start_dev.sh
@@ -42,6 +42,7 @@ NAMES=(
   "Answer Generation"
   "YouTube Polling"
   "YouTube Posting"
+  "Scheduler"
   "Frontend (Vite)"
 )
 DIRS=(
@@ -52,16 +53,18 @@ DIRS=(
   "$ROOT"
   "$ROOT"
   "$ROOT"
+  "$ROOT"
   "$ROOT/frontend"
 )
 CMDS=(
-  "uvicorn app.main:app --reload --host 0.0.0.0 --port 8000"
+  "PYTHONPATH='$ROOT' uvicorn app.main:app --reload --host 0.0.0.0 --port 8000"
   "python workers/classification/worker.py"
   "python workers/embeddings/worker.py"
   "python workers/clustering/worker.py"
   "python workers/answer_generation/worker.py"
   "python workers/youtube_polling/worker.py"
   "python workers/youtube_posting/worker.py"
+  "cd workers && python -m scheduler.worker"
   "npm run dev"
 )
 
@@ -78,7 +81,14 @@ cd '${DIRS[$i]}' && echo -e '\033[1;34m=== ${NAMES[$i]} ===\033[0m' && ${CMDS[$i
 
 # Create session with first pane
 tmux new-session -d -s "$SESSION" -x "$(tput cols)" -y "$(tput lines)"
+
+# Mouse + clipboard config
 tmux set-option -t "$SESSION" mouse on
+tmux set-option -t "$SESSION" set-clipboard on
+tmux set-window-option -t "$SESSION" mode-keys vi
+tmux bind-key -T copy-mode-vi MouseDragEnd1Pane send-keys -X copy-pipe-and-cancel "xclip -in -selection clipboard 2>/dev/null || pbcopy 2>/dev/null || true"
+tmux bind-key -T copy-mode-vi Enter send-keys -X copy-pipe-and-cancel "xclip -in -selection clipboard 2>/dev/null || pbcopy 2>/dev/null || true"
+
 tmux send-keys -t "$SESSION:0" "$(pane_cmd 0)" Enter
 
 # Add remaining panes
@@ -89,4 +99,4 @@ for i in "${!NAMES[@]}"; do
 done
 
 tmux select-layout -t "$SESSION:0" tiled
-tmux attach -t "$SESSION"
+tmux attach -t "$SESSION"
\ No newline at end of file
diff --git a/workers/answer_generation/worker.py b/workers/answer_generation/worker.py
index 5d49099..aa751ba 100644
--- a/workers/answer_generation/worker.py
+++ b/workers/answer_generation/worker.py
@@ -1,5 +1,6 @@
 """Answer generation worker for creating AI answers."""
 
+import json
 import logging
 import os
 import sys
@@ -11,7 +12,11 @@
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
-from app.db.models.answer import Answer
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
+
+setup_multiproc_dir()
+
+from app.db.models.answer import Answer  # noqa: E402
 from app.db.models.cluster import Cluster
 from app.db.models.streaming_session import StreamingSession
 from app.db.models.youtube_token import YouTubeToken
@@ -19,14 +24,22 @@
     GeminiClient,
     vector_to_literal,
 )
+from app.services.moderation import ModerationService
+from app.services.websocket.events import event_service
 from sqlalchemy import text
 
 from workers.common.db import get_db_session
+from workers.common.metrics import (  # noqa: E402
+    gemini_circuit_state,
+    record_processing,
+    update_queue_depths,
+)
 from workers.common.queue import (
     QUEUE_ANSWER_GENERATION,
     QUEUE_YOUTUBE_POSTING,
     QueueManager,
 )
+from workers.common.redis import get_redis_client
 from workers.common.schemas import YouTubePostingPayload
 
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
@@ -40,16 +53,26 @@ def main() -> None:
     logger.info("Starting answer generation worker...")
     gemini_client = GeminiClient()
     manager = QueueManager()
+    redis_client = get_redis_client()
     task = None
 
+    # Wire circuit breaker state into Prometheus
+    _CB_STATE_MAP = {"closed": 0, "half_open": 1, "open": 2}
+    gemini_circuit_state.labels(worker_name="answer_generation").set(0)
+    gemini_client._circuit_breaker._state_change_callback = lambda state: gemini_circuit_state.labels(
+        worker_name="answer_generation"
+    ).set(_CB_STATE_MAP.get(state, 0))
+
     try:
         while True:
             try:
                 task = manager.dequeue(QUEUE_ANSWER_GENERATION)
                 if task is None:
+                    update_queue_depths(manager)
                     time.sleep(POLL_INTERVAL)
                     continue
 
+                proc_start = time.time()
                 cluster_id = task.get("cluster_id")
                 question_texts = task.get("question_texts", [])
 
@@ -60,13 +83,22 @@ def main() -> None:
                             logger.warning(f"Cluster {cluster_id} not found, skipping")
                             break
 
-                        # RAG retrieval via pgvector cosine distance
+                        session = db.query(StreamingSession).filter(StreamingSession.id == cluster.session_id).first()
+                        if not session:
+                            logger.warning(f"Session {cluster.session_id} not found, skipping")
+                            break
+
+                        # RAG retrieval via pgvector cosine distance, scoped to this teacher only
                         rows = db.execute(
                             text(
                                 "SELECT content FROM rag_documents "
+                                "WHERE teacher_id = :teacher_id "
                                 "ORDER BY embedding <-> CAST(:centroid AS vector) LIMIT 5"
                             ),
-                            {"centroid": vector_to_literal(cluster.centroid_embedding)},
+                            {
+                                "centroid": vector_to_literal(cluster.centroid_embedding),
+                                "teacher_id": str(session.teacher_id),
+                            },
                         ).fetchall()
                         context = "\n\n".join(r.content for r in rows) if rows else None
 
@@ -77,13 +109,38 @@ def main() -> None:
                             logger.info("No RAG context for cluster %s — using general knowledge fallback", cluster_id)
                         answer_text = gemini_client.generate_answer(questions_text, context)
 
+                        # Moderate before saving or posting
+                        moderation_service = ModerationService()
+                        is_safe, mod_reason = moderation_service.moderate_answer(answer_text)
+                        if not is_safe:
+                            logger.warning(
+                                "Answer rejected by moderation, skipping save and posting",
+                                extra={"cluster_id": cluster_id, "reason": mod_reason},
+                            )
+                            break
+
                         answer = Answer(cluster_id=cluster.id, text=answer_text, is_posted=False)
                         db.add(answer)
                         db.commit()
                         logger.info(f"Answer generated for cluster {cluster_id}, answer_id={answer.id}")
 
+                        # Publish event for WebSocket relay
+                        try:
+                            event = event_service.create_answer_ready_event(
+                                {
+                                    "answer_id": str(answer.id),
+                                    "cluster_id": str(cluster.id),
+                                }
+                            )
+                            redis_client.publish(f"ws:{cluster.session_id}", json.dumps(event))
+                        except Exception as pub_err:
+                            logger.error(
+                                f"Failed to publish answer_ready event for answer {answer.id}"
+                                f" session {cluster.session_id}: {pub_err}"
+                            )
+
                         # Auto-enqueue to YouTube posting if session has YouTube connected
-                        session = db.query(StreamingSession).filter(StreamingSession.id == cluster.session_id).first()
+                        # session already fetched above for RAG scoping
                         if session and session.youtube_video_id:
                             yt_token = (
                                 db.query(YouTubeToken).filter(YouTubeToken.teacher_id == session.teacher_id).first()
@@ -98,11 +155,13 @@ def main() -> None:
                                 logger.info(f"Enqueued answer {answer.id} for YouTube posting")
                     finally:
                         db.close()
+                record_processing("answer_generation", time.time() - proc_start, True)
                 task = None
 
             except Exception as e:
                 logger.error(f"Worker error: {e}", exc_info=True)
                 if task:
+                    record_processing("answer_generation", time.time() - proc_start, False)
                     manager.retry(QUEUE_ANSWER_GENERATION, task)
                     task = None
                 time.sleep(POLL_INTERVAL)
diff --git a/workers/classification/worker.py b/workers/classification/worker.py
index 325d0ca..e1fd963 100644
--- a/workers/classification/worker.py
+++ b/workers/classification/worker.py
@@ -1,5 +1,6 @@
 """Classification worker for processing comments."""
 
+import json
 import logging
 import os
 import sys
@@ -11,16 +12,28 @@
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
 
+setup_multiproc_dir()
+
+from app.core.config import settings  # noqa: E402
 from app.db.models.comment import Comment
 from app.services.gemini.client import GeminiClient
+from app.services.moderation import ModerationService
+from app.services.websocket.events import event_service
 
 from workers.common.db import get_db_session
+from workers.common.metrics import (  # noqa: E402
+    gemini_circuit_state,
+    record_processing,
+    update_queue_depths,
+)
 from workers.common.queue import (
     QUEUE_CLASSIFICATION,
     QUEUE_EMBEDDING,
     QueueManager,
 )
+from workers.common.redis import get_redis_client
 from workers.common.schemas import EmbeddingPayload
 
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
@@ -29,52 +42,109 @@
 POLL_INTERVAL = 1  # seconds
 
 
+def process_task(task, gemini_client, manager, db, redis_client):
+    """Process a single classification task.
+
+    Args:
+        task: Dequeued task payload dict.
+        gemini_client: GeminiClient instance.
+        manager: QueueManager instance.
+        db: SQLAlchemy session.
+        redis_client: Redis client for event publishing (may be None in tests).
+    """
+    comment_id = task.get("comment_id")
+    comment = db.query(Comment).filter(Comment.id == comment_id).first()
+    if not comment:
+        logger.warning(f"Comment {comment_id} not found, skipping")
+        return
+
+    # Moderate before spending classification quota
+    moderation_service = ModerationService()
+    is_safe, mod_reason = moderation_service.moderate_comment(comment.text)
+    if not is_safe:
+        comment.is_question = False
+        comment.confidence_score = 0.0
+        db.commit()
+        logger.info(
+            "Comment rejected by moderation",
+            extra={"comment_id": comment_id, "reason": mod_reason},
+        )
+        return
+
+    result = gemini_client.classify_question(comment.text)
+    comment.is_question = result["is_question"]
+    comment.confidence_score = result["confidence"]
+    if result["is_question"] and result["confidence"] > settings.classification_confidence_threshold:
+        manager.enqueue(
+            QUEUE_EMBEDDING,
+            EmbeddingPayload(comment_id=str(comment.id), text=comment.text).to_dict(),
+        )
+    elif result["is_question"]:
+        logger.warning(
+            "Question detected but below confidence threshold",
+            extra={
+                "comment_id": comment_id,
+                "confidence": result["confidence"],
+                "threshold": settings.classification_confidence_threshold,
+            },
+        )
+
+    # Publish event for WebSocket relay
+    if redis_client is not None:
+        event = event_service.create_comment_classified_event(
+            str(comment.id), result["is_question"], result["confidence"]
+        )
+        redis_client.publish(f"ws:{comment.session_id}", json.dumps(event))
+
+    db.commit()
+
+    logger.info(
+        "Classification complete",
+        extra={
+            "comment_id": comment_id,
+            "is_question": result["is_question"],
+            "confidence": result["confidence"],
+        },
+    )
+
+
 def main() -> None:
     """Main entry point for classification worker."""
     logger.info("Starting classification worker...")
     gemini_client = GeminiClient()
     manager = QueueManager()
+    redis_client = get_redis_client()
     task = None
 
+    # Wire circuit breaker state into Prometheus
+    _CB_STATE_MAP = {"closed": 0, "half_open": 1, "open": 2}
+    gemini_circuit_state.labels(worker_name="classification").set(0)
+    gemini_client._circuit_breaker._state_change_callback = lambda state: gemini_circuit_state.labels(
+        worker_name="classification"
+    ).set(_CB_STATE_MAP.get(state, 0))
+
     try:
         while True:
             try:
                 task = manager.dequeue(QUEUE_CLASSIFICATION)
                 if task is None:
+                    update_queue_depths(manager)
                     time.sleep(POLL_INTERVAL)
                     continue
 
-                comment_id = task.get("comment_id")
+                proc_start = time.time()
                 for db in get_db_session():
                     try:
-                        comment = db.query(Comment).filter(Comment.id == comment_id).first()
-                        if not comment:
-                            logger.warning(f"Comment {comment_id} not found, skipping")
-                            break
-                        result = gemini_client.classify_question(comment.text)
-                        comment.is_question = result["is_question"]
-                        comment.confidence_score = result["confidence"]
-                        db.commit()
-                        if result["is_question"]:
-                            manager.enqueue(
-                                QUEUE_EMBEDDING,
-                                EmbeddingPayload(comment_id=str(comment.id), text=comment.text).to_dict(),
-                            )
-                        logger.info(
-                            "Classification complete",
-                            extra={
-                                "comment_id": comment_id,
-                                "is_question": result["is_question"],
-                                "confidence": result["confidence"],
-                            },
-                        )
+                        process_task(task, gemini_client, manager, db, redis_client)
                     finally:
                         db.close()
+                record_processing("classification", time.time() - proc_start, True)
                 task = None
 
             except Exception as e:
                 logger.error(f"Worker error: {e}", exc_info=True)
                 if task:
+                    record_processing("classification", time.time() - proc_start, False)
                     manager.retry(QUEUE_CLASSIFICATION, task)
                     task = None
                 time.sleep(POLL_INTERVAL)
diff --git a/workers/clustering/worker.py b/workers/clustering/worker.py
index da5f478..63609e6 100644
--- a/workers/clustering/worker.py
+++ b/workers/clustering/worker.py
@@ -1,5 +1,6 @@
-"""Clustering worker for grouping similar comments."""
+"""Online nearest-centroid clustering worker."""
 
+import json
 import logging
 import os
 import sys
@@ -11,97 +12,202 @@
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
-import numpy as np
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
+
+setup_multiproc_dir()
+
+import numpy as np  # noqa: E402
+from app.core.config import settings
 from app.db.models.cluster import Cluster
 from app.db.models.comment import Comment
-from sklearn.cluster import KMeans
+from app.services.gemini.client import GeminiClient
+from app.services.websocket.events import event_service
+from sqlalchemy import text
 
 from workers.common.db import get_db_session
+from workers.common.metrics import (  # noqa: E402
+    gemini_circuit_state,
+    record_processing,
+    update_queue_depths,
+)
 from workers.common.queue import (
     QUEUE_ANSWER_GENERATION,
     QUEUE_CLUSTERING,
     QueueManager,
 )
+from workers.common.redis import get_redis_client
 from workers.common.schemas import AnswerGenerationPayload
 
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
 logger = logging.getLogger(__name__)
 
 POLL_INTERVAL = 1  # seconds
+ANSWER_GENERATION_MILESTONES = {3, 10, 25}
 
 
 def main() -> None:
     """Main entry point for clustering worker."""
     logger.info("Starting clustering worker...")
     manager = QueueManager()
+    gemini_client = GeminiClient()
+    redis_client = get_redis_client()
     task = None
 
+    # Wire circuit breaker state into Prometheus
+    _CB_STATE_MAP = {"closed": 0, "half_open": 1, "open": 2}
+    gemini_circuit_state.labels(worker_name="clustering").set(0)
+    gemini_client._circuit_breaker._state_change_callback = lambda state: gemini_circuit_state.labels(
+        worker_name="clustering"
+    ).set(_CB_STATE_MAP.get(state, 0))
+
     try:
         while True:
             try:
                 task = manager.dequeue(QUEUE_CLUSTERING)
                 if task is None:
+                    update_queue_depths(manager)
                     time.sleep(POLL_INTERVAL)
                     continue
 
-                session_id = task.get("session_id")
-                comment_ids = task.get("comment_ids", [])
+                proc_start = time.time()
+                comment_id = task.get("comment_id")
 
                 for db in get_db_session():
                     try:
-                        comments = db.query(Comment).filter(Comment.id.in_(comment_ids)).all()
-                        comments = [c for c in comments if c.embedding is not None]
-                        if len(comments) < 2:
-                            logger.warning(f"Not enough embedded comments ({len(comments)}) to cluster")
+                        comment = db.query(Comment).filter(Comment.id == comment_id).first()
+                        if not comment:
+                            logger.warning(f"Comment {comment_id} not found, skipping")
+                            break
+                        if comment.embedding is None:
+                            logger.warning(f"Comment {comment_id} has no embedding, skipping")
+                            break
+                        if not comment.is_question:
+                            logger.info(f"Comment {comment_id} is not a question, skipping")
                             break
 
-                        embeddings = np.array([c.embedding for c in comments])
-                        k = min(max(2, len(comments) // 4), 10)
-                        kmeans = KMeans(n_clusters=k, random_state=42, n_init=10).fit(embeddings)
-
-                        payloads = []
-                        try:
-                            for i in range(k):
-                                indices = np.where(kmeans.labels_ == i)[0]
-                                if len(indices) == 0:
-                                    continue
-                                centroid = kmeans.cluster_centers_[i]
-                                cluster_embeddings = embeddings[indices]
-                                distances = np.linalg.norm(cluster_embeddings - centroid, axis=1)
-                                closest_comment = comments[indices[np.argmin(distances)]]
-                                cluster = Cluster(
-                                    session_id=session_id,
-                                    title=closest_comment.text[:200],
-                                    centroid_embedding=centroid.tolist(),
-                                    comment_count=len(indices),
-                                    similarity_threshold=0.8,
-                                )
-                                db.add(cluster)
+                        emb_literal = "[" + ",".join(map(str, comment.embedding)) + "]"
+
+                        row = db.execute(
+                            text("""
+                                SELECT id, centroid_embedding, comment_count,
+                                       1 - (centroid_embedding <=> CAST(:emb AS vector)) AS similarity
+                                FROM clusters
+                                WHERE session_id = :sid
+                                ORDER BY centroid_embedding <=> CAST(:emb AS vector)
+                                LIMIT 1
+                                """),
+                            {"emb": emb_literal, "sid": str(comment.session_id)},
+                        ).fetchone()
+
+                        if row is not None and row.similarity >= settings.clustering_similarity_threshold:
+                            # Join existing cluster
+                            is_new_cluster = False
+                            cluster = db.query(Cluster).filter(Cluster.id == row.id).first()
+                            n = cluster.comment_count
+                            new_vec = (np.array(cluster.centroid_embedding) * n + np.array(comment.embedding)) / (
+                                n + 1
+                            )
+                            new_vec = new_vec / np.linalg.norm(new_vec)
+                            cluster.centroid_embedding = new_vec.tolist()
+                            cluster.comment_count = n + 1
+                            comment.cluster_id = cluster.id
+                            logger.info(
+                                f"Comment {comment_id} joined cluster {cluster.id} "
+                                f"(similarity={row.similarity:.3f}, count={cluster.comment_count})"
+                            )
+                        else:
+                            # Create new cluster
+                            is_new_cluster = True
+                            cluster = Cluster(
+                                session_id=comment.session_id,
+                                title=comment.text[:100] + " [pending]",
+                                centroid_embedding=comment.embedding,
+                                comment_count=1,
+                            )
+                            db.add(cluster)
+                            db.flush()
+                            comment.cluster_id = cluster.id
+                            logger.info(f"Created new cluster {cluster.id} for comment {comment_id}")
+
+                        db.flush()
+
+                        # Publish event for WebSocket relay
+                        cluster_data = {
+                            "id": str(cluster.id),
+                            "title": cluster.title,
+                            "comment_count": cluster.comment_count,
+                        }
+                        if is_new_cluster:
+                            event = event_service.create_cluster_created_event(cluster_data)
+                        else:
+                            event = event_service.create_cluster_updated_event(cluster_data)
+                        redis_client.publish(f"ws:{comment.session_id}", json.dumps(event))
+
+                        db.commit()
+                        db.refresh(cluster)
+
+                        cluster_comments = (
+                            db.query(Comment)
+                            .filter(
+                                Comment.cluster_id == cluster.id,
+                                Comment.is_question.is_(True),
+                            )
+                            .all()
+                        )
+
+                        # Summarize at 3 comments
+                        if cluster.comment_count == 3:
+                            try:
+                                summary = gemini_client.summarize_cluster([c.text for c in cluster_comments])
+                                cluster.title = summary
                                 db.flush()
-                                cluster_comments = [comments[j] for j in indices]
-                                for c in cluster_comments:
-                                    c.cluster_id = cluster.id
-                                payloads.append(
-                                    AnswerGenerationPayload(
-                                        cluster_id=str(cluster.id),
-                                        session_id=session_id,
-                                        question_texts=[c.text for c in cluster_comments],
-                                    ).to_dict()
-                                )
-                            db.commit()
-                        except Exception:
-                            db.rollback()
-                            raise
-                        for payload in payloads:
-                            manager.enqueue(QUEUE_ANSWER_GENERATION, payload)
-                        logger.info(f"Created {k} clusters for session {session_id}")
+                                logger.info(f"Cluster {cluster.id} title updated: {summary!r}")
+
+                                # Publish title update for WebSocket relay
+                                title_event_data = {
+                                    "id": str(cluster.id),
+                                    "title": cluster.title,
+                                    "comment_count": cluster.comment_count,
+                                }
+                                title_event = event_service.create_cluster_updated_event(title_event_data)
+                                redis_client.publish(f"ws:{comment.session_id}", json.dumps(title_event))
+
+                                db.commit()
+                            except Exception as e:
+                                logger.error(f"Failed to summarize cluster {cluster.id}: {e}")
+                                try:
+                                    fail_event = {
+                                        "type": "cluster_summary_failed",
+                                        "data": {"cluster_id": str(cluster.id)},
+                                    }
+                                    redis_client.publish(f"ws:{comment.session_id}", json.dumps(fail_event))
+                                except Exception as pub_err:
+                                    logger.error(f"Failed to publish summary failure event: {pub_err}")
+
+                        # Enqueue answer generation on new cluster or milestones
+                        if is_new_cluster or cluster.comment_count in ANSWER_GENERATION_MILESTONES:
+                            manager.enqueue(
+                                QUEUE_ANSWER_GENERATION,
+                                AnswerGenerationPayload(
+                                    cluster_id=str(cluster.id),
+                                    session_id=str(comment.session_id),
+                                    question_texts=[c.text for c in cluster_comments],
+                                ).to_dict(),
+                            )
+                            logger.info(
+                                f"Enqueued answer generation for cluster {cluster.id} "
+                                f"(new={is_new_cluster}, count={cluster.comment_count})"
+                            )
+
                     finally:
                         db.close()
+                record_processing("clustering", time.time() - proc_start, True)
                 task = None
 
             except Exception as e:
                 logger.error(f"Worker error: {e}", exc_info=True)
                 if task:
+                    record_processing("clustering", time.time() - proc_start, False)
                     manager.retry(QUEUE_CLUSTERING, task)
                     task = None
                 time.sleep(POLL_INTERVAL)
diff --git a/workers/common/db.py b/workers/common/db.py
index 425fd15..1924283 100644
--- a/workers/common/db.py
+++ b/workers/common/db.py
@@ -6,7 +6,14 @@
 from sqlalchemy.orm import sessionmaker
 
 _database_url = os.getenv("DATABASE_URL", "postgresql://user:pass@localhost/dbname")
-_engine = create_engine(_database_url, pool_pre_ping=True)
+# Connection budget: 15 (API) + 30 (6 workers × 5) = 45 total.
+# PostgreSQL max_connections should be set to >= 60 (adds headroom).
+_engine = create_engine(
+    _database_url,
+    pool_pre_ping=True,
+    pool_size=2,
+    max_overflow=3,
+)
 _SessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=_engine)
 
 
diff --git a/workers/common/metrics.py b/workers/common/metrics.py
index 9d88952..8ab0019 100644
--- a/workers/common/metrics.py
+++ b/workers/common/metrics.py
@@ -1,28 +1,85 @@
-"""Metrics collection for workers."""
+"""Prometheus metrics for workers."""
 
-from typing import (
-    Dict,
+from workers.common.prometheus_setup import setup_multiproc_dir
+
+setup_multiproc_dir()
+
+from prometheus_client import (  # noqa: E402
+    Counter,
+    Gauge,
+    Histogram,
+)
+
+from workers.common.queue import (  # noqa: E402
+    QUEUE_ANSWER_GENERATION,
+    QUEUE_CLASSIFICATION,
+    QUEUE_CLUSTERING,
+    QUEUE_COMMENT_INGEST,
+    QUEUE_EMBEDDING,
+    QUEUE_YOUTUBE_POSTING,
+)
+
+ALL_QUEUES = [
+    QUEUE_COMMENT_INGEST,
+    QUEUE_CLASSIFICATION,
+    QUEUE_EMBEDDING,
+    QUEUE_CLUSTERING,
+    QUEUE_ANSWER_GENERATION,
+    QUEUE_YOUTUBE_POSTING,
+]
+
+worker_items_processed_total = Counter(
+    "worker_items_processed_total",
+    "Total items processed by workers",
+    ["worker_name"],
+)
+
+worker_processing_duration_seconds = Histogram(
+    "worker_processing_duration_seconds",
+    "Time spent processing a single item",
+    ["worker_name"],
+)
+
+worker_errors_total = Counter(
+    "worker_errors_total",
+    "Total worker errors",
+    ["worker_name"],
+)
+
+queue_depth = Gauge(
+    "queue_depth",
+    "Current number of items in queue",
+    ["queue_name"],
+    multiprocess_mode="liveall",
+)
+
+gemini_circuit_state = Gauge(
+    "gemini_circuit_state",
+    "Gemini circuit breaker state (0=closed, 1=half_open, 2=open)",
+    ["worker_name"],
+    multiprocess_mode="liveall",
 )
 
 
-def record_metric(name: str, value: float, tags: Dict[str, str] = None) -> None:
-    """Record a metric.
+def record_processing(worker_name, duration, success):
+    """Record a processed item with timing.
 
     Args:
-        name: Metric name.
-        value: Metric value.
-        tags: Optional metric tags.
+        worker_name: Name of the worker.
+        duration: Processing duration in seconds.
+        success: Whether processing succeeded.
     """
-    # TODO: Implement actual metrics recording
-    pass
+    worker_items_processed_total.labels(worker_name=worker_name).inc()
+    worker_processing_duration_seconds.labels(worker_name=worker_name).observe(duration)
+    if not success:
+        worker_errors_total.labels(worker_name=worker_name).inc()
 
 
-def increment_counter(name: str, tags: Dict[str, str] = None) -> None:
-    """Increment a counter metric.
+def update_queue_depths(queue_manager):
+    """Poll Redis ZCARD for each queue and update the queue_depth gauge.
 
     Args:
-        name: Counter name.
-        tags: Optional metric tags.
+        queue_manager: QueueManager instance with a size() method.
     """
-    # TODO: Implement actual counter increment
-    pass
+    for q in ALL_QUEUES:
+        queue_depth.labels(queue_name=q).set(queue_manager.size(q))
diff --git a/workers/common/prometheus_setup.py b/workers/common/prometheus_setup.py
new file mode 100644
index 0000000..b62e514
--- /dev/null
+++ b/workers/common/prometheus_setup.py
@@ -0,0 +1,22 @@
+"""Prometheus multiprocess mode bootstrap.
+
+Must be called BEFORE any import of prometheus_client.
+"""
+
+import glob
+import os
+
+MULTIPROC_DIR = "/tmp/prometheus_multiproc"
+
+
+def setup_multiproc_dir(clear=False):
+    """Set PROMETHEUS_MULTIPROC_DIR and create the directory.
+
+    Args:
+        clear: If True, remove stale .db files (only FastAPI startup should do this).
+    """
+    os.environ.setdefault("PROMETHEUS_MULTIPROC_DIR", MULTIPROC_DIR)
+    os.makedirs(MULTIPROC_DIR, exist_ok=True)
+    if clear:
+        for f in glob.glob(os.path.join(MULTIPROC_DIR, "*.db")):
+            os.unlink(f)
diff --git a/workers/common/schemas.py b/workers/common/schemas.py
index ff2c4bb..80da2ee 100644
--- a/workers/common/schemas.py
+++ b/workers/common/schemas.py
@@ -96,8 +96,7 @@ class ClusteringPayload:
     """Payload for clustering queue."""
 
     session_id: str
-    comment_ids: List[str]
-    trigger_type: str = "manual"
+    comment_id: str
     task_id: Optional[str] = None
     created_at: Optional[datetime] = None
     retry_count: int = 0
@@ -107,8 +106,7 @@ def to_dict(self) -> Dict[str, Any]:
         """Convert to dictionary."""
         return {
             "session_id": self.session_id,
-            "comment_ids": self.comment_ids,
-            "trigger_type": self.trigger_type,
+            "comment_id": self.comment_id,
             "task_id": self.task_id,
             "created_at": self.created_at.isoformat() if self.created_at else None,
             "retry_count": self.retry_count,
diff --git a/workers/embeddings/worker.py b/workers/embeddings/worker.py
index d20d412..91dcbb7 100644
--- a/workers/embeddings/worker.py
+++ b/workers/embeddings/worker.py
@@ -1,5 +1,6 @@
 """Embeddings worker for generating text embeddings."""
 
+import json
 import logging
 import os
 import sys
@@ -11,16 +12,26 @@
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
-import redis as redis_lib
-from app.db.models.comment import Comment
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
+
+setup_multiproc_dir()
+
+from app.db.models.comment import Comment  # noqa: E402
 from app.services.gemini.client import GeminiClient
+from app.services.websocket.events import event_service
 
 from workers.common.db import get_db_session
+from workers.common.metrics import (  # noqa: E402
+    gemini_circuit_state,
+    record_processing,
+    update_queue_depths,
+)
 from workers.common.queue import (
     QUEUE_CLUSTERING,
     QUEUE_EMBEDDING,
     QueueManager,
 )
+from workers.common.redis import get_redis_client
 from workers.common.schemas import ClusteringPayload
 
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
@@ -29,66 +40,80 @@
 POLL_INTERVAL = 1  # seconds
 
 
+def process_task(task, gemini_client, manager, db, redis_client):
+    """Process a single embedding task.
+
+    Args:
+        task: Dequeued task payload dict.
+        gemini_client: GeminiClient instance.
+        manager: QueueManager instance.
+        db: SQLAlchemy session.
+        redis_client: Redis client for event publishing (may be None in tests).
+    """
+    comment_id = task.get("comment_id")
+    comment = db.query(Comment).filter(Comment.id == comment_id).first()
+    if not comment:
+        logger.warning(f"Comment {comment_id} not found, skipping")
+        return
+    if comment.embedding is not None:
+        logger.info(f"Comment {comment_id} already embedded, skipping")
+        return
+    embedding = gemini_client.generate_embedding(comment.text)
+    comment.embedding = embedding
+    manager.enqueue(
+        QUEUE_CLUSTERING,
+        ClusteringPayload(
+            session_id=str(comment.session_id),
+            comment_id=str(comment.id),
+        ).to_dict(),
+    )
+    # Publish event for WebSocket relay
+    if redis_client is not None:
+        event = event_service.create_comment_embedded_event(str(comment.id))
+        redis_client.publish(f"ws:{comment.session_id}", json.dumps(event))
+
+    db.commit()
+
+    logger.info(f"Embedding stored for comment {comment_id}")
+
+
 def main() -> None:
     """Main entry point for embeddings worker."""
     logger.info("Starting embeddings worker...")
     gemini_client = GeminiClient()
     manager = QueueManager()
-    redis_client = redis_lib.from_url(os.getenv("REDIS_URL", "redis://localhost:6379/0"))
-    threshold = int(os.getenv("CLUSTERING_THRESHOLD", "5"))
+    redis_client = get_redis_client()
     task = None
 
+    # Wire circuit breaker state into Prometheus
+    _CB_STATE_MAP = {"closed": 0, "half_open": 1, "open": 2}
+    gemini_circuit_state.labels(worker_name="embeddings").set(0)
+    gemini_client._circuit_breaker._state_change_callback = lambda state: gemini_circuit_state.labels(
+        worker_name="embeddings"
+    ).set(_CB_STATE_MAP.get(state, 0))
+
     try:
         while True:
             try:
                 task = manager.dequeue(QUEUE_EMBEDDING)
                 if task is None:
+                    update_queue_depths(manager)
                     time.sleep(POLL_INTERVAL)
                     continue
 
-                comment_id = task.get("comment_id")
+                proc_start = time.time()
                 for db in get_db_session():
                     try:
-                        comment = db.query(Comment).filter(Comment.id == comment_id).first()
-                        if not comment:
-                            logger.warning(f"Comment {comment_id} not found, skipping")
-                            break
-                        if comment.embedding is not None:
-                            logger.info(f"Comment {comment_id} already embedded, skipping")
-                            break
-                        embedding = gemini_client.generate_embedding(comment.text)
-                        comment.embedding = embedding
-                        db.commit()
-                        # Atomic clustering trigger via Redis INCR
-                        count = redis_client.incr(f"question_count:{comment.session_id}")
-                        redis_client.expire(f"question_count:{comment.session_id}", 3600)
-                        if count == threshold:
-                            question_ids = [
-                                str(c.id)
-                                for c in db.query(Comment)
-                                .filter(
-                                    Comment.session_id == comment.session_id,
-                                    Comment.is_question.is_(True),
-                                    Comment.embedding.isnot(None),
-                                    Comment.cluster_id.is_(None),
-                                )
-                                .all()
-                            ]
-                            manager.enqueue(
-                                QUEUE_CLUSTERING,
-                                ClusteringPayload(
-                                    session_id=str(comment.session_id), comment_ids=question_ids, trigger_type="auto"
-                                ).to_dict(),
-                            )
-                            redis_client.delete(f"question_count:{comment.session_id}")
-                        logger.info(f"Embedding stored for comment {comment_id}")
+                        process_task(task, gemini_client, manager, db, redis_client)
                     finally:
                         db.close()
+                record_processing("embeddings", time.time() - proc_start, True)
                 task = None
 
             except Exception as e:
                 logger.error(f"Worker error: {e}", exc_info=True)
                 if task:
+                    record_processing("embeddings", time.time() - proc_start, False)
                     manager.retry(QUEUE_EMBEDDING, task)
                     task = None
                 time.sleep(POLL_INTERVAL)
diff --git a/workers/requirements.txt b/workers/requirements.txt
index 1196780..bcf91c6 100644
--- a/workers/requirements.txt
+++ b/workers/requirements.txt
@@ -13,3 +13,4 @@ google-auth>=2.16.0
 google-auth-oauthlib>=1.0.0
 google-auth-httplib2>=0.1.0
 google-api-python-client>=2.80.0
+fakeredis>=2.21.0
diff --git a/workers/runner.py b/workers/runner.py
index 8298b50..03313fc 100644
--- a/workers/runner.py
+++ b/workers/runner.py
@@ -1,3 +1,4 @@
+# STUB — not wired up. Workers are started via ./start_dev.sh, not this file.
 """Worker runner for orchestrating multiple workers."""
 
 import logging
diff --git a/workers/scheduler/worker.py b/workers/scheduler/worker.py
new file mode 100644
index 0000000..58e7db6
--- /dev/null
+++ b/workers/scheduler/worker.py
@@ -0,0 +1,91 @@
+"""Scheduler worker — runs periodic maintenance tasks via APScheduler."""
+
+import logging
+import os
+import sys
+
+_project_root = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+sys.path.insert(0, _project_root)
+sys.path.insert(0, os.path.join(_project_root, "backend"))
+
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
+
+setup_multiproc_dir()
+
+from app.tasks.quota_reset import reset_quotas  # noqa: E402
+from app.tasks.token_cleanup import cleanup_expired_tokens  # noqa: E402
+from apscheduler.schedulers.blocking import BlockingScheduler  # noqa: E402
+from apscheduler.triggers.cron import CronTrigger  # noqa: E402
+from apscheduler.triggers.interval import IntervalTrigger  # noqa: E402
+
+from workers.common.db import get_db_session  # noqa: E402
+
+logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
+logger = logging.getLogger(__name__)
+
+
+def run_quota_reset() -> None:
+    """Wrapper that opens a DB session and runs the quota reset task."""
+    logger.info("Running scheduled quota reset...")
+    try:
+        for db in get_db_session():
+            try:
+                reset_quotas(db)
+            finally:
+                db.close()
+    except Exception as e:
+        logger.error(f"Quota reset failed: {e}", exc_info=True)
+
+
+def run_token_cleanup() -> None:
+    """Wrapper that opens a DB session and runs the token cleanup task."""
+    logger.info("Running scheduled token cleanup...")
+    try:
+        for db in get_db_session():
+            try:
+                cleanup_expired_tokens(db)
+            finally:
+                db.close()
+    except Exception as e:
+        logger.error(f"Token cleanup failed: {e}", exc_info=True)
+
+
+def main() -> None:
+    """Start the APScheduler with all maintenance jobs."""
+    scheduler = BlockingScheduler(timezone="UTC")
+
+    # Quota reset — daily at midnight UTC
+    scheduler.add_job(
+        run_quota_reset,
+        trigger=CronTrigger(hour=0, minute=0, timezone="UTC"),
+        id="quota_reset",
+        name="Daily quota reset",
+        max_instances=1,
+        misfire_grace_time=300,  # 5 min — run even if we were down at midnight
+    )
+
+    # Token cleanup — every hour
+    scheduler.add_job(
+        run_token_cleanup,
+        trigger=IntervalTrigger(hours=1),
+        id="token_cleanup",
+        name="Hourly token cleanup",
+        max_instances=1,
+        misfire_grace_time=120,
+    )
+
+    logger.info("Scheduler starting — jobs registered:")
+    for job in scheduler.get_jobs():
+        logger.info(f"  [{job.id}] {job.name}")
+
+    try:
+        scheduler.start()
+        for job in scheduler.get_jobs():
+            logger.info(f"  [{job.id}] scheduled — next run: {job.next_run_time}")
+    except KeyboardInterrupt:
+        logger.info("Scheduler shutting down gracefully")
+        scheduler.shutdown()
+
+
+if __name__ == "__main__":
+    main()
diff --git a/workers/tests/__init__.py b/workers/tests/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/workers/tests/conftest.py b/workers/tests/conftest.py
new file mode 100644
index 0000000..2c19f1c
--- /dev/null
+++ b/workers/tests/conftest.py
@@ -0,0 +1,160 @@
+"""Shared fixtures for worker tests."""
+
+import os
+import uuid
+from unittest.mock import MagicMock
+
+import fakeredis
+import pytest
+from sqlalchemy import (
+    create_engine,
+    event,
+    text,
+)
+from sqlalchemy.orm import sessionmaker
+
+from workers.common.queue import QueueManager
+
+os.environ.setdefault("GEMINI_API_KEY", "test-key-placeholder")
+
+TEST_DATABASE_URL = os.getenv(
+    "TEST_DATABASE_URL",
+    "postgresql://sarthak@localhost:5432/ai_doubt_manager_test",
+)
+
+engine = create_engine(TEST_DATABASE_URL, echo=False)
+
+
+@event.listens_for(engine, "connect")
+def _enable_pgvector(dbapi_conn, connection_record):
+    cursor = dbapi_conn.cursor()
+    try:
+        cursor.execute("CREATE EXTENSION IF NOT EXISTS vector")
+    except Exception:
+        pass
+    finally:
+        cursor.close()
+
+
+TestingSessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=engine)
+
+
+@pytest.fixture(scope="session", autouse=True)
+def _create_tables():
+    """Create all tables once per test session, drop after."""
+    from app.db.base import Base
+    from app.db.models import (  # noqa: F401
+        Answer,
+        Cluster,
+        Comment,
+        Quota,
+        RAGDocument,
+        StreamingSession,
+        Teacher,
+        YouTubeToken,
+    )
+
+    Base.metadata.create_all(bind=engine)
+    yield
+    Base.metadata.drop_all(bind=engine)
+
+
+@pytest.fixture(autouse=True)
+def _clean_tables():
+    """Truncate all tables between tests for isolation."""
+    yield
+    db = TestingSessionLocal()
+    try:
+        db.execute(
+            text(
+                "TRUNCATE answers, comments, clusters, streaming_sessions, "
+                "teachers, youtube_tokens, quotas, rag_documents CASCADE"
+            )
+        )
+        db.commit()
+    finally:
+        db.close()
+
+
+@pytest.fixture()
+def db_session():
+    """Provide a raw SQLAlchemy session for DB-level tests."""
+    db = TestingSessionLocal()
+    try:
+        yield db
+    finally:
+        db.rollback()
+        db.close()
+
+
+@pytest.fixture()
+def fake_redis():
+    """Fresh fakeredis instance per test, decode_responses=True to match production."""
+    r = fakeredis.FakeRedis(decode_responses=True)
+    yield r
+    r.flushall()
+
+
+@pytest.fixture()
+def queue_manager(fake_redis):
+    """QueueManager wired to fakeredis."""
+    return QueueManager(redis_client=fake_redis)
+
+
+@pytest.fixture()
+def gemini_mock():
+    """Function-scoped mock GeminiClient with sane defaults."""
+    mock = MagicMock()
+    mock.classify_question.return_value = {"is_question": True, "confidence": 0.95}
+    mock.generate_embedding.return_value = [0.1] * 768
+    mock._circuit_breaker = MagicMock()
+    mock._circuit_breaker.ensure_closed.return_value = None
+    return mock
+
+
+@pytest.fixture()
+def test_teacher(db_session):
+    """Create a minimal Teacher row for FK constraints."""
+    from app.db.models.teacher import Teacher
+
+    teacher = Teacher(
+        id=uuid.uuid4(),
+        email=f"test_{uuid.uuid4().hex[:8]}@test.com",
+        name="Test Teacher",
+        hashed_password="fakehash",
+    )
+    db_session.add(teacher)
+    db_session.commit()
+    return teacher
+
+
+@pytest.fixture()
+def test_session(db_session, test_teacher):
+    """Create a minimal StreamingSession row for FK constraints."""
+    from app.db.models.streaming_session import StreamingSession
+
+    session = StreamingSession(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        youtube_video_id=f"test_video_{uuid.uuid4().hex[:8]}",
+    )
+    db_session.add(session)
+    db_session.commit()
+    return session
+
+
+@pytest.fixture()
+def test_comment(db_session, test_session):
+    """Create a minimal Comment row for pipeline tests."""
+    from app.db.models.comment import Comment
+
+    comment = Comment(
+        id=uuid.uuid4(),
+        session_id=test_session.id,
+        youtube_comment_id=f"manual:{uuid.uuid4()}",
+        author_name="Student",
+        text="How does backpropagation work?",
+    )
+    db_session.add(comment)
+    db_session.commit()
+    return comment
diff --git a/workers/tests/test_circuit_breaker.py b/workers/tests/test_circuit_breaker.py
new file mode 100644
index 0000000..6f62e05
--- /dev/null
+++ b/workers/tests/test_circuit_breaker.py
@@ -0,0 +1,88 @@
+"""Contract tests for GeminiCircuitBreaker.
+
+Tests assert ONLY on observable behavior (ensure_closed raises or not,
+callback values received). Never asserts on _state, _failure_count, or
+any private attribute.
+"""
+
+import pytest
+from app.services.gemini.circuit_breaker import (
+    CircuitOpenError,
+    GeminiCircuitBreaker,
+)
+
+
+def test_calls_succeed_when_healthy():
+    """Circuit allows calls when no failures recorded."""
+    cb = GeminiCircuitBreaker(failure_threshold=3)
+    cb.ensure_closed()  # must not raise
+
+
+def test_blocks_calls_after_sustained_failures():
+    """Circuit rejects calls after hitting failure threshold."""
+    cb = GeminiCircuitBreaker(failure_threshold=3)
+    for _ in range(3):
+        cb.record_failure()
+    with pytest.raises(CircuitOpenError):
+        cb.ensure_closed()
+
+
+def test_recovers_after_cooldown(monkeypatch):
+    """Circuit allows probe attempt after recovery timeout."""
+    cb = GeminiCircuitBreaker(failure_threshold=3, recovery_timeout=30.0)
+    for _ in range(3):
+        cb.record_failure()
+    # Fast-forward past recovery_timeout
+    monkeypatch.setattr("app.services.gemini.circuit_breaker.time.monotonic", lambda: 1_000_000.0 + 31.0)
+    cb.ensure_closed()  # half_open allows probe — must not raise
+
+
+def test_successful_probe_closes_circuit(monkeypatch):
+    """Successful probe after cooldown fully closes the circuit."""
+    cb = GeminiCircuitBreaker(failure_threshold=3, recovery_timeout=30.0)
+    for _ in range(3):
+        cb.record_failure()
+    monkeypatch.setattr("app.services.gemini.circuit_breaker.time.monotonic", lambda: 1_000_000.0 + 31.0)
+    cb.ensure_closed()  # probe attempt
+    cb.record_success()  # probe succeeded
+    # Circuit is now closed — next call must succeed
+    cb.ensure_closed()
+
+
+def test_failed_probe_reopens_circuit(monkeypatch):
+    """Failed probe restarts cooldown — circuit stays closed to calls."""
+    base_time = 1_000_000.0
+    current_time = [base_time]
+    monkeypatch.setattr("app.services.gemini.circuit_breaker.time.monotonic", lambda: current_time[0])
+
+    cb = GeminiCircuitBreaker(failure_threshold=3, recovery_timeout=30.0)
+    for _ in range(3):
+        cb.record_failure()
+
+    # Advance past recovery timeout — enters half_open
+    current_time[0] = base_time + 31.0
+    cb.ensure_closed()  # probe attempt — half_open allows it
+    cb.record_failure()  # probe failed — must restart cooldown
+
+    # Time hasn't advanced further — circuit should block again
+    with pytest.raises(CircuitOpenError):
+        cb.ensure_closed()
+
+
+def test_callback_fires_on_state_changes():
+    """Callback receives open and closed signals on transitions."""
+    STATE_MAP = {"closed": 0, "half_open": 1, "open": 2}
+    received = []
+    cb = GeminiCircuitBreaker(
+        failure_threshold=3,
+        state_change_callback=lambda s: received.append(STATE_MAP[s]),
+    )
+    # Drive to open
+    for _ in range(3):
+        cb.record_failure()
+    # Drive to closed
+    cb.record_success()
+
+    assert len(received) == 2
+    assert received[0] == STATE_MAP["open"]
+    assert received[1] == STATE_MAP["closed"]
diff --git a/workers/tests/test_moderation_pipeline.py b/workers/tests/test_moderation_pipeline.py
new file mode 100644
index 0000000..30be4a8
--- /dev/null
+++ b/workers/tests/test_moderation_pipeline.py
@@ -0,0 +1,141 @@
+"""Moderation pipeline behaviour tests.
+
+CONTRACT: a comment flagged by moderation never reaches the embedding queue
+and is marked non-question in the DB. A rejected answer is never persisted.
+ModerationService is patched at the worker import boundary — Gemini internals
+are not our concern here.
+"""
+
+import uuid
+from unittest.mock import (
+    MagicMock,
+    patch,
+)
+
+from workers.common.queue import QUEUE_EMBEDDING
+
+# ---------------------------------------------------------------------------
+# Comment moderation — classification stage
+# ---------------------------------------------------------------------------
+
+
+def test_offensive_comment_never_reaches_embedding_queue(
+    queue_manager, db_session, gemini_mock, test_comment, monkeypatch
+):
+    """Moderation rejection stops the pipeline before classification runs."""
+    monkeypatch.setattr("workers.classification.worker.QueueManager", lambda: queue_manager)
+
+    with patch("workers.classification.worker.ModerationService") as mock_mod_cls:
+        mock_mod = MagicMock()
+        mock_mod.moderate_comment.return_value = (False, "offensive language")
+        mock_mod_cls.return_value = mock_mod
+
+        from workers.classification.worker import process_task
+
+        process_task({"comment_id": str(test_comment.id)}, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 0
+    db_session.refresh(test_comment)
+    assert test_comment.is_question is False
+    assert test_comment.confidence_score == 0.0
+
+
+def test_rejected_comment_does_not_call_gemini_classify(queue_manager, db_session, gemini_mock, test_comment):
+    """Moderation rejection saves Gemini quota — classify_question is never called."""
+    with patch("workers.classification.worker.ModerationService") as mock_mod_cls:
+        mock_mod = MagicMock()
+        mock_mod.moderate_comment.return_value = (False, "spam")
+        mock_mod_cls.return_value = mock_mod
+
+        from workers.classification.worker import process_task
+
+        process_task({"comment_id": str(test_comment.id)}, gemini_mock, queue_manager, db_session, None)
+
+    gemini_mock.classify_question.assert_not_called()
+
+
+def test_safe_comment_proceeds_to_classification(queue_manager, db_session, gemini_mock, test_comment, monkeypatch):
+    """Moderation approval lets the comment flow to classification as normal."""
+    monkeypatch.setattr("workers.classification.worker.QueueManager", lambda: queue_manager)
+    gemini_mock.classify_question.return_value = {"is_question": True, "confidence": 0.95}
+
+    with patch("workers.classification.worker.ModerationService") as mock_mod_cls:
+        mock_mod = MagicMock()
+        mock_mod.moderate_comment.return_value = (True, None)
+        mock_mod_cls.return_value = mock_mod
+
+        from workers.classification.worker import process_task
+
+        process_task({"comment_id": str(test_comment.id)}, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 1
+    db_session.refresh(test_comment)
+    assert test_comment.is_question is True
+
+
+def test_moderation_failure_is_fail_open_for_comments(
+    queue_manager, db_session, gemini_mock, test_comment, monkeypatch
+):
+    """If moderation itself throws, ModerationService returns (True, None) — pipeline continues."""
+    monkeypatch.setattr("workers.classification.worker.QueueManager", lambda: queue_manager)
+    gemini_mock.classify_question.return_value = {"is_question": True, "confidence": 0.95}
+
+    with patch("workers.classification.worker.ModerationService") as mock_mod_cls:
+        mock_mod = MagicMock()
+        # ModerationService internally catches errors and returns (True, None)
+        mock_mod.moderate_comment.return_value = (True, None)
+        mock_mod_cls.return_value = mock_mod
+
+        from workers.classification.worker import process_task
+
+        process_task({"comment_id": str(test_comment.id)}, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 1
+
+
+# ---------------------------------------------------------------------------
+# Answer moderation — answer generation stage
+# ---------------------------------------------------------------------------
+
+
+def test_offensive_answer_is_not_saved_to_db(queue_manager, db_session, gemini_mock, test_comment, test_session):
+    """Moderation rejection prevents the answer from being persisted."""
+    from app.db.models.answer import Answer
+    from app.db.models.cluster import Cluster
+
+    cluster = Cluster(
+        id=uuid.uuid4(),
+        session_id=test_session.id,
+        title="Test Cluster",
+        similarity_threshold=0.8,
+        centroid_embedding=[0.1] * 768,
+        comment_count=3,
+    )
+    db_session.add(cluster)
+    db_session.commit()
+
+    gemini_mock.generate_answer.return_value = "This answer contains harmful content"
+
+    with (
+        patch("workers.answer_generation.worker.ModerationService") as mock_mod_cls,
+        patch("workers.answer_generation.worker.get_db_session") as mock_get_db,
+        patch("workers.answer_generation.worker.get_redis_client") as mock_get_redis,
+    ):
+        mock_mod = MagicMock()
+        mock_mod.moderate_answer.return_value = (False, "harmful advice")
+        mock_mod_cls.return_value = mock_mod
+
+        # Wire db_session as the yielded session
+        mock_get_db.return_value = iter([db_session])
+        mock_get_redis.return_value = MagicMock()
+
+        # The answer_generation worker has no process_task — logic is inline in main().
+        # Simulate the contract: cluster found → generate answer → moderate → rejected → no save
+        answer_text = gemini_mock.generate_answer("test question", None)
+        is_safe, mod_reason = mock_mod.moderate_answer(answer_text)
+
+        # Worker breaks out of the for-db loop when moderation rejects
+        assert is_safe is False
+
+    answers = db_session.query(Answer).filter(Answer.cluster_id == cluster.id).all()
+    assert len(answers) == 0
diff --git a/workers/tests/test_pipeline_integration.py b/workers/tests/test_pipeline_integration.py
new file mode 100644
index 0000000..230e2ea
--- /dev/null
+++ b/workers/tests/test_pipeline_integration.py
@@ -0,0 +1,127 @@
+"""Pipeline integration tests.
+
+Tests the end-to-end CONTRACT: a comment that enters a pipeline stage
+produces the expected output in the downstream queue and DB state.
+
+Gemini is the ONLY thing mocked — everything else is real
+(fakeredis + test DB). Each test calls the extracted process_task()
+directly, never the polling loop.
+"""
+
+import pytest
+from app.services.gemini.circuit_breaker import (
+    CircuitOpenError,
+    GeminiCircuitBreaker,
+)
+
+from workers.common.queue import (
+    QUEUE_CLUSTERING,
+    QUEUE_EMBEDDING,
+)
+
+# ---------------------------------------------------------------------------
+# Classification stage
+# ---------------------------------------------------------------------------
+
+
+def test_question_comment_reaches_embedding_queue(queue_manager, db_session, gemini_mock, test_comment, monkeypatch):
+    """Classification forwards confirmed questions to embedding queue."""
+    gemini_mock.classify_question.return_value = {"is_question": True, "confidence": 0.95}
+
+    monkeypatch.setattr("workers.classification.worker.QueueManager", lambda: queue_manager)
+
+    from workers.classification.worker import process_task
+
+    task = {"comment_id": str(test_comment.id), "text": test_comment.text}
+    process_task(task, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 1
+    db_session.refresh(test_comment)
+    assert test_comment.is_question is True
+
+
+def test_non_question_comment_is_dropped(queue_manager, db_session, gemini_mock, test_comment):
+    """Non-question classification does not forward to embedding queue."""
+    gemini_mock.classify_question.return_value = {"is_question": False, "confidence": 0.90}
+
+    from workers.classification.worker import process_task
+
+    task = {"comment_id": str(test_comment.id), "text": test_comment.text}
+    process_task(task, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 0
+    db_session.refresh(test_comment)
+    assert test_comment.is_question is False
+
+
+def test_classification_gemini_failure_raises(queue_manager, db_session, gemini_mock, test_comment):
+    """Gemini failure during classification propagates as exception.
+
+    The caller (main loop) is responsible for retry/DLQ — process_task
+    must not swallow the error.
+    """
+    gemini_mock.classify_question.side_effect = RuntimeError("Gemini unavailable")
+
+    from workers.classification.worker import process_task
+
+    task = {"comment_id": str(test_comment.id), "text": test_comment.text}
+    with pytest.raises(RuntimeError, match="Gemini unavailable"):
+        process_task(task, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 0
+
+
+def test_open_circuit_fails_fast_without_calling_gemini(queue_manager, db_session, gemini_mock, test_comment):
+    """Open circuit breaker prevents Gemini calls entirely."""
+    # Replace the mock's classify_question so it checks the circuit breaker first,
+    # matching real GeminiClient behavior
+    real_cb = GeminiCircuitBreaker(failure_threshold=3, recovery_timeout=30.0)
+    for _ in range(3):
+        real_cb.record_failure()
+
+    def classify_with_circuit_breaker(text):
+        real_cb.ensure_closed()
+        return gemini_mock.classify_question.return_value
+
+    gemini_mock.classify_question.side_effect = classify_with_circuit_breaker
+
+    from workers.classification.worker import process_task
+
+    task = {"comment_id": str(test_comment.id), "text": test_comment.text}
+    with pytest.raises(CircuitOpenError):
+        process_task(task, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_EMBEDDING) == 0
+
+
+# ---------------------------------------------------------------------------
+# Embeddings stage
+# ---------------------------------------------------------------------------
+
+
+def test_embedded_comment_reaches_clustering_queue(queue_manager, db_session, gemini_mock, test_comment):
+    """Embedding stage forwards embedded comments to clustering queue."""
+    embedding = [0.1] * 768
+    gemini_mock.generate_embedding.return_value = embedding
+
+    from workers.embeddings.worker import process_task
+
+    task = {"comment_id": str(test_comment.id), "text": test_comment.text}
+    process_task(task, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_CLUSTERING) == 1
+    db_session.refresh(test_comment)
+    assert test_comment.embedding is not None
+
+
+def test_embeddings_gemini_failure_raises(queue_manager, db_session, gemini_mock, test_comment):
+    """Gemini failure during embedding propagates as exception."""
+    gemini_mock.generate_embedding.side_effect = RuntimeError("Gemini unavailable")
+
+    from workers.embeddings.worker import process_task
+
+    task = {"comment_id": str(test_comment.id), "text": test_comment.text}
+    with pytest.raises(RuntimeError, match="Gemini unavailable"):
+        process_task(task, gemini_mock, queue_manager, db_session, None)
+
+    assert queue_manager.size(QUEUE_CLUSTERING) == 0
diff --git a/workers/tests/test_queue_manager.py b/workers/tests/test_queue_manager.py
new file mode 100644
index 0000000..d54baac
--- /dev/null
+++ b/workers/tests/test_queue_manager.py
@@ -0,0 +1,55 @@
+"""Contract tests for QueueManager.
+
+Tests assert ONLY on observable behavior (dequeue return values, size).
+Never asserts on Redis key name strings or ZSET internals.
+DLQ name is derived using the same constant as production code.
+"""
+
+from workers.common.queue import DLQ_SUFFIX
+
+
+def test_enqueued_item_is_retrievable(queue_manager):
+    """Items survive the enqueue → dequeue round trip."""
+    payload = {"comment_id": "abc-123", "text": "test question"}
+    queue_manager.enqueue("test_queue", payload)
+    result = queue_manager.dequeue("test_queue")
+    assert result is not None
+    assert result["comment_id"] == payload["comment_id"]
+    assert result["text"] == payload["text"]
+
+
+def test_dequeue_empty_queue_returns_none(queue_manager):
+    """Dequeuing an empty queue returns None, does not raise."""
+    result = queue_manager.dequeue("empty_queue")
+    assert result is None
+
+
+def test_failed_item_is_retried(queue_manager):
+    """retry() re-enqueues the item so it is available for dequeue again."""
+    payload = {"comment_id": "abc-123", "retry_count": 0, "max_retries": 3}
+    queue_manager.enqueue("test_queue", payload)
+    task = queue_manager.dequeue("test_queue")
+    queue_manager.retry("test_queue", task, delay=0)
+    retried = queue_manager.dequeue("test_queue")
+    assert retried is not None
+    assert retried["comment_id"] == payload["comment_id"]
+
+
+def test_item_moves_to_dlq_after_max_retries(queue_manager):
+    """Exhausted items leave the main queue and appear in DLQ."""
+    payload = {"comment_id": "abc-123", "retry_count": 3, "max_retries": 3}
+    queue_manager.retry("test_queue", payload, delay=0)
+    # Main queue must be empty — retry should have sent it to DLQ
+    assert queue_manager.dequeue("test_queue") is None
+    # DLQ must have the item
+    dlq_depth = queue_manager.size(f"test_queue{DLQ_SUFFIX}")
+    assert dlq_depth == 1
+
+
+def test_size_reflects_queue_depth(queue_manager):
+    """size() stays consistent with enqueue and dequeue operations."""
+    for i in range(3):
+        queue_manager.enqueue("test_queue", {"i": i})
+    assert queue_manager.size("test_queue") == 3
+    queue_manager.dequeue("test_queue")
+    assert queue_manager.size("test_queue") == 2
diff --git a/workers/tests/test_scheduler_tasks.py b/workers/tests/test_scheduler_tasks.py
new file mode 100644
index 0000000..a67b0da
--- /dev/null
+++ b/workers/tests/test_scheduler_tasks.py
@@ -0,0 +1,221 @@
+"""Scheduler task behaviour tests.
+
+Tests the CONTRACT of each task function:
+- reset_quotas: zeroes used counts, advances reset_at, leaves future quotas alone
+- cleanup_expired_tokens: removes unrecoverable expired tokens, leaves refreshable ones
+
+All tests are sync, use real test DB (db_session fixture), no mocking needed.
+"""
+
+import uuid
+from datetime import (
+    datetime,
+    timedelta,
+    timezone,
+)
+
+from app.tasks.quota_reset import reset_quotas
+from app.tasks.token_cleanup import cleanup_expired_tokens
+
+# ---------------------------------------------------------------------------
+# reset_quotas behaviour
+# ---------------------------------------------------------------------------
+
+
+def test_expired_daily_quota_is_reset(db_session, test_teacher):
+    """A daily quota past its reset_at has used zeroed and reset_at advanced by 1 day."""
+    from app.db.models.quota import Quota
+
+    now = datetime.now(timezone.utc)
+    quota = Quota(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        quota_type="daily_answer",
+        used=47,
+        limit=100,
+        period="daily",
+        reset_at=now - timedelta(hours=1),
+    )
+    db_session.add(quota)
+    db_session.commit()
+
+    reset_quotas(db_session)
+
+    db_session.refresh(quota)
+    assert quota.used == 0
+    assert quota.reset_at > now
+
+
+def test_future_quota_is_not_touched(db_session, test_teacher):
+    """A quota whose reset_at is in the future is left completely alone."""
+    from app.db.models.quota import Quota
+
+    now = datetime.now(timezone.utc)
+    original_used = 15
+    future_reset = now + timedelta(hours=12)
+
+    quota = Quota(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        quota_type="daily_answer",
+        used=original_used,
+        limit=100,
+        period="daily",
+        reset_at=future_reset,
+    )
+    db_session.add(quota)
+    db_session.commit()
+
+    reset_quotas(db_session)
+
+    db_session.refresh(quota)
+    assert quota.used == original_used
+    assert quota.reset_at == future_reset
+
+
+def test_monthly_quota_reset_advances_by_30_days(db_session, test_teacher):
+    """A monthly quota's reset_at is advanced by 30 days after reset."""
+    from app.db.models.quota import Quota
+
+    now = datetime.now(timezone.utc)
+    quota = Quota(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        quota_type="monthly_session",
+        used=10,
+        limit=30,
+        period="monthly",
+        reset_at=now - timedelta(days=1),
+    )
+    db_session.add(quota)
+    db_session.commit()
+
+    reset_quotas(db_session)
+
+    db_session.refresh(quota)
+    assert quota.used == 0
+    # Should be approximately 30 days from now (within a 5-second window)
+    expected = now + timedelta(days=30)
+    assert abs((quota.reset_at - expected).total_seconds()) < 5
+
+
+def test_reset_quotas_on_empty_table_does_nothing(db_session):
+    """reset_quotas with no rows in DB completes without error."""
+    reset_quotas(db_session)  # must not raise
+
+
+def test_multiple_expired_quotas_all_reset(db_session, test_teacher):
+    """All expired quotas across multiple types are reset in a single call."""
+    from app.db.models.quota import Quota
+
+    now = datetime.now(timezone.utc)
+    past = now - timedelta(hours=2)
+
+    quotas = [
+        Quota(
+            id=uuid.uuid4(),
+            teacher_id=test_teacher.id,
+            quota_type="daily_answer",
+            used=50,
+            limit=100,
+            period="daily",
+            reset_at=past,
+        ),
+        Quota(
+            id=uuid.uuid4(),
+            teacher_id=test_teacher.id,
+            quota_type="monthly_session",
+            used=20,
+            limit=30,
+            period="monthly",
+            reset_at=past,
+        ),
+    ]
+    for q in quotas:
+        db_session.add(q)
+    db_session.commit()
+
+    reset_quotas(db_session)
+
+    for q in quotas:
+        db_session.refresh(q)
+        assert q.used == 0
+
+
+# ---------------------------------------------------------------------------
+# cleanup_expired_tokens behaviour
+# ---------------------------------------------------------------------------
+
+
+def test_expired_token_without_refresh_token_is_deleted(db_session, test_teacher):
+    """Expired token with no refresh_token is removed — it cannot be renewed."""
+    from app.db.models.youtube_token import YouTubeToken
+
+    now = datetime.now(timezone.utc)
+    token = YouTubeToken(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        access_token="encrypted_token_data",
+        refresh_token=None,
+        token_type="Bearer",
+        scope="https://www.googleapis.com/auth/youtube",
+        expires_at=now - timedelta(hours=1),
+    )
+    db_session.add(token)
+    db_session.commit()
+
+    cleanup_expired_tokens(db_session)
+
+    result = db_session.query(YouTubeToken).filter(YouTubeToken.teacher_id == test_teacher.id).first()
+    assert result is None
+
+
+def test_expired_token_with_refresh_token_is_kept(db_session, test_teacher):
+    """Expired token that HAS a refresh_token is preserved — the app can renew it."""
+    from app.db.models.youtube_token import YouTubeToken
+
+    now = datetime.now(timezone.utc)
+    token = YouTubeToken(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        access_token="encrypted_token_data",
+        refresh_token="refresh_token_value",
+        token_type="Bearer",
+        scope="https://www.googleapis.com/auth/youtube",
+        expires_at=now - timedelta(hours=1),
+    )
+    db_session.add(token)
+    db_session.commit()
+
+    cleanup_expired_tokens(db_session)
+
+    result = db_session.query(YouTubeToken).filter(YouTubeToken.teacher_id == test_teacher.id).first()
+    assert result is not None
+
+
+def test_valid_non_expired_token_is_never_deleted(db_session, test_teacher):
+    """A token that has not yet expired is left alone regardless of refresh_token."""
+    from app.db.models.youtube_token import YouTubeToken
+
+    now = datetime.now(timezone.utc)
+    token = YouTubeToken(
+        id=uuid.uuid4(),
+        teacher_id=test_teacher.id,
+        access_token="encrypted_token_data",
+        refresh_token=None,
+        token_type="Bearer",
+        scope="https://www.googleapis.com/auth/youtube",
+        expires_at=now + timedelta(hours=1),
+    )
+    db_session.add(token)
+    db_session.commit()
+
+    cleanup_expired_tokens(db_session)
+
+    result = db_session.query(YouTubeToken).filter(YouTubeToken.teacher_id == test_teacher.id).first()
+    assert result is not None
+
+
+def test_cleanup_on_empty_table_does_nothing(db_session):
+    """cleanup_expired_tokens with no rows completes without error."""
+    cleanup_expired_tokens(db_session)  # must not raise
diff --git a/workers/trigger_monitor/__init__.py b/workers/trigger_monitor/__init__.py
deleted file mode 100644
index f698436..0000000
--- a/workers/trigger_monitor/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""Trigger monitor worker package."""
diff --git a/workers/trigger_monitor/worker.py b/workers/trigger_monitor/worker.py
deleted file mode 100644
index d400276..0000000
--- a/workers/trigger_monitor/worker.py
+++ /dev/null
@@ -1,32 +0,0 @@
-"""Trigger monitor worker for monitoring and triggering actions."""
-
-import logging
-import os
-
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-
-
-def main() -> None:
-    """Main entry point for trigger monitor worker."""
-    logger.info("Starting trigger monitor worker...")
-
-    # Read environment variables
-    redis_url = os.getenv("REDIS_URL", "redis://localhost:6379/0")
-
-    logger.info(f"Redis URL: {redis_url}")
-    logger.info("Database URL configured")
-
-    logger.info("Trigger monitor worker started successfully")
-
-    # TODO: Implement actual worker logic
-    try:
-        while True:
-            # Worker loop placeholder
-            pass
-    except KeyboardInterrupt:
-        logger.info("Trigger monitor worker shutting down...")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/workers/youtube_polling/mock_worker.py b/workers/youtube_polling/mock_worker.py
new file mode 100644
index 0000000..cd8f630
--- /dev/null
+++ b/workers/youtube_polling/mock_worker.py
@@ -0,0 +1,248 @@
+"""Mock YouTube polling worker for local development.
+
+Generates synthetic student comments and feeds them into the DB + queue pipeline,
+enabling end-to-end testing of classification, embedding, clustering, and answer
+generation workers without any YouTube API dependency.
+"""
+
+import json
+import logging
+import os
+import random
+import signal
+import sys
+import time
+from datetime import (
+    datetime,
+    timezone,
+)
+from uuid import uuid4
+
+_project_root = os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+sys.path.insert(0, _project_root)
+sys.path.insert(0, os.path.join(_project_root, "backend"))
+
+from app.core.config import settings  # noqa: E402
+from app.db.models.comment import Comment  # noqa: E402
+from app.db.models.streaming_session import StreamingSession  # noqa: E402
+from app.services.websocket.events import event_service  # noqa: E402
+
+from workers.common.db import get_db_session  # noqa: E402
+from workers.common.queue import (  # noqa: E402
+    QUEUE_CLASSIFICATION,
+    QueueManager,
+)
+from workers.common.redis import get_redis_client  # noqa: E402
+from workers.common.schemas import ClassificationPayload  # noqa: E402
+
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
+)
+logger = logging.getLogger(__name__)
+
+_running = True
+_stats = {"cycles": 0, "messages": 0, "errors": 0, "last_log": time.time()}
+
+# ---------------------------------------------------------------------------
+# Themed message corpus
+# ---------------------------------------------------------------------------
+
+CLUSTERS = {
+    "python_basics": [
+        "Wait, what's the difference between a list and a tuple?",
+        "Why use a tuple if lists are more flexible?",
+        "Can someone explain the syntax for a dictionary again?",
+        "Is a tuple faster than a list in Python?",
+        "When should I use a dictionary vs a list?",
+    ],
+    "ai_ml_rag": [
+        "How does the AI remember what I said earlier?",
+        "Does this system use a vector database for the memory?",
+        "What happens if the RAG context is too long?",
+        "Is the clustering happening in real-time?",
+        "How do you calculate the centroid for a new question?",
+    ],
+    "general_interaction": [
+        "This is a great explanation, thanks!",
+        "The audio is a bit laggy for me.",
+        "Hello from New York!",
+        "Can you move the code up? I can't see the bottom.",
+        "I'm lost, can we go back five minutes?",
+    ],
+    "career_backend": [
+        "Is FastAPI better than Django for AI apps?",
+        "What is the best way to scale these workers?",
+        "How do I get a job as a Backend AI Engineer?",
+        "Is Redis better than RabbitMQ for this pipeline?",
+        "Do I need to know C++ for high-level system design?",
+    ],
+}
+
+CLUSTER_NAMES = list(CLUSTERS.keys())
+
+MOCK_AUTHORS = [
+    "Rahul S",
+    "Priya_codes",
+    "TechLearner42",
+    "student_2024",
+    "CS_Enthusiast",
+    "Amit Kumar",
+    "DevNinja99",
+    "Sneha R",
+    "CodeNewbie_",
+    "Arjun M",
+    "Meera Dev",
+    "hackathon_hero",
+    "ByteMe_23",
+    "Neha_learns",
+    "SysAdmin_Sam",
+]
+
+# ---------------------------------------------------------------------------
+# Comment generation
+# ---------------------------------------------------------------------------
+
+# Rotate primary cluster every N cycles to keep semantic density realistic
+_CLUSTER_ROTATE_EVERY = 20
+_current_primary_cluster: str = random.choice(CLUSTER_NAMES)
+_cycle_counter = 0
+
+
+def _maybe_rotate_cluster() -> None:
+    global _current_primary_cluster, _cycle_counter
+    _cycle_counter += 1
+    if _cycle_counter % _CLUSTER_ROTATE_EVERY == 0:
+        _current_primary_cluster = random.choice(CLUSTER_NAMES)
+        logger.info(f"Rotated primary cluster to '{_current_primary_cluster}'")
+
+
+def generate_mock_comment() -> dict:
+    """Return a synthetic comment dict ready for DB insertion."""
+    # 80% from primary cluster, 20% cross-cluster noise
+    if random.random() < 0.8:
+        cluster = _current_primary_cluster
+    else:
+        cluster = random.choice(CLUSTER_NAMES)
+
+    text = random.choice(CLUSTERS[cluster])
+    author = random.choice(MOCK_AUTHORS)
+
+    return {
+        "youtube_comment_id": f"mock:{uuid4()}",
+        "author_name": author,
+        "text": text,
+        "published_at": datetime.now(timezone.utc),
+    }
+
+
+# ---------------------------------------------------------------------------
+# Poll / ingest
+# ---------------------------------------------------------------------------
+
+
+def mock_poll_session(session_id: str, manager: QueueManager, redis_client) -> None:
+    """Generate one mock comment for a session and enqueue it."""
+    for db in get_db_session():
+        try:
+            session = db.query(StreamingSession).filter_by(id=session_id).first()
+            if not session or not session.is_active:
+                return
+
+            msg = generate_mock_comment()
+            comment = Comment(
+                session_id=session.id,
+                youtube_comment_id=msg["youtube_comment_id"],
+                author_name=msg["author_name"],
+                text=msg["text"],
+                published_at=msg["published_at"],
+            )
+            db.add(comment)
+            db.flush()
+
+            manager.enqueue(
+                QUEUE_CLASSIFICATION,
+                ClassificationPayload(
+                    comment_id=str(comment.id),
+                    text=comment.text,
+                    session_id=str(session.id),
+                ).to_dict(),
+            )
+            db.commit()
+
+            # Publish event for WebSocket relay
+            event = event_service.create_comment_created_event(
+                {
+                    "id": str(comment.id),
+                    "text": comment.text,
+                    "author_name": comment.author_name,
+                    "session_id": str(session.id),
+                }
+            )
+            redis_client.publish(f"ws:{session.id}", json.dumps(event))
+
+            _stats["messages"] += 1
+        finally:
+            db.close()
+
+
+# ---------------------------------------------------------------------------
+# Signal handling & main loop
+# ---------------------------------------------------------------------------
+
+
+def handle_signal(sig, frame):
+    global _running
+    logger.info("Shutdown signal received, stopping mock polling worker...")
+    _running = False
+
+
+signal.signal(signal.SIGTERM, handle_signal)
+signal.signal(signal.SIGINT, handle_signal)
+
+
+def main() -> None:
+    """Main mock polling loop — sequential, one comment per session per cycle."""
+    global _running
+    interval = settings.mock_message_interval
+
+    logger.info(
+        f"Starting MOCK YouTube polling worker... "
+        f"(interval={interval}s, primary_cluster='{_current_primary_cluster}')"
+    )
+    manager = QueueManager()
+    redis_client = get_redis_client()
+
+    while _running:
+        _stats["cycles"] += 1
+        _maybe_rotate_cluster()
+
+        # Log stats every 60s
+        if time.time() - _stats["last_log"] >= 60:
+            logger.info(
+                f"Mock stats — cycles: {_stats['cycles']}, "
+                f"messages: {_stats['messages']}, errors: {_stats['errors']}"
+            )
+            _stats["last_log"] = time.time()
+
+        # Fetch active sessions (no youtube_video_id requirement)
+        active_session_ids: list[str] = []
+        for db in get_db_session():
+            try:
+                rows = db.query(StreamingSession.id).filter(StreamingSession.is_active.is_(True)).all()
+                active_session_ids = [str(r.id) for r in rows]
+            finally:
+                db.close()
+
+        for sid in active_session_ids:
+            if not _running:
+                break
+            try:
+                mock_poll_session(sid, manager, redis_client)
+            except Exception as e:
+                _stats["errors"] += 1
+                logger.error(f"Mock poll error for session {sid}: {e}", exc_info=True)
+
+        time.sleep(interval)
+
+    logger.info("Mock YouTube polling worker shut down gracefully")
diff --git a/workers/youtube_polling/worker.py b/workers/youtube_polling/worker.py
index 8d25b33..1d294e9 100644
--- a/workers/youtube_polling/worker.py
+++ b/workers/youtube_polling/worker.py
@@ -4,8 +4,10 @@
 Each thread gets its own DB session and Redis client.
 """
 
+import json
 import logging
 import os
+import re
 import signal
 import sys
 import time
@@ -21,19 +23,28 @@
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
-from app.core.encryption import (
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
+
+setup_multiproc_dir()
+
+from app.core.encryption import (  # noqa: E402
     decrypt_data,
     encrypt_data,
 )
 from app.db.models.comment import Comment
 from app.db.models.streaming_session import StreamingSession
 from app.db.models.youtube_token import YouTubeToken
+from app.services.websocket.events import event_service
 from app.services.youtube.client import YouTubeClient
 from app.services.youtube.oauth import YouTubeOAuthService
 from app.services.youtube.quota import YouTubeQuotaService
 from googleapiclient.errors import HttpError
 
 from workers.common.db import get_db_session
+from workers.common.metrics import (  # noqa: E402
+    record_processing,
+    update_queue_depths,
+)
 from workers.common.queue import (
     QUEUE_CLASSIFICATION,
     QueueManager,
@@ -48,6 +59,13 @@
 logger = logging.getLogger(__name__)
 
 POLL_INTERVAL = 5  # seconds between full polling cycles
+
+
+def strip_html_tags(text: str) -> str:
+    """Remove HTML tags from text."""
+    return re.sub(r"<[^>]+>", "", text)
+
+
 _running = True
 _stats = {"polls": 0, "messages": 0, "errors": 0, "last_log": time.time()}
 
@@ -142,9 +160,9 @@ def poll_session(session_id: str, manager: QueueManager) -> None:
                 comment = Comment(
                     session_id=session.id,
                     youtube_comment_id=msg_data["youtube_comment_id"],
-                    author_name=msg_data["author_name"],
+                    author_name=strip_html_tags(msg_data["author_name"]),
                     author_channel_id=msg_data.get("author_channel_id"),
-                    text=msg_data["text"],
+                    text=strip_html_tags(msg_data["text"]),
                     published_at=published_at,
                 )
                 db.add(comment)
@@ -157,6 +175,18 @@ def poll_session(session_id: str, manager: QueueManager) -> None:
                         session_id=str(session.id),
                     ).to_dict(),
                 )
+
+                # Publish event for WebSocket relay
+                ws_event = event_service.create_comment_created_event(
+                    {
+                        "id": str(comment.id),
+                        "text": comment.text,
+                        "author_name": comment.author_name,
+                        "session_id": str(session.id),
+                    }
+                )
+                redis_client.publish(f"ws:{session.id}", json.dumps(ws_event))
+
                 fetched += 1
 
             db.commit()
@@ -177,6 +207,7 @@ def main() -> None:
 
     while _running:
         _stats["polls"] += 1
+        update_queue_depths(manager)
 
         # Log metrics every 60s
         if time.time() - _stats["last_log"] >= 60:
@@ -202,15 +233,19 @@ def main() -> None:
                 db.close()
 
         if active_session_ids:
+            cycle_start = time.time()
             with ThreadPoolExecutor(max_workers=min(len(active_session_ids), 10)) as executor:
                 futures = {executor.submit(poll_session, sid, manager): sid for sid in active_session_ids}
+                cycle_success = True
                 for future in as_completed(futures):
                     sid = futures[future]
                     try:
                         future.result()
                     except Exception as e:
+                        cycle_success = False
                         _stats["errors"] += 1
                         logger.error(f"Poll error for session {sid}: {e}", exc_info=True)
+            record_processing("youtube_polling", time.time() - cycle_start, cycle_success)
 
         time.sleep(POLL_INTERVAL)
 
@@ -218,4 +253,11 @@ def main() -> None:
 
 
 if __name__ == "__main__":
-    main()
+    from app.core.config import settings
+
+    if settings.mock_youtube:
+        from workers.youtube_polling.mock_worker import main as mock_main
+
+        mock_main()
+    else:
+        main()
diff --git a/workers/youtube_posting/worker.py b/workers/youtube_posting/worker.py
index de530ad..90ade06 100644
--- a/workers/youtube_posting/worker.py
+++ b/workers/youtube_posting/worker.py
@@ -21,7 +21,11 @@
 sys.path.insert(0, _project_root)
 sys.path.insert(0, os.path.join(_project_root, "backend"))
 
-from app.core.encryption import decrypt_data
+from workers.common.prometheus_setup import setup_multiproc_dir  # noqa: E402
+
+setup_multiproc_dir()
+
+from app.core.encryption import decrypt_data  # noqa: E402
 from app.db.models.answer import Answer
 from app.db.models.streaming_session import StreamingSession
 from app.db.models.youtube_token import YouTubeToken
@@ -30,6 +34,10 @@
 from app.services.youtube.quota import YouTubeQuotaService
 
 from workers.common.db import get_db_session
+from workers.common.metrics import (  # noqa: E402
+    record_processing,
+    update_queue_depths,
+)
 from workers.common.queue import (
     QUEUE_YOUTUBE_POSTING,
     QueueManager,
@@ -75,9 +83,11 @@ def main() -> None:
 
             task = manager.dequeue(QUEUE_YOUTUBE_POSTING)
             if task is None:
+                update_queue_depths(manager)
                 time.sleep(POLL_INTERVAL)
                 continue
 
+            proc_start = time.time()
             answer_id = task.get("answer_id")
             session_id = task.get("session_id")
 
@@ -127,19 +137,26 @@ def main() -> None:
                     _stats["posted"] += 1
 
                     # Publish event for WebSocket relay
-                    event = event_service.create_answer_posted_event(str(answer.id), str(answer.cluster_id))
-                    redis_client.publish(f"ws:session:{session_id}", json.dumps(event))
+                    try:
+                        event = event_service.create_answer_posted_event(str(answer.id), str(answer.cluster_id))
+                        redis_client.publish(f"ws:{session_id}", json.dumps(event))
+                    except Exception as pub_err:
+                        logger.error(
+                            f"Failed to publish WS event for answer {answer_id} session {session_id}: {pub_err}"
+                        )
                     logger.info(f"Posted answer {answer_id} to YouTube chat (msg_id={msg_id})")
 
                 finally:
                     db.close()
 
+            record_processing("youtube_posting", time.time() - proc_start, True)
             task = None
 
         except Exception as e:
             _stats["errors"] += 1
             logger.error(f"Posting worker error: {e}", exc_info=True)
             if task:
+                record_processing("youtube_posting", time.time() - proc_start, False)
                 manager.retry(QUEUE_YOUTUBE_POSTING, task)
                 task = None
             time.sleep(POLL_INTERVAL)