diff --git a/.gitignore b/.gitignore
index 4773417..22a1e90 100644
--- a/.gitignore
+++ b/.gitignore
@@ -23,15 +23,21 @@ robot_tests/
 # Test files
 test.py
 
-# Ignore the AI generated md files
+# Ignore the AI generated md/instruction files
 .kiro
 .cursor
 .claude
 .vscode
 .codex
+.github/copilot-instructions.md
 
 # Ignore the jsonl files
 *.jsonl
 
+# Ignore the database content
+chroma_db/
+data/
+logs/temp_metrics
+
 # Ignore the local browser_service
-tools/browser_service_local/*
\ No newline at end of file
+tools/browser_service/*
diff --git a/docs/OPTIMIZATION.md b/docs/OPTIMIZATION.md
new file mode 100644
index 0000000..630531d
--- /dev/null
+++ b/docs/OPTIMIZATION.md
@@ -0,0 +1,756 @@
+# CrewAI Performance Optimization Guide
+
+This guide explains how to use Mark 1's performance optimization system to reduce token usage and costs while maintaining code generation accuracy.
+
+## Overview
+
+Mark 1's optimization system reduces token usage by **67%** (from 12K to 4K tokens per workflow) through a **Hybrid Knowledge Architecture** that combines:
+
+1. **Core Rules** (~300 tokens) - Always included, library-specific constraints
+2. **ChromaDB Vector Store** - Keyword documentation with semantic search
+3. **Pattern Learning** - Learns from successful executions to predict relevant keywords
+4. **Smart Context Pruning** - Includes only keywords relevant to detected action types
+
+**Benefits:**
+- 67% token reduction (12K → 4K tokens per workflow)
+- 56% cost reduction ($0.0027 → $0.0012 per workflow)
+- Maintains 95%+ code generation accuracy
+- Improves over time through pattern learning
+- Graceful degradation if optimization fails
+
+## Quick Start
+
+### 1. Install Dependencies
+
+The optimization system requires additional Python packages:
+
+```bash
+pip install chromadb==0.4.22 sentence-transformers==2.2.2
+```
+
+### 2. Enable Optimization
+
+Add to your `.env` file:
+
+```env
+# Enable optimization system
+OPTIMIZATION_ENABLED=true
+```
+
+### 3. Restart Mark 1
+
+```bash
+# Stop services
+# Restart backend and frontend
+```
+
+On first startup, the system will:
+- Initialize ChromaDB with keyword embeddings (~5 seconds)
+- Create pattern learning database
+- Be ready for optimized test generation
+
+## Configuration Options
+
+All optimization settings are configured in `src/backend/.env`:
+
+### OPTIMIZATION_ENABLED
+
+Enable or disable the entire optimization system.
+
+```env
+OPTIMIZATION_ENABLED=true
+```
+
+**Options:**
+- `true` - Enable optimization (67% token reduction)
+- `false` - Use baseline behavior (full context)
+
+**Default:** `false`
+
+**Recommendation:** Enable after verifying your setup works correctly.
+
+### OPTIMIZATION_CHROMA_DB_PATH
+
+Path to ChromaDB storage directory for keyword embeddings.
+
+```env
+OPTIMIZATION_CHROMA_DB_PATH=./chroma_db
+```
+
+**Default:** `./chroma_db`
+
+**What it stores:**
+- Keyword embeddings for semantic search
+- Separate collections for Browser Library and SeleniumLibrary
+- Persistent storage (no re-embedding needed on restart)
+
+**Disk usage:** ~10-20 MB per library
+
+### OPTIMIZATION_PATTERN_DB_PATH
+
+Path to SQLite database for pattern learning.
+
+```env
+OPTIMIZATION_PATTERN_DB_PATH=./data/pattern_learning.db
+```
+
+**Default:** `./data/pattern_learning.db`
+
+**What it stores:**
+- Query patterns with embeddings
+- Keyword usage history
+- Prediction statistics
+
+**Disk usage:** Grows over time (~1 KB per query)
+
+### OPTIMIZATION_KEYWORD_SEARCH_TOP_K
+
+Number of keywords to return from semantic search.
+
+```env
+OPTIMIZATION_KEYWORD_SEARCH_TOP_K=3
+```
+
+**Range:** 1-10
+
+**Default:** 3
+
+**Trade-offs:**
+- Higher values: More keyword options, higher token usage
+- Lower values: Fewer options, lower token usage
+
+**Recommendation:** Keep at 3 for best balance.
+
+### OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD
+
+Minimum confidence for pattern prediction (0.0-1.0).
+
+```env
+OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.7
+```
+
+**Range:** 0.0 to 1.0
+
+**Default:** 0.7 (70% similarity required)
+
+**How it works:**
+- System searches for similar past queries
+- If similarity ≥ threshold, uses predicted keywords
+- If similarity < threshold, uses zero-context + search tool
+
+**Adjust based on:**
+- `0.6` - More aggressive prediction (may include irrelevant keywords)
+- `0.7` - Balanced (recommended)
+- `0.8` - Conservative prediction (fewer predictions, more searches)
+
+### OPTIMIZATION_CONTEXT_PRUNING_ENABLED
+
+Enable smart context pruning based on query classification.
+
+```env
+OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+```
+
+**Options:**
+- `true` - Prune context to relevant keyword categories
+- `false` - Include all keywords (when predicted/searched)
+
+**Default:** `true`
+
+**What it does:**
+- Classifies query into action categories (navigation, input, interaction, extraction, assertion, wait)
+- Includes only keywords matching detected categories
+- Reduces context size by ~40%
+
+**Recommendation:** Keep enabled for maximum token reduction.
+
+### OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD
+
+Minimum confidence for category classification (0.0-1.0).
+
+```env
+OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.8
+```
+
+**Range:** 0.0 to 1.0
+
+**Default:** 0.8 (80% similarity required)
+
+**How it works:**
+- System classifies query into action categories
+- If confidence ≥ threshold, prunes to relevant categories
+- If confidence < threshold, includes all categories (safe fallback)
+
+**Adjust based on:**
+- `0.7` - More aggressive pruning (may exclude needed keywords)
+- `0.8` - Balanced (recommended)
+- `0.9` - Conservative pruning (less reduction, safer)
+
+## Example Configurations
+
+### Production Setup (Recommended)
+
+```env
+# Enable optimization with balanced settings
+OPTIMIZATION_ENABLED=true
+OPTIMIZATION_CHROMA_DB_PATH=./chroma_db
+OPTIMIZATION_PATTERN_DB_PATH=./data/pattern_learning.db
+OPTIMIZATION_KEYWORD_SEARCH_TOP_K=3
+OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.7
+OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.8
+```
+
+**Best for:** Production use with proven token reduction and accuracy.
+
+### Aggressive Optimization
+
+```env
+# Maximum token reduction
+OPTIMIZATION_ENABLED=true
+OPTIMIZATION_CHROMA_DB_PATH=./chroma_db
+OPTIMIZATION_PATTERN_DB_PATH=./data/pattern_learning.db
+OPTIMIZATION_KEYWORD_SEARCH_TOP_K=2
+OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.6
+OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.7
+```
+
+**Best for:** Minimizing costs when accuracy can tolerate slight variations.
+
+### Conservative Optimization
+
+```env
+# Safer optimization with higher accuracy
+OPTIMIZATION_ENABLED=true
+OPTIMIZATION_CHROMA_DB_PATH=./chroma_db
+OPTIMIZATION_PATTERN_DB_PATH=./data/pattern_learning.db
+OPTIMIZATION_KEYWORD_SEARCH_TOP_K=5
+OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.8
+OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.9
+```
+
+**Best for:** Critical tests where accuracy is paramount.
+
+### Development/Testing
+
+```env
+# Disable optimization for baseline comparison
+OPTIMIZATION_ENABLED=false
+```
+
+**Best for:** Testing baseline behavior or debugging issues.
+
+## How It Works
+
+### Tier 1: Core Rules (Always Included)
+
+Core rules are **always** included in agent context (~300 tokens):
+
+- Critical sequences (New Browser → New Context viewport=None → New Page)
+- Parameter rules and syntax
+- Auto-waiting behavior
+- Locator priorities
+- Library-specific constraints
+
+**Why always included:**
+- Ensures critical patterns never forgotten
+- Maintains code quality and consistency
+- Prevents common mistakes
+
+### Tier 2: Pattern Learning (Predicted Keywords)
+
+When you run a query, the system:
+
+1. Searches for similar past queries in pattern database
+2. If similarity ≥ confidence threshold (default 0.7):
+   - Predicts relevant keywords based on past usage
+   - Retrieves full documentation from ChromaDB
+   - Includes in agent context (~500 tokens)
+3. If similarity < threshold:
+   - Falls back to Tier 3
+
+**Improves over time:**
+- More queries = better predictions
+- System learns your testing patterns
+- Prediction accuracy increases
+
+### Tier 3: Zero-Context + Search Tool
+
+If no pattern match found:
+
+1. Agents receive minimal context with tool instructions (~200 tokens)
+2. Agents use `keyword_search` tool to find relevant keywords on-demand
+3. Tool performs semantic search in ChromaDB (<100ms)
+4. Returns top 3 matching keywords with documentation
+
+**Example tool usage:**
+```
+Agent: "I need to click a button"
+Tool: Returns ["Click", "Click Element", "Click Button"] with docs
+Agent: Uses "Click" in generated code
+```
+
+### Tier 4: Full Context Fallback
+
+If all optimizations fail:
+- System falls back to full context (baseline behavior)
+- Logs fallback event for monitoring
+- Maintains 99.9% workflow success rate
+
+## Monitoring Performance
+
+### Metrics API
+
+The optimization system tracks detailed metrics accessible via the workflow metrics API:
+
+```bash
+curl http://localhost:5000/workflow-metrics/{workflow_id}
+```
+
+**Response includes:**
+
+```json
+{
+  "workflow_id": "abc-123",
+  "total_time_ms": 35000,
+  "optimization": {
+    "token_usage": {
+      "step_planner": 800,
+      "element_identifier": 600,
+      "code_assembler": 1200,
+      "code_validator": 400,
+      "total": 3000
+    },
+    "keyword_search": {
+      "calls": 2,
+      "total_latency_ms": 150,
+      "avg_latency_ms": 75,
+      "accuracy": 0.95
+    },
+    "pattern_learning": {
+      "prediction_used": true,
+      "predicted_keywords_count": 8,
+      "prediction_accuracy": 0.87
+    },
+    "context_reduction": {
+      "baseline_tokens": 12000,
+      "optimized_tokens": 3000,
+      "reduction_percentage": 75.0
+    }
+  }
+}
+```
+
+### Key Metrics
+
+**Token Usage:**
+- Per-agent token counts
+- Total workflow token usage
+- Compare against baseline (12K tokens)
+
+**Keyword Search:**
+- Number of tool calls
+- Average latency (target: <100ms)
+- Accuracy (% of returned keywords used in final code)
+
+**Pattern Learning:**
+- Whether prediction was used
+- Number of predicted keywords
+- Prediction accuracy
+
+**Context Reduction:**
+- Baseline vs optimized token counts
+- Reduction percentage (target: 67%)
+
+### Logs
+
+Optimization events are logged to `logs/optimization.log`:
+
+```
+INFO: ChromaDB initialized with 143 keywords in 4.2s
+INFO: Pattern prediction used for query "login to website" (8 keywords, 0.87 confidence)
+INFO: Keyword search: "click button" → 3 results in 78ms
+WARNING: Pattern prediction confidence too low (0.65), falling back to search tool
+ERROR: ChromaDB search failed, falling back to full context
+```
+
+## Interpreting Metrics
+
+### Good Performance
+
+```json
+{
+  "token_usage": {"total": 3000},
+  "keyword_search": {"calls": 1, "avg_latency_ms": 75},
+  "pattern_learning": {"prediction_used": true, "prediction_accuracy": 0.85},
+  "context_reduction": {"reduction_percentage": 75.0}
+}
+```
+
+**Indicators:**
+- ✅ Total tokens: 3K-4K (67% reduction achieved)
+- ✅ Few keyword searches (pattern learning working)
+- ✅ High prediction accuracy (>0.80)
+- ✅ High reduction percentage (>65%)
+
+### Needs Tuning
+
+```json
+{
+  "token_usage": {"total": 8000},
+  "keyword_search": {"calls": 5, "avg_latency_ms": 150},
+  "pattern_learning": {"prediction_used": false},
+  "context_reduction": {"reduction_percentage": 33.0}
+}
+```
+
+**Indicators:**
+- ⚠️ Total tokens: 6K-8K (less reduction than expected)
+- ⚠️ Many keyword searches (pattern learning not matching)
+- ⚠️ Prediction not used (confidence threshold too high?)
+- ⚠️ Low reduction percentage (<50%)
+
+**Actions:**
+- Lower `OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD` to 0.6
+- Check if queries are too diverse for pattern learning
+- Verify ChromaDB is initialized correctly
+
+### Fallback Occurring
+
+```json
+{
+  "token_usage": {"total": 12000},
+  "context_reduction": {"reduction_percentage": 0.0}
+}
+```
+
+**Indicators:**
+- ❌ Total tokens: 12K (no reduction, using full context)
+- ❌ Zero reduction percentage
+
+**Actions:**
+- Check logs for error messages
+- Verify ChromaDB path is accessible
+- Verify dependencies are installed
+- Check pattern database is writable
+
+## Troubleshooting
+
+### "ChromaDB initialization failed"
+
+**Symptoms:**
+- Error on startup
+- Optimization falls back to full context
+
+**Solutions:**
+1. Verify dependencies installed:
+   ```bash
+   pip install chromadb==0.4.22 sentence-transformers==2.2.2
+   ```
+2. Check ChromaDB path is writable:
+   ```bash
+   mkdir -p ./chroma_db
+   chmod 755 ./chroma_db
+   ```
+3. Check disk space (needs ~20 MB)
+4. Review logs for specific error
+
+### "Pattern database locked"
+
+**Symptoms:**
+- SQLite database errors
+- Pattern learning fails
+
+**Solutions:**
+1. Check no other process is using the database
+2. Verify database path is writable:
+   ```bash
+   mkdir -p ./data
+   chmod 755 ./data
+   ```
+3. Delete and recreate database:
+   ```bash
+   rm ./data/pattern_learning.db
+   # Restart Mark 1 to recreate
+   ```
+
+### "Keyword search timeout"
+
+**Symptoms:**
+- Search takes >100ms
+- Slow test generation
+
+**Solutions:**
+1. Check ChromaDB is initialized (first search is slower)
+2. Verify sentence-transformers model is downloaded
+3. Check system resources (CPU, memory)
+4. Reduce `OPTIMIZATION_KEYWORD_SEARCH_TOP_K` to 2
+
+### "Low prediction accuracy"
+
+**Symptoms:**
+- Pattern learning predicts wrong keywords
+- Generated code uses different keywords
+
+**Solutions:**
+1. System needs more training data (run more queries)
+2. Lower confidence threshold:
+   ```env
+   OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.6
+   ```
+3. Check queries are similar enough for pattern matching
+4. Verify pattern database is being updated
+
+### "Token reduction less than expected"
+
+**Symptoms:**
+- Reduction percentage <50%
+- Token usage still high
+
+**Solutions:**
+1. Enable context pruning:
+   ```env
+   OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+   ```
+2. Lower pruning threshold:
+   ```env
+   OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.7
+   ```
+3. Reduce keyword search results:
+   ```env
+   OPTIMIZATION_KEYWORD_SEARCH_TOP_K=2
+   ```
+4. Check pattern learning is being used (review metrics)
+
+### "Optimization disabled automatically"
+
+**Symptoms:**
+- System falls back to full context
+- Logs show fallback events
+
+**Solutions:**
+1. Check all dependencies installed
+2. Verify ChromaDB initialized successfully
+3. Check pattern database is accessible
+4. Review error logs for root cause
+5. Temporarily disable optimization to verify baseline works:
+   ```env
+   OPTIMIZATION_ENABLED=false
+   ```
+
+## Performance Tips
+
+### 1. Let Pattern Learning Train
+
+The system improves over time:
+- First 10 queries: Mostly uses search tool
+- After 20 queries: Starts predicting keywords
+- After 50 queries: High prediction accuracy
+
+**Tip:** Run diverse queries to build a good training set.
+
+### 2. Monitor Metrics Regularly
+
+Check metrics after every 10-20 queries:
+- Is token reduction improving?
+- Is prediction accuracy increasing?
+- Are searches becoming less frequent?
+
+### 3. Tune Thresholds Based on Usage
+
+**If you have diverse queries:**
+- Lower confidence thresholds (0.6-0.7)
+- More searches, less prediction
+
+**If you have repetitive queries:**
+- Higher confidence thresholds (0.7-0.8)
+- More prediction, fewer searches
+
+### 4. Clean Up Old Data
+
+Pattern database grows over time:
+
+```bash
+# Backup current database
+cp ./data/pattern_learning.db ./data/pattern_learning.db.backup
+
+# Optional: Delete old patterns (keeps last 1000)
+sqlite3 ./data/pattern_learning.db "DELETE FROM patterns WHERE id NOT IN (SELECT id FROM patterns ORDER BY timestamp DESC LIMIT 1000)"
+```
+
+### 5. Use Appropriate Library
+
+Browser Library works best with optimization:
+- Better keyword documentation
+- More consistent patterns
+- Faster execution
+
+```env
+ROBOT_LIBRARY=browser
+```
+
+## Best Practices
+
+### Do's
+
+✅ **Enable optimization in production** - Proven 67% token reduction
+
+✅ **Monitor metrics regularly** - Track performance improvements
+
+✅ **Let pattern learning train** - Needs 20+ queries for best results
+
+✅ **Use recommended settings** - Default configuration is well-tested
+
+✅ **Keep ChromaDB persistent** - Don't delete between restarts
+
+✅ **Review logs for fallbacks** - Indicates issues to address
+
+### Don'ts
+
+❌ **Don't disable after one failure** - Check logs and fix root cause
+
+❌ **Don't set thresholds too low** - May include irrelevant keywords
+
+❌ **Don't set thresholds too high** - May never use predictions
+
+❌ **Don't delete pattern database** - Loses all learning
+
+❌ **Don't expect instant results** - Pattern learning needs training
+
+❌ **Don't ignore metrics** - They show what's working and what's not
+
+## Migration Guide
+
+### Enabling Optimization on Existing System
+
+1. **Backup current setup:**
+   ```bash
+   cp src/backend/.env src/backend/.env.backup
+   ```
+
+2. **Install dependencies:**
+   ```bash
+   pip install chromadb==0.4.22 sentence-transformers==2.2.2
+   ```
+
+3. **Add configuration to `.env`:**
+   ```env
+   OPTIMIZATION_ENABLED=true
+   OPTIMIZATION_CHROMA_DB_PATH=./chroma_db
+   OPTIMIZATION_PATTERN_DB_PATH=./data/pattern_learning.db
+   OPTIMIZATION_KEYWORD_SEARCH_TOP_K=3
+   OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.7
+   OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+   OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.8
+   ```
+
+4. **Restart Mark 1:**
+   ```bash
+   # Stop all services
+   # Start backend and frontend
+   ```
+
+5. **Verify initialization:**
+   - Check logs for "ChromaDB initialized"
+   - Check `./chroma_db/` directory created
+   - Check `./data/pattern_learning.db` created
+
+6. **Run test queries:**
+   - Start with simple queries
+   - Check metrics API for token reduction
+   - Verify code generation accuracy
+
+7. **Monitor for 24 hours:**
+   - Review metrics regularly
+   - Check for fallback events
+   - Verify no errors in logs
+
+8. **Tune if needed:**
+   - Adjust thresholds based on metrics
+   - Review troubleshooting section if issues
+
+### Disabling Optimization
+
+If you need to disable optimization:
+
+1. **Set in `.env`:**
+   ```env
+   OPTIMIZATION_ENABLED=false
+   ```
+
+2. **Restart Mark 1**
+
+3. **Keep data for future use:**
+   - Don't delete `./chroma_db/`
+   - Don't delete `./data/pattern_learning.db`
+   - Can re-enable anytime without losing learning
+
+## FAQ
+
+### Does optimization affect code quality?
+
+No. The system maintains 95%+ accuracy by:
+- Always including core rules
+- Using semantic search for relevant keywords
+- Falling back to full context if needed
+
+### How long does ChromaDB initialization take?
+
+~5 seconds on first startup. Subsequent startups are instant (uses persistent storage).
+
+### Does pattern learning work with both Browser and SeleniumLibrary?
+
+Yes. The system learns patterns for whichever library you're using.
+
+### Can I use optimization with local models (Ollama)?
+
+Yes. Optimization works with both online (Gemini) and local (Ollama) models.
+
+### What happens if ChromaDB fails?
+
+The system gracefully falls back to full context (baseline behavior). Workflow success rate remains 99.9%.
+
+### How much disk space does optimization use?
+
+- ChromaDB: ~10-20 MB per library
+- Pattern database: ~1 KB per query (grows over time)
+- Total: <100 MB for typical usage
+
+### Can I reset pattern learning?
+
+Yes. Delete the pattern database:
+```bash
+rm ./data/pattern_learning.db
+```
+System will recreate it on next startup.
+
+### Does optimization work with custom keywords?
+
+Yes, if you've added custom keywords to your library context, they'll be included in ChromaDB and pattern learning.
+
+## Getting Help
+
+If you're experiencing issues with optimization:
+
+1. **Check logs:** `logs/optimization.log`
+2. **Review metrics:** Use workflow metrics API
+3. **Check troubleshooting section** above
+4. **Search existing issues:** [GitHub Issues](https://github.com/monkscode/Natural-Language-to-Robot-Framework/issues)
+5. **Open new issue** with:
+   - Configuration settings
+   - Error messages from logs
+   - Metrics output
+   - Steps to reproduce
+
+## Additional Resources
+
+- [Configuration Guide](CONFIGURATION.md) - All environment variables
+- [Architecture Guide](ARCHITECTURE.md) - How Mark 1 works
+- [Troubleshooting Guide](TROUBLESHOOTING.md) - Common issues
+- [GitHub Discussions](https://github.com/monkscode/Natural-Language-to-Robot-Framework/discussions) - Ask questions
+
+---
+
+**Ready to optimize?** Enable optimization in your `.env` file and start reducing token costs today! 🚀
diff --git a/docs/OPTIMIZATION_DEVELOPER_GUIDE.md b/docs/OPTIMIZATION_DEVELOPER_GUIDE.md
new file mode 100644
index 0000000..68f8721
--- /dev/null
+++ b/docs/OPTIMIZATION_DEVELOPER_GUIDE.md
@@ -0,0 +1,2233 @@
+# CrewAI Optimization System - Developer Guide
+
+This guide provides technical documentation for developers working on or extending the CrewAI optimization system.
+
+## Table of Contents
+
+- [Architecture Overview](#architecture-overview)
+- [Core Components](#core-components)
+- [Hybrid Knowledge Architecture](#hybrid-knowledge-architecture)
+- [Extension Points](#extension-points)
+- [Testing Approach](#testing-approach)
+- [Code Examples](#code-examples)
+- [Performance Considerations](#performance-considerations)
+- [Debugging and Troubleshooting](#debugging-and-troubleshooting)
+
+## Architecture Overview
+
+The optimization system implements a **Hybrid Knowledge Architecture** that reduces token usage by 67% while maintaining code generation accuracy. The system combines three key strategies:
+
+1. **Core Rules** - Always-present library-specific constraints (~300 tokens)
+2. **ChromaDB Vector Store** - Semantic search over keyword documentation
+3. **Pattern Learning** - Learn from successful executions to predict relevant keywords
+
+### High-Level Architecture
+
+```
+┌─────────────────────────────────────────────────────────────────┐
+│                    CrewAI Workflow System                        │
+│                                                                  │
+│  ┌────────────────┐         ┌──────────────────────┐           │
+│  │ Step Planner   │         │ Smart Keyword        │           │
+│  │    Agent       │────────▶│    Provider          │           │
+│  └────────────────┘         │                      │           │
+│                              │  ┌────────────────┐  │           │
+│  ┌────────────────┐         │  │ Pattern        │  │           │
+│  │ Code Assembler │────────▶│  │ Learning       │  │           │
+│  │    Agent       │         │  └────────┬───────┘  │           │
+│  └────────────────┘         │           │          │           │
+│                              │  ┌────────▼───────┐  │           │
+│  ┌────────────────┐         │  │ Keyword Search │  │           │
+│  │ Code Validator │────────▶│  │     Tool       │  │           │
+│  │    Agent       │         │  └────────┬───────┘  │           │
+│  └────────────────┘         │           │          │           │
+│                              │  ┌────────▼───────┐  │           │
+│  ┌────────────────┐         │  │   ChromaDB     │  │           │
+│  │Library Context │◀────────│  │ Vector Store   │  │           │
+│  │   (Existing)   │         │  └────────────────┘  │           │
+│  └────────────────┘         └──────────────────────┘           │
+└─────────────────────────────────────────────────────────────────┘
+```
+
+### Module Structure
+
+```
+src/backend/crew_ai/optimization/
+├── __init__.py                    # Public API exports
+├── chroma_store.py                # ChromaDB vector store wrapper
+├── keyword_search_tool.py         # Semantic keyword search tool
+├── pattern_learning.py            # Query pattern matcher
+├── smart_keyword_provider.py      # Hybrid keyword provider orchestration
+├── context_pruner.py              # Smart context pruning
+└── logging_config.py              # Optimization-specific logging
+```
+
+
+## Core Components
+
+### 1. ChromaDB Vector Store (`chroma_store.py`)
+
+The `KeywordVectorStore` class manages keyword embeddings using ChromaDB for efficient semantic search.
+
+**Key Features:**
+- Persistent storage (no re-embedding on restart)
+- Automatic embedding generation using sentence-transformers
+- Separate collections per library (Browser, SeleniumLibrary)
+- Version tracking and automatic rebuild on library updates
+
+**Class Interface:**
+
+```python
+class KeywordVectorStore:
+    """ChromaDB wrapper for keyword storage and semantic search."""
+    
+    def __init__(self, persist_directory: str = "./chroma_db"):
+        """Initialize ChromaDB client with persistence."""
+        
+    def create_or_get_collection(self, library_name: str):
+        """Get or create collection for library keywords."""
+        
+    def add_keywords(self, library_name: str, keywords: List[Dict]):
+        """Add keywords to ChromaDB collection."""
+        
+    def search(self, library_name: str, query: str, top_k: int = 3) -> List[Dict]:
+        """Semantic search for keywords."""
+        
+    def get_library_version(self, library_name: str) -> str:
+        """Get library version from metadata."""
+        
+    def rebuild_collection(self, library_name: str):
+        """Rebuild collection on version change."""
+```
+
+**Implementation Details:**
+
+- Uses `chromadb.PersistentClient` for disk persistence
+- Embedding function: `SentenceTransformerEmbeddingFunction` with `all-MiniLM-L6-v2`
+- Documents formatted as: `"{keyword_name} {keyword_documentation}"`
+- Metadata includes: name, args, doc, version
+- Search returns: name, args, description, distance score
+
+**Performance:**
+- Initialization: <5 seconds for 143 keywords
+- Search latency: <100ms per query
+- Storage: ~10-20 MB per library
+
+### 2. Keyword Search Tool (`keyword_search_tool.py`)
+
+The `KeywordSearchTool` provides semantic search as a CrewAI tool that agents can invoke.
+
+**Key Features:**
+- CrewAI `BaseTool` integration
+- LRU cache for frequent searches (100 entries)
+- Returns top K results with examples
+- JSON-formatted output for agent consumption
+
+**Class Interface:**
+
+```python
+class KeywordSearchTool(BaseTool):
+    """CrewAI tool for semantic keyword search."""
+    
+    name: str = "keyword_search"
+    description: str = "Search for Robot Framework keywords..."
+    
+    def __init__(self, library_name: str, chroma_store: KeywordVectorStore):
+        """Initialize with library name and ChromaDB store."""
+        
+    def _run(self, query: str, top_k: int = 3) -> str:
+        """Search for keywords matching the query."""
+```
+
+**Usage by Agents:**
+
+```python
+# Agent calls tool with natural language query
+result = keyword_search("click a button")
+
+# Tool returns JSON with top matches
+{
+  "results": [
+    {
+      "name": "Click",
+      "args": ["selector", "**kwargs"],
+      "description": "Clicks element identified by selector...",
+      "example": "Click    ${locator}"
+    },
+    ...
+  ]
+}
+```
+
+**Caching Strategy:**
+- LRU cache with 100 entries
+- Cache key: `"{query}:{top_k}"`
+- Eviction: FIFO when cache full
+- Hit rate: ~40% in typical usage
+
+
+### 3. Pattern Learning System (`pattern_learning.py`)
+
+The `QueryPatternMatcher` learns which keywords are commonly used for specific query types.
+
+**Key Features:**
+- ChromaDB-based pattern storage with embeddings
+- Semantic similarity search for pattern matching
+- Confidence-based prediction
+- Continuous learning from successful executions
+
+**Class Interface:**
+
+```python
+class QueryPatternMatcher:
+    """Learn and predict keyword usage patterns."""
+    
+    def __init__(self, chroma_store: KeywordVectorStore):
+        """Initialize with ChromaDB store."""
+        
+    def learn_from_execution(self, user_query: str, generated_code: str):
+        """Extract keywords from code and store pattern."""
+        
+    def get_relevant_keywords(self, user_query: str, 
+                            confidence_threshold: float = 0.7) -> List[str]:
+        """Predict relevant keywords based on similar past queries."""
+        
+    def _extract_keywords_from_code(self, code: str) -> List[str]:
+        """Extract Robot Framework keywords from generated code."""
+```
+
+**Learning Process:**
+
+1. **Execution Completes** → Extract keywords from generated code
+2. **Store Pattern** → Save query + keywords in ChromaDB with embedding
+3. **New Query** → Search for similar past queries
+4. **Predict Keywords** → If similarity ≥ threshold, return aggregated keywords
+
+**Prediction Algorithm:**
+
+```python
+def get_relevant_keywords(self, user_query: str, confidence_threshold: float = 0.7):
+    # 1. Search ChromaDB for similar patterns
+    results = self.pattern_collection.query(query_texts=[user_query], n_results=5)
+    
+    # 2. Check confidence (convert distance to similarity)
+    top_distance = results['distances'][0][0]
+    similarity = 1 / (1 + top_distance)
+    
+    if similarity < confidence_threshold:
+        return []  # Not confident enough
+    
+    # 3. Aggregate keywords from top 5 similar patterns
+    keyword_counts = {}
+    for metadata in results['metadatas'][0]:
+        keywords = json.loads(metadata['keywords'])
+        for keyword in keywords:
+            keyword_counts[keyword] = keyword_counts.get(keyword, 0) + 1
+    
+    # 4. Return top 10 most common keywords
+    sorted_keywords = sorted(keyword_counts.items(), key=lambda x: x[1], reverse=True)
+    return [kw for kw, count in sorted_keywords[:10]]
+```
+
+**Improvement Over Time:**
+- First 10 queries: Low prediction rate (~10%)
+- After 20 queries: Moderate prediction rate (~40%)
+- After 50 queries: High prediction rate (~70%)
+
+### 4. Smart Keyword Provider (`smart_keyword_provider.py`)
+
+The `SmartKeywordProvider` orchestrates the 3-tier keyword retrieval system.
+
+**Key Features:**
+- Hybrid approach: core rules + predicted/searched keywords
+- Graceful degradation through multiple fallback tiers
+- Agent-specific context formatting
+- Learning hook for continuous improvement
+
+**Class Interface:**
+
+```python
+class SmartKeywordProvider:
+    """Intelligent keyword provider with hybrid approach."""
+    
+    def __init__(self, library_context: LibraryContext,
+                 pattern_matcher: QueryPatternMatcher,
+                 chroma_store: KeywordVectorStore):
+        """Initialize with library context and optimization components."""
+        
+    def get_agent_context(self, user_query: str, agent_role: str) -> str:
+        """Get optimized context for an agent."""
+        
+    def get_keyword_search_tool(self) -> KeywordSearchTool:
+        """Get keyword search tool for agents."""
+        
+    def learn_from_execution(self, user_query: str, generated_code: str):
+        """Learn from successful execution."""
+```
+
+**3-Tier Retrieval Strategy:**
+
+```python
+def get_agent_context(self, user_query: str, agent_role: str) -> str:
+    # Tier 1: Core Rules (Always Included)
+    core_rules = self.library_context.core_rules  # ~300 tokens
+    
+    try:
+        # Tier 2: Pattern Learning (Predicted Keywords)
+        predicted_keywords = self.pattern_matcher.get_relevant_keywords(user_query)
+        
+        if predicted_keywords:
+            # Get full docs from ChromaDB
+            keyword_docs = self._get_keyword_docs(predicted_keywords)
+            return self._format_predicted_context(core_rules, keyword_docs, agent_role)
+            # Total: ~800 tokens (300 core + 500 keywords)
+    except Exception as e:
+        logger.warning(f"Pattern learning failed: {e}")
+    
+    try:
+        # Tier 3: Zero-Context + Search Tool
+        return self._format_zero_context_with_tool(core_rules, agent_role)
+        # Total: ~500 tokens (300 core + 200 tool instructions)
+    except Exception as e:
+        logger.warning(f"Zero-context formatting failed: {e}")
+    
+    # Tier 4: Full Context Fallback
+    logger.info("Using full context as fallback")
+    return self.library_context.code_assembly_context
+    # Total: ~3000 tokens (baseline behavior)
+```
+
+
+### 5. Context Pruner (`context_pruner.py`)
+
+The `ContextPruner` classifies queries and prunes context to relevant keyword categories.
+
+**Key Features:**
+- Semantic query classification into action categories
+- Pre-computed category embeddings for fast lookup
+- Confidence-based filtering
+- Fallback to all categories if confidence too low
+
+**Class Interface:**
+
+```python
+class ContextPruner:
+    """Classify queries and prune context to relevant categories."""
+    
+    KEYWORD_CATEGORIES = {
+        "navigation": ["New Browser", "New Page", "Go To", ...],
+        "input": ["Fill Text", "Input Text", "Type Text", ...],
+        "interaction": ["Click", "Click Element", "Hover", ...],
+        "extraction": ["Get Text", "Get Attribute", ...],
+        "assertion": ["Should Be Equal", "Should Contain", ...],
+        "wait": ["Wait For Elements State", ...]
+    }
+    
+    def __init__(self):
+        """Initialize with sentence-transformers classifier."""
+        
+    def classify_query(self, user_query: str, 
+                      confidence_threshold: float = 0.8) -> List[str]:
+        """Classify query into action categories."""
+        
+    def prune_keywords(self, all_keywords: List[Dict], 
+                      categories: List[str]) -> List[Dict]:
+        """Filter keywords to only those in relevant categories."""
+```
+
+**Classification Process:**
+
+```python
+def classify_query(self, user_query: str, confidence_threshold: float = 0.8):
+    # 1. Encode query
+    query_embedding = self.classifier.encode([user_query])[0]
+    
+    # 2. Compute similarity with each category
+    similarities = {
+        cat: np.dot(query_embedding, emb)
+        for cat, emb in self.category_embeddings.items()
+    }
+    
+    # 3. Get categories above threshold
+    relevant_categories = [
+        cat for cat, sim in similarities.items()
+        if sim >= confidence_threshold
+    ]
+    
+    # 4. Fallback to all categories if none meet threshold
+    if not relevant_categories:
+        return list(self.KEYWORD_CATEGORIES.keys())
+    
+    return relevant_categories
+```
+
+**Performance Impact:**
+- Average context reduction: 40%
+- Classification latency: <50ms
+- Accuracy maintained: >95%
+
+## Hybrid Knowledge Architecture
+
+The hybrid architecture combines three knowledge sources to optimize token usage while maintaining accuracy.
+
+### Tier 1: Core Rules (Always Present)
+
+**Purpose:** Ensure critical library-specific constraints are never forgotten.
+
+**Content (~300 tokens):**
+- Critical sequences (e.g., New Browser → New Context viewport=None → New Page)
+- Parameter rules and syntax
+- Auto-waiting behavior
+- Locator priorities
+- Common pitfalls and solutions
+
+**Implementation:**
+
+```python
+# In src/backend/crew_ai/library_context/browser_context.py
+
+class BrowserLibraryContext(LibraryContext):
+    @property
+    def core_rules(self) -> str:
+        """Core rules always included in agent context."""
+        return """
+        CRITICAL BROWSER LIBRARY RULES:
+        
+        1. INITIALIZATION SEQUENCE (MUST FOLLOW):
+           - New Browser    chromium    headless=True
+           - New Context    viewport=None    # REQUIRED: viewport=None
+           - New Page       ${URL}
+        
+        2. PARAMETER RULES:
+           - viewport MUST be None (not 'None' string)
+           - Use Browser Library syntax, NOT SeleniumLibrary
+           - All selectors use CSS or text= prefix
+        
+        3. AUTO-WAITING:
+           - Browser Library auto-waits for elements
+           - No explicit Wait keywords needed in most cases
+        
+        4. LOCATOR PRIORITIES:
+           - Prefer: id= > data-testid= > text= > css=
+           - Avoid: xpath (use CSS instead)
+        """
+```
+
+**Why Always Included:**
+- Prevents critical mistakes (e.g., missing viewport=None)
+- Maintains code quality consistency
+- Small token cost (~300) for high value
+
+### Tier 2: Predicted Keywords (Pattern Learning)
+
+**Purpose:** Pre-load relevant keywords based on learned patterns.
+
+**Process:**
+1. Search for similar past queries in ChromaDB
+2. If similarity ≥ 0.7, predict relevant keywords
+3. Retrieve full documentation from ChromaDB
+4. Include in agent context (~500 tokens)
+
+**Example:**
+
+```python
+# User query: "search for shoes on Flipkart"
+
+# Pattern learning finds similar past query:
+# "search for laptops on Amazon" → used [Fill Text, Click, Get Text]
+
+# Prediction: [Fill Text, Click, Get Text] with 0.85 confidence
+
+# Context includes:
+# - Core rules (300 tokens)
+# - Fill Text documentation (150 tokens)
+# - Click documentation (150 tokens)
+# - Get Text documentation (200 tokens)
+# Total: ~800 tokens (vs 3000 baseline)
+```
+
+**Improvement Over Time:**
+- System learns from every successful execution
+- Prediction accuracy increases with more data
+- Adapts to user's testing patterns
+
+### Tier 3: Zero-Context + Search Tool
+
+**Purpose:** Provide minimal context with on-demand keyword retrieval.
+
+**Process:**
+1. If no pattern match, provide minimal context
+2. Include tool usage instructions (~200 tokens)
+3. Agent uses keyword_search tool when needed
+4. Tool returns top 3 matches from ChromaDB (<100ms)
+
+**Example:**
+
+```python
+# Agent context:
+"""
+You are an expert Robot Framework developer using Browser Library.
+
+CORE RULES:
+[... core rules ~300 tokens ...]
+
+KEYWORD SEARCH TOOL:
+You have access to a keyword_search tool to find relevant keywords on-demand.
+
+Examples:
+- Need to click? Search: "click button element"
+- Need to input text? Search: "type text input field"
+- Need to wait? Search: "wait element visible"
+
+The tool returns the top 3 matching keywords with documentation.
+Use the exact keyword names and syntax from the tool results.
+"""
+
+# Agent workflow:
+# 1. Reads query: "click the login button"
+# 2. Calls: keyword_search("click button")
+# 3. Receives: [Click, Click Element, Click Button] with docs
+# 4. Uses: Click    id=login-button
+```
+
+**Benefits:**
+- Minimal context (~500 tokens total)
+- Flexible - works for any query
+- Fast - search completes in <100ms
+
+### Tier 4: Full Context Fallback
+
+**Purpose:** Ensure reliability if all optimizations fail.
+
+**Trigger Conditions:**
+- ChromaDB initialization fails
+- Keyword search tool fails
+- Pattern learning database corrupted
+- Any unexpected error
+
+**Behavior:**
+- Falls back to baseline behavior (full context)
+- Logs fallback event for monitoring
+- Maintains 99.9% workflow success rate
+
+**Implementation:**
+
+```python
+def get_agent_context(self, user_query: str, agent_role: str) -> str:
+    try:
+        # Try optimized approaches
+        return self._get_optimized_context(user_query, agent_role)
+    except Exception as e:
+        logger.error(f"Optimization failed: {e}, falling back to full context")
+        return self.library_context.code_assembly_context
+```
+
+
+## Extension Points
+
+The optimization system is designed to be extensible. Here are the key extension points:
+
+### 1. Adding New Libraries
+
+To add optimization support for a new Robot Framework library:
+
+**Step 1: Add Core Rules**
+
+```python
+# In src/backend/crew_ai/library_context/your_library_context.py
+
+class YourLibraryContext(LibraryContext):
+    @property
+    def core_rules(self) -> str:
+        """Define core rules for your library."""
+        return """
+        CRITICAL YOUR_LIBRARY RULES:
+        
+        1. INITIALIZATION:
+           - [Your library-specific initialization]
+        
+        2. PARAMETER RULES:
+           - [Your library-specific parameters]
+        
+        3. COMMON PATTERNS:
+           - [Your library-specific patterns]
+        """
+```
+
+**Step 2: Initialize ChromaDB Collection**
+
+```python
+# In your initialization code
+from src.backend.crew_ai.optimization import KeywordVectorStore
+
+chroma_store = KeywordVectorStore()
+
+# Extract keywords from your library
+keywords = extract_keywords_from_library("YourLibrary")
+
+# Add to ChromaDB
+chroma_store.add_keywords("YourLibrary", keywords)
+```
+
+**Step 3: Configure Pattern Learning**
+
+```python
+# Pattern learning works automatically for any library
+# Just ensure keywords are extracted correctly from generated code
+
+def _extract_keywords_from_code(self, code: str) -> List[str]:
+    # Add your library-specific keyword extraction logic
+    # Default implementation works for most Robot Framework libraries
+    pass
+```
+
+### 2. Custom Embedding Models
+
+To use a different embedding model:
+
+**Step 1: Update ChromaDB Configuration**
+
+```python
+# In src/backend/crew_ai/optimization/chroma_store.py
+
+def _get_embedding_function(self):
+    """Get custom embedding function."""
+    from chromadb.utils import embedding_functions
+    
+    # Option 1: Different sentence-transformers model
+    return embedding_functions.SentenceTransformerEmbeddingFunction(
+        model_name="all-mpnet-base-v2"  # More accurate but slower
+    )
+    
+    # Option 2: OpenAI embeddings (requires API key)
+    return embedding_functions.OpenAIEmbeddingFunction(
+        api_key="your-api-key",
+        model_name="text-embedding-3-small"
+    )
+    
+    # Option 3: Custom embedding function
+    class CustomEmbeddingFunction:
+        def __call__(self, texts: List[str]) -> List[List[float]]:
+            # Your custom embedding logic
+            return embeddings
+    
+    return CustomEmbeddingFunction()
+```
+
+**Step 2: Update Configuration**
+
+```env
+# In .env
+OPTIMIZATION_EMBEDDING_MODEL=all-mpnet-base-v2
+```
+
+**Trade-offs:**
+- `all-MiniLM-L6-v2` (default): Fast, 384 dimensions, good accuracy
+- `all-mpnet-base-v2`: Slower, 768 dimensions, better accuracy
+- OpenAI embeddings: Requires API, costs money, excellent accuracy
+
+### 3. Custom Context Pruning Strategies
+
+To add new pruning strategies:
+
+**Step 1: Extend ContextPruner**
+
+```python
+# In src/backend/crew_ai/optimization/context_pruner.py
+
+class ContextPruner:
+    def classify_query_advanced(self, user_query: str, 
+                               website_type: str = None) -> List[str]:
+        """Advanced classification with website-specific logic."""
+        
+        # Base classification
+        categories = self.classify_query(user_query)
+        
+        # Website-specific adjustments
+        if website_type == "ecommerce":
+            # E-commerce sites often need extraction keywords
+            if "extraction" not in categories:
+                categories.append("extraction")
+        
+        elif website_type == "form":
+            # Form-heavy sites need input keywords
+            if "input" not in categories:
+                categories.append("input")
+        
+        return categories
+```
+
+**Step 2: Add New Category Mappings**
+
+```python
+KEYWORD_CATEGORIES = {
+    # Existing categories
+    "navigation": [...],
+    "input": [...],
+    
+    # New categories
+    "file_handling": ["Upload File", "Download File", "Choose File"],
+    "authentication": ["Login", "Logout", "Set Cookie"],
+    "api_testing": ["GET Request", "POST Request", "Validate Response"],
+}
+```
+
+### 4. Custom Pattern Learning Strategies
+
+To implement advanced pattern learning:
+
+**Step 1: Extend QueryPatternMatcher**
+
+```python
+# In src/backend/crew_ai/optimization/pattern_learning.py
+
+class AdvancedPatternMatcher(QueryPatternMatcher):
+    def get_relevant_keywords_with_context(self, 
+                                          user_query: str,
+                                          website_url: str = None,
+                                          previous_queries: List[str] = None) -> List[str]:
+        """Advanced prediction with additional context."""
+        
+        # Base prediction
+        keywords = self.get_relevant_keywords(user_query)
+        
+        # Website-specific patterns
+        if website_url:
+            website_patterns = self._get_website_patterns(website_url)
+            keywords.extend(website_patterns)
+        
+        # Sequential patterns (workflow context)
+        if previous_queries:
+            sequential_keywords = self._predict_next_keywords(previous_queries)
+            keywords.extend(sequential_keywords)
+        
+        return list(set(keywords))  # Remove duplicates
+    
+    def _get_website_patterns(self, website_url: str) -> List[str]:
+        """Get common keywords for specific website."""
+        # Query patterns filtered by website
+        pass
+    
+    def _predict_next_keywords(self, previous_queries: List[str]) -> List[str]:
+        """Predict next keywords based on workflow sequence."""
+        # Analyze common sequences (e.g., search → filter → select)
+        pass
+```
+
+### 5. Custom Metrics and Monitoring
+
+To add custom metrics:
+
+**Step 1: Extend WorkflowMetrics**
+
+```python
+# In src/backend/metrics/workflow_metrics.py
+
+class WorkflowMetrics:
+    def __init__(self):
+        # Existing metrics
+        self.token_usage = {...}
+        
+        # Custom metrics
+        self.custom_metrics = {
+            "keyword_reuse_rate": 0.0,
+            "pattern_cache_hit_rate": 0.0,
+            "avg_keywords_per_query": 0.0,
+        }
+    
+    def track_keyword_reuse(self, keywords_used: List[str], 
+                           keywords_predicted: List[str]):
+        """Track how many predicted keywords were actually used."""
+        if not keywords_predicted:
+            return
+        
+        reused = len(set(keywords_used) & set(keywords_predicted))
+        self.custom_metrics["keyword_reuse_rate"] = reused / len(keywords_predicted)
+```
+
+**Step 2: Add to API Response**
+
+```python
+def to_dict(self) -> Dict:
+    base_dict = super().to_dict()
+    base_dict["optimization"]["custom"] = self.custom_metrics
+    return base_dict
+```
+
+### 6. Alternative Storage Backends
+
+To use a different storage backend instead of ChromaDB:
+
+**Step 1: Create Storage Interface**
+
+```python
+# In src/backend/crew_ai/optimization/storage_interface.py
+
+from abc import ABC, abstractmethod
+
+class VectorStoreInterface(ABC):
+    """Abstract interface for vector storage."""
+    
+    @abstractmethod
+    def add_keywords(self, library_name: str, keywords: List[Dict]):
+        """Add keywords to storage."""
+        pass
+    
+    @abstractmethod
+    def search(self, library_name: str, query: str, top_k: int) -> List[Dict]:
+        """Search for keywords."""
+        pass
+```
+
+**Step 2: Implement Alternative Backend**
+
+```python
+# In src/backend/crew_ai/optimization/faiss_store.py
+
+import faiss
+import numpy as np
+
+class FAISSVectorStore(VectorStoreInterface):
+    """FAISS-based vector storage."""
+    
+    def __init__(self, persist_directory: str):
+        self.persist_directory = persist_directory
+        self.indexes = {}  # library_name -> FAISS index
+        self.embedder = SentenceTransformer('all-MiniLM-L6-v2')
+    
+    def add_keywords(self, library_name: str, keywords: List[Dict]):
+        # Generate embeddings
+        texts = [f"{kw['name']} {kw.get('doc', '')}" for kw in keywords]
+        embeddings = self.embedder.encode(texts)
+        
+        # Create FAISS index
+        dimension = embeddings.shape[1]
+        index = faiss.IndexFlatL2(dimension)
+        index.add(embeddings)
+        
+        # Store index and metadata
+        self.indexes[library_name] = {
+            "index": index,
+            "keywords": keywords
+        }
+        
+        # Persist to disk
+        faiss.write_index(index, f"{self.persist_directory}/{library_name}.index")
+    
+    def search(self, library_name: str, query: str, top_k: int) -> List[Dict]:
+        # Encode query
+        query_embedding = self.embedder.encode([query])
+        
+        # Search FAISS index
+        index_data = self.indexes[library_name]
+        distances, indices = index_data["index"].search(query_embedding, top_k)
+        
+        # Format results
+        results = []
+        for i, idx in enumerate(indices[0]):
+            keyword = index_data["keywords"][idx]
+            results.append({
+                "name": keyword["name"],
+                "args": keyword.get("args", []),
+                "description": keyword.get("doc", ""),
+                "distance": float(distances[0][i])
+            })
+        
+        return results
+```
+
+**Step 3: Update Configuration**
+
+```python
+# In src/backend/core/config.py
+
+OPTIMIZATION_STORAGE_BACKEND = Field(
+    default="chromadb",
+    description="Vector storage backend: chromadb, faiss, or custom"
+)
+```
+
+
+## Testing Approach
+
+The optimization system uses a comprehensive testing strategy covering unit, integration, and performance tests.
+
+### Unit Tests
+
+Unit tests focus on individual components in isolation.
+
+**Test Structure:**
+
+```
+tests/
+├── test_chroma_store.py           # ChromaDB vector store tests
+├── test_keyword_search_tool.py    # Keyword search tool tests
+├── test_pattern_learning.py       # Pattern learning tests
+├── test_context_pruner.py         # Context pruning tests
+└── test_integration_optimization.py  # Integration tests
+```
+
+**Example: Testing ChromaDB Store**
+
+```python
+# tests/test_chroma_store.py
+
+import pytest
+from src.backend.crew_ai.optimization import KeywordVectorStore
+
+@pytest.fixture
+def chroma_store():
+    """Create temporary ChromaDB store for testing."""
+    import tempfile
+    temp_dir = tempfile.mkdtemp()
+    store = KeywordVectorStore(persist_directory=temp_dir)
+    yield store
+    # Cleanup
+    import shutil
+    shutil.rmtree(temp_dir)
+
+def test_collection_creation(chroma_store):
+    """Test creating collections for different libraries."""
+    # Create Browser collection
+    collection = chroma_store.create_or_get_collection("Browser")
+    assert collection is not None
+    assert collection.name == "keywords_browser"
+    
+    # Create SeleniumLibrary collection
+    collection = chroma_store.create_or_get_collection("SeleniumLibrary")
+    assert collection is not None
+    assert collection.name == "keywords_seleniumlibrary"
+
+def test_keyword_ingestion(chroma_store):
+    """Test adding keywords to ChromaDB."""
+    keywords = [
+        {"name": "Click", "args": ["selector"], "doc": "Clicks element"},
+        {"name": "Fill Text", "args": ["selector", "text"], "doc": "Fills text"},
+    ]
+    
+    chroma_store.add_keywords("Browser", keywords)
+    
+    # Verify keywords stored
+    collection = chroma_store.create_or_get_collection("Browser")
+    results = collection.get(ids=["Click", "Fill Text"])
+    assert len(results["ids"]) == 2
+
+def test_semantic_search(chroma_store):
+    """Test semantic search returns relevant keywords."""
+    # Add test keywords
+    keywords = [
+        {"name": "Click", "args": ["selector"], "doc": "Clicks element identified by selector"},
+        {"name": "Fill Text", "args": ["selector", "text"], "doc": "Fills text into input field"},
+        {"name": "Get Text", "args": ["selector"], "doc": "Gets text content from element"},
+    ]
+    chroma_store.add_keywords("Browser", keywords)
+    
+    # Search for clicking
+    results = chroma_store.search("Browser", "click a button", top_k=2)
+    assert len(results) == 2
+    assert results[0]["name"] == "Click"
+    
+    # Search for text input
+    results = chroma_store.search("Browser", "type text into field", top_k=2)
+    assert len(results) == 2
+    assert results[0]["name"] == "Fill Text"
+
+def test_version_tracking(chroma_store):
+    """Test library version tracking and rebuild."""
+    keywords = [{"name": "Click", "args": ["selector"], "doc": "Clicks element"}]
+    
+    # Add keywords with version 1.0.0
+    chroma_store.add_keywords("Browser", keywords)
+    version = chroma_store.get_library_version("Browser")
+    assert version == "1.0.0"
+    
+    # Simulate version change
+    chroma_store.rebuild_collection("Browser", new_version="1.1.0")
+    version = chroma_store.get_library_version("Browser")
+    assert version == "1.1.0"
+```
+
+**Example: Testing Pattern Learning**
+
+```python
+# tests/test_pattern_learning.py
+
+import pytest
+from src.backend.crew_ai.optimization import QueryPatternMatcher, KeywordVectorStore
+
+@pytest.fixture
+def pattern_matcher():
+    """Create pattern matcher with temporary storage."""
+    import tempfile
+    temp_dir = tempfile.mkdtemp()
+    chroma_store = KeywordVectorStore(persist_directory=temp_dir)
+    matcher = QueryPatternMatcher(chroma_store=chroma_store)
+    yield matcher
+    # Cleanup
+    import shutil
+    shutil.rmtree(temp_dir)
+
+def test_keyword_extraction(pattern_matcher):
+    """Test extracting keywords from Robot Framework code."""
+    code = """
+*** Test Cases ***
+Test Login
+    New Browser    chromium    headless=True
+    New Page    https://example.com
+    Fill Text    id=username    testuser
+    Click    id=login-button
+    Get Text    id=welcome-message
+    """
+    
+    keywords = pattern_matcher._extract_keywords_from_code(code)
+    
+    assert "New Browser" in keywords
+    assert "New Page" in keywords
+    assert "Fill Text" in keywords
+    assert "Click" in keywords
+    assert "Get Text" in keywords
+
+def test_pattern_storage(pattern_matcher):
+    """Test storing patterns in ChromaDB."""
+    query = "login to website"
+    code = """
+*** Test Cases ***
+Test
+    Fill Text    id=username    user
+    Click    id=login
+    """
+    
+    # Learn from execution
+    pattern_matcher.learn_from_execution(query, code)
+    
+    # Verify pattern stored
+    collection = pattern_matcher.pattern_collection
+    results = collection.get()
+    assert len(results["ids"]) > 0
+
+def test_pattern_prediction(pattern_matcher):
+    """Test predicting keywords from similar queries."""
+    # Learn from multiple executions
+    pattern_matcher.learn_from_execution(
+        "search for shoes on Flipkart",
+        "*** Test Cases ***\nTest\n    Fill Text    name=q    shoes\n    Click    id=search"
+    )
+    pattern_matcher.learn_from_execution(
+        "search for laptops on Amazon",
+        "*** Test Cases ***\nTest\n    Fill Text    id=search-box    laptops\n    Click    css=.search-button"
+    )
+    
+    # Predict for similar query
+    predicted = pattern_matcher.get_relevant_keywords("search for phones on eBay")
+    
+    assert "Fill Text" in predicted
+    assert "Click" in predicted
+
+def test_confidence_threshold(pattern_matcher):
+    """Test confidence threshold filtering."""
+    # Learn pattern
+    pattern_matcher.learn_from_execution(
+        "login to website",
+        "*** Test Cases ***\nTest\n    Fill Text    id=user    test\n    Click    id=login"
+    )
+    
+    # Similar query should predict (high confidence)
+    predicted = pattern_matcher.get_relevant_keywords("login to portal", confidence_threshold=0.7)
+    assert len(predicted) > 0
+    
+    # Dissimilar query should not predict (low confidence)
+    predicted = pattern_matcher.get_relevant_keywords("download file", confidence_threshold=0.7)
+    assert len(predicted) == 0
+
+def test_improvement_over_time(pattern_matcher):
+    """Test prediction accuracy improves with more data."""
+    # Learn from 20 diverse queries
+    queries = [
+        ("search for products", "Fill Text\nClick"),
+        ("login to account", "Fill Text\nClick"),
+        ("add to cart", "Click\nGet Text"),
+        # ... 17 more queries
+    ]
+    
+    for query, code in queries:
+        pattern_matcher.learn_from_execution(query, f"*** Test Cases ***\nTest\n    {code}")
+    
+    # Test prediction accuracy
+    test_query = "search for items"
+    predicted = pattern_matcher.get_relevant_keywords(test_query)
+    
+    # Should predict Fill Text and Click (common for search queries)
+    assert "Fill Text" in predicted
+    assert "Click" in predicted
+```
+
+**Example: Testing Context Pruning**
+
+```python
+# tests/test_context_pruner.py
+
+import pytest
+from src.backend.crew_ai.optimization import ContextPruner
+
+@pytest.fixture
+def pruner():
+    """Create context pruner instance."""
+    return ContextPruner()
+
+def test_query_classification(pruner):
+    """Test classifying queries into categories."""
+    # Navigation query
+    categories = pruner.classify_query("open website and go to login page")
+    assert "navigation" in categories
+    
+    # Input query
+    categories = pruner.classify_query("fill form with user details")
+    assert "input" in categories
+    
+    # Interaction query
+    categories = pruner.classify_query("click the submit button")
+    assert "interaction" in categories
+    
+    # Extraction query
+    categories = pruner.classify_query("get the product name and price")
+    assert "extraction" in categories
+    
+    # Mixed query
+    categories = pruner.classify_query("search for products and click first result")
+    assert "input" in categories
+    assert "interaction" in categories
+
+def test_keyword_pruning(pruner):
+    """Test pruning keywords to relevant categories."""
+    all_keywords = [
+        {"name": "New Browser", "category": "navigation"},
+        {"name": "Click", "category": "interaction"},
+        {"name": "Fill Text", "category": "input"},
+        {"name": "Get Text", "category": "extraction"},
+    ]
+    
+    # Prune to only interaction keywords
+    pruned = pruner.prune_keywords(all_keywords, ["interaction"])
+    assert len(pruned) == 1
+    assert pruned[0]["name"] == "Click"
+    
+    # Prune to input and interaction
+    pruned = pruner.prune_keywords(all_keywords, ["input", "interaction"])
+    assert len(pruned) == 2
+    assert any(kw["name"] == "Fill Text" for kw in pruned)
+    assert any(kw["name"] == "Click" for kw in pruned)
+
+def test_confidence_threshold(pruner):
+    """Test confidence threshold behavior."""
+    # High confidence query
+    categories = pruner.classify_query("click button", confidence_threshold=0.8)
+    assert len(categories) > 0
+    
+    # Low confidence query (should return all categories)
+    categories = pruner.classify_query("do something", confidence_threshold=0.9)
+    assert len(categories) == len(pruner.KEYWORD_CATEGORIES)
+
+def test_context_reduction(pruner):
+    """Test context size reduction."""
+    all_keywords = [
+        {"name": f"Keyword{i}", "category": cat}
+        for i in range(50)
+        for cat in ["navigation", "input", "interaction", "extraction"]
+    ]
+    
+    # Classify query
+    categories = pruner.classify_query("fill form and submit")
+    
+    # Prune keywords
+    pruned = pruner.prune_keywords(all_keywords, categories)
+    
+    # Should reduce context significantly
+    reduction = (len(all_keywords) - len(pruned)) / len(all_keywords) * 100
+    assert reduction > 30  # At least 30% reduction
+```
+
+### Integration Tests
+
+Integration tests verify the optimization system works correctly with the full CrewAI workflow.
+
+```python
+# tests/test_integration_optimization.py
+
+import pytest
+from src.backend.crew_ai.crew import run_crew
+from src.backend.core.config import settings
+
+@pytest.fixture(autouse=True)
+def enable_optimization():
+    """Enable optimization for integration tests."""
+    original = settings.OPTIMIZATION_ENABLED
+    settings.OPTIMIZATION_ENABLED = True
+    yield
+    settings.OPTIMIZATION_ENABLED = original
+
+def test_optimized_workflow():
+    """Test full workflow with optimization enabled."""
+    result, crew = run_crew(
+        query="search for shoes on Flipkart and get first product name",
+        model_provider="online",
+        model_name="gemini-2.0-flash-exp",
+        library_type="browser"
+    )
+    
+    # Verify result
+    assert result is not None
+    assert "Fill Text" in result.raw
+    assert "Get Text" in result.raw
+    
+    # Verify optimization metrics
+    metrics = crew.metrics
+    assert metrics.optimization.token_usage["total"] < 5000  # Less than baseline
+    assert metrics.optimization.context_reduction["reduction_percentage"] > 50
+
+def test_pattern_learning_integration():
+    """Test pattern learning improves over multiple queries."""
+    queries = [
+        "search for laptops",
+        "search for phones",
+        "search for tablets",
+    ]
+    
+    prediction_used = []
+    
+    for query in queries:
+        result, crew = run_crew(
+            query=query,
+            model_provider="online",
+            model_name="gemini-2.0-flash-exp"
+        )
+        
+        # Track if prediction was used
+        prediction_used.append(
+            crew.metrics.optimization.pattern_learning_stats["prediction_used"]
+        )
+    
+    # Later queries should use predictions more often
+    assert sum(prediction_used[1:]) > sum(prediction_used[:1])
+
+def test_graceful_degradation():
+    """Test fallback when optimization fails."""
+    # Simulate ChromaDB failure
+    with patch('src.backend.crew_ai.optimization.KeywordVectorStore') as mock:
+        mock.side_effect = Exception("ChromaDB failed")
+        
+        # Should still work with full context
+        result, crew = run_crew(
+            query="search for shoes",
+            model_provider="online",
+            model_name="gemini-2.0-flash-exp"
+        )
+        
+        assert result is not None
+        # Should use full context (no reduction)
+        assert crew.metrics.optimization.context_reduction["reduction_percentage"] == 0
+
+def test_keyword_search_tool_usage():
+    """Test agents can use keyword search tool."""
+    # Disable pattern learning to force tool usage
+    with patch('src.backend.crew_ai.optimization.QueryPatternMatcher.get_relevant_keywords') as mock:
+        mock.return_value = []  # No predictions
+        
+        result, crew = run_crew(
+            query="click the login button",
+            model_provider="online",
+            model_name="gemini-2.0-flash-exp"
+        )
+        
+        # Verify tool was used
+        assert crew.metrics.optimization.keyword_search_stats["calls"] > 0
+        assert result is not None
+
+def test_core_rules_preservation():
+    """Test core rules are always present in generated code."""
+    result, crew = run_crew(
+        query="open Flipkart website",
+        model_provider="online",
+        model_name="gemini-2.0-flash-exp",
+        library_type="browser"
+    )
+    
+    # Verify critical sequence present
+    assert "New Browser" in result.raw
+    assert "New Context" in result.raw
+    assert "viewport=None" in result.raw  # Critical parameter
+    assert "New Page" in result.raw
+```
+
+### Performance Tests
+
+Performance tests verify the system meets latency and throughput requirements.
+
+```python
+# tests/test_performance_validation.py
+
+import pytest
+import time
+from src.backend.crew_ai.optimization import KeywordVectorStore, KeywordSearchTool
+
+def test_chromadb_initialization_time():
+    """Test ChromaDB initialization completes within 5 seconds."""
+    import tempfile
+    temp_dir = tempfile.mkdtemp()
+    
+    start = time.time()
+    store = KeywordVectorStore(persist_directory=temp_dir)
+    
+    # Add 143 keywords (Browser Library size)
+    keywords = [
+        {"name": f"Keyword{i}", "args": [], "doc": f"Documentation for keyword {i}"}
+        for i in range(143)
+    ]
+    store.add_keywords("Browser", keywords)
+    
+    duration = time.time() - start
+    
+    assert duration < 5.0  # 5 second requirement
+    
+    # Cleanup
+    import shutil
+    shutil.rmtree(temp_dir)
+
+def test_keyword_search_latency():
+    """Test keyword search completes within 100ms."""
+    import tempfile
+    temp_dir = tempfile.mkdtemp()
+    
+    # Setup
+    store = KeywordVectorStore(persist_directory=temp_dir)
+    keywords = [
+        {"name": "Click", "args": ["selector"], "doc": "Clicks element"},
+        {"name": "Fill Text", "args": ["selector", "text"], "doc": "Fills text"},
+        {"name": "Get Text", "args": ["selector"], "doc": "Gets text"},
+    ]
+    store.add_keywords("Browser", keywords)
+    
+    tool = KeywordSearchTool("Browser", store)
+    
+    # Measure search latency
+    start = time.time()
+    result = tool._run("click a button", top_k=3)
+    latency = (time.time() - start) * 1000  # Convert to ms
+    
+    assert latency < 100  # 100ms requirement
+    
+    # Cleanup
+    import shutil
+    shutil.rmtree(temp_dir)
+
+def test_pattern_prediction_latency():
+    """Test pattern prediction completes quickly."""
+    import tempfile
+    temp_dir = tempfile.mkdtemp()
+    
+    # Setup
+    store = KeywordVectorStore(persist_directory=temp_dir)
+    matcher = QueryPatternMatcher(chroma_store=store)
+    
+    # Learn some patterns
+    for i in range(10):
+        matcher.learn_from_execution(
+            f"test query {i}",
+            f"*** Test Cases ***\nTest\n    Keyword{i}"
+        )
+    
+    # Measure prediction latency
+    start = time.time()
+    predicted = matcher.get_relevant_keywords("test query similar")
+    latency = (time.time() - start) * 1000
+    
+    assert latency < 200  # Should be fast
+    
+    # Cleanup
+    import shutil
+    shutil.rmtree(temp_dir)
+
+def test_end_to_end_workflow_time():
+    """Test optimized workflow completes in reasonable time."""
+    start = time.time()
+    
+    result, crew = run_crew(
+        query="search for shoes on Flipkart",
+        model_provider="online",
+        model_name="gemini-2.0-flash-exp"
+    )
+    
+    duration = time.time() - start
+    
+    # Should complete in 30-40 seconds (vs 40-50 baseline)
+    assert duration < 45
+    assert result is not None
+```
+
+### Running Tests
+
+```bash
+# Run all tests
+pytest tests/
+
+# Run specific test file
+pytest tests/test_chroma_store.py
+
+# Run with coverage
+pytest --cov=src/backend/crew_ai/optimization tests/
+
+# Run performance tests only
+pytest tests/test_performance_validation.py -v
+
+# Run integration tests only
+pytest tests/test_integration_optimization.py -v
+```
+
+
+## Code Examples
+
+### Example 1: Basic Optimization Setup
+
+```python
+# In src/backend/crew_ai/crew.py
+
+from src.backend.crew_ai.optimization import (
+    KeywordVectorStore,
+    QueryPatternMatcher,
+    SmartKeywordProvider
+)
+from src.backend.core.config import settings
+
+def run_crew(query: str, model_provider: str, model_name: str, 
+             library_type: str = None, workflow_id: str = ""):
+    """Run CrewAI workflow with optimization."""
+    
+    # Load library context
+    library_context = get_library_context(library_type or settings.ROBOT_LIBRARY)
+    
+    # Initialize optimization if enabled
+    if settings.OPTIMIZATION_ENABLED:
+        # Initialize ChromaDB store
+        chroma_store = KeywordVectorStore(
+            persist_directory=settings.OPTIMIZATION_CHROMA_DB_PATH
+        )
+        
+        # Initialize pattern matcher
+        pattern_matcher = QueryPatternMatcher(chroma_store=chroma_store)
+        
+        # Initialize smart provider
+        smart_provider = SmartKeywordProvider(
+            library_context=library_context,
+            pattern_matcher=pattern_matcher,
+            chroma_store=chroma_store
+        )
+        
+        # Get optimized context
+        optimized_context = smart_provider.get_agent_context(query, "assembler")
+        keyword_search_tool = smart_provider.get_keyword_search_tool()
+    else:
+        # Use baseline behavior
+        optimized_context = library_context.code_assembly_context
+        keyword_search_tool = None
+    
+    # Initialize agents
+    agents = RobotAgents(
+        model_provider,
+        model_name,
+        library_context,
+        optimized_context=optimized_context,
+        keyword_search_tool=keyword_search_tool
+    )
+    
+    # Run workflow
+    crew = Crew(
+        agents=[
+            agents.step_planner_agent(),
+            agents.element_identifier_agent(),
+            agents.code_assembler_agent(),
+            agents.code_validator_agent()
+        ],
+        tasks=[...],
+        verbose=True
+    )
+    
+    result = crew.kickoff()
+    
+    # Learn from successful execution
+    if settings.OPTIMIZATION_ENABLED and result:
+        smart_provider.learn_from_execution(query, result.raw)
+    
+    return result, crew
+```
+
+### Example 2: Custom Keyword Search
+
+```python
+# Custom keyword search with filtering
+
+from src.backend.crew_ai.optimization import KeywordSearchTool
+
+class FilteredKeywordSearchTool(KeywordSearchTool):
+    """Keyword search with custom filtering."""
+    
+    def __init__(self, library_name: str, chroma_store: KeywordVectorStore,
+                 excluded_keywords: List[str] = None):
+        super().__init__(library_name, chroma_store)
+        self.excluded_keywords = excluded_keywords or []
+    
+    def _run(self, query: str, top_k: int = 3) -> str:
+        """Search with filtering."""
+        # Get base results
+        results = self.chroma_store.search(
+            library_name=self.library_name,
+            query=query,
+            top_k=top_k * 2  # Get more to account for filtering
+        )
+        
+        # Filter out excluded keywords
+        filtered = [
+            r for r in results
+            if r["name"] not in self.excluded_keywords
+        ][:top_k]
+        
+        # Format results
+        return json.dumps(filtered, indent=2)
+
+# Usage
+tool = FilteredKeywordSearchTool(
+    "Browser",
+    chroma_store,
+    excluded_keywords=["Deprecated Keyword", "Old Keyword"]
+)
+```
+
+### Example 3: Advanced Pattern Learning
+
+```python
+# Pattern learning with website-specific patterns
+
+from src.backend.crew_ai.optimization import QueryPatternMatcher
+
+class WebsiteAwarePatternMatcher(QueryPatternMatcher):
+    """Pattern matcher with website-specific learning."""
+    
+    def learn_from_execution_with_website(self, 
+                                         user_query: str,
+                                         generated_code: str,
+                                         website_url: str):
+        """Learn pattern with website context."""
+        # Extract keywords
+        keywords = self._extract_keywords_from_code(generated_code)
+        
+        if not keywords:
+            return
+        
+        # Store pattern with website metadata
+        pattern_id = f"pattern_{int(time.time() * 1000)}"
+        self.pattern_collection.add(
+            documents=[user_query],
+            ids=[pattern_id],
+            metadatas=[{
+                "keywords": json.dumps(keywords),
+                "website": website_url,
+                "timestamp": datetime.now().isoformat()
+            }]
+        )
+    
+    def get_relevant_keywords_for_website(self,
+                                         user_query: str,
+                                         website_url: str,
+                                         confidence_threshold: float = 0.7) -> List[str]:
+        """Get keywords filtered by website."""
+        # Search for similar patterns
+        results = self.pattern_collection.query(
+            query_texts=[user_query],
+            n_results=10,
+            where={"website": website_url}  # Filter by website
+        )
+        
+        # Check confidence
+        if not results['ids'][0]:
+            return []
+        
+        top_distance = results['distances'][0][0]
+        similarity = 1 / (1 + top_distance)
+        
+        if similarity < confidence_threshold:
+            return []
+        
+        # Aggregate keywords
+        keyword_counts = {}
+        for metadata in results['metadatas'][0]:
+            keywords = json.loads(metadata['keywords'])
+            for keyword in keywords:
+                keyword_counts[keyword] = keyword_counts.get(keyword, 0) + 1
+        
+        # Return top keywords
+        sorted_keywords = sorted(keyword_counts.items(), key=lambda x: x[1], reverse=True)
+        return [kw for kw, count in sorted_keywords[:10]]
+
+# Usage
+matcher = WebsiteAwarePatternMatcher(chroma_store)
+
+# Learn with website context
+matcher.learn_from_execution_with_website(
+    "search for products",
+    generated_code,
+    "https://flipkart.com"
+)
+
+# Predict for same website
+keywords = matcher.get_relevant_keywords_for_website(
+    "add to cart",
+    "https://flipkart.com"
+)
+```
+
+### Example 4: Custom Context Formatting
+
+```python
+# Custom context formatting for different agent roles
+
+from src.backend.crew_ai.optimization import SmartKeywordProvider
+
+class CustomSmartKeywordProvider(SmartKeywordProvider):
+    """Smart provider with custom context formatting."""
+    
+    def _format_predicted_context(self, 
+                                  predicted_keywords: List[str],
+                                  agent_role: str) -> str:
+        """Custom formatting based on agent role."""
+        # Get core rules
+        core_rules = self.library_context.core_rules
+        
+        # Get keyword docs
+        keyword_docs = self._get_keyword_docs(predicted_keywords)
+        
+        if agent_role == "planner":
+            # Planner needs high-level overview
+            return f"""
+{core_rules}
+
+AVAILABLE KEYWORDS (High-Level):
+{self._format_keyword_list(keyword_docs)}
+
+Focus on planning the test structure and identifying required actions.
+"""
+        
+        elif agent_role == "assembler":
+            # Assembler needs detailed syntax
+            return f"""
+{core_rules}
+
+KEYWORD DOCUMENTATION (Detailed):
+{self._format_keyword_details(keyword_docs)}
+
+Generate Robot Framework code using these exact keywords and syntax.
+"""
+        
+        elif agent_role == "validator":
+            # Validator needs validation rules
+            return f"""
+{core_rules}
+
+VALIDATION RULES:
+- Verify all keywords are from the approved list
+- Check parameter syntax matches documentation
+- Ensure proper indentation and structure
+
+APPROVED KEYWORDS:
+{self._format_keyword_list(keyword_docs)}
+"""
+        
+        return core_rules
+    
+    def _format_keyword_list(self, keyword_docs: List[Dict]) -> str:
+        """Format keywords as simple list."""
+        return "\n".join([
+            f"- {kw['name']}: {kw['description'][:100]}..."
+            for kw in keyword_docs
+        ])
+    
+    def _format_keyword_details(self, keyword_docs: List[Dict]) -> str:
+        """Format keywords with full details."""
+        formatted = []
+        for kw in keyword_docs:
+            formatted.append(f"""
+Keyword: {kw['name']}
+Arguments: {', '.join(kw['args'])}
+Description: {kw['description']}
+Example: {kw['example']}
+""")
+        return "\n".join(formatted)
+
+# Usage
+provider = CustomSmartKeywordProvider(library_context, pattern_matcher, chroma_store)
+
+# Get context for different roles
+planner_context = provider.get_agent_context(query, "planner")
+assembler_context = provider.get_agent_context(query, "assembler")
+validator_context = provider.get_agent_context(query, "validator")
+```
+
+### Example 5: Metrics Collection and Analysis
+
+```python
+# Collecting and analyzing optimization metrics
+
+from src.backend.metrics.workflow_metrics import WorkflowMetrics
+
+def analyze_optimization_performance(workflow_ids: List[str]) -> Dict:
+    """Analyze optimization performance across multiple workflows."""
+    
+    metrics_list = []
+    for workflow_id in workflow_ids:
+        metrics = get_workflow_metrics(workflow_id)
+        metrics_list.append(metrics)
+    
+    # Calculate averages
+    avg_token_usage = sum(m.optimization.token_usage["total"] for m in metrics_list) / len(metrics_list)
+    avg_reduction = sum(m.optimization.context_reduction["reduction_percentage"] for m in metrics_list) / len(metrics_list)
+    avg_search_calls = sum(m.optimization.keyword_search_stats["calls"] for m in metrics_list) / len(metrics_list)
+    
+    # Calculate prediction rate
+    prediction_used_count = sum(1 for m in metrics_list if m.optimization.pattern_learning_stats["prediction_used"])
+    prediction_rate = prediction_used_count / len(metrics_list) * 100
+    
+    # Calculate cost savings
+    baseline_cost = 12000 * 0.000225  # 12K tokens at $0.225 per 1M tokens
+    optimized_cost = avg_token_usage * 0.000225
+    cost_savings = (baseline_cost - optimized_cost) / baseline_cost * 100
+    
+    return {
+        "avg_token_usage": avg_token_usage,
+        "avg_reduction_percentage": avg_reduction,
+        "avg_search_calls": avg_search_calls,
+        "prediction_rate": prediction_rate,
+        "cost_savings_percentage": cost_savings,
+        "total_workflows": len(metrics_list)
+    }
+
+# Usage
+workflow_ids = ["abc-123", "def-456", "ghi-789"]
+analysis = analyze_optimization_performance(workflow_ids)
+
+print(f"Average token usage: {analysis['avg_token_usage']:.0f}")
+print(f"Average reduction: {analysis['avg_reduction_percentage']:.1f}%")
+print(f"Prediction rate: {analysis['prediction_rate']:.1f}%")
+print(f"Cost savings: {analysis['cost_savings_percentage']:.1f}%")
+```
+
+### Example 6: Debugging Optimization Issues
+
+```python
+# Debugging optimization system
+
+from src.backend.crew_ai.optimization import logging_config
+
+# Enable debug logging
+import logging
+logging.getLogger("crew_ai.optimization").setLevel(logging.DEBUG)
+
+def debug_optimization_workflow(query: str):
+    """Run workflow with detailed debugging."""
+    
+    # Initialize components
+    chroma_store = KeywordVectorStore()
+    pattern_matcher = QueryPatternMatcher(chroma_store)
+    smart_provider = SmartKeywordProvider(library_context, pattern_matcher, chroma_store)
+    
+    # Debug pattern learning
+    print("=== Pattern Learning ===")
+    predicted = pattern_matcher.get_relevant_keywords(query)
+    print(f"Predicted keywords: {predicted}")
+    
+    if not predicted:
+        print("No predictions found, checking pattern database...")
+        collection = pattern_matcher.pattern_collection
+        results = collection.get()
+        print(f"Total patterns in database: {len(results['ids'])}")
+    
+    # Debug keyword search
+    print("\n=== Keyword Search ===")
+    tool = smart_provider.get_keyword_search_tool()
+    search_result = tool._run("click button", top_k=3)
+    print(f"Search results: {search_result}")
+    
+    # Debug context generation
+    print("\n=== Context Generation ===")
+    context = smart_provider.get_agent_context(query, "assembler")
+    print(f"Context length: {len(context)} characters")
+    print(f"Context preview: {context[:500]}...")
+    
+    # Run workflow
+    print("\n=== Running Workflow ===")
+    result, crew = run_crew(query, "online", "gemini-2.0-flash-exp")
+    
+    # Debug metrics
+    print("\n=== Metrics ===")
+    metrics = crew.metrics
+    print(f"Token usage: {metrics.optimization.token_usage}")
+    print(f"Keyword search: {metrics.optimization.keyword_search_stats}")
+    print(f"Pattern learning: {metrics.optimization.pattern_learning_stats}")
+    print(f"Context reduction: {metrics.optimization.context_reduction}")
+    
+    return result, crew
+
+# Usage
+result, crew = debug_optimization_workflow("search for shoes on Flipkart")
+```
+
+
+## Performance Considerations
+
+### Memory Usage
+
+**ChromaDB Storage:**
+- In-memory index: ~50-100 MB for 143 keywords
+- Disk storage: ~10-20 MB per library
+- Embedding cache: ~80 MB (sentence-transformers model)
+
+**Pattern Learning:**
+- ChromaDB collection: Grows with usage (~1 KB per pattern)
+- In-memory cache: Minimal (<1 MB)
+
+**Optimization:**
+- Use persistent storage (ChromaDB handles this automatically)
+- Limit pattern database size (keep last 1000 patterns)
+- Monitor memory usage in production
+
+### CPU Usage
+
+**Embedding Generation:**
+- One-time cost at startup (~5 seconds for 143 keywords)
+- Uses CPU for sentence-transformers inference
+- Batched processing for efficiency (32 keywords at a time)
+
+**Semantic Search:**
+- Fast vector similarity computation (<100ms)
+- Uses numpy for vectorized operations
+- Minimal CPU overhead per search
+
+**Optimization:**
+- Pre-compute embeddings at startup
+- Use caching for frequent searches
+- Consider GPU acceleration for large-scale deployments
+
+### Disk I/O
+
+**ChromaDB Persistence:**
+- Writes to disk on collection updates
+- Reads from disk on startup (fast with persistent storage)
+- Minimal I/O during normal operation
+
+**Pattern Learning:**
+- Writes to ChromaDB on each successful execution
+- Reads from ChromaDB on each query prediction
+- ChromaDB handles persistence automatically
+
+**Optimization:**
+- Use SSD for better performance
+- Monitor disk space (grows with patterns)
+- Implement pattern cleanup for long-running systems
+
+### Network Latency
+
+**No External Dependencies:**
+- All processing is local (no API calls)
+- No network latency for embeddings or search
+- Faster and more reliable than cloud-based solutions
+
+**Optimization:**
+- Keep all components local
+- Avoid external embedding APIs
+- Use local models for maximum performance
+
+### Scaling Considerations
+
+**Horizontal Scaling:**
+- Each instance has its own ChromaDB storage
+- Pattern learning is instance-specific
+- Consider shared storage for collaborative learning
+
+**Vertical Scaling:**
+- More CPU → Faster embedding generation
+- More RAM → Larger in-memory caches
+- More disk → More pattern storage
+
+**Optimization Strategies:**
+
+```python
+# Shared ChromaDB storage for multiple instances
+class SharedKeywordVectorStore(KeywordVectorStore):
+    """ChromaDB store with shared network storage."""
+    
+    def __init__(self, shared_directory: str):
+        """Initialize with shared network directory."""
+        super().__init__(persist_directory=shared_directory)
+        self._lock = FileLock(f"{shared_directory}/.lock")
+    
+    def add_keywords(self, library_name: str, keywords: List[Dict]):
+        """Thread-safe keyword addition."""
+        with self._lock:
+            super().add_keywords(library_name, keywords)
+
+# Distributed pattern learning
+class DistributedPatternMatcher(QueryPatternMatcher):
+    """Pattern matcher with distributed storage."""
+    
+    def __init__(self, redis_client):
+        """Initialize with Redis for distributed patterns."""
+        self.redis = redis_client
+        super().__init__(chroma_store)
+    
+    def learn_from_execution(self, user_query: str, generated_code: str):
+        """Store pattern in both local and distributed storage."""
+        # Store locally
+        super().learn_from_execution(user_query, generated_code)
+        
+        # Store in Redis for sharing
+        pattern = {
+            "query": user_query,
+            "keywords": self._extract_keywords_from_code(generated_code),
+            "timestamp": datetime.now().isoformat()
+        }
+        self.redis.lpush("patterns", json.dumps(pattern))
+```
+
+## Debugging and Troubleshooting
+
+### Logging Configuration
+
+The optimization system uses structured logging for debugging:
+
+```python
+# In src/backend/crew_ai/optimization/logging_config.py
+
+import logging
+
+# Create optimization logger
+optimization_logger = logging.getLogger("crew_ai.optimization")
+optimization_logger.setLevel(logging.INFO)
+
+# Add file handler
+file_handler = logging.FileHandler("logs/optimization.log")
+file_handler.setFormatter(logging.Formatter(
+    '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+))
+optimization_logger.addHandler(file_handler)
+
+# Add console handler for development
+console_handler = logging.StreamHandler()
+console_handler.setLevel(logging.WARNING)
+optimization_logger.addHandler(console_handler)
+```
+
+**Log Levels:**
+- `DEBUG`: Detailed information for debugging (search queries, predictions, etc.)
+- `INFO`: Normal operation (predictions used, search calls, etc.)
+- `WARNING`: Fallback triggered (component failed, using baseline)
+- `ERROR`: Critical failure (optimization disabled entirely)
+
+**Example Logs:**
+
+```
+2024-01-15 10:30:15 - crew_ai.optimization - INFO - ChromaDB initialized with 143 keywords in 4.2s
+2024-01-15 10:30:20 - crew_ai.optimization - INFO - Pattern prediction used for query "login to website" (8 keywords, 0.87 confidence)
+2024-01-15 10:30:25 - crew_ai.optimization - DEBUG - Keyword search: "click button" → 3 results in 78ms
+2024-01-15 10:30:30 - crew_ai.optimization - WARNING - Pattern prediction confidence too low (0.65), falling back to search tool
+2024-01-15 10:30:35 - crew_ai.optimization - ERROR - ChromaDB search failed: Connection timeout, falling back to full context
+```
+
+### Common Issues and Solutions
+
+#### Issue 1: ChromaDB Initialization Fails
+
+**Symptoms:**
+```
+ERROR - ChromaDB initialization failed: Cannot connect to database
+```
+
+**Diagnosis:**
+```python
+# Check ChromaDB directory
+import os
+print(f"ChromaDB path exists: {os.path.exists('./chroma_db')}")
+print(f"ChromaDB path writable: {os.access('./chroma_db', os.W_OK)}")
+
+# Check dependencies
+try:
+    import chromadb
+    print(f"ChromaDB version: {chromadb.__version__}")
+except ImportError:
+    print("ChromaDB not installed")
+```
+
+**Solutions:**
+1. Verify ChromaDB installed: `pip install chromadb==0.4.22`
+2. Check directory permissions: `chmod 755 ./chroma_db`
+3. Check disk space: `df -h`
+4. Review logs for specific error
+
+#### Issue 2: Keyword Search Returns No Results
+
+**Symptoms:**
+```
+WARNING - Keyword search returned 0 results for query "click button"
+```
+
+**Diagnosis:**
+```python
+# Check if keywords are in ChromaDB
+store = KeywordVectorStore()
+collection = store.create_or_get_collection("Browser")
+results = collection.get()
+print(f"Total keywords in collection: {len(results['ids'])}")
+print(f"Sample keywords: {results['ids'][:10]}")
+
+# Test search directly
+search_results = store.search("Browser", "click button", top_k=3)
+print(f"Search results: {search_results}")
+```
+
+**Solutions:**
+1. Verify keywords ingested: Check collection has keywords
+2. Rebuild collection: `store.rebuild_collection("Browser")`
+3. Check query format: Ensure query is descriptive
+4. Lower top_k: Try `top_k=1` to see if any results
+
+#### Issue 3: Pattern Learning Not Predicting
+
+**Symptoms:**
+```
+INFO - Pattern prediction not used (confidence too low: 0.45)
+```
+
+**Diagnosis:**
+```python
+# Check pattern database
+matcher = QueryPatternMatcher(chroma_store)
+collection = matcher.pattern_collection
+results = collection.get()
+print(f"Total patterns: {len(results['ids'])}")
+
+# Test prediction
+predicted = matcher.get_relevant_keywords("test query", confidence_threshold=0.5)
+print(f"Predicted keywords: {predicted}")
+```
+
+**Solutions:**
+1. Need more training data: Run 20+ diverse queries
+2. Lower confidence threshold: Set to 0.6 instead of 0.7
+3. Check pattern storage: Verify patterns are being saved
+4. Review query similarity: Ensure queries are similar enough
+
+#### Issue 4: High Token Usage (No Reduction)
+
+**Symptoms:**
+```
+INFO - Token usage: 11500 (expected: 4000)
+```
+
+**Diagnosis:**
+```python
+# Check optimization status
+print(f"Optimization enabled: {settings.OPTIMIZATION_ENABLED}")
+
+# Check context generation
+provider = SmartKeywordProvider(library_context, pattern_matcher, chroma_store)
+context = provider.get_agent_context(query, "assembler")
+print(f"Context length: {len(context)} characters")
+print(f"Context preview: {context[:200]}...")
+
+# Check metrics
+metrics = crew.metrics
+print(f"Context reduction: {metrics.optimization.context_reduction}")
+```
+
+**Solutions:**
+1. Verify optimization enabled: Check `OPTIMIZATION_ENABLED=true`
+2. Check fallback: Review logs for fallback events
+3. Enable context pruning: Set `OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true`
+4. Lower thresholds: Reduce confidence thresholds
+
+#### Issue 5: Slow Performance
+
+**Symptoms:**
+```
+WARNING - Keyword search took 250ms (expected: <100ms)
+```
+
+**Diagnosis:**
+```python
+import time
+
+# Measure ChromaDB search
+start = time.time()
+results = store.search("Browser", "click button", top_k=3)
+latency = (time.time() - start) * 1000
+print(f"Search latency: {latency:.2f}ms")
+
+# Measure pattern prediction
+start = time.time()
+predicted = matcher.get_relevant_keywords("test query")
+latency = (time.time() - start) * 1000
+print(f"Prediction latency: {latency:.2f}ms")
+```
+
+**Solutions:**
+1. Check system resources: CPU, memory, disk I/O
+2. Verify ChromaDB initialized: First search is slower
+3. Use caching: Enable LRU cache in KeywordSearchTool
+4. Reduce top_k: Lower number of results
+
+### Debugging Tools
+
+**1. Optimization Status Check:**
+
+```python
+def check_optimization_status():
+    """Check optimization system status."""
+    from src.backend.crew_ai.optimization import KeywordVectorStore, QueryPatternMatcher
+    
+    print("=== Optimization Status ===")
+    print(f"Enabled: {settings.OPTIMIZATION_ENABLED}")
+    print(f"ChromaDB path: {settings.OPTIMIZATION_CHROMA_DB_PATH}")
+    
+    # Check ChromaDB
+    try:
+        store = KeywordVectorStore()
+        collection = store.create_or_get_collection("Browser")
+        results = collection.get()
+        print(f"✓ ChromaDB: {len(results['ids'])} keywords")
+    except Exception as e:
+        print(f"✗ ChromaDB: {e}")
+    
+    # Check pattern learning
+    try:
+        matcher = QueryPatternMatcher(store)
+        collection = matcher.pattern_collection
+        results = collection.get()
+        print(f"✓ Pattern Learning: {len(results['ids'])} patterns")
+    except Exception as e:
+        print(f"✗ Pattern Learning: {e}")
+    
+    print("=== Status Check Complete ===")
+
+# Usage
+check_optimization_status()
+```
+
+**2. Performance Profiler:**
+
+```python
+import cProfile
+import pstats
+
+def profile_optimization(query: str):
+    """Profile optimization performance."""
+    profiler = cProfile.Profile()
+    profiler.enable()
+    
+    # Run workflow
+    result, crew = run_crew(query, "online", "gemini-2.0-flash-exp")
+    
+    profiler.disable()
+    
+    # Print stats
+    stats = pstats.Stats(profiler)
+    stats.sort_stats('cumulative')
+    stats.print_stats(20)  # Top 20 functions
+    
+    return result, crew
+
+# Usage
+profile_optimization("search for shoes")
+```
+
+**3. Metrics Dashboard:**
+
+```python
+def print_optimization_dashboard(workflow_ids: List[str]):
+    """Print optimization metrics dashboard."""
+    print("=== Optimization Dashboard ===\n")
+    
+    for workflow_id in workflow_ids:
+        metrics = get_workflow_metrics(workflow_id)
+        
+        print(f"Workflow: {workflow_id}")
+        print(f"  Token Usage: {metrics.optimization.token_usage['total']}")
+        print(f"  Reduction: {metrics.optimization.context_reduction['reduction_percentage']:.1f}%")
+        print(f"  Prediction Used: {metrics.optimization.pattern_learning_stats['prediction_used']}")
+        print(f"  Search Calls: {metrics.optimization.keyword_search_stats['calls']}")
+        print()
+    
+    print("=== Dashboard Complete ===")
+
+# Usage
+print_optimization_dashboard(["abc-123", "def-456", "ghi-789"])
+```
+
+## Best Practices
+
+### Development
+
+1. **Test with optimization disabled first** - Verify baseline behavior works
+2. **Enable optimization incrementally** - Start with one component at a time
+3. **Monitor metrics closely** - Track token usage, prediction rate, search calls
+4. **Use debug logging** - Enable DEBUG level during development
+5. **Write unit tests** - Test each component in isolation
+6. **Profile performance** - Identify bottlenecks early
+
+### Production
+
+1. **Start with conservative settings** - Higher confidence thresholds
+2. **Monitor fallback rate** - Should be <10%
+3. **Track prediction accuracy** - Should improve over time
+4. **Set up alerts** - For high token usage, slow searches, errors
+5. **Regular pattern cleanup** - Keep database size manageable
+6. **Backup ChromaDB** - Before major updates
+
+### Code Quality
+
+1. **Follow type hints** - Use Python type annotations
+2. **Document public APIs** - Clear docstrings for all public methods
+3. **Handle errors gracefully** - Always provide fallback behavior
+4. **Log important events** - Use appropriate log levels
+5. **Write comprehensive tests** - Unit, integration, and performance tests
+6. **Keep components decoupled** - Easy to swap implementations
+
+## Contributing
+
+### Adding New Features
+
+1. **Discuss in GitHub issue** - Propose feature and get feedback
+2. **Follow existing patterns** - Match code style and architecture
+3. **Add tests** - Unit tests for new components
+4. **Update documentation** - Both user and developer docs
+5. **Submit PR** - With clear description and examples
+
+### Code Review Checklist
+
+- [ ] Code follows existing patterns and style
+- [ ] All public methods have docstrings
+- [ ] Type hints used throughout
+- [ ] Unit tests added for new functionality
+- [ ] Integration tests pass
+- [ ] Performance tests pass (if applicable)
+- [ ] Documentation updated
+- [ ] No breaking changes (or clearly documented)
+- [ ] Error handling and logging added
+- [ ] Graceful degradation implemented
+
+## Additional Resources
+
+- [User Guide](OPTIMIZATION.md) - Configuration and usage
+- [Architecture Guide](ARCHITECTURE.md) - Overall system architecture
+- [Configuration Guide](CONFIGURATION.md) - All environment variables
+- [Troubleshooting Guide](TROUBLESHOOTING.md) - Common issues
+- [GitHub Repository](https://github.com/monkscode/Natural-Language-to-Robot-Framework)
+- [GitHub Discussions](https://github.com/monkscode/Natural-Language-to-Robot-Framework/discussions)
+
+---
+
+**Questions or feedback?** Open an issue on GitHub or start a discussion!
diff --git a/src/backend/.env.example b/src/backend/.env.example
index 0b5a649..314fe18 100644
--- a/src/backend/.env.example
+++ b/src/backend/.env.example
@@ -64,3 +64,44 @@ PREFER_REMOTE_DOCKER_IMAGE=true
 # Leave empty to use the default: monkscode/nlrf:latest
 # Example: your-org/custom-nlrf:latest
 REMOTE_DOCKER_IMAGE=monkscode/nlrf:latest
+
+
+# --- CrewAI Performance Optimization Configuration ---
+# Enable/disable the optimization system (pattern learning, ChromaDB, semantic search)
+# When enabled, reduces token usage by 67% through hybrid knowledge architecture
+# Default: false (disabled until fully tested)
+OPTIMIZATION_ENABLED=true
+
+# Path to ChromaDB storage directory for keyword embeddings
+# ChromaDB stores keyword documentation with semantic search capabilities
+# Default: ./chroma_db
+OPTIMIZATION_CHROMA_DB_PATH=./chroma_db
+
+# Path to SQLite database for pattern learning
+# Stores query patterns and keyword usage history for prediction
+# Default: ./data/pattern_learning.db
+OPTIMIZATION_PATTERN_DB_PATH=./data/pattern_learning.db
+
+# Number of keywords to return from semantic search
+# Higher values provide more options but increase token usage
+# Valid range: 1-10
+# Default: 3
+OPTIMIZATION_KEYWORD_SEARCH_TOP_K=3
+
+# Minimum confidence threshold for pattern prediction (0.0-1.0)
+# Higher values require stronger similarity matches before using predictions
+# 0.7 = 70% similarity required
+# Default: 0.7
+OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD=0.7
+
+# Enable/disable smart context pruning based on query classification
+# When enabled, only includes keywords relevant to detected action types
+# Reduces context size by ~40% while maintaining accuracy
+# Default: true
+OPTIMIZATION_CONTEXT_PRUNING_ENABLED=true
+
+# Minimum confidence threshold for category classification (0.0-1.0)
+# Higher values require stronger category matches before pruning
+# 0.6 = 60% similarity required
+# Default: 0.6
+OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD=0.6
diff --git a/src/backend/api/endpoints.py b/src/backend/api/endpoints.py
index 73a4209..e7349dc 100644
--- a/src/backend/api/endpoints.py
+++ b/src/backend/api/endpoints.py
@@ -14,6 +14,7 @@ class Query(BaseModel):
 
 class ExecuteRequest(BaseModel):
     robot_code: str
+    user_query: str = None  # Optional: original user query for pattern learning
 
 @router.post('/generate-test')
 async def generate_test_only(query: Query):
@@ -40,14 +41,22 @@ async def execute_test_only(request: ExecuteRequest):
     """
     Execute provided Robot Framework test code in Docker container.
     Accepts user-edited or manually-written code.
+    
+    Optional: Pass user_query for pattern learning from successful executions.
     """
     robot_code = request.robot_code
+    user_query = request.user_query  # Optional: for pattern learning
+    
     if not robot_code or not robot_code.strip():
         raise HTTPException(status_code=400, detail="Robot code not provided")
 
     logging.info(f"[EXECUTE ONLY] Executing user-provided test code ({len(robot_code)} characters)")
+    if user_query:
+        logging.info(f"[EXECUTE ONLY] ✅ User query provided for pattern learning: {user_query[:50]}...")
+    else:
+        logging.warning("[EXECUTE ONLY] ⚠️ No user query provided - pattern learning will be skipped")
 
-    return StreamingResponse(stream_execute_only(robot_code), media_type="text/event-stream")
+    return StreamingResponse(stream_execute_only(robot_code, user_query), media_type="text/event-stream")
 
 @router.post('/generate-and-run')
 async def generate_and_run_streaming(query: Query):
diff --git a/src/backend/core/config.py b/src/backend/core/config.py
index fe5ff33..4acacf4 100644
--- a/src/backend/core/config.py
+++ b/src/backend/core/config.py
@@ -36,6 +36,16 @@ class Settings(BaseSettings):
     MAX_LOCATOR_STRATEGIES: int = Field(default=21, description="Maximum number of locator strategies to try")
     TRACK_LLM_COSTS: bool = Field(default=True, description="Enable/disable LLM cost tracking and logging")
     
+    # Optimization Configuration
+    OPTIMIZATION_ENABLED: bool = Field(default=False, description="Enable/disable optimization system (pattern learning, ChromaDB)")
+    OPTIMIZATION_CHROMA_DB_PATH: str = Field(default="./chroma_db", description="Path to ChromaDB storage directory")
+    OPTIMIZATION_PATTERN_DB_PATH: str = Field(default="./data/pattern_learning.db", description="Path to pattern learning SQLite database")
+    OPTIMIZATION_EMBEDDING_MODEL: str = Field(default="all-MiniLM-L6-v2", description="Sentence transformer model for embeddings (used by ChromaDB)")
+    OPTIMIZATION_KEYWORD_SEARCH_TOP_K: int = Field(default=3, description="Number of keywords to return from search")
+    OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD: float = Field(default=0.7, description="Minimum confidence for pattern prediction (0.0-1.0)")
+    OPTIMIZATION_CONTEXT_PRUNING_ENABLED: bool = Field(default=True, description="Enable smart context pruning")
+    OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD: float = Field(default=0.6, description="Minimum confidence for category classification (0.0-1.0)")
+    
     @validator('ROBOT_LIBRARY')
     def validate_robot_library(cls, v):
         """Validate that ROBOT_LIBRARY is either 'selenium' or 'browser'."""
@@ -63,6 +73,13 @@ def validate_max_locator_strategies(cls, v):
         if v < 1 or v > 50:
             raise ValueError(f"MAX_LOCATOR_STRATEGIES must be between 1 and 50, got {v}")
         return v
+    
+    @validator('OPTIMIZATION_PATTERN_CONFIDENCE_THRESHOLD', 'OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD')
+    def validate_confidence_threshold(cls, v):
+        """Validate that confidence thresholds are between 0.0 and 1.0."""
+        if not 0.0 <= v <= 1.0:
+            raise ValueError(f"Confidence threshold must be between 0.0 and 1.0, got {v}")
+        return v
 
     class Config:
         env_file = ".env"
diff --git a/src/backend/core/workflow_metrics.py b/src/backend/core/workflow_metrics.py
index 54a241d..c6137d1 100644
--- a/src/backend/core/workflow_metrics.py
+++ b/src/backend/core/workflow_metrics.py
@@ -49,10 +49,117 @@ class WorkflowMetrics:
     custom_action_usage_count: int = 0
     session_id: Optional[str] = None
     
+    # Optimization metrics (NEW)
+    token_usage: Dict[str, int] = None
+    keyword_search_stats: Dict[str, Any] = None
+    pattern_learning_stats: Dict[str, Any] = None
+    context_reduction: Dict[str, Any] = None
+    
+    def __post_init__(self):
+        """Initialize optimization metrics with default values if not provided."""
+        if self.token_usage is None:
+            self.token_usage = {
+                "step_planner": 0,
+                "element_identifier": 0,
+                "code_assembler": 0,
+                "code_validator": 0,
+                "total": 0
+            }
+        
+        if self.keyword_search_stats is None:
+            self.keyword_search_stats = {
+                "calls": 0,
+                "total_latency_ms": 0.0,
+                "avg_latency_ms": 0.0,
+                "returned_keywords": [],
+                "accuracy": 0.0
+            }
+        
+        if self.pattern_learning_stats is None:
+            self.pattern_learning_stats = {
+                "prediction_used": False,
+                "predicted_keywords_count": 0,
+                "prediction_accuracy": 0.0
+            }
+        
+        if self.context_reduction is None:
+            self.context_reduction = {
+                "baseline_tokens": 0,
+                "optimized_tokens": 0,
+                "reduction_percentage": 0.0
+            }
+    
+    def track_token_usage(self, agent_name: str, token_count: int) -> None:
+        """
+        Track token usage per agent.
+        
+        Args:
+            agent_name: Name of the agent (step_planner, element_identifier, code_assembler, code_validator)
+            token_count: Number of tokens used by the agent
+        """
+        if agent_name in self.token_usage:
+            self.token_usage[agent_name] = token_count
+            self.token_usage["total"] = sum(
+                v for k, v in self.token_usage.items() if k != "total"
+            )
+    
+    def track_keyword_search(self, latency_ms: float, returned_keywords: List[str]) -> None:
+        """
+        Track keyword search tool usage.
+        
+        Args:
+            latency_ms: Search latency in milliseconds
+            returned_keywords: List of keyword names returned by search
+        """
+        self.keyword_search_stats["calls"] += 1
+        self.keyword_search_stats["total_latency_ms"] += latency_ms
+        self.keyword_search_stats["avg_latency_ms"] = (
+            self.keyword_search_stats["total_latency_ms"] / 
+            self.keyword_search_stats["calls"]
+        )
+        # Store returned keywords for accuracy calculation later
+        self.keyword_search_stats["returned_keywords"].extend(returned_keywords)
+    
+    def track_pattern_learning(self, predicted: bool, keyword_count: int, accuracy: float = 0.0) -> None:
+        """
+        Track pattern learning usage.
+        
+        Args:
+            predicted: Whether prediction was used
+            keyword_count: Number of predicted keywords
+            accuracy: Prediction accuracy (0.0-1.0)
+        """
+        self.pattern_learning_stats["prediction_used"] = predicted
+        self.pattern_learning_stats["predicted_keywords_count"] = keyword_count
+        self.pattern_learning_stats["prediction_accuracy"] = accuracy
+    
+    def track_context_reduction(self, baseline: int, optimized: int) -> None:
+        """
+        Track context size reduction.
+        
+        Args:
+            baseline: Baseline token count (without optimization)
+            optimized: Optimized token count (with optimization)
+        """
+        self.context_reduction["baseline_tokens"] = baseline
+        self.context_reduction["optimized_tokens"] = optimized
+        self.context_reduction["reduction_percentage"] = (
+            ((baseline - optimized) / baseline * 100) if baseline > 0 else 0.0
+        )
+    
     def to_dict(self) -> Dict[str, Any]:
         """Convert to dictionary with ISO format timestamp."""
         data = asdict(self)
         data['timestamp'] = self.timestamp.isoformat()
+        
+        # Add optimization metrics section
+        data['optimization'] = {
+            'token_usage': self.token_usage,
+            'keyword_search': self.keyword_search_stats,
+            'pattern_learning': self.pattern_learning_stats,
+            'context_reduction': self.context_reduction
+        }
+        
         return data
     
     @classmethod
@@ -111,6 +218,21 @@ def from_dict(cls, data: Dict[str, Any]) -> 'WorkflowMetrics':
         data.setdefault('custom_action_usage_count', 0)
         data.setdefault('session_id', None)
         
+        # Handle optimization metrics (backward compatibility)
+        # Check if optimization section exists in data
+        if 'optimization' in data:
+            opt = data.pop('optimization')
+            data.setdefault('token_usage', opt.get('token_usage'))
+            data.setdefault('keyword_search_stats', opt.get('keyword_search'))
+            data.setdefault('pattern_learning_stats', opt.get('pattern_learning'))
+            data.setdefault('context_reduction', opt.get('context_reduction'))
+        else:
+            # Set defaults for optimization metrics if not present
+            data.setdefault('token_usage', None)
+            data.setdefault('keyword_search_stats', None)
+            data.setdefault('pattern_learning_stats', None)
+            data.setdefault('context_reduction', None)
+        
         return cls(**data)
 
 
@@ -261,6 +383,37 @@ def get_workflow_metrics_collector() -> WorkflowMetricsCollector:
     return _metrics_collector
 
 
+def count_tokens(text: str) -> int:
+    """
+    Count tokens in text using simple word-based estimation.
+    
+    This is a simple approximation: 1 token ≈ 0.75 words (or 1 word ≈ 1.33 tokens).
+    For more accurate counting, consider using tiktoken library.
+    
+    Args:
+        text: Text to count tokens for
+    
+    Returns:
+        Estimated token count
+    
+    Example:
+        >>> count_tokens("Hello world, this is a test")
+        8
+    """
+    if not text:
+        return 0
+    
+    # Simple word-based estimation
+    # Split on whitespace and count words
+    words = text.split()
+    
+    # Approximate: 1 word ≈ 1.33 tokens (or 0.75 words per token)
+    # This is a rough estimate based on typical English text
+    estimated_tokens = int(len(words) * 1.33)
+    
+    return estimated_tokens
+
+
 def calculate_crewai_cost(usage_metrics: dict, model_name: str = "gemini-2.0-flash-exp") -> dict:
     """
     Calculate cost from CrewAI usage_metrics.
diff --git a/src/backend/crew_ai/agents.py b/src/backend/crew_ai/agents.py
index 67adce5..76d0a23 100644
--- a/src/backend/crew_ai/agents.py
+++ b/src/backend/crew_ai/agents.py
@@ -50,7 +50,10 @@ def get_llm(model_provider, model_name):
 
 
 class RobotAgents:
-    def __init__(self, model_provider, model_name, library_context=None):
+    def __init__(self, model_provider, model_name, library_context=None, 
+                 optimized_context=None, keyword_search_tool=None,
+                 planner_context=None, identifier_context=None,
+                 assembler_context=None, validator_context=None):
         """
         Initialize Robot Framework agents.
 
@@ -58,19 +61,98 @@ def __init__(self, model_provider, model_name, library_context=None):
             model_provider: "local" or "online"
             model_name: Model identifier
             library_context: LibraryContext instance (optional, for dynamic keyword knowledge)
+            optimized_context: DEPRECATED - Use assembler_context instead (kept for backward compatibility)
+            keyword_search_tool: KeywordSearchTool instance (optional, added to code assembler tools)
+            planner_context: Optimized context for Test Automation Planner (optional)
+            identifier_context: Optimized context for Element Identifier (optional, currently unused)
+            assembler_context: Optimized context for Code Assembler (optional)
+            validator_context: Optimized context for Code Validator (optional)
         """
         self.llm = get_llm(model_provider, model_name)
         self.library_context = library_context
+        self.keyword_search_tool = keyword_search_tool
+        
+        # Handle backward compatibility for optimized_context (deprecated)
+        if optimized_context is not None and assembler_context is None:
+            logger.warning(
+                "⚠️ DEPRECATION WARNING: 'optimized_context' parameter is deprecated. "
+                "Use 'assembler_context' instead for clarity and consistency."
+            )
+            assembler_context = optimized_context
+        
+        # Role-specific optimized contexts
+        self.planner_context = planner_context
+        self.identifier_context = identifier_context  # Currently unused by element_identifier_agent
+        self.assembler_context = assembler_context
+        self.validator_context = validator_context
+
+    def _get_agent_context(self, agent_type: str) -> str:
+        """
+        Unified context retrieval with consistent priority chain.
+        
+        Priority:
+        1. Optimized context (from SmartKeywordProvider - pattern learning/zero-context+tool)
+        2. Library context (static context from library_context)
+        3. Empty string (graceful degradation)
+        
+        Args:
+            agent_type: "planner", "assembler", or "validator"
+        
+        Returns:
+            Context string with appropriate formatting
+        """
+        # Map agent type to optimized context attribute
+        optimized_context_map = {
+            "planner": self.planner_context,
+            "assembler": self.assembler_context,
+            "validator": self.validator_context
+        }
+        
+        # Map agent type to library context property
+        library_context_map = {
+            "planner": "planning_context",
+            "assembler": "code_assembly_context",
+            "validator": "validation_context"
+        }
+        
+        optimized_context = optimized_context_map.get(agent_type)
+        
+        # Priority 1: Use optimized context if available
+        if optimized_context:
+            logger.info(f"🎯 {agent_type.capitalize()} using optimized context")
+            return f"\n\n{optimized_context}"
+        
+        # Priority 2: Fall back to library context
+        if self.library_context:
+            library_property = library_context_map.get(agent_type)
+            if library_property:
+                static_context = getattr(self.library_context, library_property)
+                logger.info(f"📚 {agent_type.capitalize()} using static library context (optimization not available)")
+                return f"\n\n{static_context}"
+        
+        # Priority 3: Graceful degradation
+        logger.warning(f"⚠️ {agent_type.capitalize()} has no context available - using minimal validation")
+        return ""
 
     def step_planner_agent(self) -> Agent:
-        # Get library-specific context if available
-        library_knowledge = ""
+        # Step Planner needs MINIMAL context - just library name and core principles
+        # It doesn't need keyword details - that's for the Code Assembler
+        library_name = self.library_context.library_name if self.library_context else 'Robot Framework'
+        
+        # Minimal library-specific guidance (no keyword lists!)
+        library_guidance = ""
         if self.library_context:
-            library_knowledge = f"\n\n{self.library_context.planning_context}"
+            library_guidance = f"""
+
+**{library_name} CORE PRINCIPLES:**
+- Use appropriate keywords for: navigation, input, clicking, text extraction
+- Browser Library has auto-waiting (no explicit waits needed)
+- Focus on high-level actions, not implementation details
+"""
 
         return Agent(
             role="Test Automation Planner",
-            goal=f"Break down a natural language query into a structured series of high-level test steps for Robot Framework using {self.library_context.library_name if self.library_context else 'Robot Framework'}. ONLY include elements and actions explicitly mentioned in the user's query.",
+            goal=f"Break down a natural language query into a structured series of high-level test steps for Robot Framework using {library_name}. ONLY include elements and actions explicitly mentioned in the user's query.",
             backstory=(
                 "You are an expert test automation planner with a strict focus on user requirements. "
                 "Your task is to analyze the user's query and convert ONLY the explicitly mentioned actions into structured test steps. "
@@ -81,8 +163,9 @@ def step_planner_agent(self) -> Agent:
                 "4. The browser automation will handle popups contextually - you don't need to\n"
                 "5. If user says 'search for shoes', create steps for: search input + enter. Nothing else.\n"
                 "6. If user says 'get product name', create step for: get product name. Nothing else.\n"
-                "7. Be meticulous but ONLY for what user explicitly asked for."
-                f"{library_knowledge}"
+                "7. Be meticulous but ONLY for what user explicitly asked for.\n"
+                "8. Create HIGH-LEVEL steps - the Code Assembler will handle keyword details."
+                f"{library_guidance}"
             ),
             llm=self.llm,
             verbose=True,
@@ -92,139 +175,13 @@ def step_planner_agent(self) -> Agent:
     def element_identifier_agent(self) -> Agent:
         return Agent(
             role="Advanced Web Element Locator Specialist with Batch Vision AI",
-            goal="Use the batch_browser_automation tool to find ALL web element locators in ONE browser session with full context. Process all elements together for maximum efficiency and context awareness.",
+            goal="Use batch_browser_automation to find ALL element locators in ONE call.",
             backstory=(
-                "You are an expert in web element identification for Robot Framework automation "
-                "with cutting-edge BATCH vision AI capabilities powered by browser-use. "
-                "\n\n⚠️ **CRITICAL REQUIREMENT - BATCH PROCESSING MODE**\n"
-                "You have ONE PRIMARY TOOL: batch_browser_automation\n"
-                "You MUST collect ALL elements from the test steps and process them in ONE batch call.\n"
-                "This keeps the browser session alive, preserves context, and handles popups intelligently.\n"
-                "\n\n**YOUR WORKFLOW:**\n"
-                "1. **Analyze Context:** Read ALL test steps from the plan\n"
-                "2. **Collect Elements:** Build a list of ALL elements that need locators\n"
-                "3. **Extract URL:** Identify the target URL from the steps (e.g., Open Browser step)\n"
-                "4. **Call Batch Tool ONCE:** Use batch_browser_automation with ALL elements\n"
-                "5. **Map Results:** Add the returned locators to each corresponding step\n"
-                "\n\n**BATCH TOOL FORMAT (USE THIS):**\n"
-                "```\n"
-                "Action: batch_browser_automation\n"
-                "Action Input: {\n"
-                "    \"elements\": [\n"
-                "        {\"id\": \"element_1\", \"description\": \"search box in header\", \"action\": \"input\"},\n"
-                "        {\"id\": \"element_2\", \"description\": \"first product card\", \"action\": \"click\"},\n"
-                "        {\"id\": \"element_3\", \"description\": \"product price in first card\", \"action\": \"get_text\"}\n"
-                "    ],\n"
-                "    \"url\": \"https://www.flipkart.com\",\n"
-                "    \"user_query\": \"Search for shoes and get first product price\"\n"
-                "}\n"
-                "```\n"
-                "\n\n**CONCRETE EXAMPLE:**\n"
-                "\n**Input Steps:**\n"
-                "```\n"
-                "[\n"
-                "    {\"keyword\": \"Open Browser\", \"value\": \"https://www.flipkart.com\"},\n"
-                "    {\"keyword\": \"Input Text\", \"element_description\": \"search box\", \"value\": \"shoes\"},\n"
-                "    {\"keyword\": \"Press Keys\", \"element_description\": \"search box\", \"value\": \"RETURN\"},\n"
-                "    {\"keyword\": \"Get Text\", \"element_description\": \"first product name\"},\n"
-                "    {\"keyword\": \"Get Text\", \"element_description\": \"first product price\"}\n"
-                "]\n"
-                "```\n"
-                "\n**What You Do:**\n"
-                "1. Identify URL: https://www.flipkart.com\n"
-                "2. Collect elements needing locators:\n"
-                "   - search box (for steps 2 & 3)\n"
-                "   - first product name (for step 4)\n"
-                "   - first product price (for step 5)\n"
-                "\n3. Call batch tool:\n"
-                "```\n"
-                "Action: batch_browser_automation\n"
-                "Action Input: {\n"
-                "    \"elements\": [\n"
-                "        {\"id\": \"elem_1\", \"description\": \"search box in header\", \"action\": \"input\"},\n"
-                "        {\"id\": \"elem_2\", \"description\": \"first product name element in search results\", \"action\": \"get_text\"},\n"
-                "        {\"id\": \"elem_3\", \"description\": \"first product price element in search results\", \"action\": \"get_text\"}\n"
-                "    ],\n"
-                "    \"url\": \"https://www.flipkart.com\",\n"
-                "    \"user_query\": \"Search for shoes and get first product name and price\"\n"
-                "}\n"
-                "```\n"
-                "\n4. Receive response:\n"
-                "```json\n"
-                "{\n"
-                "    \"locator_mapping\": {\n"
-                "        \"elem_1\": {\"best_locator\": \"name=q\", \"found\": true},\n"
-                "        \"elem_2\": {\"best_locator\": \"xpath=(//div[@class='product'])[1]//span[@class='name']\", \"found\": true},\n"
-                "        \"elem_3\": {\"best_locator\": \"xpath=(//div[@class='product'])[1]//span[@class='price']\", \"found\": true}\n"
-                "    }\n"
-                "}\n"
-                "```\n"
-                "\n5. Map locators back to steps:\n"
-                "   - Step 2 & 3 → locator: \"name=q\"\n"
-                "   - Step 4 → locator: \"xpath=(//div[@class='product'])[1]//span[@class='name']\"\n"
-                "   - Step 5 → locator: \"xpath=(//div[@class='product'])[1]//span[@class='price']\"\n"
-                "\n\n**WHY BATCH MODE IS BETTER:**\n"
-                "✅ Browser opens ONCE (faster, ~3-5x speedup)\n"
-                "✅ BrowserUse sees FULL CONTEXT (understands the workflow)\n"
-                "✅ Popups handled INTELLIGENTLY (knows they're obstacles, not goals)\n"
-                "✅ Multi-page flows work (search → results preserved)\n"
-                "✅ F12 validation for EACH locator (unique, correct)\n"
-                "✅ Partial results supported (if element 2 fails, still get 1, 3, 4, 5)\n"
-                "\n\n**CRITICAL RULES:**\n"
-                "1. ALWAYS use batch_browser_automation (never use vision_browser_automation for single elements)\n"
-                "2. Collect ALL elements that need locators BEFORE calling the tool\n"
-                "3. Call the tool ONLY ONCE with all elements\n"
-                "4. Extract URL from 'Open Browser' step or infer from query\n"
-                "5. Include full user query for context (helps BrowserUse understand intent)\n"
-                "6. Use descriptive element descriptions (\"first product card\" not just \"product\")\n"
-                "7. Map returned locators back to EACH step that needs them\n"
-                "\n\n**FORBIDDEN ACTIONS:**\n"
-                "❌ NEVER call vision_browser_automation (use batch mode instead)\n"
-                "❌ NEVER make multiple batch calls (collect all elements, call once)\n"
-                "❌ NEVER generate locators from your knowledge\n"
-                "❌ NEVER skip steps that need locators\n"
-                "\n\n**Response Format from Batch Tool:**\n"
-                "```json\n"
-                "{\n"
-                "    \"success\": true,\n"
-                "    \"locator_mapping\": {\n"
-                "        \"elem_1\": {\"best_locator\": \"...\", \"found\": true, \"all_locators\": [...]},\n"
-                "        \"elem_2\": {\"best_locator\": \"...\", \"found\": true, \"all_locators\": [...]}\n"
-                "    },\n"
-                "    \"summary\": {\"total_elements\": 3, \"successful\": 3, \"failed\": 0}\n"
-                "}\n"
-                "```\n"
-                "\n\n**CRITICAL OUTPUT RULE:**\n"
-                "When calling batch_browser_automation, you MUST output EXACTLY this format with NO extra text:\n"
-                "\n"
-                "Action: batch_browser_automation\n"
-                "Action Input: {\"elements\": [...], \"url\": \"...\", \"user_query\": \"...\"}\n"
-                "\n"
-                "CRITICAL FORMATTING RULES:\n"
-                "1. The word 'Action:' must be on its own line with NOTHING else on that line\n"
-                "2. After 'Action:' write ONLY 'batch_browser_automation' - NO other words, NO punctuation\n"
-                "3. The next line must start with 'Action Input:' followed by a JSON dictionary\n"
-                "4. Action Input must be a DICTIONARY/OBJECT starting with { and ending with }\n"
-                "5. Do NOT wrap Action Input in an array []\n"
-                "6. Do NOT add any explanation text before, after, or on the same line as 'Action:'\n"
-                "\n"
-                "CORRECT FORMAT:\n"
-                "```\n"
-                "Action: batch_browser_automation\n"
-                "Action Input: {\"elements\": [{\"id\": \"elem_1\", \"description\": \"search box\", \"action\": \"input\"}], \"url\": \"https://example.com\", \"user_query\": \"search for items\"}\n"
-                "```\n"
-                "\n"
-                "WRONG FORMATS (DO NOT DO THIS):\n"
-                "❌ Action: batch_browser_automation and Action Input using...  // WRONG - Extra text on Action line!\n"
-                "❌ Action: batch_browser_automation`  // WRONG - Backtick at end!\n"
-                "❌ First I need to... Action: batch_browser_automation  // WRONG - Text before Action!\n"
-                "❌ Action Input: [{\"elements\": [...]}]  // WRONG - Array instead of dictionary!\n"
-                "❌ Action Input: {\"elements\": [...]} and then...  // WRONG - Text after Action Input!\n"
-                "\n"
-                "REMEMBER: The Action line must contain ONLY 'Action: batch_browser_automation' with NO other text.\n"
-                "\n"
-                "**Remember:** Batch mode is ALWAYS better because BrowserUse works best with full context. "
-                "Even for 1-2 elements, use batch mode. NO EXCEPTIONS."
+                "Expert web element locator using batch vision AI. "
+                "Workflow: (1) Collect ALL elements from test steps, (2) Extract URL, (3) Call batch_browser_automation ONCE with all elements, (4) Map locators to steps. "
+                "Tool format: Action: batch_browser_automation | Action Input: {\"elements\": [{\"id\": \"elem_1\", \"description\": \"...\", \"action\": \"input/click/get_text\"}], \"url\": \"...\", \"user_query\": \"...\"}. "
+                "CRITICAL: Action line must have ONLY 'batch_browser_automation' with NO extra text. Action Input must be a dict {}, NOT array []. "
+                "Benefits: Browser opens once (3-5x faster), full context awareness, intelligent popup handling, validated locators."
             ),
             # NEW: Batch processing tool for multiple elements
             tools=[batch_browser_use_tool],
@@ -234,10 +191,8 @@ def element_identifier_agent(self) -> Agent:
         )
 
     def code_assembler_agent(self) -> Agent:
-        # Get library-specific context if available
-        library_knowledge = ""
-        if self.library_context:
-            library_knowledge = f"\n\n{self.library_context.code_assembly_context}"
+        # Get context via unified method with consistent priority chain
+        library_knowledge = self._get_agent_context("assembler")
 
         return Agent(
             role="Robot Framework Code Generator (Output ONLY Code)",
@@ -302,6 +257,7 @@ def code_assembler_agent(self) -> Agent:
                 "Your goal is to learn from validation feedback and produce corrected code that passes validation."
                 f"{library_knowledge}"
             ),
+            tools=[self.keyword_search_tool] if self.keyword_search_tool else [],
             llm=self.llm,
             verbose=True,
             allow_delegation=True,
@@ -311,46 +267,27 @@ def code_validator_agent(self) -> Agent:
         # Import settings to access MAX_AGENT_ITERATIONS
         from ..core.config import settings
 
-        # Get library-specific context if available
-        library_knowledge = ""
-        if self.library_context:
-            library_knowledge = f"\n\n{self.library_context.validation_context}"
+        # Get context via unified method with consistent priority chain
+        library_knowledge = self._get_agent_context("validator")
+
+        # Build tools list - add keyword_search_tool if available
+        # This allows validator to look up keyword details for validation
+        tools = []
+        if self.keyword_search_tool:
+            tools.append(self.keyword_search_tool)
+            logger.info("🔧 Validator has keyword_search_tool access for keyword verification")
 
         return Agent(
             role="Robot Framework Linter and Quality Assurance Engineer",
-            goal=f"Validate the generated Robot Framework code for correctness and adherence to {self.library_context.library_name if self.library_context else 'Robot Framework'} rules, and delegate fixes to Code Assembly Agent if errors are found.",
+            goal=f"Validate Robot Framework code for {self.library_context.library_name if self.library_context else 'Robot Framework'} correctness. Delegate fixes if errors found.",
             backstory=(
-                "You are an expert Robot Framework linter. Your sole task is to validate the provided "
-                "Robot Framework code for syntax errors, correct keyword usage, and adherence to critical rules. "
-                "You must be thorough and provide a clear validation result.\n\n"
-                "**DELEGATION WORKFLOW:**\n"
-                "When you find errors in the code, you MUST follow this workflow:\n"
-                "1. Identify and document all syntax errors, incorrect keyword usage, and rule violations\n"
-                "2. Create a detailed fix request with:\n"
-                "   - Specific line numbers where errors occur\n"
-                "   - Clear description of each error\n"
-                "   - Examples of correct syntax for each issue\n"
-                "   - Relevant Robot Framework rules being violated\n"
-                "3. Delegate the fix request to the Code Assembly Agent with clear, actionable instructions\n"
-                "4. The Code Assembly Agent will regenerate the code incorporating your feedback\n"
-                "5. You will then validate the regenerated code and repeat if necessary\n\n"
-                "**CRITICAL DELEGATION INSTRUCTIONS:**\n"
-                "When you find errors, create a detailed fix request and delegate to Code Assembly Agent.\n"
-                "Your delegation message should include:\n"
-                "- A summary of all errors found\n"
-                "- Specific corrections needed for each error\n"
-                "- Code examples showing the correct implementation\n"
-                "- Priority ranking if multiple errors exist (fix critical syntax errors first)\n\n"
-                "**VALIDATION CRITERIA:**\n"
-                "- Syntax correctness (indentation, spacing, structure)\n"
-                "- Correct keyword usage for the target library\n"
-                "- Proper variable assignments for keywords that return values\n"
-                "- Valid locator formats\n"
-                "- Correct test case structure\n\n"
-                "If the code is valid, clearly state 'VALID' and provide a brief summary. "
-                "If errors are found, immediately delegate to Code Assembly Agent with detailed fix instructions."
+                "Expert Robot Framework validator. Check: syntax, keyword usage, variable assignments, locator formats, test structure. "
+                "Use keyword_search tool to verify keyword details (arguments, return values, syntax) when needed. "
+                "If VALID: Return JSON {\"valid\": true, \"reason\": \"...\"}. "
+                "If INVALID: Document errors with line numbers, then delegate to Code Assembly Agent with fix instructions."
                 f"{library_knowledge}"
             ),
+            tools=tools,
             llm=self.llm,
             verbose=True,
             allow_delegation=True,
diff --git a/src/backend/crew_ai/crew.py b/src/backend/crew_ai/crew.py
index 4a100a3..2a55742 100644
--- a/src/backend/crew_ai/crew.py
+++ b/src/backend/crew_ai/crew.py
@@ -2,6 +2,8 @@
 from src.backend.crew_ai.agents import RobotAgents
 from src.backend.crew_ai.tasks import RobotTasks
 from src.backend.crew_ai.llm_output_cleaner import LLMOutputCleaner, formatting_monitor
+from src.backend.core.workflow_metrics import WorkflowMetrics, count_tokens
+from datetime import datetime
 import re
 import logging
 
@@ -64,6 +66,7 @@ def run_crew(query: str, model_provider: str, model_name: str, library_type: str
       are now used without wrappers as Google Gemini API has sufficient rate limits.
     - Popup handling is done contextually by BrowserUse agents, not as a separate step.
     - Library context is loaded dynamically based on ROBOT_LIBRARY config setting.
+    - Optimization system (pattern learning, ChromaDB) can be enabled via OPTIMIZATION_ENABLED config.
     """
     # Load library context based on configuration
     from src.backend.core.config import settings
@@ -78,8 +81,139 @@ def run_crew(query: str, model_provider: str, model_name: str, library_type: str
     logger.info(
         f"✅ Loaded {library_context.library_name} context with dynamic keywords")
 
+    # Initialize metrics for optimization tracking
+    optimization_metrics = None
+    if settings.OPTIMIZATION_ENABLED:
+        # Create a temporary metrics object for tracking optimization metrics
+        # This will be merged with the main workflow metrics later
+        optimization_metrics = WorkflowMetrics(
+            workflow_id=workflow_id or "temp",
+            timestamp=datetime.now(),
+            url=extract_url_from_query(query),
+            total_llm_calls=0,
+            total_cost=0.0,
+            execution_time=0.0
+        )
+    
+    # Initialize optimization system if enabled
+    optimized_context = None
+    keyword_search_tool = None
+    smart_provider = None
+    baseline_context_tokens = 0
+    optimized_context_tokens = 0
+    
+    if settings.OPTIMIZATION_ENABLED:
+        try:
+            logger.info("🚀 Optimization system enabled - initializing components")
+            from src.backend.crew_ai.optimization import (
+                KeywordVectorStore,
+                QueryPatternMatcher,
+                SmartKeywordProvider,
+                ContextPruner
+            )
+            
+            # Initialize ChromaDB vector store
+            vector_store = KeywordVectorStore(
+                persist_directory=settings.OPTIMIZATION_CHROMA_DB_PATH
+            )
+            
+            # Ensure collection is ready (auto-rebuild if version mismatch)
+            vector_store.ensure_collection_ready(library_context.library_name)
+            
+            # Initialize pattern matcher (with ChromaDB for query embeddings)
+            pattern_matcher = QueryPatternMatcher(
+                db_path=settings.OPTIMIZATION_PATTERN_DB_PATH,
+                chroma_store=vector_store  # Pass ChromaDB store for query embeddings
+            )
+            
+            # Initialize context pruner if enabled
+            context_pruner = None
+            if settings.OPTIMIZATION_CONTEXT_PRUNING_ENABLED:
+                try:
+                    logger.info("🔍 Initializing context pruner...")
+                    context_pruner = ContextPruner()
+                    logger.info("✅ Context pruner initialized")
+                except Exception as e:
+                    logger.warning(f"⚠️ Failed to initialize context pruner: {e}")
+                    logger.warning("   Context pruning will be disabled")
+            
+            # Initialize smart keyword provider with metrics
+            smart_provider = SmartKeywordProvider(
+                library_context=library_context,
+                pattern_matcher=pattern_matcher,
+                vector_store=vector_store,
+                context_pruner=context_pruner,
+                pruning_enabled=settings.OPTIMIZATION_CONTEXT_PRUNING_ENABLED,
+                pruning_threshold=settings.OPTIMIZATION_CONTEXT_PRUNING_THRESHOLD,
+                metrics=optimization_metrics
+            )
+            
+            # Calculate baseline context size (full context)
+            baseline_context = library_context.code_assembly_context
+            baseline_context_tokens = count_tokens(baseline_context)
+            
+            # Get optimized contexts for ALL agents
+            logger.info("🎯 Generating optimized contexts for all agents...")
+            planner_context = smart_provider.get_agent_context(query, "planner")
+            # Identifier context skipped - element_identifier_agent doesn't use context
+            # It only needs batch_browser_automation tool, no keyword knowledge required
+            identifier_context = None
+            assembler_context = smart_provider.get_agent_context(query, "assembler")
+            validator_context = smart_provider.get_agent_context(query, "validator")
+            
+            # Calculate total optimized tokens (skip None values)
+            planner_tokens = count_tokens(planner_context)
+            identifier_tokens = 0  # Not generated, saves ~50-100ms per workflow
+            assembler_tokens = count_tokens(assembler_context)
+            validator_tokens = count_tokens(validator_context)
+            optimized_context_tokens = assembler_tokens  # For backward compatibility metric
+            
+            logger.info(f"📊 Context sizes: Planner={planner_tokens}, Identifier=N/A (skipped), Assembler={assembler_tokens}, Validator={validator_tokens}")
+            
+            # Track context reduction (using assembler as reference)
+            if optimization_metrics:
+                optimization_metrics.track_context_reduction(
+                    baseline=baseline_context_tokens,
+                    optimized=optimized_context_tokens
+                )
+                logger.info(
+                    f"📊 Context reduction (assembler): {baseline_context_tokens} -> {optimized_context_tokens} tokens "
+                    f"({optimization_metrics.context_reduction['reduction_percentage']:.1f}% reduction)"
+                )
+            
+            # Get keyword search tool
+            keyword_search_tool = smart_provider.get_keyword_search_tool()
+            
+            logger.info("✅ Optimization system initialized successfully for ALL agents")
+            
+        except Exception as e:
+            logger.error(f"❌ Failed to initialize optimization system: {e}")
+            logger.warning("⚠️ Falling back to baseline behavior (full context)")
+            planner_context = None
+            identifier_context = None
+            assembler_context = None
+            validator_context = None
+            keyword_search_tool = None
+            smart_provider = None
+            optimization_metrics = None
+    else:
+        logger.info("ℹ️ Optimization system disabled (OPTIMIZATION_ENABLED=False)")
+        planner_context = None
+        identifier_context = None
+        assembler_context = None
+        validator_context = None
+
     # Initialize agents and tasks with library context and workflow_id
-    agents = RobotAgents(model_provider, model_name, library_context)
+    agents = RobotAgents(
+        model_provider, 
+        model_name, 
+        library_context,
+        assembler_context=assembler_context,  # Use consistent naming with other contexts
+        keyword_search_tool=keyword_search_tool,
+        planner_context=planner_context,
+        identifier_context=identifier_context,
+        validator_context=validator_context
+    )
     tasks = RobotTasks(library_context, workflow_id=workflow_id)
 
     # Define Agents (removed popup_strategy_agent - let BrowserUse handle popups contextually)
@@ -101,6 +235,7 @@ def run_crew(query: str, model_provider: str, model_name: str, library_type: str
         tasks=[plan_steps, identify_elements, assemble_code, validate_code],
         process=Process.sequential,
         verbose=True,
+        embedder=None,  # Disable automatic knowledge/embedding system
     )
 
     logger.info("🚀 Starting CrewAI workflow execution...")
@@ -114,7 +249,17 @@ def run_crew(query: str, model_provider: str, model_name: str, library_type: str
         logger.info("✅ CrewAI workflow completed successfully")
         logger.info(f"🏁 Crew execution finished - delegation cycle complete")
         logger.info(f"📊 Final LLM Stats: {formatting_monitor.get_stats()}")
-        return result, crew
+        
+        # NOTE: Pattern learning is NOT done here!
+        # Learning should only happen AFTER test execution succeeds (test_status == "passed")
+        # This ensures we only learn from validated, working code.
+        # The learning is triggered in workflow_service.py after Docker execution completes successfully.
+        
+        # Return optimization metrics separately (Crew object doesn't allow dynamic attributes)
+        if optimization_metrics:
+            logger.info("📊 Optimization metrics collected")
+        
+        return result, crew, optimization_metrics
 
     except Exception as e:
         error_msg = str(e)
diff --git a/src/backend/crew_ai/library_context/base.py b/src/backend/crew_ai/library_context/base.py
index 2d8978c..83e589f 100644
--- a/src/backend/crew_ai/library_context/base.py
+++ b/src/backend/crew_ai/library_context/base.py
@@ -118,6 +118,27 @@ def get_viewport_config_code(self) -> str:
         """
         pass
 
+    @property
+    @abstractmethod
+    def core_rules(self) -> str:
+        """
+        Return core library rules that must always be included in agent context.
+        
+        These are critical rules that should never be omitted, even in optimized mode.
+        Target: ~300 tokens
+        
+        Should include:
+        - Critical keyword sequences (e.g., New Browser → New Context → New Page)
+        - Parameter rules (e.g., viewport=None requirement)
+        - Auto-waiting behavior
+        - Locator priorities
+        - Common pitfalls to avoid
+        
+        Returns:
+            str: Core rules text (~300 tokens)
+        """
+        pass
+
     def get_full_context(self, agent_role: str) -> str:
         """
         Get complete context for a specific agent role.
diff --git a/src/backend/crew_ai/library_context/browser_context.py b/src/backend/crew_ai/library_context/browser_context.py
index 350ff74..9decad3 100644
--- a/src/backend/crew_ai/library_context/browser_context.py
+++ b/src/backend/crew_ai/library_context/browser_context.py
@@ -19,6 +19,9 @@ class BrowserLibraryContext(LibraryContext):
     def __init__(self):
         """Initialize with dynamic documentation extractor."""
         self._doc_extractor = DynamicLibraryDocumentation("Browser")
+        # Lazy-loaded caches for contexts
+        self._planning_context_cache = None
+        self._code_assembly_context_cache = None
 
     @property
     def library_name(self) -> str:
@@ -46,59 +49,74 @@ def get_viewport_config_code(self) -> str:
         return "    New Context    viewport=None"
 
     @property
-    def planning_context(self) -> str:
+    def core_rules(self) -> str:
         """
-        Context for Step Planner Agent.
-        Combines dynamic keywords with static best practices.
+        Core Browser Library rules that must always be included (~300 tokens).
+        
+        These critical rules ensure correct code generation even in optimized mode.
         """
-        # Get dynamic keywords from installed library (top 25 most common)
-        dynamic_keywords = self._doc_extractor.get_keywords_summary(
-            max_keywords=25)
-
-        # Add complete keyword list (lightweight - just names)
-        from .dynamic_context import get_all_keywords_list
-        all_keywords = get_all_keywords_list("Browser")
-
-        # Add static best practices
-        best_practices = """
-
-**BEST PRACTICES:**
-
-1. **Browser Initialization:**
-   - Always use "New Browser" before "New Page"
-   - Browser types: chromium (recommended), firefox, webkit
-   - Set headless=True for CI/CD environments
-
-2. **Auto-Waiting:**
-   - Browser Library automatically waits for elements to be actionable
-   - Explicit waits rarely needed (unlike SeleniumLibrary)
-   - Elements must be visible, enabled, and stable before interaction
-
-3. **Locator Strategy (Browser Library Advantages):**
-   - **text=<value>** → Find by visible text (most stable!)
-   - **role=<role>[name="<name>"]** → Find by ARIA role (accessibility-first)
-   - **data-testid=<value>** → Find by test ID
-   - **id=<value>** → Find by ID
-   - **<css_selector>** → CSS selector (no prefix needed)
-   - **xpath=<expression>** → XPath (no prefix needed)
-
-4. **Priority Order:**
-   - text > role > data-testid > id > css > xpath
-   - Text and role selectors are more stable than CSS/XPath
-
-**KEY DIFFERENCES FROM SELENIUM:**
-- ✅ Auto-waiting built-in (no explicit waits needed)
-- ✅ Strict mode ensures locators are unique
-- ✅ Better locator strategies (text, role)
-- ✅ Faster execution (Playwright engine)
+        return """
+**BROWSER LIBRARY CORE RULES:**
+
+1. **CRITICAL SEQUENCE (MUST FOLLOW):**
+   New Browser → New Context viewport=None → New Page
+   
+   Example:
+   ```robot
+   New Browser    chromium    headless=True
+   New Context    viewport=None    ← REQUIRED!
+   New Page    https://example.com
+   ```
+
+2. **VIEWPORT REQUIREMENT:**
+   - ALWAYS include "New Context    viewport=None" after New Browser
+   - Default viewport (800x600) causes element detection failures
+   - This is the #1 cause of Browser Library test failures
+
+3. **PARAMETER RULES:**
+   - Browser Library uses: browser=chromium, headless=True
+   - NOT SeleniumLibrary syntax (no 'options' parameter)
+   - Valid browsers: chromium, firefox, webkit
+
+4. **AUTO-WAITING:**
+   - Browser Library auto-waits for elements (built-in)
+   - Explicit waits rarely needed
+   - Elements must be visible, enabled, stable
+
+5. **LOCATOR PRIORITY:**
+   text > role > data-testid > id > css > xpath
+   - text=<value> → Most stable
+   - role=<role>[name="<name>"] → Accessibility-first
+   - CSS selectors need no prefix
+
+6. **COMMON PITFALLS:**
+   ❌ Missing viewport config → Elements not found
+   ❌ Using SeleniumLibrary syntax → Keyword errors
+   ❌ Wrong sequence → Browser not initialized
 """
 
-        return dynamic_keywords + all_keywords + best_practices
+    @property
+    def planning_context(self) -> str:
+        """
+        Minimal context for Test Automation Planner Agent.
+        Returns high-level action categories without detailed keyword information.
+        Uses lazy loading with caching for performance.
+        """
+        if self._planning_context_cache is None:
+            self._planning_context_cache = self._doc_extractor.get_minimal_planning_context()
+        return self._planning_context_cache
 
     @property
     def code_assembly_context(self) -> str:
-        """Context for Code Assembler Agent - Browser Library specific"""
-        return """
+        """
+        Detailed context for Code Assembler Agent.
+        Focuses on code structure and syntax rules.
+        Keyword details are available via keyword_search_tool.
+        Uses lazy loading with caching for performance.
+        """
+        if self._code_assembly_context_cache is None:
+            # Code structure template with critical syntax rules
+            code_structure = """
 --- BROWSER LIBRARY CODE STRUCTURE ---
 
 **MANDATORY STRUCTURE:**
@@ -175,42 +193,43 @@ def code_assembly_context(self) -> str:
 4. Browser Library auto-waits, so explicit waits are rarely needed
 5. Locators can be CSS selectors without prefix
 6. Text and role selectors are preferred for stability
+
+**KEYWORD REFERENCE:**
+Use the keyword_search_tool to look up specific keyword details when needed.
+Common keywords: New Browser, New Context, New Page, Fill Text, Click, Get Text, 
+Keyboard Key, Wait For Elements State, Close Browser
 """
+            
+            self._code_assembly_context_cache = code_structure
+        
+        return self._code_assembly_context_cache
 
     @property
     def validation_context(self) -> str:
-        """Context for Code Validator Agent - Browser Library specific"""
+        """
+        Context for Code Validator Agent - Browser Library specific (OPTIMIZED)
+        
+        PURPOSE: Provide LIBRARY-SPECIFIC syntax rules that differ from SeleniumLibrary.
+        This is the "what changes between libraries" context.
+        
+        SCOPE: Minimal, focused rules (~50 tokens)
+        - Library imports (Browser vs SeleniumLibrary)
+        - Browser initialization keywords (New Browser vs Open Browser)
+        - Parameter differences (browser/headless vs options)
+        - Keyword naming differences (Fill Text vs Input Text)
+        
+        NOT INCLUDED: Generic validation workflow, error reporting format, delegation logic
+        (That's in tasks.py validate_code_task description - ~500 tokens)
+        
+        SEPARATION OF CONCERNS:
+        - validation_context = Library-specific SYNTAX rules (here)
+        - Task description = Generic validation WORKFLOW (tasks.py)
+        - Optimized context = Query-specific KEYWORDS (smart_provider)
+        """
         return """
---- BROWSER LIBRARY VALIDATION RULES ---
-
-**VALIDATION CHECKLIST:**
-1. Library Browser is imported
-2. New Browser is called before New Page
-3. All keywords have correct arguments
-4. Variables are properly declared
-5. Locators use valid Browser Library format
-
-**COMMON ERRORS TO CHECK:**
-
-1. **Missing New Browser**
-   ❌ WRONG: New Page    https://example.com
-   ✅ CORRECT:
-      New Browser    chromium    headless=True
-      New Page    https://example.com
-
-2. **Incorrect Assignment Syntax**
-   ❌ WRONG: Get Text    ${locator}    ${result}
-   ✅ CORRECT: ${result}=    Get Text    ${locator}
-
-3. **Missing Library Import**
-   ❌ WRONG: (no *** Settings *** section)
-   ✅ CORRECT:
-      *** Settings ***
-      Library    Browser
-
-4. **Using SeleniumLibrary keywords**
-   ❌ WRONG: Open Browser    https://example.com
-   ✅ CORRECT: 
-      New Browser    chromium    headless=True
-      New Page    https://example.com
+**BROWSER LIBRARY RULES:**
+• Library Browser must be imported
+• New Browser before New Page
+• Variable assignment: ${var}= Get Text ${loc}
+• No SeleniumLibrary keywords (use New Browser, not Open Browser)
 """
diff --git a/src/backend/crew_ai/library_context/dynamic_context.py b/src/backend/crew_ai/library_context/dynamic_context.py
index 8f560ff..7091514 100644
--- a/src/backend/crew_ai/library_context/dynamic_context.py
+++ b/src/backend/crew_ai/library_context/dynamic_context.py
@@ -176,6 +176,41 @@ def sort_key(kw):
             logger.warning(f"Could not generate keywords summary: {e}")
             return f"--- {self.library_name.upper()} KEYWORDS ---\n\nCould not load dynamic documentation.\n"
     
+    def get_minimal_planning_context(self) -> str:
+        """
+        Get minimal keyword guidance for test planning phase.
+        Returns only high-level action categories without detailed keyword info.
+        
+        This method provides conceptual guidance about available actions
+        without listing specific keywords, parameters, or descriptions.
+        Designed to keep token usage under 400 tokens (~1600 characters).
+        
+        Returns:
+            Formatted string with minimal keyword guidance for planning
+        """
+        try:
+            # Verify library is available (uses cache if already loaded)
+            doc_data = self.get_library_documentation()
+            version = doc_data.get('version', 'Unknown')
+            library_display = f"{self.library_name} v{version}"
+        except Exception as e:
+            logger.warning(f"Could not load library documentation for {self.library_name}: {e}")
+            logger.info("Using fallback minimal planning context")
+            library_display = self.library_name
+        
+        # Generate minimal context with action categories only
+        context = f"--- {library_display.upper()} ACTION CATEGORIES ---\n\n"
+        context += "Available action types for test planning:\n\n"
+        context += "• Browser Management: Opening/closing browsers, navigation\n"
+        context += "• Element Interaction: Clicking, inputting text, selecting options\n"
+        context += "• Data Extraction: Getting text, attributes, URLs\n"
+        context += "• Keyboard Actions: Pressing keys, keyboard combinations\n"
+        context += "• Waiting: Waiting for elements, conditions\n"
+        context += "• Validation: Assertions and checks\n\n"
+        context += "Note: Focus on HIGH-LEVEL test steps. The Code Assembler will handle keyword details.\n"
+        
+        return context
+    
     def _get_generic_locator_guide(self) -> str:
         """Fallback locator guide if extraction fails."""
         if self.library_name == 'Browser':
diff --git a/src/backend/crew_ai/library_context/selenium_context.py b/src/backend/crew_ai/library_context/selenium_context.py
index cec93dd..cd74f03 100644
--- a/src/backend/crew_ai/library_context/selenium_context.py
+++ b/src/backend/crew_ai/library_context/selenium_context.py
@@ -19,6 +19,9 @@ class SeleniumLibraryContext(LibraryContext):
     def __init__(self):
         """Initialize with dynamic documentation extractor."""
         self._doc_extractor = DynamicLibraryDocumentation("SeleniumLibrary")
+        # Lazy-loaded caches for contexts
+        self._planning_context_cache = None
+        self._code_assembly_context_cache = None
 
     @property
     def library_name(self) -> str:
@@ -31,50 +34,25 @@ def library_import(self) -> str:
     @property
     def planning_context(self) -> str:
         """
-        Context for Step Planner Agent.
-        Combines dynamic keywords with static best practices.
+        Minimal context for Test Automation Planner Agent.
+        Returns high-level action categories without detailed keyword information.
+        Uses lazy loading with caching for performance.
         """
-        # Get dynamic keywords from installed library (top 25 most common)
-        dynamic_keywords = self._doc_extractor.get_keywords_summary(
-            max_keywords=25)
-
-        # Add complete keyword list (lightweight - just names)
-        from .dynamic_context import get_all_keywords_list
-        all_keywords = get_all_keywords_list("SeleniumLibrary")
-
-        # Add static best practices
-        best_practices = """
-
-**BEST PRACTICES:**
-
-1. **Search Optimization:**
-   - For search operations: Use "Press Keys" with "RETURN" instead of clicking search button
-   - Works on Google, Flipkart, Amazon, and most modern websites
-   - Faster and more reliable than finding/clicking search buttons
-
-2. **Locator Strategy:**
-   - Priority: id > name > data-* > aria-* > css > xpath
-   - Avoid dynamic classes (e.g., class names with random numbers)
-   - Use explicit locators from the element identifier agent
-
-3. **Wait Strategy:**
-   - Use "Wait Until Element Is Visible" for dynamic content
-   - Default timeout: 10 seconds
-   - Add waits after navigation or AJAX operations
-
-**LOCATOR FORMATS:**
-- id=<value>          → Find by ID attribute
-- name=<value>        → Find by name attribute  
-- xpath=<expression>  → Find by XPath
-- css=<selector>      → Find by CSS selector
-"""
-
-        return dynamic_keywords + all_keywords + best_practices
+        if self._planning_context_cache is None:
+            self._planning_context_cache = self._doc_extractor.get_minimal_planning_context()
+        return self._planning_context_cache
 
     @property
     def code_assembly_context(self) -> str:
-        """Context for Code Assembler Agent - extracted from existing tasks.py"""
-        return """
+        """
+        Detailed context for Code Assembler Agent.
+        Focuses on code structure and syntax rules.
+        Keyword details are available via keyword_search_tool.
+        Uses lazy loading with caching for performance.
+        """
+        if self._code_assembly_context_cache is None:
+            # Code structure template with critical syntax rules
+            code_structure = """
 --- SELENIUMLIBRARY CODE STRUCTURE ---
 
 **MANDATORY STRUCTURE:**
@@ -164,7 +142,16 @@ def code_assembly_context(self) -> str:
 3. Locators must be stored in variables
 4. Include proper indentation (4 spaces)
 5. Add documentation to test cases
+
+**KEYWORD REFERENCE:**
+Use the keyword_search_tool to look up specific keyword details when needed.
+Common keywords: Open Browser, Input Text, Press Keys, Click Element, Get Text,
+Wait Until Element Is Visible, Should Be True, Close Browser
 """
+            
+            self._code_assembly_context_cache = code_structure
+        
+        return self._code_assembly_context_cache
 
     @property
     def browser_init_params(self) -> dict:
@@ -198,68 +185,81 @@ def get_viewport_config_code(self) -> str:
         """
         return ""
 
+    @property
+    def core_rules(self) -> str:
+        """
+        Core SeleniumLibrary rules that must always be included (~300 tokens).
+        
+        These critical rules ensure correct code generation even in optimized mode.
+        """
+        return """
+**SELENIUMLIBRARY CORE RULES:**
+
+1. **BROWSER INITIALIZATION:**
+   Open Browser    <url>    chrome    options=${options}
+   
+   Example:
+   ```robot
+   ${browser}    chrome
+   ${options}    add_argument("--headless");add_argument("--no-sandbox");add_argument("--incognito")
+   Open Browser    https://example.com    ${browser}    options=${options}
+   ```
+
+2. **PARAMETER RULES:**
+   - SeleniumLibrary uses: browser=chrome, options=${options}
+   - NOT Browser Library syntax (no separate headless parameter)
+   - Options format: add_argument("--headless");add_argument("--no-sandbox")
+
+3. **WAIT STRATEGY:**
+   - SeleniumLibrary does NOT auto-wait (unlike Browser Library)
+   - Use "Wait Until Element Is Visible" for dynamic content
+   - Default timeout: 10 seconds
+   - Add waits after navigation or AJAX operations
+
+4. **LOCATOR PRIORITY:**
+   id > name > data-* > aria-* > css > xpath
+   - id=<value> → Most reliable
+   - name=<value> → Good for forms
+   - xpath=<expression> → Last resort
+
+5. **VARIABLE ASSIGNMENT:**
+   - Use ${variable}= syntax for assignments
+   - Example: ${text}=    Get Text    ${locator}
+   - NOT: Get Text    ${locator}    ${text}
+
+6. **COMMON PITFALLS:**
+   ❌ Missing options parameter → Browser fails to start
+   ❌ No explicit waits → Elements not found
+   ❌ Wrong assignment syntax → Variables not set
+"""
+
     @property
     def validation_context(self) -> str:
-        """Context for Code Validator Agent - extracted from existing tasks.py"""
+        """
+        Context for Code Validator Agent - SeleniumLibrary (OPTIMIZED)
+        
+        PURPOSE: Provide LIBRARY-SPECIFIC syntax rules that differ from Browser Library.
+        This is the "what changes between libraries" context.
+        
+        SCOPE: Minimal, focused rules (~50 tokens)
+        - Library imports (SeleniumLibrary, BuiltIn)
+        - Variable assignment syntax
+        - Locator prefix requirements (id=, name=, xpath=)
+        - Conditional keyword syntax (Run Keyword If)
+        
+        NOT INCLUDED: Generic validation workflow, error reporting format, delegation logic
+        (That's in tasks.py validate_code_task description - ~500 tokens)
+        
+        SEPARATION OF CONCERNS:
+        - validation_context = Library-specific SYNTAX rules (here)
+        - Task description = Generic validation WORKFLOW (tasks.py)
+        - Optimized context = Query-specific KEYWORDS (smart_provider)
+        """
         return """
---- SELENIUMLIBRARY VALIDATION RULES ---
-
-**VALIDATION CHECKLIST:**
-1. All required libraries are imported (SeleniumLibrary, BuiltIn, String if needed)
-2. All keywords have the correct number of arguments
-3. Variables are properly declared before use
-4. Should Be True statements have valid expressions
-5. Run Keyword If statements have proper syntax
-6. Price/numeric comparisons use proper conversion (Evaluate)
-
-**COMMON ERRORS TO CHECK:**
-
-1. **Missing Variable Declaration**
-   ❌ WRONG: Get Text    name=q
-   ✅ CORRECT: 
-      *** Variables ***
-      ${search_locator}    name=q
-      
-      *** Test Cases ***
-      Test
-          Get Text    ${search_locator}
-
-2. **Incorrect Assignment Syntax**
-   ❌ WRONG: Get Text    ${locator}    ${result}
-   ✅ CORRECT: ${result}=    Get Text    ${locator}
-
-3. **Missing Library Import**
-   ❌ WRONG: (no *** Settings *** section)
-   ✅ CORRECT:
-      *** Settings ***
-      Library    SeleniumLibrary
-      Library    BuiltIn
-
-4. **Invalid Locator Format**
-   ❌ WRONG: Get Text    search-box
-   ✅ CORRECT: Get Text    id=search-box
-
-5. **Missing Browser Config**
-   ❌ WRONG: Open Browser    https://example.com
-   ✅ CORRECT: Open Browser    https://example.com    chrome    options=${options}
-
-6. **Incorrect Should Be True Syntax**
-   ❌ WRONG: Should Be True    price < 1000
-   ✅ CORRECT: Should Be True    ${price} < 1000
-
-7. **Get Text without locator argument**
-   ❌ WRONG: ${text}=    Get Text
-   ✅ CORRECT: ${text}=    Get Text    ${locator}
-
-8. **Invalid expressions in Should Be True**
-   ❌ WRONG: Should Be True    product_price < 1000
-   ✅ CORRECT: Should Be True    ${product_price} < 1000
-
-9. **Missing variable assignments**
-   ❌ WRONG: Get Text    ${locator}
-   ✅ CORRECT: ${result}=    Get Text    ${locator}
-
-10. **Incorrect conditional syntax**
-    ❌ WRONG: If    ${total} > 100    Input Text    ${locator}    text
-    ✅ CORRECT: Run Keyword If    ${total} > 100    Input Text    ${locator}    text
+**SELENIUMLIBRARY RULES:**
+• Import SeleniumLibrary, BuiltIn
+• Variable assignment: ${var}= Get Text ${loc}
+• Locators need prefix: id=, name=, xpath=, css=
+• Variables in expressions: Should Be True ${price} < 1000
+• Conditionals: Run Keyword If ${cond} Keyword Args
 """
diff --git a/src/backend/crew_ai/optimization/__init__.py b/src/backend/crew_ai/optimization/__init__.py
new file mode 100644
index 0000000..f1c4145
--- /dev/null
+++ b/src/backend/crew_ai/optimization/__init__.py
@@ -0,0 +1,38 @@
+"""
+Optimization module for CrewAI-based Robot Framework code generation.
+
+This module provides:
+- ChromaDB vector store for keyword embeddings
+- Semantic keyword search tool for agents
+- Pattern learning from successful executions
+- Smart keyword provider with hybrid architecture
+- Centralized logging configuration
+"""
+
+from .chroma_store import KeywordVectorStore
+from .keyword_search_tool import KeywordSearchTool
+from .pattern_learning import QueryPatternMatcher
+from .smart_keyword_provider import SmartKeywordProvider
+from .context_pruner import ContextPruner
+from .logging_config import (
+    get_optimization_logger,
+    configure_optimization_logging,
+    LogMessages,
+    log_fallback,
+    log_critical_failure,
+    log_performance_metric,
+)
+
+__all__ = [
+    "KeywordVectorStore",
+    "KeywordSearchTool",
+    "QueryPatternMatcher",
+    "SmartKeywordProvider",
+    "ContextPruner",
+    "get_optimization_logger",
+    "configure_optimization_logging",
+    "LogMessages",
+    "log_fallback",
+    "log_critical_failure",
+    "log_performance_metric",
+]
diff --git a/src/backend/crew_ai/optimization/chroma_store.py b/src/backend/crew_ai/optimization/chroma_store.py
new file mode 100644
index 0000000..626cd9f
--- /dev/null
+++ b/src/backend/crew_ai/optimization/chroma_store.py
@@ -0,0 +1,378 @@
+"""
+ChromaDB vector store for keyword embeddings and semantic search.
+
+This module provides persistent storage and semantic search for Robot Framework
+keywords using ChromaDB with sentence-transformers embeddings.
+"""
+
+import json
+import logging
+from typing import List, Dict, Optional
+import chromadb
+from chromadb.config import Settings
+from chromadb.utils import embedding_functions
+
+logger = logging.getLogger(__name__)
+
+
+class KeywordVectorStore:
+    """
+    ChromaDB-based vector store for Robot Framework keywords.
+    
+    Provides:
+    - Persistent storage of keyword embeddings
+    - Semantic search over keywords
+    - Library-specific collections
+    - Version tracking and auto-rebuild
+    """
+    
+    def __init__(self, persist_directory: str = "./chroma_db"):
+        """
+        Initialize ChromaDB client with persistence.
+        
+        Args:
+            persist_directory: Path to ChromaDB storage directory
+        """
+        self.persist_directory = persist_directory
+        
+        try:
+            # Initialize ChromaDB client with persistence
+            self.client = chromadb.PersistentClient(
+                path=persist_directory,
+                settings=Settings(
+                    anonymized_telemetry=False,
+                    allow_reset=True
+                )
+            )
+            
+            # Initialize embedding function (sentence-transformers)
+            self.embedding_function = embedding_functions.SentenceTransformerEmbeddingFunction(
+                model_name="all-MiniLM-L6-v2"
+            )
+            
+            logger.info(f"ChromaDB initialized at {persist_directory}")
+            
+        except Exception as e:
+            logger.error(f"Failed to initialize ChromaDB: {e}")
+            raise
+    
+    def create_or_get_collection(self, library_name: str):
+        """
+        Get or create collection for library keywords.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            
+        Returns:
+            ChromaDB collection for keywords
+        """
+        collection_name = f"keywords_{library_name.lower()}"
+        
+        try:
+            collection = self.client.get_or_create_collection(
+                name=collection_name,
+                embedding_function=self.embedding_function,
+                metadata={"library": library_name}
+            )
+            logger.debug(f"Collection '{collection_name}' ready")
+            return collection
+            
+        except Exception as e:
+            logger.error(f"Failed to create/get collection '{collection_name}': {e}")
+            raise
+    
+    def get_or_create_pattern_collection(self):
+        """
+        Get or create collection for query patterns (used by pattern learning).
+        
+        Returns:
+            ChromaDB collection for query patterns
+        """
+        collection_name = "query_patterns"
+        
+        try:
+            collection = self.client.get_or_create_collection(
+                name=collection_name,
+                embedding_function=self.embedding_function,
+                metadata={"type": "query_patterns"}
+            )
+            logger.debug(f"Collection '{collection_name}' ready")
+            return collection
+            
+        except Exception as e:
+            logger.error(f"Failed to create/get collection '{collection_name}': {e}")
+            raise
+
+    
+    def add_keywords(self, library_name: str, keywords: List[Dict]) -> None:
+        """
+        Add keywords to ChromaDB collection.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            keywords: List of keyword dictionaries with name, doc, args
+        """
+        if not keywords:
+            logger.warning(f"No keywords provided for {library_name}")
+            return
+        
+        collection = self.create_or_get_collection(library_name)
+        
+        try:
+            # Prepare documents (keyword name + documentation for embedding)
+            documents = []
+            ids = []
+            metadatas = []
+            
+            for kw in keywords:
+                name = kw.get('name', '')
+                doc = kw.get('doc', '')
+                args = kw.get('args', [])
+                
+                if not name:
+                    continue
+                
+                # Create searchable text: keyword name + documentation
+                searchable_text = f"{name} {doc}"
+                documents.append(searchable_text)
+                ids.append(name)
+                
+                # Store metadata (truncate long docs to 500 chars)
+                metadatas.append({
+                    "name": name,
+                    "args": json.dumps(args),
+                    "doc": doc[:500] if doc else ""
+                })
+            
+            if not documents:
+                logger.warning(f"No valid keywords to add for {library_name}")
+                return
+            
+            # Add to collection (ChromaDB handles embedding generation)
+            collection.add(
+                documents=documents,
+                ids=ids,
+                metadatas=metadatas
+            )
+            
+            logger.info(f"Added {len(documents)} keywords to {library_name} collection")
+            
+        except Exception as e:
+            logger.error(f"Failed to add keywords to {library_name}: {e}")
+            raise
+    
+    def ingest_library_keywords(self, library_name: str) -> None:
+        """
+        Extract and ingest all keywords from a library using DynamicLibraryDocumentation.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+        """
+        try:
+            # Import here to avoid circular dependency
+            from ..library_context.dynamic_context import DynamicLibraryDocumentation
+            
+            logger.info(f"Extracting keywords from {library_name}...")
+            doc_extractor = DynamicLibraryDocumentation(library_name)
+            doc_data = doc_extractor.get_library_documentation()
+            
+            keywords = doc_data.get('keywords', [])
+            
+            # Filter out internal/deprecated keywords
+            public_keywords = [
+                kw for kw in keywords 
+                if not kw['name'].startswith('_') and 'deprecated' not in kw.get('doc', '').lower()
+            ]
+            
+            logger.info(f"Found {len(public_keywords)} public keywords in {library_name}")
+            
+            # Add to ChromaDB
+            self.add_keywords(library_name, public_keywords)
+            
+        except Exception as e:
+            logger.error(f"Failed to ingest keywords from {library_name}: {e}")
+            raise
+
+    
+    def search(self, library_name: str, query: str, top_k: int = 3) -> List[Dict]:
+        """
+        Semantic search for keywords using ChromaDB.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            query: Natural language query describing what you want to do
+            top_k: Number of results to return (default: 3)
+            
+        Returns:
+            List of matching keywords with metadata and similarity scores
+            Format: [{"name": str, "args": list, "description": str, "distance": float}, ...]
+        """
+        collection = self.create_or_get_collection(library_name)
+        
+        try:
+            # Query ChromaDB (it handles embedding generation automatically)
+            results = collection.query(
+                query_texts=[query],
+                n_results=top_k
+            )
+            
+            # Check if we have results
+            if not results['ids'] or not results['ids'][0]:
+                logger.warning(f"No results found for query: {query}")
+                return []
+            
+            # Format results
+            keywords = []
+            for i in range(len(results['ids'][0])):
+                metadata = results['metadatas'][0][i]
+                distance = results['distances'][0][i] if results.get('distances') else 0.0
+                
+                keywords.append({
+                    "name": metadata['name'],
+                    "args": json.loads(metadata['args']),
+                    "description": metadata['doc'],
+                    "distance": distance,
+                    "similarity": 1 / (1 + distance)  # Convert distance to similarity score
+                })
+            
+            logger.debug(f"Found {len(keywords)} keywords for query: {query}")
+            return keywords
+            
+        except Exception as e:
+            logger.error(f"Search failed for query '{query}': {e}")
+            return []
+
+    
+    def get_library_version(self, library_name: str) -> Optional[str]:
+        """
+        Get the version of the installed library.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            
+        Returns:
+            Version string or None if not found
+        """
+        try:
+            from ..library_context.dynamic_context import DynamicLibraryDocumentation
+            
+            doc_extractor = DynamicLibraryDocumentation(library_name)
+            doc_data = doc_extractor.get_library_documentation()
+            version = doc_data.get('version', None)
+            
+            logger.debug(f"{library_name} version: {version}")
+            return version
+            
+        except Exception as e:
+            logger.warning(f"Could not get version for {library_name}: {e}")
+            return None
+    
+    def get_collection_version(self, library_name: str) -> Optional[str]:
+        """
+        Get the version stored in the ChromaDB collection metadata.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            
+        Returns:
+            Version string or None if not found
+        """
+        try:
+            collection = self.create_or_get_collection(library_name)
+            metadata = collection.metadata
+            return metadata.get('version', None)
+            
+        except Exception as e:
+            logger.warning(f"Could not get collection version for {library_name}: {e}")
+            return None
+    
+    def needs_rebuild(self, library_name: str) -> bool:
+        """
+        Check if collection needs to be rebuilt due to version mismatch.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            
+        Returns:
+            True if rebuild needed, False otherwise
+        """
+        try:
+            current_version = self.get_library_version(library_name)
+            stored_version = self.get_collection_version(library_name)
+            
+            # If no stored version, need to build
+            if stored_version is None:
+                logger.info(f"No stored version for {library_name}, rebuild needed")
+                return True
+            
+            # If versions don't match, need to rebuild
+            if current_version != stored_version:
+                logger.info(f"Version mismatch for {library_name}: {stored_version} -> {current_version}, rebuild needed")
+                return True
+            
+            logger.debug(f"{library_name} version matches ({current_version}), no rebuild needed")
+            return False
+            
+        except Exception as e:
+            logger.warning(f"Could not check rebuild status for {library_name}: {e}")
+            return False
+    
+    def rebuild_collection(self, library_name: str) -> None:
+        """
+        Rebuild collection by deleting and re-ingesting keywords.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+        """
+        try:
+            collection_name = f"keywords_{library_name.lower()}"
+            
+            # Delete existing collection
+            try:
+                self.client.delete_collection(name=collection_name)
+                logger.info(f"Deleted existing collection: {collection_name}")
+            except Exception as e:
+                logger.debug(f"Collection {collection_name} does not exist or could not be deleted: {e}")
+            
+            # Get current library version
+            current_version = self.get_library_version(library_name)
+            
+            # Create new collection with version metadata
+            collection = self.client.create_collection(
+                name=collection_name,
+                embedding_function=self.embedding_function,
+                metadata={
+                    "library": library_name,
+                    "version": current_version or "unknown"
+                }
+            )
+            
+            logger.info(f"Created new collection: {collection_name} (version: {current_version})")
+            
+            # Ingest keywords
+            self.ingest_library_keywords(library_name)
+            
+            logger.info(f"Successfully rebuilt collection for {library_name}")
+            
+        except Exception as e:
+            logger.error(f"Failed to rebuild collection for {library_name}: {e}")
+            raise
+    
+    def ensure_collection_ready(self, library_name: str) -> None:
+        """
+        Ensure collection is ready and up-to-date.
+        Auto-rebuilds if version mismatch detected.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+        """
+        try:
+            if self.needs_rebuild(library_name):
+                logger.info(f"Rebuilding collection for {library_name}...")
+                self.rebuild_collection(library_name)
+            else:
+                logger.debug(f"Collection for {library_name} is up-to-date")
+                
+        except Exception as e:
+            logger.error(f"Failed to ensure collection ready for {library_name}: {e}")
+            raise
diff --git a/src/backend/crew_ai/optimization/context_pruner.py b/src/backend/crew_ai/optimization/context_pruner.py
new file mode 100644
index 0000000..d98b72f
--- /dev/null
+++ b/src/backend/crew_ai/optimization/context_pruner.py
@@ -0,0 +1,204 @@
+"""
+Context Pruner for Smart Keyword Filtering
+
+This module classifies user queries into action categories and prunes
+keyword context to include only relevant keywords, reducing token usage
+while maintaining code generation accuracy.
+"""
+
+import logging
+import numpy as np
+from typing import List, Dict
+from sentence_transformers import SentenceTransformer
+
+logger = logging.getLogger(__name__)
+
+
+class ContextPruner:
+    """
+    Classify queries and prune context to relevant keyword categories.
+    
+    Uses semantic similarity to classify queries into action categories
+    (navigation, input, interaction, extraction, assertion, wait) and
+    filters keywords to only those in relevant categories.
+    """
+    
+    # Keyword category mappings
+    KEYWORD_CATEGORIES = {
+        "navigation": [
+            "New Browser", "New Page", "Go To", "Go Back", "Go Forward",
+            "Close Browser", "Close Page", "Switch Page", "New Context"
+        ],
+        "input": [
+            "Fill Text", "Input Text", "Type Text", "Press Keys", 
+            "Upload File", "Type Secret", "Clear Text"
+        ],
+        "interaction": [
+            "Click", "Click Element", "Hover", "Drag And Drop",
+            "Select Options By", "Check Checkbox", "Uncheck Checkbox"
+        ],
+        "extraction": [
+            "Get Text", "Get Attribute", "Get Element Count", 
+            "Get Property", "Get Style", "Get Url", "Get Title"
+        ],
+        "assertion": [
+            "Should Be Equal", "Should Contain", "Should Be Visible",
+            "Should Not Be Visible", "Should Be Enabled", "Should Be Disabled"
+        ],
+        "wait": [
+            "Wait For Elements State", "Wait Until Element Is Visible",
+            "Wait For Condition", "Wait For Load State", "Sleep"
+        ]
+    }
+    
+    def __init__(self, model_name: str = "all-MiniLM-L6-v2"):
+        """
+        Initialize with sentence transformer model for classification.
+        
+        Args:
+            model_name: Name of sentence-transformers model to use
+        """
+        logger.info(f"Initializing ContextPruner with model: {model_name}")
+        self.model = SentenceTransformer(model_name)
+        self._init_category_embeddings()
+        logger.info("ContextPruner initialized successfully")
+    
+    def _init_category_embeddings(self):
+        """
+        Pre-compute embeddings for category descriptions.
+        
+        Creates semantic representations of each category for fast
+        similarity comparison during query classification.
+        """
+        logger.debug("Pre-computing category embeddings")
+        
+        # Define category descriptions for semantic matching
+        category_descriptions = {
+            "navigation": "open browser navigate to website go to page url address",
+            "input": "type text fill form input data enter information write",
+            "interaction": "click button press element hover drag drop select",
+            "extraction": "get text retrieve data extract information read content",
+            "assertion": "verify check validate assert should be equal confirm",
+            "wait": "wait for element visible ready loaded appear timeout"
+        }
+        
+        # Pre-compute embeddings for all categories
+        self.category_embeddings = {}
+        for category, description in category_descriptions.items():
+            embedding = self.model.encode([description])[0]
+            self.category_embeddings[category] = embedding
+            logger.debug(f"Category '{category}' embedding shape: {embedding.shape}")
+        
+        logger.info(f"Pre-computed embeddings for {len(self.category_embeddings)} categories")
+    
+    def classify_query(self, user_query: str, confidence_threshold: float = 0.8) -> List[str]:
+        """
+        Classify query into action categories using semantic similarity.
+        
+        Computes similarity between the query and each category description.
+        Returns categories that meet the confidence threshold, or all categories
+        if no category meets the threshold (graceful degradation).
+        
+        Args:
+            user_query: User's natural language query
+            confidence_threshold: Minimum similarity for category inclusion (0.0-1.0)
+            
+        Returns:
+            List of relevant category names (e.g., ["input", "interaction"])
+            Returns all categories if confidence too low (fallback)
+        """
+        logger.debug(f"Classifying query: {user_query[:50]}...")
+        
+        # Encode query
+        query_embedding = self.model.encode([user_query])[0]
+        
+        # Compute similarity with each category
+        similarities = {}
+        for category, category_embedding in self.category_embeddings.items():
+            # Cosine similarity using dot product (embeddings are normalized)
+            similarity = np.dot(query_embedding, category_embedding)
+            similarities[category] = similarity
+            logger.debug(f"Category '{category}' similarity: {similarity:.3f}")
+        
+        # Get categories above threshold
+        relevant_categories = [
+            category for category, similarity in similarities.items()
+            if similarity >= confidence_threshold
+        ]
+        
+        # If no categories meet threshold, return all (fallback)
+        if not relevant_categories:
+            logger.warning(
+                f"No categories met threshold {confidence_threshold}, "
+                f"max similarity: {max(similarities.values()):.3f}. "
+                "Falling back to all categories."
+            )
+            return list(self.KEYWORD_CATEGORIES.keys())
+        
+        logger.info(
+            f"Query classified into {len(relevant_categories)} categories: "
+            f"{', '.join(relevant_categories)}"
+        )
+        return relevant_categories
+    
+    def prune_keywords(self, all_keywords: List[Dict], categories: List[str]) -> List[Dict]:
+        """
+        Filter keywords to only those in relevant categories.
+        
+        Args:
+            all_keywords: All available keywords (list of dicts with 'name' key)
+            categories: Relevant categories from classification
+            
+        Returns:
+            Filtered list of keywords matching the categories
+        """
+        logger.debug(f"Pruning keywords for categories: {', '.join(categories)}")
+        
+        # Collect all keyword names from relevant categories
+        relevant_keyword_names = set()
+        for category in categories:
+            category_keywords = self.KEYWORD_CATEGORIES.get(category, [])
+            relevant_keyword_names.update(category_keywords)
+            logger.debug(f"Category '{category}': {len(category_keywords)} keywords")
+        
+        # Filter keywords
+        pruned_keywords = [
+            kw for kw in all_keywords
+            if kw.get('name') in relevant_keyword_names
+        ]
+        
+        logger.info(
+            f"Pruned keywords: {len(all_keywords)} -> {len(pruned_keywords)} "
+            f"({len(pruned_keywords)/len(all_keywords)*100:.1f}% retained)"
+        )
+        
+        return pruned_keywords
+    
+    def get_pruning_stats(self, original_count: int, pruned_count: int) -> Dict[str, float]:
+        """
+        Calculate pruning statistics.
+        
+        Args:
+            original_count: Number of keywords before pruning
+            pruned_count: Number of keywords after pruning
+            
+        Returns:
+            Dictionary with pruning statistics
+        """
+        if original_count == 0:
+            return {
+                "original_count": 0,
+                "pruned_count": 0,
+                "reduction_percentage": 0.0,
+                "retention_percentage": 0.0
+            }
+        
+        reduction_percentage = ((original_count - pruned_count) / original_count) * 100
+        retention_percentage = (pruned_count / original_count) * 100
+        
+        return {
+            "original_count": original_count,
+            "pruned_count": pruned_count,
+            "reduction_percentage": reduction_percentage,
+            "retention_percentage": retention_percentage
+        }
diff --git a/src/backend/crew_ai/optimization/keyword_search_tool.py b/src/backend/crew_ai/optimization/keyword_search_tool.py
new file mode 100644
index 0000000..8152bf9
--- /dev/null
+++ b/src/backend/crew_ai/optimization/keyword_search_tool.py
@@ -0,0 +1,169 @@
+"""
+Keyword search tool for CrewAI agents.
+
+Provides semantic search over Robot Framework keywords, allowing agents
+to find relevant keywords on-demand without having all keywords in context.
+"""
+
+import json
+import logging
+import time
+from typing import Optional
+from crewai.tools import BaseTool
+from .chroma_store import KeywordVectorStore
+
+logger = logging.getLogger(__name__)
+
+
+class KeywordSearchTool(BaseTool):
+    """
+    CrewAI tool for semantic keyword search using ChromaDB.
+    
+    Agents call this tool when they need to find relevant keywords for an action.
+    Returns top K matching keywords with descriptions and examples.
+    """
+    
+    name: str = "keyword_search"
+    description: str = """
+Search for Robot Framework keywords by describing what you want to do.
+Use this when you need to find the right keyword for an action.
+
+Input: Natural language query (e.g., "click a button", "wait for element", "fill text input")
+Output: Top 3 matching keywords with descriptions, arguments, and examples
+
+Example usage:
+- To find click keywords: "click a button"
+- To find input keywords: "type text into field"
+- To find wait keywords: "wait for element to be visible"
+"""
+    
+    # Use Pydantic's PrivateAttr for internal state
+    _library_name: str
+    _vector_store: KeywordVectorStore
+    _cache: dict
+    _metrics: Optional[object]
+    
+    def __init__(self, library_name: str, vector_store: KeywordVectorStore, metrics: Optional[object] = None):
+        """
+        Initialize with library name and ChromaDB vector store.
+        
+        Args:
+            library_name: "Browser" or "SeleniumLibrary"
+            vector_store: KeywordVectorStore instance
+            metrics: Optional WorkflowMetrics instance for tracking
+        """
+        super().__init__()
+        object.__setattr__(self, '_library_name', library_name)
+        object.__setattr__(self, '_vector_store', vector_store)
+        object.__setattr__(self, '_cache', {})
+        object.__setattr__(self, '_metrics', metrics)
+    
+    def _run(self, query: str, top_k: int = 3) -> str:
+        """
+        Search for keywords matching the query.
+        
+        Args:
+            query: Natural language description of what you want to do
+            top_k: Number of results to return (default: 3)
+            
+        Returns:
+            JSON string with top matching keywords
+        """
+        # Start timing for metrics
+        start_time = time.time()
+        
+        # Check cache
+        cache_key = f"{query}:{top_k}"
+        if cache_key in self._cache:
+            logger.debug(f"Cache hit for query: {query}")
+            return self._cache[cache_key]
+        
+        try:
+            # Search ChromaDB
+            keywords = self._vector_store.search(
+                library_name=self._library_name,
+                query=query,
+                top_k=top_k
+            )
+            
+            if not keywords:
+                return json.dumps({
+                    "message": "No keywords found for your query. Try rephrasing or use a more general term.",
+                    "results": []
+                })
+            
+            # Format results for agent consumption
+            results = []
+            for kw in keywords:
+                # Generate usage example
+                example = self._get_example(kw['name'], kw['args'])
+                
+                results.append({
+                    "name": kw['name'],
+                    "args": kw['args'],
+                    "description": kw['description'][:200] if kw['description'] else "No description available",
+                    "example": example,
+                    "similarity": round(kw['similarity'], 3)
+                })
+            
+            result_json = json.dumps({
+                "query": query,
+                "library": self._library_name,
+                "results": results
+            }, indent=2)
+            
+            # Cache result (limit cache size to 100 entries)
+            if len(self._cache) >= 100:
+                # Remove oldest entry (simple FIFO)
+                self._cache.pop(next(iter(self._cache)))
+            self._cache[cache_key] = result_json
+            
+            # Track metrics if available
+            if self._metrics:
+                latency_ms = (time.time() - start_time) * 1000
+                returned_keyword_names = [r['name'] for r in results]
+                self._metrics.track_keyword_search(latency_ms, returned_keyword_names)
+            
+            logger.info(f"Keyword search for '{query}' returned {len(results)} results")
+            return result_json
+            
+        except Exception as e:
+            logger.error(f"Keyword search failed: {e}")
+            return json.dumps({
+                "error": "Search failed. Please try again or use keywords you already know.",
+                "results": []
+            })
+    
+    def _get_example(self, keyword_name: str, args: list) -> str:
+        """
+        Generate usage example for keyword.
+        
+        Args:
+            keyword_name: Name of the keyword
+            args: List of arguments
+            
+        Returns:
+            Example usage string
+        """
+        # Format arguments
+        if args:
+            # Handle both string and dict formats
+            arg_names = []
+            for arg in args:
+                if isinstance(arg, dict):
+                    arg_name = arg.get('name', '')
+                else:
+                    arg_name = str(arg).split('=')[0].split(':')[0].strip()
+                
+                if arg_name and arg_name not in ['self', 'cls']:
+                    arg_names.append(f"<{arg_name}>")
+            
+            arg_str = '    '.join(arg_names) if arg_names else ""
+        else:
+            arg_str = ""
+        
+        # Generate example based on keyword name
+        if arg_str:
+            return f"{keyword_name}    {arg_str}"
+        else:
+            return f"{keyword_name}"
diff --git a/src/backend/crew_ai/optimization/logging_config.py b/src/backend/crew_ai/optimization/logging_config.py
new file mode 100644
index 0000000..a8da45a
--- /dev/null
+++ b/src/backend/crew_ai/optimization/logging_config.py
@@ -0,0 +1,207 @@
+"""
+Logging configuration for the CrewAI optimization system.
+
+This module provides a centralized logging configuration for all optimization
+components, ensuring consistent logging behavior across the system.
+
+Logging Levels:
+- INFO: Normal operation (predictions used, search calls, successful operations)
+- WARNING: Fallback triggered (component failed, using baseline behavior)
+- ERROR: Critical failure (optimization disabled entirely, unrecoverable errors)
+- DEBUG: Detailed diagnostic information (for development/troubleshooting)
+"""
+
+import logging
+import sys
+from typing import Optional
+
+
+# Optimization-specific logger name
+OPTIMIZATION_LOGGER_NAME = "crew_ai.optimization"
+
+
+def get_optimization_logger(name: str) -> logging.Logger:
+    """
+    Get a logger for optimization components.
+    
+    Args:
+        name: Module name (typically __name__)
+        
+    Returns:
+        Configured logger instance
+        
+    Example:
+        >>> logger = get_optimization_logger(__name__)
+        >>> logger.info("Pattern learning predicted 8 keywords")
+    """
+    # Create logger with optimization namespace
+    if not name.startswith(OPTIMIZATION_LOGGER_NAME):
+        # If called from optimization module, use the module name
+        if "optimization" in name:
+            logger_name = name
+        else:
+            logger_name = f"{OPTIMIZATION_LOGGER_NAME}.{name}"
+    else:
+        logger_name = name
+    
+    return logging.getLogger(logger_name)
+
+
+def configure_optimization_logging(
+    level: str = "INFO",
+    log_file: Optional[str] = None,
+    format_string: Optional[str] = None
+) -> None:
+    """
+    Configure logging for the optimization system.
+    
+    This function sets up the optimization logger with appropriate handlers
+    and formatters. It should be called once during system initialization.
+    
+    Args:
+        level: Logging level (DEBUG, INFO, WARNING, ERROR)
+        log_file: Optional file path for logging output
+        format_string: Optional custom format string
+        
+    Example:
+        >>> configure_optimization_logging(level="INFO", log_file="logs/optimization.log")
+    """
+    # Get the root optimization logger
+    logger = logging.getLogger(OPTIMIZATION_LOGGER_NAME)
+    logger.setLevel(getattr(logging, level.upper()))
+    
+    # Remove existing handlers to avoid duplicates
+    logger.handlers.clear()
+    
+    # Default format string
+    if format_string is None:
+        format_string = (
+            "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+        )
+    
+    formatter = logging.Formatter(format_string)
+    
+    # Console handler (always enabled)
+    console_handler = logging.StreamHandler(sys.stdout)
+    console_handler.setLevel(getattr(logging, level.upper()))
+    console_handler.setFormatter(formatter)
+    logger.addHandler(console_handler)
+    
+    # File handler (optional)
+    if log_file:
+        try:
+            file_handler = logging.FileHandler(log_file)
+            file_handler.setLevel(getattr(logging, level.upper()))
+            file_handler.setFormatter(formatter)
+            logger.addHandler(file_handler)
+            logger.info(f"Optimization logging configured with file output: {log_file}")
+        except Exception as e:
+            logger.warning(f"Failed to configure file logging: {e}")
+    
+    # Prevent propagation to root logger to avoid duplicate logs
+    logger.propagate = False
+    
+    logger.info(f"Optimization logging configured at {level} level")
+
+
+# Standard log messages for common scenarios
+class LogMessages:
+    """
+    Standard log messages for optimization system.
+    
+    This class provides consistent log messages across all optimization
+    components, making it easier to monitor and troubleshoot the system.
+    """
+    
+    # INFO level messages (normal operation)
+    PATTERN_LEARNING_PREDICTION = "Pattern learning predicted {count} keywords with confidence {confidence:.3f}"
+    PATTERN_LEARNING_LEARNED = "Learned pattern from query: {query}"
+    KEYWORD_SEARCH_SUCCESS = "Keyword search for '{query}' returned {count} results in {latency:.1f}ms"
+    CONTEXT_PRUNING_SUCCESS = "Context pruning: {original} -> {pruned} keywords ({reduction:.1f}% reduction)"
+    CHROMA_INITIALIZED = "ChromaDB initialized at {path}"
+    COLLECTION_READY = "Collection '{name}' ready with {count} keywords"
+    
+    # WARNING level messages (fallback triggered)
+    PATTERN_LEARNING_FALLBACK = "Pattern learning failed: {error}, falling back to zero-context"
+    KEYWORD_SEARCH_FALLBACK = "Keyword search failed: {error}, providing full context to agent"
+    CONTEXT_PRUNING_FALLBACK = "Context pruning failed: {error}, using all predicted keywords"
+    EMBEDDING_FALLBACK = "Embedding generation failed: {error}, disabling semantic search"
+    FULL_CONTEXT_FALLBACK = "Using full context as fallback - optimization failed"
+    NO_PREDICTIONS = "No predictions from pattern learning, using zero-context + tool"
+    LOW_CONFIDENCE = "Top similarity {similarity:.3f} below threshold {threshold:.3f}"
+    NO_CATEGORIES = "No categories met threshold {threshold:.3f}, max similarity: {max_sim:.3f}"
+    
+    # ERROR level messages (critical failures)
+    CHROMA_INIT_FAILED = "Failed to initialize ChromaDB: {error}"
+    COLLECTION_CREATE_FAILED = "Failed to create/get collection '{name}': {error}"
+    KEYWORD_INGESTION_FAILED = "Failed to ingest keywords from {library}: {error}"
+    PATTERN_LEARNING_ERROR = "Failed to learn from execution: {error}"
+    KEYWORD_SEARCH_ERROR = "Keyword search failed: {error}"
+    ZERO_CONTEXT_ERROR = "Zero-context formatting failed: {error}, falling back to full context"
+    
+    # DEBUG level messages (detailed diagnostics)
+    CACHE_HIT = "Cache hit for query: {query}"
+    EXTRACTED_KEYWORDS = "Extracted {count} keywords from code: {keywords}"
+    CATEGORY_SIMILARITY = "Category '{category}' similarity: {similarity:.3f}"
+    QUERY_CLASSIFICATION = "Query classified into {count} categories: {categories}"
+
+
+# Convenience functions for common log patterns
+def log_fallback(logger: logging.Logger, component: str, error: Exception, fallback_action: str) -> None:
+    """
+    Log a fallback event with consistent formatting.
+    
+    Args:
+        logger: Logger instance
+        component: Component name (e.g., "Pattern Learning", "Keyword Search")
+        error: Exception that triggered the fallback
+        fallback_action: Description of fallback action taken
+        
+    Example:
+        >>> log_fallback(logger, "Pattern Learning", e, "using zero-context + tool")
+    """
+    logger.warning(
+        f"{component} failed: {error}, falling back to {fallback_action}",
+        exc_info=False  # Don't include stack trace for fallbacks
+    )
+
+
+def log_critical_failure(logger: logging.Logger, component: str, error: Exception) -> None:
+    """
+    Log a critical failure with full stack trace.
+    
+    Args:
+        logger: Logger instance
+        component: Component name
+        error: Exception that caused the failure
+        
+    Example:
+        >>> log_critical_failure(logger, "ChromaDB Initialization", e)
+    """
+    logger.error(
+        f"{component} failed critically: {error}",
+        exc_info=True  # Include full stack trace for critical errors
+    )
+
+
+def log_performance_metric(logger: logging.Logger, operation: str, duration_ms: float, threshold_ms: float) -> None:
+    """
+    Log a performance metric with threshold checking.
+    
+    Args:
+        logger: Logger instance
+        operation: Operation name
+        duration_ms: Duration in milliseconds
+        threshold_ms: Performance threshold in milliseconds
+        
+    Example:
+        >>> log_performance_metric(logger, "Keyword Search", 75.5, 100.0)
+    """
+    if duration_ms > threshold_ms:
+        logger.warning(
+            f"{operation} took {duration_ms:.1f}ms (threshold: {threshold_ms:.1f}ms)"
+        )
+    else:
+        logger.info(
+            f"{operation} completed in {duration_ms:.1f}ms"
+        )
diff --git a/src/backend/crew_ai/optimization/pattern_learning.py b/src/backend/crew_ai/optimization/pattern_learning.py
new file mode 100644
index 0000000..ae0beef
--- /dev/null
+++ b/src/backend/crew_ai/optimization/pattern_learning.py
@@ -0,0 +1,308 @@
+"""
+Pattern Learning System for Query-Keyword Association
+
+This module implements a pattern learning system that learns which keywords
+are commonly used for specific query types and predicts relevant keywords
+for new queries based on similarity to past queries.
+
+Uses ChromaDB for semantic similarity search (efficient) and SQLite for usage statistics.
+"""
+
+import sqlite3
+import json
+import time
+import logging
+from datetime import datetime
+from typing import List, Dict, Optional
+from pathlib import Path
+
+logger = logging.getLogger(__name__)
+
+
+class QueryPatternMatcher:
+    """
+    Learn and predict keyword usage patterns using ChromaDB for embeddings and SQLite for statistics.
+    Uses ChromaDB for semantic similarity search (efficient) and SQLite for usage tracking.
+    """
+    
+    def __init__(self, db_path: str = "./data/pattern_learning.db", chroma_store=None):
+        """
+        Initialize with SQLite database path and ChromaDB store.
+        
+        Args:
+            db_path: Path to SQLite database file (for usage statistics)
+            chroma_store: KeywordVectorStore instance (for query embeddings)
+        """
+        self.db_path = db_path
+        self.chroma_store = chroma_store
+        
+        # Ensure data directory exists
+        Path(self.db_path).parent.mkdir(parents=True, exist_ok=True)
+        
+        # Initialize database schema (SQLite for statistics only)
+        self._init_database()
+        
+        # Get or create ChromaDB collection for query patterns
+        if self.chroma_store:
+            self.pattern_collection = self.chroma_store.get_or_create_pattern_collection()
+        else:
+            logger.warning("No ChromaDB store provided, pattern learning will be limited")
+            self.pattern_collection = None
+        
+        logger.info(f"QueryPatternMatcher initialized with database: {db_path}")
+    
+    def _init_database(self):
+        """Create database schema if it doesn't exist (SQLite for statistics only)."""
+        conn = sqlite3.connect(self.db_path)
+        cursor = conn.cursor()
+        
+        # Create keyword_stats table (usage tracking)
+        cursor.execute("""
+            CREATE TABLE IF NOT EXISTS keyword_stats (
+                keyword_name TEXT PRIMARY KEY,
+                usage_count INTEGER DEFAULT 1,
+                last_used TEXT NOT NULL
+            )
+        """)
+        
+        # Create index for performance
+        cursor.execute("""
+            CREATE INDEX IF NOT EXISTS idx_keyword_stats_name 
+            ON keyword_stats(keyword_name)
+        """)
+        
+        conn.commit()
+        conn.close()
+        
+        logger.info("Database schema initialized successfully")
+    
+    def _extract_keywords_from_code(self, code: str) -> List[str]:
+        """
+        Extract Robot Framework keywords from generated code.
+        
+        Args:
+            code: Generated Robot Framework code
+            
+        Returns:
+            List of unique keyword names used in code
+        """
+        keywords = set()
+        
+        # Parse code line by line
+        in_test_case = False
+        test_case_name_next = False
+        
+        for line in code.split('\n'):
+            original_line = line
+            line = line.strip()
+            
+            # Skip empty lines and comments
+            if not line or line.startswith('#'):
+                continue
+            
+            # Check if we're in test case section
+            if line.startswith('*** Test Cases ***'):
+                in_test_case = True
+                test_case_name_next = True
+                continue
+            
+            # Skip section headers
+            if line.startswith('***'):
+                in_test_case = False
+                test_case_name_next = False
+                continue
+            
+            # Skip test case names (they appear right after *** Test Cases ***)
+            if in_test_case and test_case_name_next and not original_line.startswith('    '):
+                # This is a test case name, skip it
+                test_case_name_next = False
+                continue
+            
+            # Extract keywords from test case lines (must be indented)
+            if in_test_case and original_line.startswith('    ') and not line.startswith('['):
+                # Split by multiple spaces (Robot Framework separator)
+                parts = [p.strip() for p in line.split('    ') if p.strip()]
+                
+                if parts:
+                    # First part might be a variable assignment
+                    first_part = parts[0]
+                    
+                    # Check if it's a variable assignment (${var}= or ${var} =)
+                    if '=' in first_part and first_part.strip().startswith('${'):
+                        # Keyword is the second part
+                        if len(parts) > 1:
+                            keyword = parts[1]
+                            if not keyword.startswith('${') and not keyword.startswith('@{'):
+                                keywords.add(keyword)
+                    else:
+                        # First part is the keyword
+                        if not first_part.startswith('${') and not first_part.startswith('@{'):
+                            keywords.add(first_part)
+        
+        logger.debug(f"Extracted {len(keywords)} keywords from code: {keywords}")
+        return list(keywords)
+    
+    def learn_from_execution(self, user_query: str, generated_code: str):
+        """
+        Extract keywords from generated code and store pattern in ChromaDB + SQLite.
+        
+        Args:
+            user_query: Original user query
+            generated_code: Successfully generated Robot Framework code
+        """
+        try:
+            # Extract keywords used in code
+            used_keywords = self._extract_keywords_from_code(generated_code)
+            
+            if not used_keywords:
+                logger.warning("No keywords extracted from code, skipping pattern learning")
+                return
+            
+            timestamp = datetime.now().isoformat()
+            
+            # Store pattern in ChromaDB (for semantic search)
+            if self.pattern_collection:
+                pattern_id = f"pattern_{int(time.time() * 1000)}"
+                self.pattern_collection.add(
+                    documents=[user_query],
+                    ids=[pattern_id],
+                    metadatas=[{
+                        "keywords": json.dumps(used_keywords),
+                        "timestamp": timestamp
+                    }]
+                )
+                logger.debug(f"Stored pattern in ChromaDB: {pattern_id}")
+            
+            # Update keyword statistics in SQLite
+            conn = sqlite3.connect(self.db_path)
+            cursor = conn.cursor()
+            
+            for keyword in used_keywords:
+                cursor.execute("""
+                    INSERT INTO keyword_stats (keyword_name, usage_count, last_used)
+                    VALUES (?, 1, ?)
+                    ON CONFLICT(keyword_name) DO UPDATE SET
+                        usage_count = usage_count + 1,
+                        last_used = ?
+                """, (keyword, timestamp, timestamp))
+            
+            conn.commit()
+            conn.close()
+            
+            logger.info(f"Learned pattern: query='{user_query[:50]}...', keywords={used_keywords}")
+            
+        except Exception as e:
+            logger.error(f"Failed to learn from execution: {e}", exc_info=True)
+    
+    def get_relevant_keywords(self, user_query: str, confidence_threshold: float = 0.7) -> List[str]:
+        """
+        Predict relevant keywords based on similar past queries using ChromaDB.
+        
+        Args:
+            user_query: New user query
+            confidence_threshold: Minimum similarity score (0.0-1.0)
+            
+        Returns:
+            List of predicted keyword names (empty if confidence too low)
+        """
+        try:
+            if not self.pattern_collection:
+                logger.debug("No ChromaDB pattern collection available")
+                return []
+            
+            # Search for similar patterns in ChromaDB
+            results = self.pattern_collection.query(
+                query_texts=[user_query],
+                n_results=5  # Get top 5 similar patterns
+            )
+            
+            # Check if we have results
+            if not results['ids'][0]:
+                logger.debug("No patterns in ChromaDB yet")
+                return []
+            
+            # Check confidence (ChromaDB returns distances, lower is better)
+            # Convert distance to similarity: similarity = 1 / (1 + distance)
+            top_distance = results['distances'][0][0]
+            similarity = 1 / (1 + top_distance)
+            
+            if similarity < confidence_threshold:
+                logger.debug(f"Top similarity {similarity:.3f} below threshold {confidence_threshold}")
+                return []
+            
+            # Aggregate keywords from similar patterns
+            keyword_counts = {}
+            for i, metadata in enumerate(results['metadatas'][0]):
+                # Get distance for this result
+                distance = results['distances'][0][i]
+                result_similarity = 1 / (1 + distance)
+                
+                # Only use results above threshold
+                if result_similarity >= confidence_threshold:
+                    keywords = json.loads(metadata['keywords'])
+                    for keyword in keywords:
+                        keyword_counts[keyword] = keyword_counts.get(keyword, 0) + 1
+            
+            # Return top 10 most common keywords
+            sorted_keywords = sorted(keyword_counts.items(), key=lambda x: x[1], reverse=True)
+            predicted_keywords = [kw for kw, count in sorted_keywords[:10]]
+            
+            logger.info(f"Predicted {len(predicted_keywords)} keywords with confidence {similarity:.3f}")
+            logger.debug(f"Predicted keywords: {predicted_keywords}")
+            
+            return predicted_keywords
+            
+        except Exception as e:
+            logger.error(f"Failed to predict keywords: {e}", exc_info=True)
+            return []
+
+    
+    def get_keyword_stats(self) -> Dict[str, Dict]:
+        """
+        Get statistics about keyword usage.
+        
+        Returns:
+            Dictionary mapping keyword names to usage statistics
+        """
+        try:
+            conn = sqlite3.connect(self.db_path)
+            cursor = conn.cursor()
+            
+            cursor.execute("""
+                SELECT keyword_name, usage_count, last_used
+                FROM keyword_stats
+                ORDER BY usage_count DESC
+            """)
+            
+            stats = {}
+            for keyword_name, usage_count, last_used in cursor.fetchall():
+                stats[keyword_name] = {
+                    "usage_count": usage_count,
+                    "last_used": last_used
+                }
+            
+            conn.close()
+            return stats
+            
+        except Exception as e:
+            logger.error(f"Failed to get keyword stats: {e}", exc_info=True)
+            return {}
+    
+    def get_pattern_count(self) -> int:
+        """
+        Get the number of patterns stored in ChromaDB.
+        
+        Returns:
+            Number of patterns
+        """
+        try:
+            if not self.pattern_collection:
+                return 0
+            
+            # Get count from ChromaDB collection
+            count = self.pattern_collection.count()
+            return count
+            
+        except Exception as e:
+            logger.error(f"Failed to get pattern count: {e}", exc_info=True)
+            return 0
diff --git a/src/backend/crew_ai/optimization/smart_keyword_provider.py b/src/backend/crew_ai/optimization/smart_keyword_provider.py
new file mode 100644
index 0000000..cf5d684
--- /dev/null
+++ b/src/backend/crew_ai/optimization/smart_keyword_provider.py
@@ -0,0 +1,335 @@
+"""
+Smart Keyword Provider with Hybrid Architecture
+
+This module orchestrates the 3-tier keyword retrieval system:
+1. Core Rules (always included, ~300 tokens)
+2. Predicted Keywords (from pattern learning) OR Zero-Context + Tool
+3. Full Context Fallback (if both fail)
+"""
+
+import logging
+from typing import Optional, List, Dict
+from .pattern_learning import QueryPatternMatcher
+from .chroma_store import KeywordVectorStore
+from .keyword_search_tool import KeywordSearchTool
+from .context_pruner import ContextPruner
+
+logger = logging.getLogger(__name__)
+
+
+class SmartKeywordProvider:
+    """
+    Intelligent keyword provider with hybrid approach:
+    - Tier 1: Core Rules (always included)
+    - Tier 2: Predicted Keywords OR Zero-Context + Tool
+    - Tier 3: Full Context Fallback
+    """
+    
+    def __init__(self,
+                 library_context,
+                 pattern_matcher: QueryPatternMatcher,
+                 vector_store: KeywordVectorStore,
+                 context_pruner: Optional['ContextPruner'] = None,
+                 pruning_enabled: bool = False,
+                 pruning_threshold: float = 0.8,
+                 metrics: Optional[object] = None):
+        """
+        Initialize with library context and optimization components.
+        
+        Args:
+            library_context: LibraryContext instance (e.g., BrowserLibraryContext)
+            pattern_matcher: QueryPatternMatcher for pattern learning
+            vector_store: KeywordVectorStore for semantic search
+            context_pruner: Optional ContextPruner for smart keyword filtering
+            pruning_enabled: Whether to enable context pruning
+            pruning_threshold: Confidence threshold for category classification (0.0-1.0)
+            metrics: Optional WorkflowMetrics instance for tracking
+        """
+        self.library_context = library_context
+        self.pattern_matcher = pattern_matcher
+        self.vector_store = vector_store
+        self.context_pruner = context_pruner
+        self.pruning_enabled = pruning_enabled and context_pruner is not None
+        self.pruning_threshold = pruning_threshold
+        self.metrics = metrics
+        
+        logger.info(f"SmartKeywordProvider initialized for {library_context.library_name}")
+        if self.pruning_enabled:
+            logger.info(f"Context pruning enabled with threshold {pruning_threshold}")
+    
+    def _get_core_rules(self) -> str:
+        """
+        Get core library rules that are always included.
+        
+        Returns:
+            Core rules string (~300 tokens)
+        """
+        return self.library_context.core_rules
+    
+    def _format_zero_context_with_tool(self, agent_role: str) -> str:
+        """
+        Format minimal context with keyword search tool instructions.
+        
+        Used when no predictions are available from pattern learning.
+        Target: core rules (300) + tool instructions (200) = 500 tokens
+        
+        Args:
+            agent_role: "planner", "assembler", or "validator"
+            
+        Returns:
+            Formatted context string with core rules + tool usage instructions
+        """
+        core_rules = self._get_core_rules()
+        
+        return f"""
+You are an expert Robot Framework developer using {self.library_context.library_name}.
+
+{core_rules}
+
+**KEYWORD SEARCH TOOL AVAILABLE:**
+
+You have access to a keyword_search tool to find relevant keywords on-demand.
+When you need a keyword, search for it by describing what you want to do.
+
+**How to use the tool:**
+- Need to click? Search: "click button element"
+- Need to input text? Search: "type text input field"
+- Need to wait? Search: "wait element visible"
+- Need to get text? Search: "get text from element"
+
+The tool will return the top 3 matching keywords with documentation and examples.
+Use the exact keyword names and syntax from the tool results.
+
+**Examples:**
+```
+Action: keyword_search
+Action Input: "click button"
+
+Result: Click, Click Element, Click Button (with docs and examples)
+```
+
+Use this tool whenever you need to find the right keyword for an action.
+"""
+    
+    def _format_predicted_context(self, predicted_keywords: List[str], agent_role: str, user_query: str = "") -> str:
+        """
+        Format context with predicted keywords from pattern learning.
+        
+        Gets full documentation for predicted keywords from ChromaDB.
+        Optionally applies context pruning to filter keywords by category.
+        Target: core rules (300) + predicted keywords (500) = 800 tokens
+        
+        Args:
+            predicted_keywords: List of keyword names predicted by pattern learning
+            agent_role: "planner", "assembler", or "validator"
+            user_query: User's query (used for pruning if enabled)
+            
+        Returns:
+            Formatted context string with core rules + predicted keyword docs
+        """
+        # Get core rules
+        core_rules = self._get_core_rules()
+        
+        # Apply context pruning if enabled
+        keywords_to_fetch = predicted_keywords[:5]  # Limit to top 5 for efficiency
+        
+        if self.pruning_enabled and user_query:
+            try:
+                # Classify query into categories
+                relevant_categories = self.context_pruner.classify_query(
+                    user_query, 
+                    confidence_threshold=self.pruning_threshold
+                )
+                
+                # Create keyword dicts for pruning
+                keyword_dicts = [{'name': kw} for kw in keywords_to_fetch]
+                
+                # Prune keywords to relevant categories
+                pruned_keyword_dicts = self.context_pruner.prune_keywords(
+                    keyword_dicts, 
+                    relevant_categories
+                )
+                
+                # Extract pruned keyword names
+                keywords_to_fetch = [kw['name'] for kw in pruned_keyword_dicts]
+                
+                # Log pruning stats
+                stats = self.context_pruner.get_pruning_stats(
+                    len(keyword_dicts), 
+                    len(pruned_keyword_dicts)
+                )
+                logger.info(
+                    f"Context pruning: {stats['original_count']} -> {stats['pruned_count']} keywords "
+                    f"({stats['reduction_percentage']:.1f}% reduction)"
+                )
+            except Exception as e:
+                logger.warning(f"Context pruning failed: {e}, using all predicted keywords")
+        
+        # Get full documentation for keywords from ChromaDB
+        logger.info(f"Fetching documentation for {len(keywords_to_fetch)} keywords")
+        keyword_docs = []
+        for keyword_name in keywords_to_fetch:
+            # Search for exact keyword in ChromaDB
+            results = self.vector_store.search(
+                library_name=self.library_context.library_name,
+                query=keyword_name,
+                top_k=1
+            )
+            
+            if results and results[0]['name'] == keyword_name:
+                kw = results[0]
+                # Format keyword documentation - MINIMAL format to reduce tokens
+                # Only include essential info: name and first 2 args
+                args_list = kw['args'][:2] if kw['args'] else []
+                args_str = ', '.join([str(arg) for arg in args_list])
+                if len(kw['args']) > 2:
+                    args_str += ', ...'
+                
+                # Very short description (50 chars max)
+                doc_str = kw['description'][:50] if kw['description'] else ''
+                
+                # Compact format: one line per keyword
+                keyword_docs.append(f"• {kw['name']}({args_str}): {doc_str}")
+        
+        logger.info(f"Formatted {len(keyword_docs)} keyword docs in compact format")
+        
+        # Combine core rules + predicted keywords
+        predicted_docs = '\n'.join(keyword_docs) if keyword_docs else 'No predicted keywords available'
+        
+        return f"""
+You are an expert Robot Framework developer using {self.library_context.library_name}.
+
+{core_rules}
+
+**RELEVANT KEYWORDS (from similar queries):**
+{predicted_docs}
+
+Use keyword_search tool if you need additional keywords.
+"""
+    
+    def get_agent_context(self, user_query: str, agent_role: str) -> str:
+        """
+        Get optimized context for an agent based on query and role.
+        
+        Implements 3-tier retrieval:
+        1. Core Rules (always)
+        2. Predicted Keywords OR Zero-Context + Tool
+        3. Full Context Fallback
+        
+        Args:
+            user_query: User's natural language query
+            agent_role: "planner", "assembler", or "validator"
+            
+        Returns:
+            Optimized context string with minimal, relevant keywords
+        """
+        # Tier 1: Always include core rules
+        core_rules = self._get_core_rules()
+        
+        logger.info(f"Building context for {agent_role} agent")
+        logger.debug(f"Core rules: {len(core_rules)} chars")
+        
+        # Tier 2: Try pattern learning for keyword prediction
+        try:
+            predicted_keywords = self.pattern_matcher.get_relevant_keywords(user_query)
+            
+            if predicted_keywords:
+                logger.info(f"Pattern learning predicted {len(predicted_keywords)} keywords")
+                
+                # Track pattern learning metrics
+                if self.metrics:
+                    self.metrics.track_pattern_learning(
+                        predicted=True,
+                        keyword_count=len(predicted_keywords),
+                        accuracy=0.0  # Accuracy will be calculated after execution
+                    )
+                
+                try:
+                    return self._format_predicted_context(predicted_keywords, agent_role, user_query)
+                except Exception as e:
+                    logger.warning(f"Failed to format predicted context: {e}, falling back to zero-context")
+            else:
+                logger.info("No predictions from pattern learning, using zero-context + tool")
+                
+                # Track that no prediction was used
+                if self.metrics:
+                    self.metrics.track_pattern_learning(
+                        predicted=False,
+                        keyword_count=0,
+                        accuracy=0.0
+                    )
+        except Exception as e:
+            logger.warning(f"Pattern learning failed: {e}, falling back to zero-context")
+            
+            # Track that prediction failed
+            if self.metrics:
+                self.metrics.track_pattern_learning(
+                    predicted=False,
+                    keyword_count=0,
+                    accuracy=0.0
+                )
+        
+        # Tier 2 Fallback: Zero-context + tool instructions
+        try:
+            return self._format_zero_context_with_tool(agent_role)
+        except Exception as e:
+            logger.error(f"Zero-context formatting failed: {e}, falling back to full context")
+        
+        # Tier 3: Full context fallback (baseline behavior)
+        logger.warning("Using full context as fallback - optimization failed")
+        return self._get_full_context_fallback(agent_role)
+    
+    def _get_full_context_fallback(self, agent_role: str) -> str:
+        """
+        Get full context as fallback when optimization fails.
+        
+        This ensures graceful degradation to baseline behavior.
+        
+        Args:
+            agent_role: "planner", "assembler", or "validator"
+            
+        Returns:
+            Full context string from library_context
+        """
+        logger.info(f"Fallback to full context for {agent_role} agent")
+        
+        if agent_role == "planner":
+            return self.library_context.planning_context
+        elif agent_role == "identifier":
+            # Element identifier doesn't need keyword context, just minimal guidance
+            return "Expert web element locator. Use batch_browser_automation tool to find all elements in one call."
+        elif agent_role == "assembler":
+            return self.library_context.code_assembly_context
+        elif agent_role == "validator":
+            return self.library_context.validation_context
+        else:
+            # Default to code assembly context
+            logger.warning(f"Unknown agent role '{agent_role}', using code_assembly_context")
+            return self.library_context.code_assembly_context
+    
+    def get_keyword_search_tool(self) -> KeywordSearchTool:
+        """
+        Get keyword search tool for agents.
+        
+        Returns:
+            KeywordSearchTool instance configured for this library
+        """
+        return KeywordSearchTool(
+            library_name=self.library_context.library_name,
+            vector_store=self.vector_store,
+            metrics=self.metrics
+        )
+    
+    def learn_from_execution(self, user_query: str, generated_code: str):
+        """
+        Learn from successful execution.
+        
+        Args:
+            user_query: Original user query
+            generated_code: Successfully generated Robot Framework code
+        """
+        try:
+            self.pattern_matcher.learn_from_execution(user_query, generated_code)
+            logger.info(f"Learned pattern from query: {user_query[:50]}...")
+        except Exception as e:
+            logger.error(f"Failed to learn from execution: {e}")
diff --git a/src/backend/crew_ai/tasks.py b/src/backend/crew_ai/tasks.py
index 980c936..5f637b0 100644
--- a/src/backend/crew_ai/tasks.py
+++ b/src/backend/crew_ai/tasks.py
@@ -29,22 +29,20 @@ def __init__(self, library_context=None, workflow_id: str = ""):
         self.workflow_id = workflow_id
 
     def _get_keyword_guidelines(self) -> str:
-        """Get keyword guidelines from library context or use defaults."""
+        """Get MINIMAL keyword guidelines for planning phase."""
         if self.library_context:
-            # Use dynamic keywords from library context
+            # Use minimal planning context instead of detailed keywords
             return self.library_context.planning_context
         else:
-            # Fallback to basic guidelines (backward compatibility)
+            # Fallback to minimal guidance
             return """
-            *   `Open Browser`: For starting a new browser session.
-            *   `Input Text`: For typing text into input fields.
-            *   `Press Keys`: For pressing keyboard keys (e.g., ENTER, TAB, ESC).
-            *   `Click Element`: For clicking buttons, links, etc.
-            *   `Get Text`: For retrieving text from an element.
-            *   `Close Browser`: For ending the test session.
+            Available action types:
+            • Browser Management: Opening/closing browsers
+            • Element Interaction: Clicking, inputting text
+            • Data Extraction: Getting text from elements
+            • Keyboard Actions: Pressing keys
             
-            --- SEARCH OPTIMIZATION ---
-            *   For search operations: Use `Press Keys` with `RETURN` after `Input Text`.
+            Focus on HIGH-LEVEL steps. Code Assembler handles details.
             """
 
     def _get_code_structure_template(self) -> str:
diff --git a/src/backend/requirements.txt b/src/backend/requirements.txt
index cea7429..19791e7 100644
--- a/src/backend/requirements.txt
+++ b/src/backend/requirements.txt
@@ -23,4 +23,12 @@ langchain-ollama
 browser_use==0.7.10
 robotframework-browser[bb]
 playwright
-browser-service>=1.0.0
\ No newline at end of file
+browser-service>=1.0.0
+
+# ChromaDB Performance Optimization Dependencies (Requirement 7.1)
+# chromadb: Vector database for semantic keyword search and pattern learning storage
+chromadb==0.4.22
+# sentence-transformers: Generate embeddings for semantic similarity search
+sentence-transformers==2.2.2
+# numpy: Required by sentence-transformers for vector operations and similarity calculations
+numpy==1.24.3
\ No newline at end of file
diff --git a/src/backend/services/workflow_service.py b/src/backend/services/workflow_service.py
index 5586b91..6c55636 100644
--- a/src/backend/services/workflow_service.py
+++ b/src/backend/services/workflow_service.py
@@ -78,7 +78,7 @@ def run_agentic_workflow(natural_language_query: str, model_provider: str, model
         
         # Run CrewAI workflow (this takes most of the time - 10-15 seconds)
         # User sees progress messages above while this runs
-        validation_output, crew_with_results = run_crew(
+        validation_output, crew_with_results, optimization_metrics = run_crew(
             natural_language_query, model_provider, model_name, library_type=None, workflow_id=workflow_id)
         
         # Stage 3: Generating (50-75%)
@@ -446,10 +446,14 @@ async def stream_generate_only(user_query: str, model_provider: str, model_name:
     logging.info("✅ Test generation complete. Ready for user review.")
 
 
-async def stream_execute_only(robot_code: str) -> Generator[str, None, None]:
+async def stream_execute_only(robot_code: str, user_query: str = None) -> Generator[str, None, None]:
     """
     Executes provided Robot Framework test code in Docker container.
     Accepts user-edited or manually-written code.
+    
+    Args:
+        robot_code: Robot Framework test code to execute
+        user_query: Optional original user query for pattern learning
     """
     if not robot_code or not robot_code.strip():
         yield f"data: {json.dumps({'stage': 'execution', 'status': 'error', 'message': 'No test code provided'})}\n\n"
@@ -481,6 +485,39 @@ async def stream_execute_only(robot_code: str) -> Generator[str, None, None]:
         logging.info(f"🚀 Executing test: {test_filename}")
         result = run_test_in_container(client, run_id, test_filename)
         yield f"data: {json.dumps({'stage': 'execution', **result})}\n\n"
+        
+        # Pattern learning: ONLY learn from PASSED tests
+        # This ensures we only learn from validated, working code
+        if result.get('test_status') == 'passed':
+            if user_query:
+                try:
+                    from src.backend.core.config import settings
+                    if settings.OPTIMIZATION_ENABLED:
+                        # Initialize optimization components to learn from this successful execution
+                        from src.backend.crew_ai.optimization import SmartKeywordProvider, QueryPatternMatcher, KeywordVectorStore
+                        from src.backend.crew_ai.library_context import get_library_context
+                        
+                        logging.info("📚 Test PASSED - Learning from successful execution...")
+                        
+                        # Initialize components
+                        library_context = get_library_context(settings.ROBOT_LIBRARY)
+                        chroma_store = KeywordVectorStore(persist_directory=settings.OPTIMIZATION_CHROMA_DB_PATH)
+                        pattern_matcher = QueryPatternMatcher(db_path=settings.OPTIMIZATION_PATTERN_DB_PATH, chroma_store=chroma_store)
+                        smart_provider = SmartKeywordProvider(
+                            library_context=library_context,
+                            pattern_matcher=pattern_matcher,
+                            vector_store=chroma_store
+                        )
+                        
+                        # Learn from the successful execution
+                        smart_provider.learn_from_execution(user_query, robot_code)
+                        logging.info("✅ Pattern learning completed - learned from PASSED test")
+                except Exception as e:
+                    logging.warning(f"⚠️ Failed to learn from execution: {e}")
+            else:
+                logging.info("⏭️  Test PASSED but skipping pattern learning - no user query provided")
+        else:
+            logging.info(f"⏭️  Skipping pattern learning - test status: {result.get('test_status', 'unknown')}")
 
     except (ConnectionError, RuntimeError, Exception) as e:
         logging.error(f"An error occurred during Docker execution: {e}")
@@ -552,6 +589,36 @@ async def stream_generate_and_run(user_query: str, model_provider: str, model_na
         logging.info(f"🚀 Executing test: {test_filename}")
         result = run_test_in_container(client, run_id, test_filename)
         yield f"data: {json.dumps({'stage': 'execution', **result})}\n\n"
+        
+        # Pattern learning: ONLY learn from PASSED tests
+        # This ensures we only learn from validated, working code
+        if result.get('test_status') == 'passed':
+            try:
+                from src.backend.core.config import settings
+                if settings.OPTIMIZATION_ENABLED:
+                    # Initialize optimization components to learn from this successful execution
+                    from src.backend.crew_ai.optimization import SmartKeywordProvider, QueryPatternMatcher, KeywordVectorStore
+                    from src.backend.crew_ai.library_context import get_library_context
+                    
+                    logging.info("📚 Test PASSED - Learning from successful execution...")
+                    
+                    # Initialize components
+                    library_context = get_library_context(settings.ROBOT_LIBRARY)
+                    chroma_store = KeywordVectorStore(persist_directory=settings.OPTIMIZATION_CHROMA_DB_PATH)
+                    pattern_matcher = QueryPatternMatcher(db_path=settings.OPTIMIZATION_PATTERN_DB_PATH, chroma_store=chroma_store)
+                    smart_provider = SmartKeywordProvider(
+                        library_context=library_context,
+                        pattern_matcher=pattern_matcher,
+                        vector_store=chroma_store
+                    )
+                    
+                    # Learn from the successful execution
+                    smart_provider.learn_from_execution(user_query, robot_code)
+                    logging.info("✅ Pattern learning completed - learned from PASSED test")
+            except Exception as e:
+                logging.warning(f"⚠️ Failed to learn from execution: {e}")
+        else:
+            logging.info(f"⏭️  Skipping pattern learning - test status: {result.get('test_status', 'unknown')}")
 
     except (ConnectionError, RuntimeError, Exception) as e:
         logging.error(f"An error occurred during Docker execution: {e}")
diff --git a/src/frontend/script.js b/src/frontend/script.js
index 6964cc4..3d6c2be 100644
--- a/src/frontend/script.js
+++ b/src/frontend/script.js
@@ -23,6 +23,9 @@ document.addEventListener('DOMContentLoaded', () => {
     let hasGeneratedCode = false;
     let hasExecutedCode = false;
     
+    // Store the original user query for pattern learning
+    let currentUserQuery = null;
+    
     // Track manual collapse/expand state
     let generationLogsManualState = null; // null = auto, true = expanded, false = collapsed
     let executionLogsManualState = null; // null = auto, true = expanded, false = collapsed
@@ -381,6 +384,9 @@ document.addEventListener('DOMContentLoaded', () => {
         generationLogsManualState = null;
         executionLogsManualState = null;
         
+        // Clear stored user query
+        currentUserQuery = null;
+        
         // Hide both log sections
         generationLogsSection.style.display = 'none';
         executionLogsSection.style.display = 'none';
@@ -527,6 +533,9 @@ document.addEventListener('DOMContentLoaded', () => {
             }
         }
         
+        // Store the user query for pattern learning when executing
+        currentUserQuery = query;
+        
         updateButtonState(UIState.GENERATING);
         clearCode();
         generationLogsEl.innerHTML = '';
@@ -636,7 +645,8 @@ document.addEventListener('DOMContentLoaded', () => {
 
         try {
             const requestPayload = {
-                robot_code: code
+                robot_code: code,
+                user_query: currentUserQuery  // Pass the original query for pattern learning
             };
 
             const response = await fetch('/execute-test', {