diff --git a/cmd/prism-loadtest/cmd/serve.go b/cmd/prism-loadtest/cmd/serve.go
new file mode 100644
index 00000000..acbc42db
--- /dev/null
+++ b/cmd/prism-loadtest/cmd/serve.go
@@ -0,0 +1,103 @@
+package cmd
+
+import (
+	"context"
+	"fmt"
+	"os"
+	"os/signal"
+	"syscall"
+	"time"
+
+	"github.com/spf13/cobra"
+
+	"github.com/jrepp/prism-data-layer/cmd/prism-loadtest/server"
+)
+
+var (
+	servePort int
+)
+
+var serveCmd = &cobra.Command{
+	Use:   "serve",
+	Short: "Run prism-loadtest as a server with HTTP API and WebSocket streaming",
+	Long: `Start prism-loadtest in server mode, exposing:
+  - HTTP API for starting/stopping load tests
+  - WebSocket endpoint for real-time metrics streaming
+  - Embedded dashboard for visualization
+
+The server allows remote control of load tests and provides real-time
+metrics via WebSocket for D3-based visualizations.
+
+Example:
+  # Start server on default port (8091)
+  prism-loadtest serve
+
+  # Start server on custom port
+  prism-loadtest serve --port 9000
+
+  # Access dashboard
+  open http://localhost:8091/dashboard
+
+API Endpoints:
+  POST   /api/loadtest/start      - Start a new load test
+  POST   /api/loadtest/stop/:id   - Stop a running test
+  GET    /api/loadtest/status/:id - Get test status
+  GET    /api/loadtest/list       - List all tests
+  WS     /ws/metrics/:id          - Stream metrics for test
+  GET    /dashboard               - Embedded dashboard UI
+`,
+	RunE: runServe,
+}
+
+func init() {
+	rootCmd.AddCommand(serveCmd)
+	serveCmd.Flags().IntVar(&servePort, "port", 8091, "HTTP server port")
+}
+
+func runServe(cmd *cobra.Command, args []string) error {
+	fmt.Printf("Starting prism-loadtest server on port %d...\n", servePort)
+	fmt.Printf("Dashboard: http://localhost:%d/dashboard\n", servePort)
+	fmt.Printf("API:       http://localhost:%d/api/loadtest/...\n", servePort)
+	fmt.Printf("WebSocket: ws://localhost:%d/ws/metrics/:testId\n\n", servePort)
+
+	// Create backend configuration
+	backendConfig := server.BackendConfig{
+		RedisAddr:     redisAddr,
+		RedisPassword: redisPassword,
+		RedisDB:       redisDB,
+		NATSServers:   natsServers,
+	}
+
+	// Create and start server
+	srv := server.NewServer(servePort, backendConfig)
+
+	// Start server in background
+	errChan := make(chan error, 1)
+	go func() {
+		if err := srv.Start(); err != nil {
+			errChan <- err
+		}
+	}()
+
+	// Wait for interrupt signal
+	sigChan := make(chan os.Signal, 1)
+	signal.Notify(sigChan, syscall.SIGINT, syscall.SIGTERM)
+
+	select {
+	case err := <-errChan:
+		return fmt.Errorf("server failed to start: %w", err)
+	case sig := <-sigChan:
+		fmt.Printf("\nReceived signal %v, shutting down...\n", sig)
+	}
+
+	// Graceful shutdown
+	ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
+	defer cancel()
+
+	if err := srv.Shutdown(ctx); err != nil {
+		return fmt.Errorf("server shutdown failed: %w", err)
+	}
+
+	fmt.Println("Server stopped gracefully")
+	return nil
+}
diff --git a/cmd/prism-loadtest/server/dashboard.go b/cmd/prism-loadtest/server/dashboard.go
new file mode 100644
index 00000000..0748902e
--- /dev/null
+++ b/cmd/prism-loadtest/server/dashboard.go
@@ -0,0 +1,393 @@
+package server
+
+// dashboardHTML is the embedded dashboard
+const dashboardHTML = `<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Prism Load Test Dashboard</title>
+    <script src="https://d3js.org/d3.v7.min.js"></script>
+    <style>
+        * { margin: 0; padding: 0; box-sizing: border-box; }
+        body {
+            font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
+            background: #0a0a0a;
+            color: #e0e0e0;
+            padding: 20px;
+        }
+        .header {
+            text-align: center;
+            margin-bottom: 30px;
+            padding: 20px;
+            background: linear-gradient(135deg, #1e3a8a 0%, #3b82f6 100%);
+            border-radius: 10px;
+        }
+        h1 { color: #ffffff; font-size: 2.5em; margin-bottom: 10px; }
+        .subtitle { color: #cbd5e1; font-size: 1.2em; }
+        .controls {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+            gap: 15px;
+            margin-bottom: 30px;
+            padding: 20px;
+            background: #1a1a1a;
+            border-radius: 10px;
+        }
+        .control-group {
+            display: flex;
+            flex-direction: column;
+            gap: 8px;
+        }
+        label {
+            font-size: 0.9em;
+            color: #94a3b8;
+            text-transform: uppercase;
+            letter-spacing: 0.5px;
+        }
+        input, select {
+            padding: 10px;
+            background: #2a2a2a;
+            border: 1px solid #404040;
+            border-radius: 5px;
+            color: #e0e0e0;
+            font-size: 1em;
+        }
+        button {
+            padding: 10px 25px;
+            background: #3b82f6;
+            color: white;
+            border: none;
+            border-radius: 5px;
+            cursor: pointer;
+            font-size: 1em;
+            font-weight: 600;
+            transition: all 0.3s;
+        }
+        button:hover { background: #2563eb; transform: translateY(-2px); }
+        button:disabled { background: #4a4a4a; cursor: not-allowed; transform: none; }
+        button.stop { background: #ef4444; }
+        button.stop:hover { background: #dc2626; }
+        .status-bar {
+            padding: 15px 20px;
+            background: #1a1a1a;
+            border-radius: 10px;
+            margin-bottom: 30px;
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+        }
+        .status-indicator { display: flex; align-items: center; gap: 10px; }
+        .status-dot {
+            width: 12px;
+            height: 12px;
+            border-radius: 50%;
+            background: #6b7280;
+        }
+        .status-dot.connected {
+            background: #10b981;
+            animation: pulse 2s infinite;
+        }
+        @keyframes pulse {
+            0%, 100% { opacity: 1; }
+            50% { opacity: 0.5; }
+        }
+        .metrics-cards {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+            gap: 15px;
+            margin-bottom: 20px;
+        }
+        .metric-card {
+            background: #1a1a1a;
+            padding: 20px;
+            border-radius: 10px;
+            text-align: center;
+            border: 1px solid #2a2a2a;
+        }
+        .metric-label {
+            color: #94a3b8;
+            font-size: 0.9em;
+            margin-bottom: 10px;
+            text-transform: uppercase;
+            letter-spacing: 0.5px;
+        }
+        .metric-value {
+            color: #ffffff;
+            font-size: 2.5em;
+            font-weight: 700;
+        }
+        .metric-value.success { color: #10b981; }
+        .metric-value.error { color: #ef4444; }
+        .metric-value.info { color: #3b82f6; }
+        .charts {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(500px, 1fr));
+            gap: 20px;
+        }
+        .chart-card {
+            background: #1a1a1a;
+            border-radius: 10px;
+            padding: 20px;
+            border: 1px solid #2a2a2a;
+        }
+        .chart-title { font-size: 1.2em; font-weight: 600; margin-bottom: 15px; }
+        .chart { width: 100%; height: 300px; }
+        .line { fill: none; stroke-width: 2px; }
+        .line-throughput { stroke: #3b82f6; }
+        .line-p50 { stroke: #10b981; }
+        .line-p95 { stroke: #f59e0b; }
+        .line-p99 { stroke: #ef4444; }
+        .axis path, .axis line { stroke: #404040; }
+        .axis text { fill: #94a3b8; font-size: 11px; }
+    </style>
+</head>
+<body>
+    <div class="header">
+        <h1>🚀 Prism Load Test Dashboard</h1>
+        <div class="subtitle">Real-Time Performance Monitoring</div>
+    </div>
+
+    <div class="controls">
+        <div class="control-group">
+            <label>Duration</label>
+            <input type="text" id="duration" value="60s">
+        </div>
+        <div class="control-group">
+            <label>Rate (req/sec)</label>
+            <input type="number" id="rate" value="100" min="1" max="10000">
+        </div>
+        <div class="control-group">
+            <label>Register %</label>
+            <input type="number" id="registerPct" value="50" min="0" max="100">
+        </div>
+        <div class="control-group">
+            <label>Enumerate %</label>
+            <input type="number" id="enumeratePct" value="30" min="0" max="100">
+        </div>
+        <div class="control-group">
+            <label>Multicast %</label>
+            <input type="number" id="multicastPct" value="20" min="0" max="100">
+        </div>
+        <div class="control-group" style="justify-content: flex-end;">
+            <button id="startBtn" onclick="startTest()">▶ Start Test</button>
+        </div>
+        <div class="control-group" style="justify-content: flex-end;">
+            <button id="stopBtn" onclick="stopTest()" class="stop" disabled>⏹ Stop Test</button>
+        </div>
+    </div>
+
+    <div class="status-bar">
+        <div class="status-indicator">
+            <div class="status-dot" id="statusDot"></div>
+            <span id="statusText">Disconnected</span>
+        </div>
+        <div id="testInfo" style="color: #94a3b8;"></div>
+    </div>
+
+    <div class="metrics-cards">
+        <div class="metric-card">
+            <div class="metric-label">Total Requests</div>
+            <div class="metric-value info" id="totalRequests">0</div>
+        </div>
+        <div class="metric-card">
+            <div class="metric-label">Throughput</div>
+            <div class="metric-value info" id="throughput">0</div>
+            <div style="font-size: 0.9em; color: #6b7280;">req/s</div>
+        </div>
+        <div class="metric-card">
+            <div class="metric-label">Success Rate</div>
+            <div class="metric-value success" id="successRate">100%</div>
+        </div>
+        <div class="metric-card">
+            <div class="metric-label">P50 Latency</div>
+            <div class="metric-value" id="latencyP50">0</div>
+            <div style="font-size: 0.9em; color: #6b7280;">ms</div>
+        </div>
+    </div>
+
+    <div class="charts">
+        <div class="chart-card">
+            <div class="chart-title">Throughput Over Time</div>
+            <div class="chart" id="throughputChart"></div>
+        </div>
+        <div class="chart-card">
+            <div class="chart-title">Latency Percentiles</div>
+            <div class="chart" id="latencyChart"></div>
+        </div>
+    </div>
+
+    <script>
+        let currentTestId = null;
+        let ws = null;
+        let throughputData = [];
+        let latencyData = [];
+
+        // Initialize charts
+        const margin = {top: 20, right: 30, bottom: 30, left: 60};
+        const width = 500 - margin.left - margin.right;
+        const height = 300 - margin.top - margin.bottom;
+
+        function createChart(containerId, yLabel) {
+            const svg = d3.select('#' + containerId)
+                .append('svg')
+                .attr('width', width + margin.left + margin.right)
+                .attr('height', height + margin.top + margin.bottom)
+                .append('g')
+                .attr('transform', 'translate(' + margin.left + ',' + margin.top + ')');
+
+            const x = d3.scaleTime().range([0, width]);
+            const y = d3.scaleLinear().range([height, 0]);
+
+            const xAxis = svg.append('g')
+                .attr('class', 'axis')
+                .attr('transform', 'translate(0,' + height + ')');
+            const yAxis = svg.append('g').attr('class', 'axis');
+
+            svg.append('text')
+                .attr('transform', 'rotate(-90)')
+                .attr('y', -45)
+                .attr('x', -height / 2)
+                .attr('text-anchor', 'middle')
+                .style('fill', '#94a3b8')
+                .style('font-size', '12px')
+                .text(yLabel);
+
+            return {svg, x, y, xAxis, yAxis};
+        }
+
+        const throughputChart = createChart('throughputChart', 'req/sec');
+        const latencyChart = createChart('latencyChart', 'ms');
+
+        async function startTest() {
+            const config = {
+                mix: 'mixed',
+                duration: document.getElementById('duration').value,
+                rate: parseInt(document.getElementById('rate').value),
+                register_pct: parseInt(document.getElementById('registerPct').value),
+                enumerate_pct: parseInt(document.getElementById('enumeratePct').value),
+                multicast_pct: parseInt(document.getElementById('multicastPct').value)
+            };
+
+            try {
+                const response = await fetch('/api/loadtest/start', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json'},
+                    body: JSON.stringify(config)
+                });
+
+                const data = await response.json();
+                currentTestId = data.test_id;
+
+                document.getElementById('testInfo').textContent = 'Test: ' + currentTestId;
+                document.getElementById('startBtn').disabled = true;
+                document.getElementById('stopBtn').disabled = false;
+
+                // Clear data
+                throughputData = [];
+                latencyData = [];
+
+                // Connect WebSocket
+                connectWebSocket(currentTestId);
+
+            } catch (error) {
+                console.error('Failed to start test:', error);
+                alert('Failed to start test: ' + error.message);
+            }
+        }
+
+        async function stopTest() {
+            if (!currentTestId) return;
+
+            try {
+                await fetch('/api/loadtest/stop/' + currentTestId, {method: 'POST'});
+                document.getElementById('stopBtn').disabled = true;
+            } catch (error) {
+                console.error('Failed to stop test:', error);
+            }
+        }
+
+        function connectWebSocket(testId) {
+            const protocol = window.location.protocol === 'https:' ? 'wss:' : 'ws:';
+            ws = new WebSocket(protocol + '//' + window.location.host + '/ws/metrics/' + testId);
+
+            ws.onopen = () => {
+                document.getElementById('statusDot').classList.add('connected');
+                document.getElementById('statusText').textContent = 'Connected';
+            };
+
+            ws.onmessage = (event) => {
+                const metrics = JSON.parse(event.data);
+                updateMetrics(metrics);
+            };
+
+            ws.onclose = () => {
+                document.getElementById('statusDot').classList.remove('connected');
+                document.getElementById('statusText').textContent = 'Disconnected';
+                document.getElementById('startBtn').disabled = false;
+                document.getElementById('stopBtn').disabled = true;
+            };
+        }
+
+        function updateMetrics(metrics) {
+            document.getElementById('totalRequests').textContent = metrics.total_requests || 0;
+            document.getElementById('throughput').textContent = (metrics.throughput || 0).toFixed(1);
+            document.getElementById('latencyP50').textContent = (metrics.latency_p50 || 0).toFixed(2);
+
+            const successRate = metrics.total_requests > 0
+                ? ((metrics.total_requests - metrics.failed_requests) / metrics.total_requests * 100).toFixed(1)
+                : 100;
+            document.getElementById('successRate').textContent = successRate + '%';
+
+            // Add to time series
+            const dataPoint = {
+                timestamp: new Date(metrics.timestamp),
+                throughput: metrics.throughput || 0,
+                latency_p50: metrics.latency_p50 || 0,
+                latency_p95: metrics.latency_p95 || 0,
+                latency_p99: metrics.latency_p99 || 0
+            };
+
+            throughputData.push(dataPoint);
+            latencyData.push(dataPoint);
+
+            // Keep last 60 points
+            if (throughputData.length > 60) throughputData.shift();
+            if (latencyData.length > 60) latencyData.shift();
+
+            updateChart(throughputChart, throughputData, ['throughput']);
+            updateChart(latencyChart, latencyData, ['latency_p50', 'latency_p95', 'latency_p99']);
+        }
+
+        function updateChart(chart, data, metrics) {
+            if (!data || data.length === 0) return;
+
+            chart.x.domain(d3.extent(data, d => d.timestamp));
+            const yMax = d3.max(data, d => Math.max(...metrics.map(m => d[m] || 0)));
+            chart.y.domain([0, yMax * 1.1]);
+
+            chart.xAxis.call(d3.axisBottom(chart.x).ticks(6).tickFormat(d3.timeFormat('%H:%M:%S')));
+            chart.yAxis.call(d3.axisLeft(chart.y).ticks(5));
+
+            metrics.forEach(metric => {
+                const className = 'line-' + metric.replace('_', '-');
+                chart.svg.selectAll('.' + className).remove();
+
+                const line = d3.line()
+                    .x(d => chart.x(d.timestamp))
+                    .y(d => chart.y(d[metric] || 0))
+                    .curve(d3.curveMonotoneX);
+
+                chart.svg.append('path')
+                    .datum(data)
+                    .attr('class', 'line ' + className)
+                    .attr('d', line);
+            });
+        }
+
+        window.addEventListener('beforeunload', () => {
+            if (ws) ws.close();
+        });
+    </script>
+</body>
+</html>`
diff --git a/cmd/prism-loadtest/server/executor.go b/cmd/prism-loadtest/server/executor.go
new file mode 100644
index 00000000..40c7d7f0
--- /dev/null
+++ b/cmd/prism-loadtest/server/executor.go
@@ -0,0 +1,414 @@
+package server
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"math/rand"
+	"sync"
+	"sync/atomic"
+	"time"
+
+	"github.com/gorilla/websocket"
+	"golang.org/x/time/rate"
+
+	"github.com/jrepp/prism-data-layer/patterns/multicast_registry"
+	"github.com/jrepp/prism-data-layer/patterns/multicast_registry/backends"
+)
+
+// TestExecutor runs a load test and streams metrics to WebSocket clients
+type TestExecutor struct {
+	testID        string
+	config        TestConfig
+	backendConfig BackendConfig
+	status        string
+	startedAt     time.Time
+	stoppedAt     *time.Time
+
+	// Metrics
+	registerMetrics  *MetricsCollector
+	enumerateMetrics *MetricsCollector
+	multicastMetrics *MetricsCollector
+
+	// Counters
+	registerCount  atomic.Int64
+	enumerateCount atomic.Int64
+	multicastCount atomic.Int64
+	identityCounter atomic.Int64
+
+	// WebSocket clients
+	clients   []*websocket.Conn
+	clientsMu sync.RWMutex
+
+	// Control
+	stopChan chan struct{}
+	stopped  atomic.Bool
+	mu       sync.RWMutex
+}
+
+// MetricsMessage is sent to WebSocket clients
+type MetricsMessage struct {
+	Timestamp      time.Time `json:"timestamp"`
+	Throughput     float64   `json:"throughput"`
+	LatencyP50     float64   `json:"latency_p50"`
+	LatencyP95     float64   `json:"latency_p95"`
+	LatencyP99     float64   `json:"latency_p99"`
+	SuccessRate    float64   `json:"success_rate"`
+	TotalRequests  int64     `json:"total_requests"`
+	FailedRequests int64     `json:"failed_requests"`
+}
+
+// NewTestExecutor creates a new test executor
+func NewTestExecutor(testID string, config TestConfig, backendConfig BackendConfig) *TestExecutor {
+	return &TestExecutor{
+		testID:           testID,
+		config:           config,
+		backendConfig:    backendConfig,
+		status:           "running",
+		startedAt:        time.Now(),
+		registerMetrics:  NewMetricsCollector(),
+		enumerateMetrics: NewMetricsCollector(),
+		multicastMetrics: NewMetricsCollector(),
+		stopChan:         make(chan struct{}),
+		clients:          make([]*websocket.Conn, 0),
+	}
+}
+
+// Run starts the load test
+func (e *TestExecutor) Run() {
+	defer func() {
+		e.mu.Lock()
+		e.status = "completed"
+		now := time.Now()
+		e.stoppedAt = &now
+		e.mu.Unlock()
+
+		// Close all WebSocket connections
+		e.closeAllClients()
+	}()
+
+	// Parse duration
+	duration, err := time.ParseDuration(e.config.Duration)
+	if err != nil {
+		e.mu.Lock()
+		e.status = "failed"
+		e.mu.Unlock()
+		return
+	}
+
+	// Setup coordinator
+	coordinator, err := e.setupCoordinator()
+	if err != nil {
+		fmt.Printf("Failed to setup coordinator: %v\n", err)
+		e.mu.Lock()
+		e.status = "failed"
+		e.mu.Unlock()
+		return
+	}
+	defer coordinator.Close()
+
+	// Create context with timeout
+	ctx, cancel := context.WithTimeout(context.Background(), duration)
+	defer cancel()
+
+	// Start metrics broadcaster
+	go e.broadcastMetrics(ctx)
+
+	// Run load test
+	e.runLoadTest(ctx, coordinator)
+
+	fmt.Printf("Test %s completed\n", e.testID)
+}
+
+// runLoadTest executes the actual load test
+func (e *TestExecutor) runLoadTest(ctx context.Context, coordinator *multicast_registry.Coordinator) {
+	limiter := rate.NewLimiter(rate.Limit(e.config.Rate), e.config.Rate)
+	rng := rand.New(rand.NewSource(time.Now().UnixNano()))
+
+	var wg sync.WaitGroup
+
+	for {
+		select {
+		case <-ctx.Done():
+			wg.Wait()
+			return
+		case <-e.stopChan:
+			wg.Wait()
+			return
+		default:
+		}
+
+		// Rate limit
+		if err := limiter.Wait(ctx); err != nil {
+			wg.Wait()
+			return
+		}
+
+		// Select operation based on percentages
+		roll := rng.Intn(100)
+		var operation string
+
+		if roll < e.config.RegisterPct {
+			operation = "register"
+		} else if roll < e.config.RegisterPct+e.config.EnumeratePct {
+			operation = "enumerate"
+		} else {
+			operation = "multicast"
+		}
+
+		// Launch worker
+		wg.Add(1)
+		go func(op string) {
+			defer wg.Done()
+
+			switch op {
+			case "register":
+				e.registerCount.Add(1)
+				e.executeRegister(ctx, coordinator)
+			case "enumerate":
+				e.enumerateCount.Add(1)
+				e.executeEnumerate(ctx, coordinator)
+			case "multicast":
+				e.multicastCount.Add(1)
+				e.executeMulticast(ctx, coordinator)
+			}
+		}(operation)
+	}
+}
+
+// executeRegister performs a register operation
+func (e *TestExecutor) executeRegister(ctx context.Context, coordinator *multicast_registry.Coordinator) {
+	idNum := e.identityCounter.Add(1)
+	identity := fmt.Sprintf("loadtest-user-%d", idNum)
+
+	metadata := map[string]interface{}{
+		"status":    "online",
+		"loadtest":  true,
+		"timestamp": time.Now().Unix(),
+		"worker_id": idNum % 100,
+	}
+
+	start := time.Now()
+	err := coordinator.Register(ctx, identity, metadata, 300*time.Second)
+	latency := time.Since(start)
+
+	if err != nil {
+		e.registerMetrics.RecordFailure()
+	} else {
+		e.registerMetrics.RecordSuccess(latency)
+	}
+}
+
+// executeEnumerate performs an enumerate operation
+func (e *TestExecutor) executeEnumerate(ctx context.Context, coordinator *multicast_registry.Coordinator) {
+	filter := multicast_registry.NewFilter(map[string]interface{}{
+		"status": "online",
+	})
+
+	start := time.Now()
+	_, err := coordinator.Enumerate(ctx, filter)
+	latency := time.Since(start)
+
+	if err != nil {
+		e.enumerateMetrics.RecordFailure()
+	} else {
+		e.enumerateMetrics.RecordSuccess(latency)
+	}
+}
+
+// executeMulticast performs a multicast operation
+func (e *TestExecutor) executeMulticast(ctx context.Context, coordinator *multicast_registry.Coordinator) {
+	filter := multicast_registry.NewFilter(map[string]interface{}{
+		"status": "online",
+	})
+
+	payload := []byte(fmt.Sprintf(`{"type":"loadtest","timestamp":%d}`, time.Now().Unix()))
+
+	start := time.Now()
+	_, err := coordinator.Multicast(ctx, filter, payload)
+	latency := time.Since(start)
+
+	if err != nil {
+		e.multicastMetrics.RecordFailure()
+	} else {
+		e.multicastMetrics.RecordSuccess(latency)
+	}
+}
+
+// setupCoordinator creates a coordinator with backend connections
+func (e *TestExecutor) setupCoordinator() (*multicast_registry.Coordinator, error) {
+	// Create config
+	config := multicast_registry.DefaultConfig()
+	config.DefaultTTL = 300 * time.Second
+	config.MaxIdentities = 1000000 // Allow large number for load testing
+
+	// Create Redis registry backend
+	registryBackend, err := backends.NewRedisRegistryBackend(
+		e.backendConfig.RedisAddr,
+		e.backendConfig.RedisPassword,
+		e.backendConfig.RedisDB,
+		"loadtest:",
+	)
+	if err != nil {
+		return nil, fmt.Errorf("failed to create Redis backend: %w", err)
+	}
+
+	// Create NATS messaging backend
+	messagingBackend, err := backends.NewNATSMessagingBackend(e.backendConfig.NATSServers)
+	if err != nil {
+		registryBackend.Close()
+		return nil, fmt.Errorf("failed to create NATS backend: %w", err)
+	}
+
+	// Create coordinator
+	coordinator, err := multicast_registry.NewCoordinator(config, registryBackend, messagingBackend, nil)
+	if err != nil {
+		registryBackend.Close()
+		messagingBackend.Close()
+		return nil, fmt.Errorf("failed to create coordinator: %w", err)
+	}
+
+	return coordinator, nil
+}
+
+// broadcastMetrics periodically broadcasts metrics to WebSocket clients
+func (e *TestExecutor) broadcastMetrics(ctx context.Context) {
+	ticker := time.NewTicker(1 * time.Second)
+	defer ticker.Stop()
+
+	for {
+		select {
+		case <-ctx.Done():
+			return
+		case <-e.stopChan:
+			return
+		case <-ticker.C:
+			metrics := e.collectMetrics()
+			e.broadcast(metrics)
+		}
+	}
+}
+
+// collectMetrics aggregates current metrics
+func (e *TestExecutor) collectMetrics() MetricsMessage {
+	// Combine metrics from all operations
+	combined := NewMetricsCollector()
+
+	e.registerMetrics.Mu.Lock()
+	combined.TotalRequests += e.registerMetrics.TotalRequests
+	combined.SuccessfulReqs += e.registerMetrics.SuccessfulReqs
+	combined.FailedReqs += e.registerMetrics.FailedReqs
+	combined.TotalLatencyNs += e.registerMetrics.TotalLatencyNs
+	for bucket, count := range e.registerMetrics.LatencyBuckets {
+		combined.LatencyBuckets[bucket] += count
+	}
+	e.registerMetrics.Mu.Unlock()
+
+	e.enumerateMetrics.Mu.Lock()
+	combined.TotalRequests += e.enumerateMetrics.TotalRequests
+	combined.SuccessfulReqs += e.enumerateMetrics.SuccessfulReqs
+	combined.FailedReqs += e.enumerateMetrics.FailedReqs
+	combined.TotalLatencyNs += e.enumerateMetrics.TotalLatencyNs
+	for bucket, count := range e.enumerateMetrics.LatencyBuckets {
+		combined.LatencyBuckets[bucket] += count
+	}
+	e.enumerateMetrics.Mu.Unlock()
+
+	e.multicastMetrics.Mu.Lock()
+	combined.TotalRequests += e.multicastMetrics.TotalRequests
+	combined.SuccessfulReqs += e.multicastMetrics.SuccessfulReqs
+	combined.FailedReqs += e.multicastMetrics.FailedReqs
+	combined.TotalLatencyNs += e.multicastMetrics.TotalLatencyNs
+	for bucket, count := range e.multicastMetrics.LatencyBuckets {
+		combined.LatencyBuckets[bucket] += count
+	}
+	e.multicastMetrics.Mu.Unlock()
+
+	// Calculate metrics
+	elapsed := time.Since(e.startedAt)
+	throughput := float64(combined.TotalRequests) / elapsed.Seconds()
+	successRate := float64(100)
+	if combined.TotalRequests > 0 {
+		successRate = float64(combined.SuccessfulReqs) / float64(combined.TotalRequests) * 100
+	}
+
+	p50, p95, p99 := combined.CalculatePercentiles()
+
+	return MetricsMessage{
+		Timestamp:      time.Now(),
+		Throughput:     throughput,
+		LatencyP50:     float64(p50.Microseconds()) / 1000.0, // Convert to ms
+		LatencyP95:     float64(p95.Microseconds()) / 1000.0,
+		LatencyP99:     float64(p99.Microseconds()) / 1000.0,
+		SuccessRate:    successRate,
+		TotalRequests:  combined.TotalRequests,
+		FailedRequests: combined.FailedReqs,
+	}
+}
+
+// broadcast sends metrics to all connected WebSocket clients
+func (e *TestExecutor) broadcast(metrics MetricsMessage) {
+	e.clientsMu.Lock()
+	defer e.clientsMu.Unlock()
+
+	if len(e.clients) == 0 {
+		return
+	}
+
+	data, err := json.Marshal(metrics)
+	if err != nil {
+		return
+	}
+
+	// Send to all clients, removing dead ones
+	activeClients := make([]*websocket.Conn, 0, len(e.clients))
+	for _, client := range e.clients {
+		if err := client.WriteMessage(websocket.TextMessage, data); err != nil {
+			// Remove dead client
+			client.Close()
+		} else {
+			activeClients = append(activeClients, client)
+		}
+	}
+	e.clients = activeClients
+}
+
+// AddClient adds a WebSocket client
+func (e *TestExecutor) AddClient(conn *websocket.Conn) {
+	e.clientsMu.Lock()
+	defer e.clientsMu.Unlock()
+	e.clients = append(e.clients, conn)
+}
+
+// closeAllClients closes all WebSocket connections
+func (e *TestExecutor) closeAllClients() {
+	e.clientsMu.Lock()
+	defer e.clientsMu.Unlock()
+
+	for _, client := range e.clients {
+		client.Close()
+	}
+	e.clients = nil
+}
+
+// Stop stops the test
+func (e *TestExecutor) Stop() {
+	if e.stopped.Swap(true) {
+		return // Already stopped
+	}
+	close(e.stopChan)
+}
+
+// GetInfo returns test information
+func (e *TestExecutor) GetInfo() TestInfo {
+	e.mu.RLock()
+	defer e.mu.RUnlock()
+
+	return TestInfo{
+		TestID:    e.testID,
+		Status:    e.status,
+		StartedAt: e.startedAt,
+		StoppedAt: e.stoppedAt,
+		Config:    e.config,
+	}
+}
diff --git a/cmd/prism-loadtest/server/server.go b/cmd/prism-loadtest/server/server.go
new file mode 100644
index 00000000..138126dc
--- /dev/null
+++ b/cmd/prism-loadtest/server/server.go
@@ -0,0 +1,292 @@
+package server
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"net/http"
+	"sync"
+	"time"
+
+	"github.com/gorilla/mux"
+	"github.com/gorilla/websocket"
+)
+
+// Server manages HTTP API and WebSocket connections for load testing
+type Server struct {
+	port          int
+	backendConfig BackendConfig
+	httpServer    *http.Server
+	router        *mux.Router
+	tests         map[string]*TestExecutor
+	testsMu       sync.RWMutex
+	upgrader      websocket.Upgrader
+}
+
+// BackendConfig holds configuration for backend connections
+type BackendConfig struct {
+	RedisAddr     string
+	RedisPassword string
+	RedisDB       int
+	NATSServers   []string
+}
+
+// TestConfig holds configuration for a load test
+type TestConfig struct {
+	Mix          string `json:"mix"`            // "mixed", "register", etc.
+	Duration     string `json:"duration"`       // "60s", "5m"
+	Rate         int    `json:"rate"`           // req/sec
+	RegisterPct  int    `json:"register_pct"`   // 0-100
+	EnumeratePct int    `json:"enumerate_pct"`  // 0-100
+	MulticastPct int    `json:"multicast_pct"`  // 0-100
+}
+
+// TestInfo contains information about a test
+type TestInfo struct {
+	TestID    string    `json:"test_id"`
+	Status    string    `json:"status"`
+	StartedAt time.Time `json:"started_at"`
+	StoppedAt *time.Time `json:"stopped_at,omitempty"`
+	Config    TestConfig `json:"config"`
+}
+
+// NewServer creates a new load test server
+func NewServer(port int, backendConfig BackendConfig) *Server {
+	s := &Server{
+		port:          port,
+		backendConfig: backendConfig,
+		router:        mux.NewRouter(),
+		tests:         make(map[string]*TestExecutor),
+		upgrader: websocket.Upgrader{
+			CheckOrigin: func(r *http.Request) bool {
+				return true // Allow all origins for now
+			},
+		},
+	}
+
+	s.setupRoutes()
+	return s
+}
+
+// setupRoutes configures HTTP routes
+func (s *Server) setupRoutes() {
+	// Middleware (must be set before routes)
+	s.router.Use(corsMiddleware)
+	s.router.Use(loggingMiddleware)
+
+	// API routes
+	api := s.router.PathPrefix("/api/loadtest").Subrouter()
+	api.HandleFunc("/start", s.handleStartTest).Methods("POST", "OPTIONS")
+	api.HandleFunc("/stop/{testId}", s.handleStopTest).Methods("POST", "OPTIONS")
+	api.HandleFunc("/status/{testId}", s.handleGetStatus).Methods("GET", "OPTIONS")
+	api.HandleFunc("/list", s.handleListTests).Methods("GET", "OPTIONS")
+
+	// WebSocket route
+	s.router.HandleFunc("/ws/metrics/{testId}", s.handleWebSocket)
+
+	// Dashboard route
+	s.router.HandleFunc("/dashboard", s.handleDashboard).Methods("GET")
+	s.router.HandleFunc("/", s.handleDashboard).Methods("GET")
+}
+
+// handleStartTest starts a new load test
+func (s *Server) handleStartTest(w http.ResponseWriter, r *http.Request) {
+	var config TestConfig
+	if err := json.NewDecoder(r.Body).Decode(&config); err != nil {
+		sendError(w, "invalid_request", "Failed to parse request body", http.StatusBadRequest)
+		return
+	}
+
+	// Validate config
+	if config.Mix == "" {
+		config.Mix = "mixed"
+	}
+	if config.Duration == "" {
+		config.Duration = "60s"
+	}
+	if config.Rate == 0 {
+		config.Rate = 100
+	}
+
+	// Generate test ID with nanosecond precision to avoid collisions
+	testID := fmt.Sprintf("test-%d", time.Now().UnixNano())
+
+	// Create test executor
+	executor := NewTestExecutor(testID, config, s.backendConfig)
+
+	// Store test
+	s.testsMu.Lock()
+	s.tests[testID] = executor
+	s.testsMu.Unlock()
+
+	// Start test in background
+	go executor.Run()
+
+	// Return test info
+	info := TestInfo{
+		TestID:    testID,
+		Status:    "running",
+		StartedAt: time.Now(),
+		Config:    config,
+	}
+
+	sendJSON(w, info, http.StatusCreated)
+}
+
+// handleStopTest stops a running test
+func (s *Server) handleStopTest(w http.ResponseWriter, r *http.Request) {
+	vars := mux.Vars(r)
+	testID := vars["testId"]
+
+	s.testsMu.RLock()
+	executor, ok := s.tests[testID]
+	s.testsMu.RUnlock()
+
+	if !ok {
+		sendError(w, "not_found", "Test not found", http.StatusNotFound)
+		return
+	}
+
+	executor.Stop()
+
+	info := executor.GetInfo()
+	sendJSON(w, info, http.StatusOK)
+}
+
+// handleGetStatus gets the status of a test
+func (s *Server) handleGetStatus(w http.ResponseWriter, r *http.Request) {
+	vars := mux.Vars(r)
+	testID := vars["testId"]
+
+	s.testsMu.RLock()
+	executor, ok := s.tests[testID]
+	s.testsMu.RUnlock()
+
+	if !ok {
+		sendError(w, "not_found", "Test not found", http.StatusNotFound)
+		return
+	}
+
+	info := executor.GetInfo()
+	sendJSON(w, info, http.StatusOK)
+}
+
+// handleListTests lists all tests
+func (s *Server) handleListTests(w http.ResponseWriter, r *http.Request) {
+	s.testsMu.RLock()
+	defer s.testsMu.RUnlock()
+
+	tests := make([]TestInfo, 0)
+	for _, executor := range s.tests {
+		tests = append(tests, executor.GetInfo())
+	}
+
+	sendJSON(w, tests, http.StatusOK)
+}
+
+// handleWebSocket handles WebSocket connections for metrics streaming
+func (s *Server) handleWebSocket(w http.ResponseWriter, r *http.Request) {
+	vars := mux.Vars(r)
+	testID := vars["testId"]
+
+	s.testsMu.RLock()
+	executor, ok := s.tests[testID]
+	s.testsMu.RUnlock()
+
+	if !ok {
+		http.Error(w, "Test not found", http.StatusNotFound)
+		return
+	}
+
+	// Upgrade to WebSocket
+	conn, err := s.upgrader.Upgrade(w, r, nil)
+	if err != nil {
+		fmt.Printf("WebSocket upgrade failed: %v\n", err)
+		return
+	}
+
+	// Subscribe to metrics
+	executor.AddClient(conn)
+
+	fmt.Printf("WebSocket client connected for test %s\n", testID)
+}
+
+// handleDashboard serves the embedded dashboard
+func (s *Server) handleDashboard(w http.ResponseWriter, r *http.Request) {
+	w.Header().Set("Content-Type", "text/html")
+	w.Write([]byte(dashboardHTML))
+}
+
+// Start starts the HTTP server
+func (s *Server) Start() error {
+	addr := fmt.Sprintf(":%d", s.port)
+
+	s.httpServer = &http.Server{
+		Addr:         addr,
+		Handler:      s.router,
+		ReadTimeout:  15 * time.Second,
+		WriteTimeout: 15 * time.Second,
+		IdleTimeout:  60 * time.Second,
+	}
+
+	fmt.Printf("Server listening on %s\n", addr)
+	return s.httpServer.ListenAndServe()
+}
+
+// Shutdown gracefully shuts down the server
+func (s *Server) Shutdown(ctx context.Context) error {
+	// Stop all running tests
+	s.testsMu.Lock()
+	for _, executor := range s.tests {
+		executor.Stop()
+	}
+	s.testsMu.Unlock()
+
+	// Shutdown HTTP server if it was started
+	if s.httpServer != nil {
+		return s.httpServer.Shutdown(ctx)
+	}
+	return nil
+}
+
+// sendJSON sends a JSON response
+func sendJSON(w http.ResponseWriter, data interface{}, statusCode int) {
+	w.Header().Set("Content-Type", "application/json")
+	w.WriteHeader(statusCode)
+	json.NewEncoder(w).Encode(data)
+}
+
+// sendError sends an error response
+func sendError(w http.ResponseWriter, errorType, message string, code int) {
+	resp := map[string]interface{}{
+		"error":   errorType,
+		"message": message,
+		"code":    code,
+	}
+	sendJSON(w, resp, code)
+}
+
+// corsMiddleware adds CORS headers
+func corsMiddleware(next http.Handler) http.Handler {
+	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		w.Header().Set("Access-Control-Allow-Origin", "*")
+		w.Header().Set("Access-Control-Allow-Methods", "GET, POST, OPTIONS")
+		w.Header().Set("Access-Control-Allow-Headers", "Content-Type")
+
+		if r.Method == "OPTIONS" {
+			w.WriteHeader(http.StatusOK)
+			return
+		}
+
+		next.ServeHTTP(w, r)
+	})
+}
+
+// loggingMiddleware logs HTTP requests
+func loggingMiddleware(next http.Handler) http.Handler {
+	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		start := time.Now()
+		next.ServeHTTP(w, r)
+		fmt.Printf("%s %s %v\n", r.Method, r.URL.Path, time.Since(start))
+	})
+}