diff --git a/internal/launcher/connection_pool.go b/internal/launcher/connection_pool.go
index 68ff9a94..a4d2cedb 100644
--- a/internal/launcher/connection_pool.go
+++ b/internal/launcher/connection_pool.go
@@ -20,12 +20,12 @@ type ConnectionKey struct {
 
 // ConnectionMetadata tracks information about a pooled connection
 type ConnectionMetadata struct {
-	Connection  *mcp.Connection
-	CreatedAt   time.Time
-	LastUsedAt  time.Time
+	Connection   *mcp.Connection
+	CreatedAt    time.Time
+	LastUsedAt   time.Time
 	RequestCount int
-	ErrorCount  int
-	State       ConnectionState
+	ErrorCount   int
+	State        ConnectionState
 }
 
 // ConnectionState represents the state of a pooled connection
@@ -39,21 +39,22 @@ const (
 
 // Default configuration values
 const (
-	DefaultIdleTimeout    = 30 * time.Minute
+	DefaultIdleTimeout     = 30 * time.Minute
 	DefaultCleanupInterval = 5 * time.Minute
 	DefaultMaxErrorCount   = 10
 )
 
 // SessionConnectionPool manages connections keyed by (backend, session)
 type SessionConnectionPool struct {
-	connections      map[ConnectionKey]*ConnectionMetadata
-	mu               sync.RWMutex
-	ctx              context.Context
-	idleTimeout      time.Duration
-	cleanupInterval  time.Duration
-	maxErrorCount    int
-	cleanupTicker    *time.Ticker
-	cleanupDone      chan bool
+	connections     map[ConnectionKey]*ConnectionMetadata
+	mu              sync.RWMutex
+	ctx             context.Context
+	cancel          context.CancelFunc // cancel function to stop cleanup goroutine
+	idleTimeout     time.Duration
+	cleanupInterval time.Duration
+	maxErrorCount   int
+	cleanupTicker   *time.Ticker
+	cleanupDone     chan bool
 }
 
 // PoolConfig configures the connection pool
@@ -76,26 +77,31 @@ func NewSessionConnectionPool(ctx context.Context) *SessionConnectionPool {
 func NewSessionConnectionPoolWithConfig(ctx context.Context, config PoolConfig) *SessionConnectionPool {
 	logPool.Printf("Creating new session connection pool: idleTimeout=%v, cleanupInterval=%v, maxErrors=%d",
 		config.IdleTimeout, config.CleanupInterval, config.MaxErrorCount)
-	
+
+	// Create a cancellable context derived from the parent context
+	// This allows Stop() to signal the cleanup goroutine to exit
+	poolCtx, cancel := context.WithCancel(ctx)
+
 	pool := &SessionConnectionPool{
 		connections:     make(map[ConnectionKey]*ConnectionMetadata),
-		ctx:             ctx,
+		ctx:             poolCtx,
+		cancel:          cancel,
 		idleTimeout:     config.IdleTimeout,
 		cleanupInterval: config.CleanupInterval,
 		maxErrorCount:   config.MaxErrorCount,
 		cleanupDone:     make(chan bool),
 	}
-	
+
 	// Start cleanup goroutine
 	pool.startCleanup()
-	
+
 	return pool
 }
 
 // startCleanup starts the periodic cleanup goroutine
 func (p *SessionConnectionPool) startCleanup() {
 	p.cleanupTicker = time.NewTicker(p.cleanupInterval)
-	
+
 	go func() {
 		logPool.Print("Cleanup goroutine started")
 		for {
@@ -116,48 +122,48 @@ func (p *SessionConnectionPool) startCleanup() {
 func (p *SessionConnectionPool) cleanupIdleConnections() {
 	p.mu.Lock()
 	defer p.mu.Unlock()
-	
+
 	now := time.Now()
 	removed := 0
-	
+
 	for key, metadata := range p.connections {
 		shouldRemove := false
 		reason := ""
-		
+
 		// Check if idle for too long
 		if now.Sub(metadata.LastUsedAt) > p.idleTimeout {
 			shouldRemove = true
 			reason = "idle timeout"
 		}
-		
+
 		// Check if too many errors
 		if metadata.ErrorCount >= p.maxErrorCount {
 			shouldRemove = true
 			reason = "too many errors"
 		}
-		
+
 		// Check if already closed
 		if metadata.State == ConnectionStateClosed {
 			shouldRemove = true
 			reason = "already closed"
 		}
-		
+
 		if shouldRemove {
 			logPool.Printf("Cleaning up connection: backend=%s, session=%s, reason=%s, idle=%v, errors=%d",
 				key.BackendID, key.SessionID, reason, now.Sub(metadata.LastUsedAt), metadata.ErrorCount)
-			
+
 			// Close the connection if still active
 			if metadata.Connection != nil && metadata.State != ConnectionStateClosed {
 				// Note: mcp.Connection doesn't have a Close method in current implementation
 				// but we mark it as closed
 				metadata.State = ConnectionStateClosed
 			}
-			
+
 			delete(p.connections, key)
 			removed++
 		}
 	}
-	
+
 	if removed > 0 {
 		logPool.Printf("Cleanup complete: removed %d idle/failed connections, active=%d", removed, len(p.connections))
 	}
@@ -166,30 +172,35 @@ func (p *SessionConnectionPool) cleanupIdleConnections() {
 // Stop gracefully shuts down the connection pool
 func (p *SessionConnectionPool) Stop() {
 	logPool.Print("Stopping connection pool")
-	
-	// Stop cleanup goroutine
+
+	// Stop cleanup goroutine by cancelling the context
+	if p.cancel != nil {
+		p.cancel()
+	}
+
+	// Stop cleanup ticker
 	if p.cleanupTicker != nil {
 		p.cleanupTicker.Stop()
 	}
-	
-	// Wait for cleanup to finish
+
+	// Wait for cleanup goroutine to finish (should be immediate now that context is cancelled)
 	select {
 	case <-p.cleanupDone:
 		logPool.Print("Cleanup goroutine stopped")
-	case <-time.After(5 * time.Second):
+	case <-time.After(1 * time.Second):
 		logPool.Print("Cleanup goroutine stop timeout")
 	}
-	
+
 	// Close all connections
 	p.mu.Lock()
 	defer p.mu.Unlock()
-	
+
 	for key, metadata := range p.connections {
 		logPool.Printf("Closing connection: backend=%s, session=%s", key.BackendID, key.SessionID)
 		metadata.State = ConnectionStateClosed
 		delete(p.connections, key)
 	}
-	
+
 	logPool.Print("Connection pool stopped")
 }
 
@@ -200,7 +211,7 @@ func (p *SessionConnectionPool) Get(backendID, sessionID string) (*mcp.Connectio
 
 	key := ConnectionKey{BackendID: backendID, SessionID: sessionID}
 	metadata, exists := p.connections[key]
-	
+
 	if !exists {
 		logPool.Printf("Connection not found: backend=%s, session=%s", backendID, sessionID)
 		return nil, false
@@ -211,9 +222,9 @@ func (p *SessionConnectionPool) Get(backendID, sessionID string) (*mcp.Connectio
 		return nil, false
 	}
 
-	logPool.Printf("Reusing connection: backend=%s, session=%s, requests=%d", 
+	logPool.Printf("Reusing connection: backend=%s, session=%s, requests=%d",
 		backendID, sessionID, metadata.RequestCount)
-	
+
 	// Update last used time and state (need write lock for this)
 	p.mu.RUnlock()
 	p.mu.Lock()
@@ -232,7 +243,7 @@ func (p *SessionConnectionPool) Set(backendID, sessionID string, conn *mcp.Conne
 	defer p.mu.Unlock()
 
 	key := ConnectionKey{BackendID: backendID, SessionID: sessionID}
-	
+
 	// Check if connection already exists
 	if existing, exists := p.connections[key]; exists {
 		logPool.Printf("Updating existing connection: backend=%s, session=%s", backendID, sessionID)
@@ -262,7 +273,7 @@ func (p *SessionConnectionPool) Delete(backendID, sessionID string) {
 	defer p.mu.Unlock()
 
 	key := ConnectionKey{BackendID: backendID, SessionID: sessionID}
-	
+
 	if metadata, exists := p.connections[key]; exists {
 		metadata.State = ConnectionStateClosed
 		delete(p.connections, key)
@@ -295,7 +306,7 @@ func (p *SessionConnectionPool) RecordError(backendID, sessionID string) {
 	key := ConnectionKey{BackendID: backendID, SessionID: sessionID}
 	if metadata, exists := p.connections[key]; exists {
 		metadata.ErrorCount++
-		logPool.Printf("Recorded error for connection: backend=%s, session=%s, errors=%d", 
+		logPool.Printf("Recorded error for connection: backend=%s, session=%s, errors=%d",
 			backendID, sessionID, metadata.ErrorCount)
 	}
 }
diff --git a/internal/launcher/connection_pool_test.go b/internal/launcher/connection_pool_test.go
index 810b1403..b99986b9 100644
--- a/internal/launcher/connection_pool_test.go
+++ b/internal/launcher/connection_pool_test.go
@@ -13,7 +13,7 @@ import (
 func TestNewSessionConnectionPool(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	require.NotNil(t, pool)
 	assert.NotNil(t, pool.connections)
 	assert.Equal(t, 0, pool.Size())
@@ -22,21 +22,21 @@ func TestNewSessionConnectionPool(t *testing.T) {
 func TestConnectionPoolSetAndGet(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	// Create a mock connection
 	mockConn := &mcp.Connection{}
-	
+
 	// Set a connection
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Verify size
 	assert.Equal(t, 1, pool.Size())
-	
+
 	// Get the connection
 	conn, exists := pool.Get("backend1", "session1")
 	assert.True(t, exists)
 	assert.Equal(t, mockConn, conn)
-	
+
 	// Verify metadata was created
 	metadata, found := pool.GetMetadata("backend1", "session1")
 	assert.True(t, found)
@@ -48,7 +48,7 @@ func TestConnectionPoolSetAndGet(t *testing.T) {
 func TestConnectionPoolGetNonExistent(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	// Try to get non-existent connection
 	conn, exists := pool.Get("backend1", "session1")
 	assert.False(t, exists)
@@ -58,17 +58,17 @@ func TestConnectionPoolGetNonExistent(t *testing.T) {
 func TestConnectionPoolDelete(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	assert.Equal(t, 1, pool.Size())
-	
+
 	// Delete the connection
 	pool.Delete("backend1", "session1")
-	
+
 	assert.Equal(t, 0, pool.Size())
-	
+
 	// Verify it's no longer accessible
 	conn, exists := pool.Get("backend1", "session1")
 	assert.False(t, exists)
@@ -78,27 +78,27 @@ func TestConnectionPoolDelete(t *testing.T) {
 func TestConnectionPoolMultipleConnections(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	conn1 := &mcp.Connection{}
 	conn2 := &mcp.Connection{}
 	conn3 := &mcp.Connection{}
-	
+
 	// Add multiple connections with different backend/session combinations
 	pool.Set("backend1", "session1", conn1)
 	pool.Set("backend1", "session2", conn2)
 	pool.Set("backend2", "session1", conn3)
-	
+
 	assert.Equal(t, 3, pool.Size())
-	
+
 	// Verify each connection is retrievable
 	c1, exists := pool.Get("backend1", "session1")
 	assert.True(t, exists)
 	assert.Equal(t, conn1, c1)
-	
+
 	c2, exists := pool.Get("backend1", "session2")
 	assert.True(t, exists)
 	assert.Equal(t, conn2, c2)
-	
+
 	c3, exists := pool.Get("backend2", "session1")
 	assert.True(t, exists)
 	assert.Equal(t, conn3, c3)
@@ -107,54 +107,54 @@ func TestConnectionPoolMultipleConnections(t *testing.T) {
 func TestConnectionPoolUpdateExisting(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	conn1 := &mcp.Connection{}
 	conn2 := &mcp.Connection{}
-	
+
 	// Set initial connection
 	pool.Set("backend1", "session1", conn1)
-	
+
 	// Get metadata
 	metadata1, _ := pool.GetMetadata("backend1", "session1")
 	createdAt1 := metadata1.CreatedAt
 	lastUsed1 := metadata1.LastUsedAt
-	
+
 	// Wait a bit to ensure time difference
 	time.Sleep(10 * time.Millisecond)
-	
+
 	// Update with new connection
 	pool.Set("backend1", "session1", conn2)
-	
+
 	// Verify size didn't change
 	assert.Equal(t, 1, pool.Size())
-	
+
 	// Verify connection was updated
 	conn, exists := pool.Get("backend1", "session1")
 	assert.True(t, exists)
 	assert.Equal(t, conn2, conn)
-	
+
 	// Verify metadata
 	metadata2, _ := pool.GetMetadata("backend1", "session1")
-	assert.Equal(t, createdAt1, metadata2.CreatedAt) // Created time should remain same
+	assert.Equal(t, createdAt1, metadata2.CreatedAt)                                               // Created time should remain same
 	assert.True(t, metadata2.LastUsedAt.After(lastUsed1) || metadata2.LastUsedAt.Equal(lastUsed1)) // Last used should update or be equal
 }
 
 func TestConnectionPoolRequestCount(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Get metadata before any Get calls
 	metadata, _ := pool.GetMetadata("backend1", "session1")
 	assert.Equal(t, 0, metadata.RequestCount)
-	
+
 	// Call Get multiple times
 	pool.Get("backend1", "session1")
 	pool.Get("backend1", "session1")
 	pool.Get("backend1", "session1")
-	
+
 	// Verify request count increased
 	metadata, _ = pool.GetMetadata("backend1", "session1")
 	assert.Equal(t, 3, metadata.RequestCount)
@@ -163,18 +163,18 @@ func TestConnectionPoolRequestCount(t *testing.T) {
 func TestConnectionPoolRecordError(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Initial error count should be 0
 	metadata, _ := pool.GetMetadata("backend1", "session1")
 	assert.Equal(t, 0, metadata.ErrorCount)
-	
+
 	// Record errors
 	pool.RecordError("backend1", "session1")
 	pool.RecordError("backend1", "session1")
-	
+
 	// Verify error count increased
 	metadata, _ = pool.GetMetadata("backend1", "session1")
 	assert.Equal(t, 2, metadata.ErrorCount)
@@ -183,18 +183,18 @@ func TestConnectionPoolRecordError(t *testing.T) {
 func TestConnectionPoolList(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	// Empty pool
 	keys := pool.List()
 	assert.Empty(t, keys)
-	
+
 	// Add connections
 	pool.Set("backend1", "session1", &mcp.Connection{})
 	pool.Set("backend2", "session2", &mcp.Connection{})
-	
+
 	keys = pool.List()
 	assert.Len(t, keys, 2)
-	
+
 	// Verify keys are present (order may vary)
 	keyStrings := make([]string, len(keys))
 	for i, key := range keys {
@@ -209,17 +209,17 @@ func TestConnectionKeyString(t *testing.T) {
 		BackendID: "test-backend",
 		SessionID: "test-session",
 	}
-	
+
 	assert.Equal(t, "test-backend/test-session", key.String())
 }
 
 func TestConnectionPoolConcurrency(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Run concurrent Get operations
 	done := make(chan bool)
 	for i := 0; i < 10; i++ {
@@ -230,12 +230,12 @@ func TestConnectionPoolConcurrency(t *testing.T) {
 			done <- true
 		}()
 	}
-	
+
 	// Wait for all goroutines
 	for i := 0; i < 10; i++ {
 		<-done
 	}
-	
+
 	// Verify metadata (should be 1000 requests)
 	metadata, exists := pool.GetMetadata("backend1", "session1")
 	assert.True(t, exists)
@@ -245,10 +245,10 @@ func TestConnectionPoolConcurrency(t *testing.T) {
 func TestConnectionPoolDeleteNonExistent(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	// Delete non-existent connection (should not panic)
 	pool.Delete("backend1", "session1")
-	
+
 	assert.Equal(t, 0, pool.Size())
 }
 
@@ -256,17 +256,17 @@ func TestConnectionStateTransitions(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
 	defer pool.Stop()
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Initial state should be Active
 	metadata, _ := pool.GetMetadata("backend1", "session1")
 	assert.Equal(t, ConnectionStateActive, metadata.State)
-	
+
 	// Delete marks as Closed and removes
 	pool.Delete("backend1", "session1")
-	
+
 	// After delete, connection should not exist
 	_, exists := pool.GetMetadata("backend1", "session1")
 	assert.False(t, exists)
@@ -276,7 +276,7 @@ func TestPoolConfigDefaults(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
 	defer pool.Stop()
-	
+
 	assert.NotNil(t, pool)
 	assert.Equal(t, DefaultIdleTimeout, pool.idleTimeout)
 	assert.Equal(t, DefaultCleanupInterval, pool.cleanupInterval)
@@ -292,7 +292,7 @@ func TestPoolConfigCustom(t *testing.T) {
 	}
 	pool := NewSessionConnectionPoolWithConfig(ctx, config)
 	defer pool.Stop()
-	
+
 	assert.Equal(t, config.IdleTimeout, pool.idleTimeout)
 	assert.Equal(t, config.CleanupInterval, pool.cleanupInterval)
 	assert.Equal(t, config.MaxErrorCount, pool.maxErrorCount)
@@ -307,16 +307,16 @@ func TestConnectionIdleCleanup(t *testing.T) {
 	}
 	pool := NewSessionConnectionPoolWithConfig(ctx, config)
 	defer pool.Stop()
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Connection should exist initially
 	assert.Equal(t, 1, pool.Size())
-	
+
 	// Wait for idle timeout + cleanup interval
 	time.Sleep(100 * time.Millisecond)
-	
+
 	// Connection should be cleaned up
 	assert.Equal(t, 0, pool.Size())
 }
@@ -330,21 +330,21 @@ func TestConnectionErrorCleanup(t *testing.T) {
 	}
 	pool := NewSessionConnectionPoolWithConfig(ctx, config)
 	defer pool.Stop()
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Record multiple errors
 	pool.RecordError("backend1", "session1")
 	pool.RecordError("backend1", "session1")
 	pool.RecordError("backend1", "session1")
-	
+
 	// Connection should still exist
 	assert.Equal(t, 1, pool.Size())
-	
+
 	// Wait for cleanup
 	time.Sleep(50 * time.Millisecond)
-	
+
 	// Connection should be cleaned up due to errors
 	assert.Equal(t, 0, pool.Size())
 }
@@ -352,16 +352,16 @@ func TestConnectionErrorCleanup(t *testing.T) {
 func TestPoolStop(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
-	
+
 	// Add some connections
 	pool.Set("backend1", "session1", &mcp.Connection{})
 	pool.Set("backend2", "session2", &mcp.Connection{})
-	
+
 	assert.Equal(t, 2, pool.Size())
-	
+
 	// Stop the pool
 	pool.Stop()
-	
+
 	// All connections should be removed
 	assert.Equal(t, 0, pool.Size())
 }
@@ -370,14 +370,14 @@ func TestConnectionStateActive(t *testing.T) {
 	ctx := context.Background()
 	pool := NewSessionConnectionPool(ctx)
 	defer pool.Stop()
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// After Set, state should be Active
 	metadata, _ := pool.GetMetadata("backend1", "session1")
 	assert.Equal(t, ConnectionStateActive, metadata.State)
-	
+
 	// After Get, state should remain Active
 	pool.Get("backend1", "session1")
 	metadata, _ = pool.GetMetadata("backend1", "session1")
@@ -393,16 +393,16 @@ func TestConnectionCleanupWithActivity(t *testing.T) {
 	}
 	pool := NewSessionConnectionPoolWithConfig(ctx, config)
 	defer pool.Stop()
-	
+
 	mockConn := &mcp.Connection{}
 	pool.Set("backend1", "session1", mockConn)
-	
+
 	// Keep connection active by using it
 	for i := 0; i < 5; i++ {
 		time.Sleep(40 * time.Millisecond)
 		pool.Get("backend1", "session1") // This updates LastUsedAt
 	}
-	
+
 	// Connection should still exist because it was active
 	assert.Equal(t, 1, pool.Size())
 }
diff --git a/internal/launcher/launcher.go b/internal/launcher/launcher.go
index 252163f1..729a44b7 100644
--- a/internal/launcher/launcher.go
+++ b/internal/launcher/launcher.go
@@ -21,8 +21,8 @@ var logLauncher = logger.New("launcher:launcher")
 type Launcher struct {
 	ctx                context.Context
 	config             *config.Config
-	connections        map[string]*mcp.Connection  // Single connections per backend (stateless/HTTP)
-	sessionPool        *SessionConnectionPool       // Session-aware connections (stateful/stdio)
+	connections        map[string]*mcp.Connection // Single connections per backend (stateless/HTTP)
+	sessionPool        *SessionConnectionPool     // Session-aware connections (stateful/stdio)
 	mu                 sync.RWMutex
 	runningInContainer bool
 }
@@ -194,7 +194,7 @@ func GetOrLaunchForSession(l *Launcher, serverID, sessionID string) (*mcp.Connec
 	l.mu.RLock()
 	serverCfg, ok := l.config.Servers[serverID]
 	l.mu.RUnlock()
-	
+
 	if !ok {
 		logger.LogError("backend", "Backend server not found in config: %s", serverID)
 		return nil, fmt.Errorf("server '%s' not found in config", serverID)
@@ -317,7 +317,7 @@ func (l *Launcher) Close() {
 		conn.Close()
 	}
 	l.connections = make(map[string]*mcp.Connection)
-	
+
 	// Stop session pool and close all session connections
 	if l.sessionPool != nil {
 		logLauncher.Printf("Stopping session connection pool")
diff --git a/internal/launcher/launcher_test.go b/internal/launcher/launcher_test.go
index 69f9207c..164c01bc 100644
--- a/internal/launcher/launcher_test.go
+++ b/internal/launcher/launcher_test.go
@@ -451,26 +451,26 @@ func TestClose(t *testing.T) {
 }
 
 func TestGetOrLaunchForSession_HTTPBackend(t *testing.T) {
-// HTTP backends should use regular GetOrLaunch (stateless)
-mockServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-response := map[string]interface{}{
-"jsonrpc": "2.0",
-"id":      1,
-"result": map[string]interface{}{
-"protocolVersion": "2024-11-05",
-"capabilities":    map[string]interface{}{},
-"serverInfo": map[string]interface{}{
-"name":    "http-test",
-"version": "1.0.0",
-},
-},
-}
-w.Header().Set("Content-Type", "application/json")
-json.NewEncoder(w).Encode(response)
-}))
-defer mockServer.Close()
+	// HTTP backends should use regular GetOrLaunch (stateless)
+	mockServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		response := map[string]interface{}{
+			"jsonrpc": "2.0",
+			"id":      1,
+			"result": map[string]interface{}{
+				"protocolVersion": "2024-11-05",
+				"capabilities":    map[string]interface{}{},
+				"serverInfo": map[string]interface{}{
+					"name":    "http-test",
+					"version": "1.0.0",
+				},
+			},
+		}
+		w.Header().Set("Content-Type", "application/json")
+		json.NewEncoder(w).Encode(response)
+	}))
+	defer mockServer.Close()
 
-jsonConfig := fmt.Sprintf(`{
+	jsonConfig := fmt.Sprintf(`{
 "mcpServers": {
 "http-backend": {
 "type": "http",
@@ -484,53 +484,53 @@ jsonConfig := fmt.Sprintf(`{
 }
 }`, mockServer.URL)
 
-cfg := loadConfigFromJSON(t, jsonConfig)
-ctx := context.Background()
-l := New(ctx, cfg)
-defer l.Close()
+	cfg := loadConfigFromJSON(t, jsonConfig)
+	ctx := context.Background()
+	l := New(ctx, cfg)
+	defer l.Close()
 
-// Get connection for two different sessions
-conn1, err := GetOrLaunchForSession(l, "http-backend", "session1")
-require.NoError(t, err)
-require.NotNil(t, conn1)
+	// Get connection for two different sessions
+	conn1, err := GetOrLaunchForSession(l, "http-backend", "session1")
+	require.NoError(t, err)
+	require.NotNil(t, conn1)
 
-conn2, err := GetOrLaunchForSession(l, "http-backend", "session2")
-require.NoError(t, err)
-require.NotNil(t, conn2)
+	conn2, err := GetOrLaunchForSession(l, "http-backend", "session2")
+	require.NoError(t, err)
+	require.NotNil(t, conn2)
 
-// For HTTP backends, both should return the same connection (stateless)
-assert.Equal(t, conn1, conn2, "HTTP backends should reuse same connection")
+	// For HTTP backends, both should return the same connection (stateless)
+	assert.Equal(t, conn1, conn2, "HTTP backends should reuse same connection")
 
-// Should be in regular connections map, not session pool
-assert.Equal(t, 1, len(l.connections), "Should have one connection in regular map")
-assert.Equal(t, 0, l.sessionPool.Size(), "Session pool should be empty for HTTP")
+	// Should be in regular connections map, not session pool
+	assert.Equal(t, 1, len(l.connections), "Should have one connection in regular map")
+	assert.Equal(t, 0, l.sessionPool.Size(), "Session pool should be empty for HTTP")
 }
 
 func TestGetOrLaunchForSession_SessionReuse(t *testing.T) {
-// Note: We can't fully test stdio backends without actual processes
-// This test verifies the session pool is consulted
-ctx := context.Background()
-cfg := &config.Config{
-Servers: map[string]*config.ServerConfig{},
-}
-l := New(ctx, cfg)
-defer l.Close()
+	// Note: We can't fully test stdio backends without actual processes
+	// This test verifies the session pool is consulted
+	ctx := context.Background()
+	cfg := &config.Config{
+		Servers: map[string]*config.ServerConfig{},
+	}
+	l := New(ctx, cfg)
+	defer l.Close()
 
-// Verify session pool was created
-assert.NotNil(t, l.sessionPool, "Session pool should be initialized")
+	// Verify session pool was created
+	assert.NotNil(t, l.sessionPool, "Session pool should be initialized")
 }
 
 func TestGetOrLaunchForSession_InvalidServer(t *testing.T) {
-ctx := context.Background()
-cfg := &config.Config{
-Servers: map[string]*config.ServerConfig{},
-}
-l := New(ctx, cfg)
-defer l.Close()
-
-// Try to get connection for non-existent server
-conn, err := GetOrLaunchForSession(l, "nonexistent", "session1")
-assert.Error(t, err)
-assert.Nil(t, conn)
-assert.Contains(t, err.Error(), "not found in config")
+	ctx := context.Background()
+	cfg := &config.Config{
+		Servers: map[string]*config.ServerConfig{},
+	}
+	l := New(ctx, cfg)
+	defer l.Close()
+
+	// Try to get connection for non-existent server
+	conn, err := GetOrLaunchForSession(l, "nonexistent", "session1")
+	assert.Error(t, err)
+	assert.Nil(t, conn)
+	assert.Contains(t, err.Error(), "not found in config")
 }
diff --git a/internal/mcp/connection.go b/internal/mcp/connection.go
index d6b457b2..a8c85875 100644
--- a/internal/mcp/connection.go
+++ b/internal/mcp/connection.go
@@ -81,6 +81,11 @@ func newMCPClient() *sdk.Client {
 
 // newHTTPConnection creates a new HTTP Connection struct with common fields
 func newHTTPConnection(ctx context.Context, cancel context.CancelFunc, client *sdk.Client, session *sdk.ClientSession, url string, headers map[string]string, httpClient *http.Client, transportType HTTPTransportType) *Connection {
+	// Extract session ID from SDK session if available
+	var sessionID string
+	if session != nil {
+		sessionID = session.ID()
+	}
 	return &Connection{
 		client:            client,
 		session:           session,
@@ -91,6 +96,7 @@ func newHTTPConnection(ctx context.Context, cancel context.CancelFunc, client *s
 		headers:           headers,
 		httpClient:        httpClient,
 		httpTransportType: transportType,
+		httpSessionID:     sessionID,
 	}
 }
 
diff --git a/internal/mcp/http_connection_test.go b/internal/mcp/http_connection_test.go
index 09ab72bb..85d04bfa 100644
--- a/internal/mcp/http_connection_test.go
+++ b/internal/mcp/http_connection_test.go
@@ -69,25 +69,17 @@ func TestNewHTTPConnection_WithCustomHeaders(t *testing.T) {
 	assert.Equal(1, serverCallCount, "Should only attempt plain JSON transport with custom headers")
 }
 
-// TestNewHTTPConnection_WithoutHeaders_FallbackSequence tests the full fallback
-// sequence: streamable → SSE → plain JSON when no custom headers are provided
+// TestNewHTTPConnection_WithoutHeaders_FallbackSequence tests connection without custom headers.
+// When no custom headers are provided, the code tries transports in order:
+// streamable → SSE → plain JSON. If the server responds with valid JSON-RPC
+// responses, the streamable transport succeeds since it's tried first.
 func TestNewHTTPConnection_WithoutHeaders_FallbackSequence(t *testing.T) {
 	require := require.New(t)
 
-	// Track which paths the server handled
-	type requestInfo struct {
-		path   string
-		method string
-	}
-	requests := []requestInfo{}
-
-	// Create test server that rejects streamable and SSE endpoints
+	// Create test server that responds to all requests with valid JSON-RPC
 	testServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		requests = append(requests, requestInfo{path: r.URL.Path, method: r.Method})
-
-		// Reject all requests initially (to force fallback)
-		// But for plain JSON (POST to root), return success
-		if r.Method == "POST" && r.URL.Path == "/" {
+		// Accept all POST requests with valid JSON-RPC response
+		if r.Method == "POST" {
 			response := map[string]interface{}{
 				"jsonrpc": "2.0",
 				"id":      1,
@@ -100,26 +92,33 @@ func TestNewHTTPConnection_WithoutHeaders_FallbackSequence(t *testing.T) {
 				},
 			}
 			w.Header().Set("Content-Type", "application/json")
-			w.Header().Set("Mcp-Session-Id", "fallback-session")
+			w.Header().Set("Mcp-Session-Id", "test-session")
 			w.WriteHeader(http.StatusOK)
 			json.NewEncoder(w).Encode(response)
 			return
 		}
 
+		// Accept GET requests for SSE stream (streamable transport may need this)
+		if r.Method == "GET" {
+			w.Header().Set("Content-Type", "text/event-stream")
+			w.WriteHeader(http.StatusOK)
+			return
+		}
+
 		// Reject other requests
 		w.WriteHeader(http.StatusNotFound)
 	}))
 	defer testServer.Close()
 
-	// Create connection without custom headers (triggers fallback sequence)
+	// Create connection without custom headers - streamable transport should succeed first
 	conn, err := NewHTTPConnection(context.Background(), testServer.URL, nil)
-	require.NoError(err, "Connection should eventually succeed with plain JSON")
+	require.NoError(err, "Connection should succeed")
 	require.NotNil(conn)
 	defer conn.Close()
 
-	// Verify we fell back to plain JSON transport
-	require.Equal(HTTPTransportPlainJSON, conn.httpTransportType)
-	require.Equal("fallback-session", conn.httpSessionID)
+	// Streamable transport is tried first and should succeed since server responds correctly
+	require.Equal(HTTPTransportStreamable, conn.httpTransportType)
+	require.Equal("test-session", conn.httpSessionID)
 }
 
 // TestNewHTTPConnection_AllTransportsFail tests the case where all transports fail
@@ -401,18 +400,14 @@ func TestNewHTTPConnection_HeadersPropagation(t *testing.T) {
 	}
 }
 
-// TestNewHTTPConnection_EmptyHeaders tests connection with empty header map
+// TestNewHTTPConnection_EmptyHeaders tests connection with empty header map.
+// Empty headers behave the same as nil headers - streamable transport is tried first.
 func TestNewHTTPConnection_EmptyHeaders(t *testing.T) {
 	require := require.New(t)
 
-	// Track transport attempts
-	attemptedTransports := []string{}
-
 	testServer := httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
-		// Track what was attempted
-		if r.Method == "POST" && r.URL.Path == "/" {
-			attemptedTransports = append(attemptedTransports, "plain-json")
-
+		// Accept POST requests with valid JSON-RPC response
+		if r.Method == "POST" {
 			response := map[string]interface{}{
 				"jsonrpc": "2.0",
 				"id":      1,
@@ -422,24 +417,31 @@ func TestNewHTTPConnection_EmptyHeaders(t *testing.T) {
 				},
 			}
 			w.Header().Set("Content-Type", "application/json")
+			w.Header().Set("Mcp-Session-Id", "empty-headers-session")
 			w.WriteHeader(http.StatusOK)
 			json.NewEncoder(w).Encode(response)
 			return
 		}
 
-		// Reject other transport attempts
+		// Accept GET for SSE stream
+		if r.Method == "GET" {
+			w.Header().Set("Content-Type", "text/event-stream")
+			w.WriteHeader(http.StatusOK)
+			return
+		}
+
 		w.WriteHeader(http.StatusNotFound)
 	}))
 	defer testServer.Close()
 
-	// Create connection with empty headers (should try SDK transports first)
+	// Create connection with empty headers - should try SDK transports first
 	conn, err := NewHTTPConnection(context.Background(), testServer.URL, map[string]string{})
 	require.NoError(err, "Should succeed with empty headers")
 	require.NotNil(conn)
 	defer conn.Close()
 
-	// Should eventually fall back to plain JSON
-	assert.Equal(t, HTTPTransportPlainJSON, conn.httpTransportType)
+	// Streamable transport is tried first and should succeed
+	assert.Equal(t, HTTPTransportStreamable, conn.httpTransportType)
 }
 
 // TestNewHTTPConnection_NilHeaders tests connection with nil header map
diff --git a/internal/server/routed.go b/internal/server/routed.go
index 9fd33ccb..5d55b5da 100644
--- a/internal/server/routed.go
+++ b/internal/server/routed.go
@@ -36,7 +36,7 @@ func newFilteredServerCache() *filteredServerCache {
 // getOrCreate returns a cached server or creates a new one
 func (c *filteredServerCache) getOrCreate(backendID, sessionID string, creator func() *sdk.Server) *sdk.Server {
 	key := fmt.Sprintf("%s/%s", backendID, sessionID)
-	
+
 	// Try read lock first
 	c.mu.RLock()
 	if server, exists := c.servers[key]; exists {
@@ -46,18 +46,18 @@ func (c *filteredServerCache) getOrCreate(backendID, sessionID string, creator f
 		return server
 	}
 	c.mu.RUnlock()
-	
+
 	// Need to create, acquire write lock
 	c.mu.Lock()
 	defer c.mu.Unlock()
-	
+
 	// Double-check after acquiring write lock
 	if server, exists := c.servers[key]; exists {
 		logRouted.Printf("Filtered server created by another goroutine: backend=%s, session=%s", backendID, sessionID)
 		log.Printf("[CACHE] Filtered server created by another goroutine: backend=%s, session=%s", backendID, sessionID)
 		return server
 	}
-	
+
 	// Create new server
 	logRouted.Printf("Creating new filtered server: backend=%s, session=%s", backendID, sessionID)
 	log.Printf("[CACHE] Creating new filtered server: backend=%s, session=%s", backendID, sessionID)
@@ -157,10 +157,13 @@ func CreateHTTPServerForRoutedMode(addr string, unifiedServer *UnifiedServer, ap
 			Stateless: false,
 		})
 
+		// Wrap SDK handler with detailed logging for JSON-RPC translation debugging
+		loggedHandler := WithSDKLogging(routeHandler, "routed:"+backendID)
+
 		// Apply auth middleware if API key is configured (spec 7.1)
-		var finalHandler http.Handler = routeHandler
+		finalHandler := loggedHandler
 		if apiKey != "" {
-			finalHandler = authMiddleware(apiKey, routeHandler.ServeHTTP)
+			finalHandler = authMiddleware(apiKey, loggedHandler.ServeHTTP)
 		}
 
 		// Mount the handler at both /mcp/<server> and /mcp/<server>/
diff --git a/internal/server/sdk_logging.go b/internal/server/sdk_logging.go
new file mode 100644
index 00000000..9332ac36
--- /dev/null
+++ b/internal/server/sdk_logging.go
@@ -0,0 +1,181 @@
+package server
+
+import (
+	"bytes"
+	"encoding/json"
+	"io"
+	"net/http"
+	"strings"
+	"time"
+
+	"github.com/githubnext/gh-aw-mcpg/internal/logger"
+)
+
+var logSDK = logger.New("server:sdk-frontend")
+
+// JSONRPCRequest represents an incoming JSON-RPC request
+type JSONRPCRequest struct {
+	JSONRPC string          `json:"jsonrpc"`
+	ID      interface{}     `json:"id,omitempty"`
+	Method  string          `json:"method"`
+	Params  json.RawMessage `json:"params,omitempty"`
+}
+
+// JSONRPCResponse represents a JSON-RPC response
+type JSONRPCResponse struct {
+	JSONRPC string          `json:"jsonrpc"`
+	ID      interface{}     `json:"id,omitempty"`
+	Result  json.RawMessage `json:"result,omitempty"`
+	Error   *JSONRPCError   `json:"error,omitempty"`
+}
+
+// JSONRPCError represents a JSON-RPC error
+type JSONRPCError struct {
+	Code    int             `json:"code"`
+	Message string          `json:"message"`
+	Data    json.RawMessage `json:"data,omitempty"`
+}
+
+// sdkLoggingResponseWriter captures response for logging
+type sdkLoggingResponseWriter struct {
+	http.ResponseWriter
+	body       bytes.Buffer
+	statusCode int
+}
+
+func (w *sdkLoggingResponseWriter) WriteHeader(statusCode int) {
+	w.statusCode = statusCode
+	w.ResponseWriter.WriteHeader(statusCode)
+}
+
+func (w *sdkLoggingResponseWriter) Write(b []byte) (int, error) {
+	w.body.Write(b)
+	return w.ResponseWriter.Write(b)
+}
+
+// WithSDKLogging wraps an SDK StreamableHTTPHandler to log JSON-RPC translation results
+// This captures the request/response at the HTTP boundary to understand what the SDK
+// sees and what it returns, particularly for debugging protocol state issues
+func WithSDKLogging(handler http.Handler, mode string) http.Handler {
+	return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+		startTime := time.Now()
+
+		// Extract session info for logging context
+		authHeader := r.Header.Get("Authorization")
+		sessionID := extractSessionID(authHeader)
+		mcpSessionID := r.Header.Get("Mcp-Session-Id")
+
+		// Log incoming request
+		logSDK.Printf(">>> SDK Request [%s] session=%s mcp-session=%s method=%s path=%s",
+			mode, truncateSession(sessionID), truncateSession(mcpSessionID), r.Method, r.URL.Path)
+
+		// Capture and log request body for POST requests
+		var requestBody []byte
+		var jsonrpcReq JSONRPCRequest
+		if r.Method == "POST" && r.Body != nil {
+			var err error
+			requestBody, err = io.ReadAll(r.Body)
+			if err == nil && len(requestBody) > 0 {
+				// Restore body for the actual handler
+				r.Body = io.NopCloser(bytes.NewBuffer(requestBody))
+
+				// Parse JSON-RPC request
+				if err := json.Unmarshal(requestBody, &jsonrpcReq); err == nil {
+					logSDK.Printf("    JSON-RPC Request: method=%s id=%v", jsonrpcReq.Method, jsonrpcReq.ID)
+					logger.LogDebug("sdk-frontend", "JSON-RPC request parsed: mode=%s, method=%s, id=%v, session=%s",
+						mode, jsonrpcReq.Method, jsonrpcReq.ID, truncateSession(sessionID))
+				} else {
+					logSDK.Printf("    Failed to parse JSON-RPC request: %v", err)
+					logSDK.Printf("    Raw body: %s", string(requestBody))
+				}
+			}
+		}
+
+		// Wrap response writer to capture output
+		lw := &sdkLoggingResponseWriter{
+			ResponseWriter: w,
+			statusCode:     http.StatusOK,
+		}
+
+		// Call the actual SDK handler
+		handler.ServeHTTP(lw, r)
+
+		duration := time.Since(startTime)
+
+		// Parse and log response
+		responseBody := lw.body.Bytes()
+		if len(responseBody) > 0 {
+			// Try to parse as JSON-RPC response
+			var jsonrpcResp JSONRPCResponse
+			if err := json.Unmarshal(responseBody, &jsonrpcResp); err == nil {
+				if jsonrpcResp.Error != nil {
+					// Error response - this is what we're particularly interested in
+					logSDK.Printf("<<< SDK Response [%s] ERROR status=%d duration=%v",
+						mode, lw.statusCode, duration)
+					logSDK.Printf("    JSON-RPC Error: code=%d message=%q",
+						jsonrpcResp.Error.Code, jsonrpcResp.Error.Message)
+
+					// Log detailed error info for protocol state issues
+					if strings.Contains(jsonrpcResp.Error.Message, "session initialization") ||
+						strings.Contains(jsonrpcResp.Error.Message, "invalid during") {
+						logSDK.Printf("    ⚠️  PROTOCOL STATE ERROR DETECTED")
+						logSDK.Printf("    Request method was: %s", jsonrpcReq.Method)
+						logSDK.Printf("    Session ID: %s", truncateSession(sessionID))
+						logSDK.Printf("    MCP-Session-Id header: %s", truncateSession(mcpSessionID))
+						logSDK.Printf("    This error indicates SDK's StreamableHTTPHandler created fresh protocol state")
+
+						logger.LogWarn("sdk-frontend",
+							"Protocol state error: mode=%s, method=%s, session=%s, mcp_session=%s, error=%q",
+							mode, jsonrpcReq.Method, truncateSession(sessionID),
+							truncateSession(mcpSessionID), jsonrpcResp.Error.Message)
+					} else {
+						logger.LogError("sdk-frontend",
+							"JSON-RPC error: mode=%s, method=%s, code=%d, message=%q",
+							mode, jsonrpcReq.Method, jsonrpcResp.Error.Code, jsonrpcResp.Error.Message)
+					}
+				} else {
+					// Success response
+					logSDK.Printf("<<< SDK Response [%s] SUCCESS status=%d duration=%v",
+						mode, lw.statusCode, duration)
+					logSDK.Printf("    JSON-RPC Response id=%v has result=%v",
+						jsonrpcResp.ID, jsonrpcResp.Result != nil)
+
+					logger.LogDebug("sdk-frontend",
+						"JSON-RPC success: mode=%s, method=%s, id=%v, duration=%v",
+						mode, jsonrpcReq.Method, jsonrpcResp.ID, duration)
+				}
+			} else {
+				// Could be SSE stream or other format
+				logSDK.Printf("<<< SDK Response [%s] status=%d duration=%v (non-JSON or stream)",
+					mode, lw.statusCode, duration)
+				if len(responseBody) < 500 {
+					logSDK.Printf("    Raw response: %s", string(responseBody))
+				} else {
+					logSDK.Printf("    Raw response (truncated): %s...", string(responseBody[:500]))
+				}
+			}
+		} else {
+			logSDK.Printf("<<< SDK Response [%s] status=%d duration=%v (empty body)",
+				mode, lw.statusCode, duration)
+		}
+	})
+}
+
+// extractSessionID extracts session ID from Authorization header
+func extractSessionID(authHeader string) string {
+	if strings.HasPrefix(authHeader, "Bearer ") {
+		return strings.TrimSpace(strings.TrimPrefix(authHeader, "Bearer "))
+	}
+	return authHeader
+}
+
+// truncateSession returns a truncated session ID for logging (first 8 chars)
+func truncateSession(s string) string {
+	if s == "" {
+		return "(none)"
+	}
+	if len(s) <= 8 {
+		return s
+	}
+	return s[:8] + "..."
+}
diff --git a/internal/server/transport.go b/internal/server/transport.go
index 8947caf2..49595730 100644
--- a/internal/server/transport.go
+++ b/internal/server/transport.go
@@ -153,10 +153,13 @@ func CreateHTTPServerForMCP(addr string, unifiedServer *UnifiedServer, apiKey st
 		Stateless: false, // Support stateful sessions
 	})
 
+	// Wrap SDK handler with detailed logging for JSON-RPC translation debugging
+	loggedHandler := WithSDKLogging(streamableHandler, "unified")
+
 	// Apply auth middleware if API key is configured (spec 7.1)
-	var finalHandler http.Handler = streamableHandler
+	finalHandler := loggedHandler
 	if apiKey != "" {
-		finalHandler = authMiddleware(apiKey, streamableHandler.ServeHTTP)
+		finalHandler = authMiddleware(apiKey, loggedHandler.ServeHTTP)
 	}
 
 	// Mount handler at /mcp endpoint (logging is done in the callback above)
diff --git a/internal/server/unified_test.go b/internal/server/unified_test.go
index a6e37379..a00299aa 100644
--- a/internal/server/unified_test.go
+++ b/internal/server/unified_test.go
@@ -374,11 +374,11 @@ func TestGetSessionID_EdgeCases(t *testing.T) {
 		{
 			name:   "empty string session ID",
 			ctx:    ctx,
-			wantID: "",
+			wantID: "default",
 			setupFunc: func(c context.Context) context.Context {
 				return context.WithValue(c, SessionIDContextKey, "")
 			},
-			description: "should preserve empty string session ID",
+			description: "empty string session ID should return default since empty is not a valid session ID",
 		},
 		{
 			name:   "whitespace session ID",