lsp: add tiny LRU cache for last 10 completions; ignore trailing whitespace in cache key; log cache hits; report busy with isIncomplete to prompt client retry

author: Paul Buetow <paul@buetow.org> 2025-08-20 00:10:15 +0300
committer: Paul Buetow <paul@buetow.org> 2025-08-20 00:10:15 +0300
commit: 9751271505527047ad6fd992534735dbbe4de1ff (patch)
tree: f43d42d18a7adb1b8909f8877290fe5fcf8662b9
parent: 507b84f2442eecf7422738b66dc29417870cda52 (diff)
4 files changed, 177 insertions, 26 deletions
diff --git a/internal/lsp/completion_cache_test.go b/internal/lsp/completion_cache_test.go
new file mode 100644
index 0000000..0207a9f
--- /dev/null
+++ b/internal/lsp/completion_cache_test.go
@@ -0,0 +1,42 @@
+package lsp
+
+import (
+    "bytes"
+    "log"
+    "strings"
+    "testing"
+
+    "hexai/internal/logging"
+)
+
+func TestCompletionCache_IgnoresWhitespaceBeforeCursor(t *testing.T) {
+    var buf bytes.Buffer
+    logger := log.New(&buf, "", 0)
+    s := NewServer(bytes.NewBuffer(nil), &buf, logger, ServerOptions{})
+    logging.Bind(logger)
+    s.triggerChars = []string{" ", "."}
+    fake := &countingLLM{}
+    s.llmClient = fake
+
+    // First request with trailing spaces before cursor
+    line := "foo   "
+    p := CompletionParams{ Position: Position{ Line: 0, Character: len(line) }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }
+    items, ok, _ := s.tryLLMCompletion(p, "", line, "", "", "", false, "")
+    if !ok || len(items) == 0 || fake.calls != 1 {
+        t.Fatalf("expected first call to invoke LLM; ok=%v len=%d calls=%d", ok, len(items), fake.calls)
+    }
+
+    // Same logical context but with a different amount of trailing whitespace
+    line2 := "foo             "
+    p2 := CompletionParams{ Position: Position{ Line: 0, Character: len(line2) }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }
+    items2, ok2, _ := s.tryLLMCompletion(p2, "", line2, "", "", "", false, "")
+    if !ok2 || len(items2) == 0 {
+        t.Fatalf("expected cache hit to still return items")
+    }
+    if fake.calls != 1 {
+        t.Fatalf("expected cache hit to avoid LLM call; calls=%d", fake.calls)
+    }
+    if !strings.Contains(buf.String(), "completion cache hit") {
+        t.Fatalf("expected log to contain cache hit message, got: %s", buf.String())
+    }
+}
diff --git a/internal/lsp/completion_throttle_test.go b/internal/lsp/completion_throttle_test.go
index 9bd6e54..46975a0 100644
--- a/internal/lsp/completion_throttle_test.go
+++ b/internal/lsp/completion_throttle_test.go
@@ -41,9 +41,12 @@ func TestTryLLMCompletion_BusySkipsConcurrent(t *testing.T) {
     // Simulate another LLM request in flight
     s.llmBusy = true
     p := CompletionParams{ Position: Position{ Line: 0, Character: 4 }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }
-    items, ok := s.tryLLMCompletion(p, "", "foo.", "", "", "", false, "")
-    if !ok {
-        t.Fatalf("expected ok=true when busy guard skips")
+    items, ok, busy := s.tryLLMCompletion(p, "", "foo.", "", "", "", false, "")
+    if ok {
+        t.Fatalf("expected ok=false when busy guard triggers")
+    }
+    if !busy {
+        t.Fatalf("expected busy=true when another request in flight")
     }
     if len(items) != 0 {
         t.Fatalf("expected zero items when busy, got %d", len(items))
@@ -59,7 +62,7 @@ func TestTryLLMCompletion_MinPrefixSkipsEarly(t *testing.T) {
     s.llmClient = fake
     // No trigger character -> skip regardless of prefix
     p := CompletionParams{ Position: Position{ Line: 0, Character: 1 }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }
-    items, ok := s.tryLLMCompletion(p, "", "a", "", "", "", false, "")
+    items, ok, _ := s.tryLLMCompletion(p, "", "a", "", "", "", false, "")
     if !ok {
         t.Fatalf("expected ok=true when skipped by min-prefix heuristic")
     }
@@ -76,11 +79,11 @@ func TestTryLLMCompletion_RequiresTriggerChar(t *testing.T) {
     fake := &countingLLM{}
     s.llmClient = fake
     // With trigger character '.' directly before cursor -> allowed
-    items, ok := s.tryLLMCompletion(CompletionParams{ Position: Position{ Line: 0, Character: 1 }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }, "", ".", "", "", "", false, "")
+    items, ok, _ := s.tryLLMCompletion(CompletionParams{ Position: Position{ Line: 0, Character: 1 }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }, "", ".", "", "", "", false, "")
     if !ok || len(items) == 0 || fake.calls == 0 { t.Fatalf("expected allowed with '.' trigger") }
     // Without trigger -> skipped
     fake.calls = 0
-    items, ok = s.tryLLMCompletion(CompletionParams{ Position: Position{ Line: 0, Character: 1 }, TextDocument: TextDocumentIdentifier{URI: "file://y.go"} }, "", "a", "", "", "", false, "")
+    items, ok, _ = s.tryLLMCompletion(CompletionParams{ Position: Position{ Line: 0, Character: 1 }, TextDocument: TextDocumentIdentifier{URI: "file://y.go"} }, "", "a", "", "", "", false, "")
     if !ok || len(items) != 0 || fake.calls != 0 { t.Fatalf("expected skip without trigger; ok=%v len=%d calls=%d", ok, len(items), fake.calls) }
 }
 
@@ -90,7 +93,7 @@ func TestTryLLMCompletion_AllowsSpaceTrigger(t *testing.T) {
     s.llmClient = fake
     line := "type Matrix "
     p := CompletionParams{ Position: Position{ Line: 0, Character: len(line) }, TextDocument: TextDocumentIdentifier{URI: "file://x.go"} }
-    items, ok := s.tryLLMCompletion(p, "", line, "", "", "", false, "")
+    items, ok, _ := s.tryLLMCompletion(p, "", line, "", "", "", false, "")
     if !ok || len(items) == 0 || fake.calls == 0 {
         t.Fatalf("expected allowed with space trigger; ok=%v len=%d calls=%d", ok, len(items), fake.calls)
     }
diff --git a/internal/lsp/handlers.go b/internal/lsp/handlers.go
index ee7c33a..0ccc072 100644
--- a/internal/lsp/handlers.go
+++ b/internal/lsp/handlers.go
@@ -477,11 +477,17 @@ func (s *Server) handleCompletion(req Request) {
 		if s.llmClient != nil {
 			newFunc := s.isDefiningNewFunction(p.TextDocument.URI, p.Position)
 			extra, has := s.buildAdditionalContext(newFunc, p.TextDocument.URI, p.Position)
-			items, ok := s.tryLLMCompletion(p, above, current, below, funcCtx, docStr, has, extra)
-			if ok {
-				s.reply(req.ID, CompletionList{IsIncomplete: false, Items: items}, nil)
-				return
-			}
+            items, ok, busy := s.tryLLMCompletion(p, above, current, below, funcCtx, docStr, has, extra)
+            if ok {
+                s.reply(req.ID, CompletionList{IsIncomplete: false, Items: items}, nil)
+                return
+            }
+            if busy {
+                // Inform client that results are incomplete so it may try again shortly.
+                logging.Logf("lsp ", "completion busy uri=%s line=%d char=%d returning isIncomplete", p.TextDocument.URI, p.Position.Line, p.Position.Character)
+                s.reply(req.ID, CompletionList{IsIncomplete: true, Items: []CompletionItem{}}, nil)
+                return
+            }
 		}
 	}
 	items := s.fallbackCompletionItems(docStr)
@@ -505,17 +511,27 @@ func (s *Server) logCompletionContext(p CompletionParams, above, current, below,
 		p.TextDocument.URI, p.Position.Line, p.Position.Character, trimLen(above), trimLen(current), trimLen(below), trimLen(funcCtx))
 }
 
-func (s *Server) tryLLMCompletion(p CompletionParams, above, current, below, funcCtx, docStr string, hasExtra bool, extraText string) ([]CompletionItem, bool) {
+func (s *Server) tryLLMCompletion(p CompletionParams, above, current, below, funcCtx, docStr string, hasExtra bool, extraText string) ([]CompletionItem, bool, bool) {
     ctx, cancel := context.WithTimeout(context.Background(), 6*time.Second)
     defer cancel()
 
     // Only invoke LLM when triggered by one of our trigger characters.
     if !s.isTriggerEvent(p, current) {
         logging.Logf("lsp ", "%scompletion skip=no-trigger line=%d char=%d current=%q%s", logging.AnsiYellow, p.Position.Line, p.Position.Character, trimLen(current), logging.AnsiBase)
-        return []CompletionItem{}, true
+        return []CompletionItem{}, true, false
     }
 
     inParams := inParamList(current, p.Position.Character)
+
+    // Build a cache key for this completion context (ignore trailing whitespace
+    // before the cursor when forming the key) and try cache before any LLM call.
+    key := s.completionCacheKey(p, above, current, below, funcCtx, inParams, hasExtra, extraText)
+    if cleaned, ok := s.completionCacheGet(key); ok && strings.TrimSpace(cleaned) != "" {
+        logging.Logf("lsp ", "completion cache hit uri=%s line=%d char=%d preview=%s%s%s",
+            p.TextDocument.URI, p.Position.Line, p.Position.Character,
+            logging.AnsiGreen, logging.PreviewForLog(cleaned), logging.AnsiBase)
+        return s.makeCompletionItems(cleaned, inParams, current, p, docStr), true, false
+    }
     // Heuristic 1: Require a minimal typed identifier prefix to avoid early triggers,
     // but allow immediate completion after structural trigger chars like '.', ':', '/'.
     if !inParams {
@@ -543,14 +559,14 @@ func (s *Server) tryLLMCompletion(p CompletionParams, above, current, below, fun
             start := computeWordStart(current, j)
             if j-start < 1 { // require at least 1 identifier char
                 logging.Logf("lsp ", "%scompletion skip=short-prefix line=%d char=%d current=%q%s", logging.AnsiYellow, p.Position.Line, p.Position.Character, trimLen(current), logging.AnsiBase)
-                return []CompletionItem{}, true
+                return []CompletionItem{}, true, false
             }
         }
     }
     // Concurrency guard: if another LLM request is running, skip this one.
     if !s.tryStartLLM() {
         logging.Logf("lsp ", "%scompletion skip=busy another LLM request in flight%s", logging.AnsiYellow, logging.AnsiBase)
-        return []CompletionItem{}, true
+        return []CompletionItem{}, false, true
     }
 	sysPrompt, userPrompt := buildPrompts(inParams, p, above, current, below, funcCtx)
 	messages := []llm.Message{
@@ -579,7 +595,7 @@ func (s *Server) tryLLMCompletion(p CompletionParams, above, current, below, fun
 		logging.Logf("lsp ", "llm completion error: %v", err)
 		// Log updated averages after this request (even if failed)
 		s.logLLMStats()
-		return nil, false
+        return nil, false, false
 	}
 	// Update response counters (received)
 	s.incRecvCounters(len(text))
@@ -595,14 +611,100 @@ func (s *Server) tryLLMCompletion(p CompletionParams, above, current, below, fun
             }
         }
     }
-	if cleaned != "" {
-		cleaned = stripDuplicateAssignmentPrefix(current[:p.Position.Character], cleaned)
-	}
-	if cleaned == "" {
-		return nil, false
-	}
+    if cleaned != "" {
+        cleaned = stripDuplicateAssignmentPrefix(current[:p.Position.Character], cleaned)
+    }
+    if cleaned == "" {
+        return nil, false, false
+    }
 
-	return s.makeCompletionItems(cleaned, inParams, current, p, docStr), true
+    // Store successful completion in cache
+    s.completionCachePut(key, cleaned)
+
+    return s.makeCompletionItems(cleaned, inParams, current, p, docStr), true, false
+}
+
+// --- small completion cache (last ~10 entries) ---
+
+func (s *Server) completionCacheKey(p CompletionParams, above, current, below, funcCtx string, inParams bool, hasExtra bool, extraText string) string {
+    // Normalize left-of-cursor by trimming trailing spaces/tabs
+    idx := p.Position.Character
+    if idx > len(current) { idx = len(current) }
+    left := strings.TrimRight(current[:idx], " \t")
+    right := ""
+    if idx < len(current) { right = current[idx:] }
+    prov := ""
+    model := ""
+    if s.llmClient != nil {
+        prov = s.llmClient.Name()
+        model = s.llmClient.DefaultModel()
+    }
+    temp := ""
+    if s.codingTemperature != nil { temp = fmt.Sprintf("%.3f", *s.codingTemperature) }
+    extra := ""
+    if hasExtra {
+        extra = strings.TrimSpace(extraText)
+    }
+    // Compose a key from essential context parts
+    return strings.Join([]string{
+        "v1", // version for future-proofing
+        prov,
+        model,
+        temp,
+        p.TextDocument.URI,
+        fmt.Sprintf("%d:%d", p.Position.Line, p.Position.Character),
+        above,
+        left,
+        right,
+        below,
+        funcCtx,
+        fmt.Sprintf("params=%t", inParams),
+        extra,
+    }, "\x1f") // use unit separator to avoid collisions
+}
+
+func (s *Server) completionCacheGet(key string) (string, bool) {
+    s.mu.Lock()
+    defer s.mu.Unlock()
+    v, ok := s.compCache[key]
+    if !ok {
+        return "", false
+    }
+    // move to most-recent
+    s.compCacheTouchLocked(key)
+    return v, true
+}
+
+func (s *Server) completionCachePut(key, value string) {
+    s.mu.Lock()
+    defer s.mu.Unlock()
+    if _, exists := s.compCache[key]; !exists {
+        s.compCacheOrder = append(s.compCacheOrder, key)
+        s.compCache[key] = value
+        if len(s.compCacheOrder) > 10 {
+            // evict oldest
+            old := s.compCacheOrder[0]
+            s.compCacheOrder = s.compCacheOrder[1:]
+            delete(s.compCache, old)
+        }
+        return
+    }
+    // update existing and mark most-recent
+    s.compCache[key] = value
+    s.compCacheTouchLocked(key)
+}
+
+func (s *Server) compCacheTouchLocked(key string) {
+    // assumes s.mu is held
+    // remove any existing occurrence of key in order slice
+    idx := -1
+    for i, k := range s.compCacheOrder {
+        if k == key { idx = i; break }
+    }
+    if idx >= 0 {
+        s.compCacheOrder = append(append([]string{}, s.compCacheOrder[:idx]...), s.compCacheOrder[idx+1:]...)
+    }
+    s.compCacheOrder = append(s.compCacheOrder, key)
 }
 
 // isTriggerEvent returns true when the completion request appears to be caused
diff --git a/internal/lsp/server.go b/internal/lsp/server.go
index 2c4daa9..e1c9eaa 100644
--- a/internal/lsp/server.go
+++ b/internal/lsp/server.go
@@ -38,8 +38,11 @@ type Server struct {
 	llmReqTotal       int64
 	llmSentBytesTotal int64
 	llmRespTotal      int64
-	llmRespBytesTotal int64
-	startTime         time.Time
+    llmRespBytesTotal int64
+    startTime         time.Time
+    // Small LRU cache for recent code completion outputs (keyed by context)
+    compCache      map[string]string
+    compCacheOrder []string // most-recent at end; cap ~10
 }
 
 // ServerOptions collects configuration for NewServer to avoid long parameter lists.
@@ -87,6 +90,7 @@ func NewServer(r io.Reader, w io.Writer, logger *log.Logger, opts ServerOptions)
         s.triggerChars = append([]string{}, opts.TriggerCharacters...)
     }
     s.codingTemperature = opts.CodingTemperature
+    s.compCache = make(map[string]string)
     return s
 }
author	Paul Buetow <paul@buetow.org>	2025-08-20 00:10:15 +0300
committer	Paul Buetow <paul@buetow.org>	2025-08-20 00:10:15 +0300
commit	9751271505527047ad6fd992534735dbbe4de1ff (patch)
tree	f43d42d18a7adb1b8909f8877290fe5fcf8662b9
parent	507b84f2442eecf7422738b66dc29417870cda52 (diff)