fix(provider): fix output parsing and separate stderr from stdout

stn1slv · stn1slv · commit ed50c90270e0 · 2026-04-05T16:50:08.000+02:00
- Extract parseOutputLines() helper into common.go, shared by both
  Anthropic and Gemini providers, replacing four copies of identical logic
- Fix multi-digit numbered list stripping (e.g. "10. message" was broken)
- Separate stderr from stdout in CLI exec; only stdout is parsed for
  messages, stderr is included in error output on failure
- Add table-driven tests covering all parsing edge cases
diff --git a/internal/provider/anthropic.go b/internal/provider/anthropic.go
@@ -54,79 +54,12 @@ func (a *AnthropicProvider) GenerateCommitMessages(ctx context.Context, diff str
 	fullPrompt := fmt.Sprintf("%s\n\nUser request: %s\n\nIMPORTANT: Generate exactly %d commit messages, one per line. Do not include any other text, explanations, or formatting - just the commit messages.",
 		systemMsg, userPrompt, a.numSuggestions)
 
-	// Execute claude CLI with haiku model
-	// Using -p flag for print mode and --model for model selection
-	// Pipe prompt via stdin to avoid Windows command line length limits (8191 chars)
-	cmd := exec.CommandContext(ctx, "claude", "--model", a.model, "-p", "-")
-
-	stdin, err := cmd.StdinPipe()
+	output, err := a.runCLI(ctx, fullPrompt)
 	if err != nil {
-		return nil, fmt.Errorf("error creating stdin pipe: %w", err)
-	}
-
-	var outputBuf strings.Builder
-	cmd.Stdout = &outputBuf
-	cmd.Stderr = &outputBuf
-
-	if err := cmd.Start(); err != nil {
-		return nil, fmt.Errorf("error starting claude CLI: %w", err)
-	}
-
-	_, writeErr := stdin.Write([]byte(fullPrompt))
-	stdin.Close()
-
-	waitErr := cmd.Wait()
-
-	if writeErr != nil {
-		return nil, fmt.Errorf("error writing to claude CLI stdin: %w", writeErr)
-	}
-
-	if waitErr != nil {
-		return nil, fmt.Errorf("error executing claude CLI: %w\nOutput: %s", waitErr, outputBuf.String())
-	}
-
-	output := []byte(outputBuf.String())
-
-	// Parse the output - split by newlines and clean
-	content := string(output)
-	lines := strings.Split(content, "\n")
-
-	var commitMessages []string
-	for _, line := range lines {
-		trimmed := strings.TrimSpace(line)
-		// Skip empty lines and lines that look like explanatory text
-		if trimmed == "" {
-			continue
-		}
-		// Skip lines that are clearly not commit messages (too long, contain certain patterns)
-		if len(trimmed) > 200 {
-			continue
-		}
-		// Skip markdown formatting or numbered lists
-		if strings.HasPrefix(trimmed, "#") || strings.HasPrefix(trimmed, "-") || strings.HasPrefix(trimmed, "*") {
-			// Try to extract the actual commit message
-			parts := strings.SplitN(trimmed, " ", 2)
-			if len(parts) == 2 {
-				trimmed = strings.TrimSpace(parts[1])
-			}
-		}
-		// Remove numbered list formatting like "1. " or "1) "
-		if len(trimmed) > 3 {
-			if (trimmed[0] >= '0' && trimmed[0] <= '9') && (trimmed[1] == '.' || trimmed[1] == ')') {
-				trimmed = strings.TrimSpace(trimmed[2:])
-			}
-		}
-
-		if trimmed != "" {
-			commitMessages = append(commitMessages, trimmed)
-		}
-
-		// Stop once we have enough messages
-		if len(commitMessages) >= a.numSuggestions {
-			break
-		}
+		return nil, err
 	}
 
+	commitMessages := parseOutputLines(output, a.numSuggestions)
 	if len(commitMessages) == 0 {
 		return nil, fmt.Errorf("no valid commit messages generated from Claude output")
 	}
@@ -163,77 +96,50 @@ func (a *AnthropicProvider) GeneratePRTitles(ctx context.Context, diff string) (
 	fullPrompt := fmt.Sprintf("%s\n\nUser request: %s\n\nIMPORTANT: Generate exactly %d pull request titles, one per line. Do not include any other text, explanations, or formatting - just the PR titles.",
 		systemMsg, userPrompt, a.numSuggestions)
 
+	output, err := a.runCLI(ctx, fullPrompt)
+	if err != nil {
+		return nil, err
+	}
+
+	prTitles := parseOutputLines(output, a.numSuggestions)
+	if len(prTitles) == 0 {
+		return nil, fmt.Errorf("no valid PR titles generated from Claude output")
+	}
+
+	return prTitles, nil
+}
+
+// runCLI executes the claude CLI with the given prompt via stdin and returns stdout.
+func (a *AnthropicProvider) runCLI(ctx context.Context, prompt string) (string, error) {
+	// Using -p flag for print mode and --model for model selection
 	// Pipe prompt via stdin to avoid Windows command line length limits (8191 chars)
 	cmd := exec.CommandContext(ctx, "claude", "--model", a.model, "-p", "-")
 
 	stdin, err := cmd.StdinPipe()
 	if err != nil {
-		return nil, fmt.Errorf("error creating stdin pipe: %w", err)
+		return "", fmt.Errorf("error creating stdin pipe: %w", err)
 	}
 
-	var outputBuf strings.Builder
-	cmd.Stdout = &outputBuf
-	cmd.Stderr = &outputBuf
+	var stdoutBuf, stderrBuf strings.Builder
+	cmd.Stdout = &stdoutBuf
+	cmd.Stderr = &stderrBuf
 
 	if err := cmd.Start(); err != nil {
-		return nil, fmt.Errorf("error starting claude CLI: %w", err)
+		return "", fmt.Errorf("error starting claude CLI: %w", err)
 	}
 
-	_, writeErr := stdin.Write([]byte(fullPrompt))
+	_, writeErr := stdin.Write([]byte(prompt))
 	stdin.Close()
 
 	waitErr := cmd.Wait()
 
 	if writeErr != nil {
-		return nil, fmt.Errorf("error writing to claude CLI stdin: %w", writeErr)
+		return "", fmt.Errorf("error writing to claude CLI stdin: %w", writeErr)
 	}
 
 	if waitErr != nil {
-		return nil, fmt.Errorf("error executing claude CLI: %w\nOutput: %s", waitErr, outputBuf.String())
-	}
-
-	output := []byte(outputBuf.String())
-
-	// Parse the output - same logic as commit message generation
-	content := string(output)
-	lines := strings.Split(content, "\n")
-
-	var prTitles []string
-	for _, line := range lines {
-		trimmed := strings.TrimSpace(line)
-		if trimmed == "" {
-			continue
-		}
-		if len(trimmed) > 200 {
-			continue
-		}
-		// Skip markdown formatting or numbered lists
-		if strings.HasPrefix(trimmed, "#") || strings.HasPrefix(trimmed, "-") || strings.HasPrefix(trimmed, "*") {
-			parts := strings.SplitN(trimmed, " ", 2)
-			if len(parts) == 2 {
-				trimmed = strings.TrimSpace(parts[1])
-			}
-		}
-		// Remove numbered list formatting like "1. " or "1) "
-		if len(trimmed) > 3 {
-			if (trimmed[0] >= '0' && trimmed[0] <= '9') && (trimmed[1] == '.' || trimmed[1] == ')') {
-				trimmed = strings.TrimSpace(trimmed[2:])
-			}
-		}
-
-		if trimmed != "" {
-			prTitles = append(prTitles, trimmed)
-		}
-
-		// Stop once we have enough titles
-		if len(prTitles) >= a.numSuggestions {
-			break
-		}
-	}
-
-	if len(prTitles) == 0 {
-		return nil, fmt.Errorf("no valid PR titles generated from Claude output")
+		return "", fmt.Errorf("error executing claude CLI: %w\nStderr: %s", waitErr, stderrBuf.String())
 	}
 
-	return prTitles, nil
+	return stdoutBuf.String(), nil
 }
diff --git a/internal/provider/common.go b/internal/provider/common.go
@@ -4,10 +4,50 @@ import (
 	"context"
 	"fmt"
 	"strings"
+	"unicode"
 
 	"github.com/openai/openai-go"
 )
 
+// parseOutputLines parses raw LLM output into clean lines, stripping markdown
+// formatting, numbered/bulleted list prefixes, and skipping empty or overly long lines.
+// It returns at most maxLines results.
+func parseOutputLines(raw string, maxLines int) []string {
+	lines := strings.Split(raw, "\n")
+
+	var result []string
+	for _, line := range lines {
+		trimmed := strings.TrimSpace(line)
+		if trimmed == "" || len(trimmed) > 200 {
+			continue
+		}
+		// Strip markdown heading, bullet, or asterisk prefix
+		if strings.HasPrefix(trimmed, "#") || strings.HasPrefix(trimmed, "-") || strings.HasPrefix(trimmed, "*") {
+			parts := strings.SplitN(trimmed, " ", 2)
+			if len(parts) == 2 {
+				trimmed = strings.TrimSpace(parts[1])
+			}
+		}
+		// Strip numbered list prefix like "1. ", "10) ", "3. "
+		if len(trimmed) > 0 && trimmed[0] >= '0' && trimmed[0] <= '9' {
+			i := 0
+			for i < len(trimmed) && unicode.IsDigit(rune(trimmed[i])) {
+				i++
+			}
+			if i < len(trimmed) && (trimmed[i] == '.' || trimmed[i] == ')') {
+				trimmed = strings.TrimSpace(trimmed[i+1:])
+			}
+		}
+		if trimmed != "" {
+			result = append(result, trimmed)
+		}
+		if len(result) >= maxLines {
+			break
+		}
+	}
+	return result
+}
+
 // commonProvider holds the common fields and methods for OpenAI-compatible providers.
 type commonProvider struct {
 	client *openai.Client
diff --git a/internal/provider/common_test.go b/internal/provider/common_test.go
@@ -0,0 +1,108 @@
+package provider
+
+import (
+	"strings"
+	"testing"
+)
+
+func TestParseOutputLines(t *testing.T) {
+	tests := []struct {
+		name     string
+		input    string
+		maxLines int
+		expected []string
+	}{
+		{
+			name:     "plain lines",
+			input:    "feat: add login\nfix: typo in readme\nchore: update deps",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo in readme", "chore: update deps"},
+		},
+		{
+			name:     "single-digit numbered list with dot",
+			input:    "1. feat: add login\n2. fix: typo\n3. chore: deps",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo", "chore: deps"},
+		},
+		{
+			name:     "single-digit numbered list with paren",
+			input:    "1) feat: add login\n2) fix: typo",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo"},
+		},
+		{
+			name:     "multi-digit numbered list",
+			input:    "10. feat: add login\n11. fix: typo\n12. chore: deps",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo", "chore: deps"},
+		},
+		{
+			name:     "markdown bullet dashes",
+			input:    "- feat: add login\n- fix: typo",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo"},
+		},
+		{
+			name:     "markdown bullet asterisks",
+			input:    "* feat: add login\n* fix: typo",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo"},
+		},
+		{
+			name:     "markdown headings stripped",
+			input:    "# feat: add login\n## fix: typo",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo"},
+		},
+		{
+			name:     "empty lines skipped",
+			input:    "feat: add login\n\n\nfix: typo\n\n",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo"},
+		},
+		{
+			name:     "lines over 200 chars skipped",
+			input:    "feat: add login\n" + strings.Repeat("x", 201) + "\nfix: typo",
+			maxLines: 10,
+			expected: []string{"feat: add login", "fix: typo"},
+		},
+		{
+			name:     "respects maxLines limit",
+			input:    "line1\nline2\nline3\nline4\nline5",
+			maxLines: 3,
+			expected: []string{"line1", "line2", "line3"},
+		},
+		{
+			name:     "whitespace-only input",
+			input:    "   \n  \n\t\n",
+			maxLines: 10,
+			expected: nil,
+		},
+		{
+			name:     "mixed formatting",
+			input:    "1. feat: login\n- fix: typo\n* chore: deps\n## docs: readme\nplain message",
+			maxLines: 10,
+			expected: []string{"feat: login", "fix: typo", "chore: deps", "docs: readme", "plain message"},
+		},
+		{
+			name:     "number at start but no list separator",
+			input:    "3rd attempt at fixing auth",
+			maxLines: 10,
+			expected: []string{"3rd attempt at fixing auth"},
+		},
+	}
+
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			got := parseOutputLines(tt.input, tt.maxLines)
+			if len(got) != len(tt.expected) {
+				t.Fatalf("got %d lines %v, want %d lines %v", len(got), got, len(tt.expected), tt.expected)
+			}
+			for i := range got {
+				if got[i] != tt.expected[i] {
+					t.Errorf("line %d: got %q, want %q", i, got[i], tt.expected[i])
+				}
+			}
+		})
+	}
+}
diff --git a/internal/provider/gemini.go b/internal/provider/gemini.go