fix: address swarm review of the inline PR review (PR #18)

From PR #18's own review — the FIRST run with consensus consolidation live (it posted one ranked consensus comment across 7 models instead of 7 walls). - Anchor inline comments to ADDED lines only (parseDiffNewLines no longer records context lines): Gitea reliably accepts comments on added lines, so the all-or-nothing review POST won't be rejected for an off-change anchor. - Span-scan anchoring (anchorLine): a cluster whose min line is just outside the diff still anchors if any line in its [line,maxLine] span is an added line. - Path normalization (normPath) on both diff and finding paths, so "./pkg/x.go" vs "pkg/x.go" vs a "b/"-prefixed diff path all match (and the comment Path is the normalized repo-relative one). - deletePriorReviews: paginate (cap 10 pages) and bail on a non-2xx GET, so a stale marked review past page 1 is still removed and the "replace not stack" guarantee holds better under failure. - mergeIntoCluster backfills an empty title/detail from any report (not only a strictly-higher-severity one). - Rename inlineReviewHTTPTime -> inlineReviewHTTPTimeout (emit.go convention). Graded the run's 36 findings in gadfly-reports (notably a 7/7-consensus deletePriorReviews error-handling finding — the consensus signal working as intended). XSS-framed findings marked false (Gitea sanitizes review markdown); trusted-input and gofmt-clean ones likewise. Tests updated for added-only anchoring + span scan. gofmt/vet/bash -n clean. Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
2026-06-28 21:59:27 -04:00
parent 7577c21039
commit 4ea80cad1f
3 changed files with 131 additions and 59 deletions
@@ -382,6 +382,15 @@ func mergeIntoCluster(c *cluster, f outFinding, model string) {
 	if f.Line > c.maxLine {
 		c.maxLine = f.Line
 	}
 	// Backfill an empty title/detail from any report, regardless of severity, so a
 	// higher-severity-but-terse finding doesn't leave the cluster without context.
 	if strings.TrimSpace(c.title) == "" && strings.TrimSpace(f.Title) != "" {
 		c.title = f.Title
 	}
 	if strings.TrimSpace(c.detail) == "" && strings.TrimSpace(f.Detail) != "" {
 		c.detail = f.Detail
 	}
 	// A strictly-higher-severity report takes over the title/detail.
 	if sevRank(f.Severity) > sevRank(c.severity) {
 		c.severity = f.Severity
 		if strings.TrimSpace(f.Title) != "" {
@@ -33,8 +33,8 @@ const (
 	// maxInlineComments caps how many inline comments one review carries, so a
 	// huge diff can't produce a wall of annotations. Clusters are pre-sorted by
 	// agreement×severity, so the cap keeps the most important.
-	maxInlineComments    = 25
+	maxInlineComments       = 25
-	inlineReviewHTTPTime = 20 * time.Second
+	inlineReviewHTTPTimeout = 20 * time.Second
 )
 // reviewComment is one inline comment in a Gitea pull review. Field names match
@@ -76,7 +76,7 @@ func postInlineReview(clusters []cluster) {
 		return // nothing anchors to a changed line; the consensus comment covers it
 	}
-	client := &http.Client{Timeout: inlineReviewHTTPTime}
+	client := &http.Client{Timeout: inlineReviewHTTPTimeout}
 	base := fmt.Sprintf("%s/pulls/%s/reviews", api, pr)
 	deletePriorReviews(client, base, token) // avoid stacking on re-runs
@@ -92,11 +92,12 @@ func postInlineReview(clusters []cluster) {
 func inlineComments(clusters []cluster, addable map[string]map[int]bool) []reviewComment {
 	var out []reviewComment
 	for _, c := range clusters {
-		lines := addable[c.file]
+		path := normPath(c.file)
-		if lines == nil || c.line <= 0 || !lines[c.line] {
+		anchor := anchorLine(addable[path], c.line, c.maxLine)
 		if anchor == 0 {
 			continue
 		}
-		out = append(out, reviewComment{Path: c.file, NewPosition: c.line, Body: inlineBody(c)})
+		out = append(out, reviewComment{Path: path, NewPosition: anchor, Body: inlineBody(c)})
 		if len(out) >= maxInlineComments {
 			break
 		}
@@ -104,6 +105,25 @@ func inlineComments(clusters []cluster, addable map[string]map[int]bool) []revie
 	return out
 }
 // anchorLine returns the first line in [lo,hi] that is an added line in the diff,
 // or 0 if none. Scanning the cluster's whole span (not just its representative
 // line) anchors a finding whose min line is just outside the diff but whose span
 // still overlaps a changed line.
 func anchorLine(added map[int]bool, lo, hi int) int {
 	if added == nil || lo <= 0 {
 		return 0
 	}
 	if hi < lo { // single-line cluster (maxLine unset)
 		hi = lo
 	}
 	for ln := lo; ln <= hi; ln++ {
 		if added[ln] {
 			return ln
 		}
 	}
 	return 0
 }
 // inlineBody renders one inline comment: severity + title, who flagged it, detail.
 func inlineBody(c cluster) string {
 	var b strings.Builder
@@ -116,11 +136,13 @@ func inlineBody(c cluster) string {
 	return b.String()
 }
-// parseDiffNewLines returns, per file, the set of NEW-file line numbers that are
+// parseDiffNewLines returns, per file, the set of NEW-file line numbers that were
-// present in the unified diff (added '+' or context ' ' lines) — the lines an
+// ADDED in the unified diff — the safest lines for an inline comment to anchor to
-// inline comment can anchor to. Hunk lengths from the @@ header bound each hunk,
+// (Gitea reliably accepts comments on added lines). Context lines are walked to
-// so a content line that happens to start with "+++ " or "@@" is still read as
+// keep the line counter correct but are NOT recorded: anchoring only to added
-// content, not mistaken for a header.
+// lines avoids the all-or-nothing review POST being rejected for an off-change
 // anchor. Hunk lengths from the @@ header bound each hunk, so a content line that
 // happens to start with "+++ " or "@@" is still read as content, not a header.
 func parseDiffNewLines(diff string) map[string]map[int]bool {
 	out := map[string]map[int]bool{}
 	var file string
@@ -130,14 +152,13 @@ func parseDiffNewLines(diff string) map[string]map[int]bool {
 		if inHunk && (newRem > 0 || oldRem > 0) {
 			switch {
 			case strings.HasPrefix(line, "+"):
-				record(out, file, newLine)
+				record(out, file, newLine) // added line — anchorable
 				newLine++
 				newRem--
 			case strings.HasPrefix(line, "-"):
 				oldRem--
 			case strings.HasPrefix(line, "\\"): // "\ No newline at end of file"
-			default: // context line (leading space, or an empty line)
+			default: // context line (leading space, or an empty line): advance, don't record
 				record(out, file, newLine)
 				newLine++
 				newRem--
 				oldRem--
@@ -149,8 +170,7 @@ func parseDiffNewLines(diff string) map[string]map[int]bool {
 		}
 		switch {
 		case strings.HasPrefix(line, "+++ "):
-			p := strings.TrimPrefix(strings.TrimPrefix(line, "+++ "), "b/")
+			file = normPath(strings.TrimPrefix(line, "+++ "))
 			file = strings.TrimSpace(p)
 			if file == "/dev/null" {
 				file = ""
 			}
@@ -170,6 +190,19 @@ func parseDiffNewLines(diff string) map[string]map[int]bool {
 // @@ -<oldStart>[,<oldLen>] +<newStart>[,<newLen>] @@
 var hunkRe = regexp.MustCompile(`^@@ -(\d+)(?:,(\d+))? \+(\d+)(?:,(\d+))? @@`)
 // normPath trims a unified-diff path down to a repo-relative one: strip a single
 // leading "a/" or "b/" prefix (and any "./"), and surrounding whitespace. Applied
 // to BOTH the diff paths and a finding's file so they match even when a model
 // writes "./pkg/x.go" or the diff carries the "b/" prefix.
 func normPath(p string) string {
 	p = strings.TrimSpace(p)
 	p = strings.TrimPrefix(p, "./")
 	if strings.HasPrefix(p, "a/") || strings.HasPrefix(p, "b/") {
 		p = p[2:]
 	}
 	return p
 }
 func record(out map[string]map[int]bool, file string, line int) {
 	if file == "" {
 		return
@@ -195,33 +228,44 @@ func atoiOr(s string, def int) int {
 // deletePriorReviews removes our previous inline reviews (matched by the body
 // marker) so a re-run replaces rather than stacks. Best-effort and quiet.
 func deletePriorReviews(client *http.Client, base, token string) {
-	req, err := http.NewRequest(http.MethodGet, base+"?limit=50", nil)
+	const perPage = 50
-	if err != nil {
+	for page := 1; page <= 10; page++ { // bound the scan, but page past 50 so a stale marked review isn't missed
-		return
+		req, err := http.NewRequest(http.MethodGet, fmt.Sprintf("%s?limit=%d&page=%d", base, perPage, page), nil)
 	}
 	req.Header.Set("Authorization", "token "+token)
 	resp, err := client.Do(req)
 	if err != nil {
 		return
 	}
 	var reviews []struct {
 		ID   int    `json:"id"`
 		Body string `json:"body"`
 	}
 	_ = json.NewDecoder(resp.Body).Decode(&reviews)
 	resp.Body.Close()
 	for _, r := range reviews {
 		if !strings.Contains(r.Body, inlineReviewMarker) {
 			continue
 		}
 		dreq, err := http.NewRequest(http.MethodDelete, fmt.Sprintf("%s/%d", base, r.ID), nil)
 		if err != nil {
-			continue
+			return
 		}
-		dreq.Header.Set("Authorization", "token "+token)
+		req.Header.Set("Authorization", "token "+token)
-		if dresp, err := client.Do(dreq); err == nil {
+		resp, err := client.Do(req)
-			io.Copy(io.Discard, dresp.Body)
+		if err != nil {
-			dresp.Body.Close()
+			return
 		}
 		if resp.StatusCode < 200 || resp.StatusCode >= 300 {
 			io.Copy(io.Discard, resp.Body)
 			resp.Body.Close()
 			return
 		}
 		var reviews []struct {
 			ID   int    `json:"id"`
 			Body string `json:"body"`
 		}
 		_ = json.NewDecoder(resp.Body).Decode(&reviews)
 		resp.Body.Close()
 		for _, r := range reviews {
 			if !strings.Contains(r.Body, inlineReviewMarker) {
 				continue
 			}
 			dreq, err := http.NewRequest(http.MethodDelete, fmt.Sprintf("%s/%d", base, r.ID), nil)
 			if err != nil {
 				continue
 			}
 			dreq.Header.Set("Authorization", "token "+token)
 			if dresp, err := client.Do(dreq); err == nil {
 				io.Copy(io.Discard, dresp.Body)
 				dresp.Body.Close()
 			}
 		}
 		if len(reviews) < perPage {
 			return // last page
 		}
 	}
 }
@@ -1,6 +1,9 @@
 package main
-import "testing"
+import (
 	"strings"
 	"testing"
 )
 func TestParseDiffNewLines(t *testing.T) {
 	diff := "diff --git a/a.go b/a.go\n" +
@@ -14,18 +17,19 @@ func TestParseDiffNewLines(t *testing.T) {
 		"+new3\n" +
 		" line4\n"
 	got := parseDiffNewLines(diff)
-	want := map[int]bool{1: true, 2: true, 3: true, 4: true} // context+added new-file lines
+	// Only ADDED lines anchor: new2 (line 2) and new3 (line 3). Context lines 1
 	// and 4 are walked for counting but not recorded.
 	want := map[int]bool{2: true, 3: true}
 	if len(got["a.go"]) != len(want) {
-		t.Fatalf("a.go lines = %v, want %v", got["a.go"], want)
+		t.Fatalf("a.go lines = %v, want %v (added-only)", got["a.go"], want)
 	}
 	for ln := range want {
 		if !got["a.go"][ln] {
 			t.Errorf("expected a.go line %d anchorable", ln)
 		}
 	}
-	// The deleted line's old number must NOT be an anchor target beyond the new set.
+	if got["a.go"][1] || got["a.go"][4] {
-	if got["a.go"][5] {
+		t.Error("context lines 1/4 should not be anchorable (added-only)")
 		t.Error("line 5 should not be anchorable")
 	}
 }
@@ -34,8 +38,22 @@ func TestParseDiffNewLinesContentLooksLikeHeader(t *testing.T) {
 	// diff. Hunk-length tracking must read it as content, not a file header.
 	diff := "--- a/x\n+++ b/x\n@@ -1,1 +1,2 @@\n ctx\n+++ weird\n"
 	got := parseDiffNewLines(diff)
-	if !got["x"][1] || !got["x"][2] {
+	if got["x"][1] { // context line, not recorded (added-only)
-		t.Errorf("want lines 1 (ctx) and 2 (added) anchorable, got %v", got["x"])
+		t.Errorf("line 1 is context, should not anchor: %v", got["x"])
 	}
 	if !got["x"][2] { // the "+++ weird" added line
 		t.Errorf("want added line 2 anchorable, got %v", got["x"])
 	}
 }
 func TestAnchorLineScansSpan(t *testing.T) {
 	// A cluster spanning 10..14 whose min line (10) isn't in the diff but whose
 	// span includes added line 14 must anchor to 14, not be dropped.
 	added := map[string]map[int]bool{"a.go": {14: true}}
 	clusters := []cluster{{file: "a.go", line: 10, maxLine: 14, severity: "high", title: "t", models: set("m1"), lenses: set("x")}}
 	cs := inlineComments(clusters, added)
 	if len(cs) != 1 || cs[0].NewPosition != 14 {
 		t.Fatalf("want anchor at 14 via span scan, got %+v", cs)
 	}
 }
@@ -51,6 +69,16 @@ func TestParseDiffNewLinesMultiFile(t *testing.T) {
 	}
 }
 func TestInlineCommentsNormalizesPaths(t *testing.T) {
 	// Diff path "b/pkg/x.go" -> "pkg/x.go"; a finding written as "./pkg/x.go" must
 	// still anchor (both normalize to the same repo-relative path).
 	addable := parseDiffNewLines("--- a/pkg/x.go\n+++ b/pkg/x.go\n@@ -0,0 +1,1 @@\n+bug\n")
 	clusters := []cluster{{file: "./pkg/x.go", line: 1, severity: "high", title: "t", models: set("m1"), lenses: set("x")}}
 	if cs := inlineComments(clusters, addable); len(cs) != 1 || cs[0].Path != "pkg/x.go" {
 		t.Errorf("path normalization failed to anchor: %+v", cs)
 	}
 }
 func TestInlineCommentsFiltersToDiffLines(t *testing.T) {
 	addable := map[string]map[int]bool{"a.go": {10: true, 11: true}}
 	clusters := []cluster{
@@ -65,7 +93,7 @@ func TestInlineCommentsFiltersToDiffLines(t *testing.T) {
 	if cs[0].Path != "a.go" || cs[0].NewPosition != 10 {
 		t.Errorf("wrong anchor: %+v", cs[0])
 	}
-	if !containsStr(cs[0].Body, "anchored") || !containsStr(cs[0].Body, "2 model") {
+	if !strings.Contains(cs[0].Body, "anchored") || !strings.Contains(cs[0].Body, "2 model") {
 		t.Errorf("inline body missing title/agreement: %q", cs[0].Body)
 	}
 }
@@ -77,12 +105,3 @@ func set(xs ...string) map[string]bool {
 	}
 	return m
 }
 func containsStr(s, sub string) bool {
 	for i := 0; i+len(sub) <= len(s); i++ {
 		if s[i:i+len(sub)] == sub {
 			return true
 		}
 	}
 	return false
 }