aboutsummaryrefslogtreecommitdiff
path: root/diff/lines/diff_test.go
diff options
context:
space:
mode:
authorGravatar Runxi Yu2026-02-21 13:25:21 +0800
committerGravatar Runxi Yu2026-02-21 13:25:21 +0800
commitb01bc1a344c47ded15342f7872832daa1bf5cfce (patch)
tree2cce3baa4881debff633ac0daf093a74e10bbded /diff/lines/diff_test.go
parentSTRUCTURE: Remove (diff)
signatureNo signature
diff/lines: Line-based diffs via Myers
Diffstat (limited to 'diff/lines/diff_test.go')
-rw-r--r--diff/lines/diff_test.go326
1 files changed, 326 insertions, 0 deletions
diff --git a/diff/lines/diff_test.go b/diff/lines/diff_test.go
new file mode 100644
index 00000000..9f0d1ab8
--- /dev/null
+++ b/diff/lines/diff_test.go
@@ -0,0 +1,326 @@
+package lines
+
+import (
+ "bytes"
+ "strconv"
+ "strings"
+ "testing"
+)
+
+func TestDiff(t *testing.T) {
+ t.Parallel()
+
+ tests := []struct {
+ name string
+ oldInput string
+ newInput string
+ expected []Chunk
+ }{
+ {
+ name: "empty inputs produce no chunks",
+ oldInput: "",
+ newInput: "",
+ expected: []Chunk{},
+ },
+ {
+ name: "only additions",
+ oldInput: "",
+ newInput: "alpha\nbeta\n",
+ expected: []Chunk{
+ {Kind: ChunkKindAdded, Data: []byte("alpha\nbeta\n")},
+ },
+ },
+ {
+ name: "only deletions",
+ oldInput: "alpha\nbeta\n",
+ newInput: "",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("alpha\nbeta\n")},
+ },
+ },
+ {
+ name: "unchanged content is grouped",
+ oldInput: "same\nlines\n",
+ newInput: "same\nlines\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("same\nlines\n")},
+ },
+ },
+ {
+ name: "insertion in the middle",
+ oldInput: "a\nb\nc\n",
+ newInput: "a\nb\nX\nc\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("a\nb\n")},
+ {Kind: ChunkKindAdded, Data: []byte("X\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("c\n")},
+ },
+ },
+ {
+ name: "replacement without trailing newline",
+ oldInput: "first\nsecond",
+ newInput: "first\nsecond\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("first\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("second")},
+ {Kind: ChunkKindAdded, Data: []byte("second\n")},
+ },
+ },
+ {
+ name: "line replacement",
+ oldInput: "a\nb\nc\n",
+ newInput: "a\nB\nc\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("a\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("b\n")},
+ {Kind: ChunkKindAdded, Data: []byte("B\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("c\n")},
+ },
+ },
+ {
+ name: "swap adjacent lines",
+ oldInput: "A\nB\n",
+ newInput: "B\nA\n",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("A\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("B\n")},
+ {Kind: ChunkKindAdded, Data: []byte("A\n")},
+ },
+ },
+ {
+ name: "indentation change is a full line replacement",
+ oldInput: "func main() {\n\treturn\n}\n",
+ newInput: "func main() {\n return\n}\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("func main() {\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("\treturn\n")},
+ {Kind: ChunkKindAdded, Data: []byte(" return\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("}\n")},
+ },
+ },
+ {
+ name: "commenting out lines",
+ oldInput: "code\n",
+ newInput: "// code\n",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("code\n")},
+ {Kind: ChunkKindAdded, Data: []byte("// code\n")},
+ },
+ },
+ {
+ name: "reducing repeating lines",
+ oldInput: "log\nlog\nlog\n",
+ newInput: "log\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("log\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("log\nlog\n")},
+ },
+ },
+ {
+ name: "expanding repeating lines",
+ oldInput: "tick\n",
+ newInput: "tick\ntick\ntick\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("tick\n")},
+ {Kind: ChunkKindAdded, Data: []byte("tick\ntick\n")},
+ },
+ },
+ {
+ name: "interleaved modifications",
+ oldInput: "keep\nchange\nkeep\nchange\n",
+ newInput: "keep\nfixed\nkeep\nfixed\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("keep\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("change\n")},
+ {Kind: ChunkKindAdded, Data: []byte("fixed\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("keep\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("change\n")},
+ {Kind: ChunkKindAdded, Data: []byte("fixed\n")},
+ },
+ },
+ {
+ name: "large common header and footer",
+ oldInput: "header\nheader\nheader\nOLD\nfooter\nfooter\n",
+ newInput: "header\nheader\nheader\nNEW\nfooter\nfooter\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("header\nheader\nheader\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("OLD\n")},
+ {Kind: ChunkKindAdded, Data: []byte("NEW\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("footer\nfooter\n")},
+ },
+ },
+ {
+ name: "completely different content",
+ oldInput: "apple\nbanana\n",
+ newInput: "cherry\ndate\n",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("apple\nbanana\n")},
+ {Kind: ChunkKindAdded, Data: []byte("cherry\ndate\n")},
+ },
+ },
+ {
+ name: "unicode and emoji changes",
+ oldInput: "Hello 🌍\nYay\n",
+ newInput: "Hello 🌎\nYay\n",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("Hello 🌍\n")},
+ {Kind: ChunkKindAdded, Data: []byte("Hello 🌎\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("Yay\n")},
+ },
+ },
+ {
+ name: "binary data with embedded newlines",
+ oldInput: "\x00\x01\n\x02\x03\n",
+ newInput: "\x00\x01\n\x02\xFF\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("\x00\x01\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("\x02\x03\n")},
+ {Kind: ChunkKindAdded, Data: []byte("\x02\xFF\n")},
+ },
+ },
+ {
+ name: "adding trailing newline to last line",
+ oldInput: "Line 1\nLine 2",
+ newInput: "Line 1\nLine 2\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("Line 1\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("Line 2")},
+ {Kind: ChunkKindAdded, Data: []byte("Line 2\n")},
+ },
+ },
+ {
+ name: "removing trailing newline",
+ oldInput: "A\nB\n",
+ newInput: "A\nB",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("A\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("B\n")},
+ {Kind: ChunkKindAdded, Data: []byte("B")},
+ },
+ },
+ {
+ name: "inserting blank lines",
+ oldInput: "A\nB\n",
+ newInput: "A\n\n\nB\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("A\n")},
+ {Kind: ChunkKindAdded, Data: []byte("\n\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("B\n")},
+ },
+ },
+ {
+ name: "collapsing blank lines",
+ oldInput: "A\n\n\n\nB\n",
+ newInput: "A\nB\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("A\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("\n\n\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("B\n")},
+ },
+ },
+ {
+ name: "case sensitivity check",
+ oldInput: "FOO\nbar\n",
+ newInput: "foo\nbar\n",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("FOO\n")},
+ {Kind: ChunkKindAdded, Data: []byte("foo\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("bar\n")},
+ },
+ },
+ {
+ name: "partial line match is full mismatch",
+ oldInput: "The quick brown fox\n",
+ newInput: "The quick brown fox jumps\n",
+ expected: []Chunk{
+ {Kind: ChunkKindDeleted, Data: []byte("The quick brown fox\n")},
+ {Kind: ChunkKindAdded, Data: []byte("The quick brown fox jumps\n")},
+ },
+ },
+ {
+ name: "inserting middle content",
+ oldInput: "Top\nBottom\n",
+ newInput: "Top\nMiddle\nBottom\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("Top\n")},
+ {Kind: ChunkKindAdded, Data: []byte("Middle\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("Bottom\n")},
+ },
+ },
+ {
+ name: "block move simulated",
+ oldInput: "BlockA\nBlockB\nBlockC\n",
+ newInput: "BlockA\nBlockC\nBlockB\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("BlockA\n")},
+ {Kind: ChunkKindDeleted, Data: []byte("BlockB\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("BlockC\n")},
+ {Kind: ChunkKindAdded, Data: []byte("BlockB\n")},
+ },
+ },
+ {
+ name: "alternating additions",
+ oldInput: "A\nB\nC\n",
+ newInput: "A\n1\nB\n2\nC\n",
+ expected: []Chunk{
+ {Kind: ChunkKindUnchanged, Data: []byte("A\n")},
+ {Kind: ChunkKindAdded, Data: []byte("1\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("B\n")},
+ {Kind: ChunkKindAdded, Data: []byte("2\n")},
+ {Kind: ChunkKindUnchanged, Data: []byte("C\n")},
+ },
+ },
+ }
+
+ for _, tt := range tests {
+ t.Run(tt.name, func(t *testing.T) {
+ t.Parallel()
+
+ chunks, err := Diff([]byte(tt.oldInput), []byte(tt.newInput))
+ if err != nil {
+ t.Fatalf("Diff returned error: %v", err)
+ }
+
+ if len(chunks) != len(tt.expected) {
+ t.Fatalf("expected %d chunks, got %d: %s", len(tt.expected), len(chunks), formatChunks(chunks))
+ }
+
+ for i := range tt.expected {
+ if chunks[i].Kind != tt.expected[i].Kind {
+ t.Fatalf("chunk %d kind mismatch: got %v, want %v; chunks: %s", i, chunks[i].Kind, tt.expected[i].Kind, formatChunks(chunks))
+ }
+ if !bytes.Equal(chunks[i].Data, tt.expected[i].Data) {
+ t.Fatalf("chunk %d data mismatch: got %q, want %q; chunks: %s", i, string(chunks[i].Data), string(tt.expected[i].Data), formatChunks(chunks))
+ }
+ }
+ })
+ }
+}
+
+func formatChunks(chunks []Chunk) string {
+ var b strings.Builder
+ b.WriteByte('[')
+ for i, chunk := range chunks {
+ if i > 0 {
+ b.WriteString(", ")
+ }
+ b.WriteString(chunkKindName(chunk.Kind))
+ b.WriteByte(':')
+ b.WriteString(strconv.Quote(string(chunk.Data)))
+ }
+ b.WriteByte(']')
+ return b.String()
+}
+
+func chunkKindName(kind ChunkKind) string {
+ switch kind {
+ case ChunkKindUnchanged:
+ return "U"
+ case ChunkKindDeleted:
+ return "D"
+ case ChunkKindAdded:
+ return "A"
+ default:
+ return "?"
+ }
+}