-
Notifications
You must be signed in to change notification settings - Fork 8
/
Copy pathcody-diff.el
116 lines (99 loc) · 4.4 KB
/
cody-diff.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
;;; cody-diff.el -- Provides Myers diff functionality -*- lexical-binding: t; -*-
;; Copyright (C) 2024 Sourcegraph, Inc.
;; Version: 0.1
;; Author: Steve Yegge <steve.yegge@gmail.com>
;; URL: https://github.com/sourcegraph/emacs-cody
;;; Commentary:
;; This provides a very quick-and-dirty list differ. It is intended
;; only for diffing within relatively short single sequences of under a
;; few hundred characters, for code autocompletion use cases.
;;; Code:
(eval-when-compile (require 'cl-lib))
(defvar cody--list-diff-cache (make-hash-table :test 'equal)
"Memoization cache for `cody--list-diff'.")
(defun cody-diff-lists (a b)
"Compute Myers diff of lists A and B.
Returns a list of `patches' consisting of either atoms, which are
unchanged regions, deletions of the form (- atom atom? ...), and
insertions of the form (+ atom atom? ...)."
(clrhash cody--list-diff-cache)
(let ((max-lisp-eval-depth 25000)) ; allow deeper recursion
(cody--diff-worker a b)))
(defun cody-diff-strings (a b)
"Compute Myers diff at character level on two strings A and B.
Returns same as `cody-diff-lists' except with single-character
strings as the atoms in the patch."
(cody-diff-lists (mapcar #'string (string-to-list a))
(mapcar #'string (string-to-list b))))
(defun cody-diff-strings-with-positions (a b start-pos)
"Postprocesses the `cody-diff-strings' output for display.
A is the buffer string at START-POS being compared with B.
Removes all unchanged characters, and prepends the buffer position
to each diff chunk. Return value is a list whose elements represent
insertions of the form `(POS . STRING)'.
Returns nil if there are any deletions or overwrites in the diff."
(cody--diff-get-patch-insertions (cody-diff-strings a b)
start-pos))
(defun cody--diff-get-patch-insertions (patch start-pos)
"Convert PATCH, a list of patch chunks, into position-based inserts.
START-POS is the buffer position corresponding to the beginning of the
code rewrites for the line, and may be at the beginning of the current
line, before point, but not before `line-beginning-position'.
The Myers diff algorithm returns patches that take the form of a
list of chunks which are either atoms representing unchanged
characters, or flat lists representing insertions (car is `+'),
with no support currently for deletions.
Example:
(C B (+ A) B A (+ C))
We rewrite this list to compute the character position of each
insertion, discarding the unchanged characters, which are used to
count the buffer position for each patch chunk.
If any element of the passed PATCH is a deletion such as `(- A B)',
this function returns nil."
(cl-loop with pos = start-pos
and inserts = nil
for chunk in patch
do (pcase chunk
(`(+ . ,ins)
(let ((insertion-str (apply 'concat ins)))
(push (cons pos insertion-str) inserts)
(cl-incf pos (length insertion-str))))
(`(- . ,_) (cl-return nil)) ; Return nil immediately if a deletion is found
(_ (cl-incf pos))) ; Handle unchanged characters
finally return (nreverse inserts)))
;; Implementation courtesy of Michael Bauer <perma-curious@posteo.de>,
;; http://perma-curious.eu/post-elisp-diff/, who has graciously given his
;; permission to use it.
(defun cody--diff-worker (a b)
"Diff A and B.
Recursively computes the longest common subsequence and while
doing so assembles the returned diff."
;; f:first r:rest
(with-memoization (gethash (cons a b) cody--list-diff-cache)
(cl-labels
((choose (a b)
;; choose diff with longer lcs
(let ((la (seq-count #'atom a))
(lb (seq-count #'atom b)))
(if (> la lb) a b)))
(merge (x)
;; merge consecutive add or rem
(pcase x
(`((,op ,f) (,op . ,r) . ,d)
`((,op ,f . ,r) . ,d))
(d d))))
(cond
((and a b)
(pcase-let ((`(,af . ,ar) a)
(`(,bf . ,br) b))
(if (equal af bf)
;; same
(cons af (cody--diff-worker ar br))
;; different
(merge (choose (cons (list '+ bf) (cody--diff-worker a br))
(cons (list '- af) (cody--diff-worker ar b)))))))
;; rest
(a `((- . ,a)))
(b `((+ . ,b)))))))
(provide 'cody-diff)
;;; cody-diff.el ends here