blob: 65316147c7e3efc7625959c1d80071b2e863a9a9 [file] [log] [blame]
Austin Engcc2516a2023-10-17 20:57:54 +00001// Copyright 2021 The Dawn & Tint Authors
Ben Clayton4485fcd2021-04-16 08:58:44 +00002//
Austin Engcc2516a2023-10-17 20:57:54 +00003// Redistribution and use in source and binary forms, with or without
4// modification, are permitted provided that the following conditions are met:
Ben Clayton4485fcd2021-04-16 08:58:44 +00005//
Austin Engcc2516a2023-10-17 20:57:54 +00006// 1. Redistributions of source code must retain the above copyright notice, this
7// list of conditions and the following disclaimer.
Ben Clayton4485fcd2021-04-16 08:58:44 +00008//
Austin Engcc2516a2023-10-17 20:57:54 +00009// 2. Redistributions in binary form must reproduce the above copyright notice,
10// this list of conditions and the following disclaimer in the documentation
11// and/or other materials provided with the distribution.
12//
13// 3. Neither the name of the copyright holder nor the names of its
14// contributors may be used to endorse or promote products derived from
15// this software without specific prior written permission.
16//
17// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
18// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
20// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
21// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
23// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
24// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
25// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
Ben Clayton4485fcd2021-04-16 08:58:44 +000027
28package substr
29
30import (
31 diff "github.com/sergi/go-diff/diffmatchpatch"
32)
33
34// Fix attempts to reconstruct substr by comparing it to body.
35// substr is a fuzzy substring of body.
36// Fix returns a new exact substring of body, by calculating a diff of the text.
37// If no match could be made, Fix() returns an empty string.
38func Fix(body, substr string) string {
39 dmp := diff.New()
40
41 diffs := dmp.DiffMain(body, substr, false)
42 if len(diffs) == 0 {
43 return ""
44 }
45
46 front := func() diff.Diff { return diffs[0] }
47 back := func() diff.Diff { return diffs[len(diffs)-1] }
48
49 start, end := 0, len(body)
50
51 // Trim edits that remove text from body start
52 for len(diffs) > 0 && front().Type == diff.DiffDelete {
53 start += len(front().Text)
54 diffs = diffs[1:]
55 }
56
57 // Trim edits that remove text from body end
58 for len(diffs) > 0 && back().Type == diff.DiffDelete {
59 end -= len(back().Text)
60 diffs = diffs[:len(diffs)-1]
61 }
62
63 // New substring is the span for the remainder of the edits
64 return body[start:end]
65}