mirror of https://github.com/go-gitea/gitea
Some refactor on git diff and ignore getting commit information failed on migrating pull request review comments (#9996)
* Some refactor on git diff and ignore getting commit information failed on migrating pull request review comments * fix test * fix lint * Change error log to warnpull/9997/head^2
parent
1019913eab
commit
e8860ef4f9
@ -0,0 +1,260 @@ |
||||
// Copyright 2020 The Gitea Authors. All rights reserved.
|
||||
// Use of this source code is governed by a MIT-style
|
||||
// license that can be found in the LICENSE file.
|
||||
|
||||
package git |
||||
|
||||
import ( |
||||
"bufio" |
||||
"bytes" |
||||
"context" |
||||
"fmt" |
||||
"io" |
||||
"os/exec" |
||||
"regexp" |
||||
"strconv" |
||||
"strings" |
||||
|
||||
"code.gitea.io/gitea/modules/process" |
||||
) |
||||
|
||||
// RawDiffType type of a raw diff.
|
||||
type RawDiffType string |
||||
|
||||
// RawDiffType possible values.
|
||||
const ( |
||||
RawDiffNormal RawDiffType = "diff" |
||||
RawDiffPatch RawDiffType = "patch" |
||||
) |
||||
|
||||
// GetRawDiff dumps diff results of repository in given commit ID to io.Writer.
|
||||
func GetRawDiff(repoPath, commitID string, diffType RawDiffType, writer io.Writer) error { |
||||
return GetRawDiffForFile(repoPath, "", commitID, diffType, "", writer) |
||||
} |
||||
|
||||
// GetRawDiffForFile dumps diff results of file in given commit ID to io.Writer.
|
||||
func GetRawDiffForFile(repoPath, startCommit, endCommit string, diffType RawDiffType, file string, writer io.Writer) error { |
||||
repo, err := OpenRepository(repoPath) |
||||
if err != nil { |
||||
return fmt.Errorf("OpenRepository: %v", err) |
||||
} |
||||
defer repo.Close() |
||||
|
||||
return GetRepoRawDiffForFile(repo, startCommit, endCommit, diffType, file, writer) |
||||
} |
||||
|
||||
// GetRepoRawDiffForFile dumps diff results of file in given commit ID to io.Writer according given repository
|
||||
func GetRepoRawDiffForFile(repo *Repository, startCommit, endCommit string, diffType RawDiffType, file string, writer io.Writer) error { |
||||
commit, err := repo.GetCommit(endCommit) |
||||
if err != nil { |
||||
return fmt.Errorf("GetCommit: %v", err) |
||||
} |
||||
fileArgs := make([]string, 0) |
||||
if len(file) > 0 { |
||||
fileArgs = append(fileArgs, "--", file) |
||||
} |
||||
// FIXME: graceful: These commands should have a timeout
|
||||
ctx, cancel := context.WithCancel(DefaultContext) |
||||
defer cancel() |
||||
|
||||
var cmd *exec.Cmd |
||||
switch diffType { |
||||
case RawDiffNormal: |
||||
if len(startCommit) != 0 { |
||||
cmd = exec.CommandContext(ctx, GitExecutable, append([]string{"diff", "-M", startCommit, endCommit}, fileArgs...)...) |
||||
} else if commit.ParentCount() == 0 { |
||||
cmd = exec.CommandContext(ctx, GitExecutable, append([]string{"show", endCommit}, fileArgs...)...) |
||||
} else { |
||||
c, _ := commit.Parent(0) |
||||
cmd = exec.CommandContext(ctx, GitExecutable, append([]string{"diff", "-M", c.ID.String(), endCommit}, fileArgs...)...) |
||||
} |
||||
case RawDiffPatch: |
||||
if len(startCommit) != 0 { |
||||
query := fmt.Sprintf("%s...%s", endCommit, startCommit) |
||||
cmd = exec.CommandContext(ctx, GitExecutable, append([]string{"format-patch", "--no-signature", "--stdout", "--root", query}, fileArgs...)...) |
||||
} else if commit.ParentCount() == 0 { |
||||
cmd = exec.CommandContext(ctx, GitExecutable, append([]string{"format-patch", "--no-signature", "--stdout", "--root", endCommit}, fileArgs...)...) |
||||
} else { |
||||
c, _ := commit.Parent(0) |
||||
query := fmt.Sprintf("%s...%s", endCommit, c.ID.String()) |
||||
cmd = exec.CommandContext(ctx, GitExecutable, append([]string{"format-patch", "--no-signature", "--stdout", query}, fileArgs...)...) |
||||
} |
||||
default: |
||||
return fmt.Errorf("invalid diffType: %s", diffType) |
||||
} |
||||
|
||||
stderr := new(bytes.Buffer) |
||||
|
||||
cmd.Dir = repo.Path |
||||
cmd.Stdout = writer |
||||
cmd.Stderr = stderr |
||||
pid := process.GetManager().Add(fmt.Sprintf("GetRawDiffForFile: [repo_path: %s]", repo.Path), cancel) |
||||
defer process.GetManager().Remove(pid) |
||||
|
||||
if err = cmd.Run(); err != nil { |
||||
return fmt.Errorf("Run: %v - %s", err, stderr) |
||||
} |
||||
return nil |
||||
} |
||||
|
||||
// ParseDiffHunkString parse the diffhunk content and return
|
||||
func ParseDiffHunkString(diffhunk string) (leftLine, leftHunk, rightLine, righHunk int) { |
||||
ss := strings.Split(diffhunk, "@@") |
||||
ranges := strings.Split(ss[1][1:], " ") |
||||
leftRange := strings.Split(ranges[0], ",") |
||||
leftLine, _ = strconv.Atoi(leftRange[0][1:]) |
||||
if len(leftRange) > 1 { |
||||
leftHunk, _ = strconv.Atoi(leftRange[1]) |
||||
} |
||||
if len(ranges) > 1 { |
||||
rightRange := strings.Split(ranges[1], ",") |
||||
rightLine, _ = strconv.Atoi(rightRange[0]) |
||||
if len(rightRange) > 1 { |
||||
righHunk, _ = strconv.Atoi(rightRange[1]) |
||||
} |
||||
} else { |
||||
log("Parse line number failed: %v", diffhunk) |
||||
rightLine = leftLine |
||||
righHunk = leftHunk |
||||
} |
||||
return |
||||
} |
||||
|
||||
// Example: @@ -1,8 +1,9 @@ => [..., 1, 8, 1, 9]
|
||||
var hunkRegex = regexp.MustCompile(`^@@ -(?P<beginOld>[0-9]+)(,(?P<endOld>[0-9]+))? \+(?P<beginNew>[0-9]+)(,(?P<endNew>[0-9]+))? @@`) |
||||
|
||||
const cmdDiffHead = "diff --git " |
||||
|
||||
func isHeader(lof string) bool { |
||||
return strings.HasPrefix(lof, cmdDiffHead) || strings.HasPrefix(lof, "---") || strings.HasPrefix(lof, "+++") |
||||
} |
||||
|
||||
// CutDiffAroundLine cuts a diff of a file in way that only the given line + numberOfLine above it will be shown
|
||||
// it also recalculates hunks and adds the appropriate headers to the new diff.
|
||||
// Warning: Only one-file diffs are allowed.
|
||||
func CutDiffAroundLine(originalDiff io.Reader, line int64, old bool, numbersOfLine int) string { |
||||
if line == 0 || numbersOfLine == 0 { |
||||
// no line or num of lines => no diff
|
||||
return "" |
||||
} |
||||
scanner := bufio.NewScanner(originalDiff) |
||||
hunk := make([]string, 0) |
||||
// begin is the start of the hunk containing searched line
|
||||
// end is the end of the hunk ...
|
||||
// currentLine is the line number on the side of the searched line (differentiated by old)
|
||||
// otherLine is the line number on the opposite side of the searched line (differentiated by old)
|
||||
var begin, end, currentLine, otherLine int64 |
||||
var headerLines int |
||||
for scanner.Scan() { |
||||
lof := scanner.Text() |
||||
// Add header to enable parsing
|
||||
if isHeader(lof) { |
||||
hunk = append(hunk, lof) |
||||
headerLines++ |
||||
} |
||||
if currentLine > line { |
||||
break |
||||
} |
||||
// Detect "hunk" with contains commented lof
|
||||
if strings.HasPrefix(lof, "@@") { |
||||
// Already got our hunk. End of hunk detected!
|
||||
if len(hunk) > headerLines { |
||||
break |
||||
} |
||||
// A map with named groups of our regex to recognize them later more easily
|
||||
submatches := hunkRegex.FindStringSubmatch(lof) |
||||
groups := make(map[string]string) |
||||
for i, name := range hunkRegex.SubexpNames() { |
||||
if i != 0 && name != "" { |
||||
groups[name] = submatches[i] |
||||
} |
||||
} |
||||
if old { |
||||
begin, _ = strconv.ParseInt(groups["beginOld"], 10, 64) |
||||
end, _ = strconv.ParseInt(groups["endOld"], 10, 64) |
||||
// init otherLine with begin of opposite side
|
||||
otherLine, _ = strconv.ParseInt(groups["beginNew"], 10, 64) |
||||
} else { |
||||
begin, _ = strconv.ParseInt(groups["beginNew"], 10, 64) |
||||
if groups["endNew"] != "" { |
||||
end, _ = strconv.ParseInt(groups["endNew"], 10, 64) |
||||
} else { |
||||
end = 0 |
||||
} |
||||
// init otherLine with begin of opposite side
|
||||
otherLine, _ = strconv.ParseInt(groups["beginOld"], 10, 64) |
||||
} |
||||
end += begin // end is for real only the number of lines in hunk
|
||||
// lof is between begin and end
|
||||
if begin <= line && end >= line { |
||||
hunk = append(hunk, lof) |
||||
currentLine = begin |
||||
continue |
||||
} |
||||
} else if len(hunk) > headerLines { |
||||
hunk = append(hunk, lof) |
||||
// Count lines in context
|
||||
switch lof[0] { |
||||
case '+': |
||||
if !old { |
||||
currentLine++ |
||||
} else { |
||||
otherLine++ |
||||
} |
||||
case '-': |
||||
if old { |
||||
currentLine++ |
||||
} else { |
||||
otherLine++ |
||||
} |
||||
default: |
||||
currentLine++ |
||||
otherLine++ |
||||
} |
||||
} |
||||
} |
||||
|
||||
// No hunk found
|
||||
if currentLine == 0 { |
||||
return "" |
||||
} |
||||
// headerLines + hunkLine (1) = totalNonCodeLines
|
||||
if len(hunk)-headerLines-1 <= numbersOfLine { |
||||
// No need to cut the hunk => return existing hunk
|
||||
return strings.Join(hunk, "\n") |
||||
} |
||||
var oldBegin, oldNumOfLines, newBegin, newNumOfLines int64 |
||||
if old { |
||||
oldBegin = currentLine |
||||
newBegin = otherLine |
||||
} else { |
||||
oldBegin = otherLine |
||||
newBegin = currentLine |
||||
} |
||||
// headers + hunk header
|
||||
newHunk := make([]string, headerLines) |
||||
// transfer existing headers
|
||||
copy(newHunk, hunk[:headerLines]) |
||||
// transfer last n lines
|
||||
newHunk = append(newHunk, hunk[len(hunk)-numbersOfLine-1:]...) |
||||
// calculate newBegin, ... by counting lines
|
||||
for i := len(hunk) - 1; i >= len(hunk)-numbersOfLine; i-- { |
||||
switch hunk[i][0] { |
||||
case '+': |
||||
newBegin-- |
||||
newNumOfLines++ |
||||
case '-': |
||||
oldBegin-- |
||||
oldNumOfLines++ |
||||
default: |
||||
oldBegin-- |
||||
newBegin-- |
||||
newNumOfLines++ |
||||
oldNumOfLines++ |
||||
} |
||||
} |
||||
// construct the new hunk header
|
||||
newHunk[headerLines] = fmt.Sprintf("@@ -%d,%d +%d,%d @@", |
||||
oldBegin, oldNumOfLines, newBegin, newNumOfLines) |
||||
return strings.Join(newHunk, "\n") |
||||
} |
@ -0,0 +1,82 @@ |
||||
// Copyright 2020 The Gitea Authors. All rights reserved.
|
||||
// Use of this source code is governed by a MIT-style
|
||||
// license that can be found in the LICENSE file.
|
||||
|
||||
package git |
||||
|
||||
import ( |
||||
"strings" |
||||
"testing" |
||||
|
||||
"github.com/stretchr/testify/assert" |
||||
) |
||||
|
||||
const exampleDiff = `diff --git a/README.md b/README.md |
||||
--- a/README.md |
||||
+++ b/README.md |
||||
@@ -1,3 +1,6 @@ |
||||
# gitea-github-migrator |
||||
+ |
||||
+ Build Status |
||||
- Latest Release |
||||
Docker Pulls |
||||
+ cut off |
||||
+ cut off` |
||||
|
||||
func TestCutDiffAroundLine(t *testing.T) { |
||||
result := CutDiffAroundLine(strings.NewReader(exampleDiff), 4, false, 3) |
||||
resultByLine := strings.Split(result, "\n") |
||||
assert.Len(t, resultByLine, 7) |
||||
// Check if headers got transferred
|
||||
assert.Equal(t, "diff --git a/README.md b/README.md", resultByLine[0]) |
||||
assert.Equal(t, "--- a/README.md", resultByLine[1]) |
||||
assert.Equal(t, "+++ b/README.md", resultByLine[2]) |
||||
// Check if hunk header is calculated correctly
|
||||
assert.Equal(t, "@@ -2,2 +3,2 @@", resultByLine[3]) |
||||
// Check if line got transferred
|
||||
assert.Equal(t, "+ Build Status", resultByLine[4]) |
||||
|
||||
// Must be same result as before since old line 3 == new line 5
|
||||
newResult := CutDiffAroundLine(strings.NewReader(exampleDiff), 3, true, 3) |
||||
assert.Equal(t, result, newResult, "Must be same result as before since old line 3 == new line 5") |
||||
|
||||
newResult = CutDiffAroundLine(strings.NewReader(exampleDiff), 6, false, 300) |
||||
assert.Equal(t, exampleDiff, newResult) |
||||
|
||||
emptyResult := CutDiffAroundLine(strings.NewReader(exampleDiff), 6, false, 0) |
||||
assert.Empty(t, emptyResult) |
||||
|
||||
// Line is out of scope
|
||||
emptyResult = CutDiffAroundLine(strings.NewReader(exampleDiff), 434, false, 0) |
||||
assert.Empty(t, emptyResult) |
||||
} |
||||
|
||||
func BenchmarkCutDiffAroundLine(b *testing.B) { |
||||
for n := 0; n < b.N; n++ { |
||||
CutDiffAroundLine(strings.NewReader(exampleDiff), 3, true, 3) |
||||
} |
||||
} |
||||
|
||||
func ExampleCutDiffAroundLine() { |
||||
const diff = `diff --git a/README.md b/README.md |
||||
--- a/README.md |
||||
+++ b/README.md |
||||
@@ -1,3 +1,6 @@ |
||||
# gitea-github-migrator |
||||
+ |
||||
+ Build Status |
||||
- Latest Release |
||||
Docker Pulls |
||||
+ cut off |
||||
+ cut off` |
||||
result := CutDiffAroundLine(strings.NewReader(diff), 4, false, 3) |
||||
println(result) |
||||
} |
||||
|
||||
func TestParseDiffHunkString(t *testing.T) { |
||||
leftLine, leftHunk, rightLine, rightHunk := ParseDiffHunkString("@@ -19,3 +19,5 @@ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER") |
||||
assert.EqualValues(t, 19, leftLine) |
||||
assert.EqualValues(t, 3, leftHunk) |
||||
assert.EqualValues(t, 19, rightLine) |
||||
assert.EqualValues(t, 5, rightHunk) |
||||
} |
Loading…
Reference in new issue