Skip to content

Commit e0cf3d8

Browse files
authored
Migrated Repository will show modifications when possible (#17191)
* Read patches to get history
1 parent ba6efb1 commit e0cf3d8

File tree

5 files changed

+188
-3
lines changed

5 files changed

+188
-3
lines changed

modules/git/repo_compare.go

+61
Original file line numberDiff line numberDiff line change
@@ -6,9 +6,14 @@
66
package git
77

88
import (
9+
"bufio"
910
"bytes"
11+
"errors"
1012
"fmt"
1113
"io"
14+
"io/ioutil"
15+
"os"
16+
"path/filepath"
1217
"regexp"
1318
"strconv"
1419
"strings"
@@ -188,6 +193,8 @@ func GetDiffShortStat(repoPath string, args ...string) (numFiles, totalAdditions
188193
var shortStatFormat = regexp.MustCompile(
189194
`\s*(\d+) files? changed(?:, (\d+) insertions?\(\+\))?(?:, (\d+) deletions?\(-\))?`)
190195

196+
var patchCommits = regexp.MustCompile(`^From\s(\w+)\s`)
197+
191198
func parseDiffStat(stdout string) (numFiles, totalAdditions, totalDeletions int, err error) {
192199
if len(stdout) == 0 || stdout == "\n" {
193200
return 0, 0, 0, nil
@@ -267,3 +274,57 @@ func (repo *Repository) GetDiffFromMergeBase(base, head string, w io.Writer) err
267274
}
268275
return err
269276
}
277+
278+
// ReadPullHead will fetch a pull ref if possible or return an error
279+
func (repo *Repository) ReadPullHead(prID int64) (commitSHA string, err error) {
280+
headPath := fmt.Sprintf("refs/pull/%d/head", prID)
281+
fullHeadPath := filepath.Join(repo.Path, headPath)
282+
loadHead, err := os.Open(fullHeadPath)
283+
if err != nil {
284+
return "", err
285+
}
286+
defer loadHead.Close()
287+
// Read only the first line of the patch - usually it contains the first commit made in patch
288+
scanner := bufio.NewScanner(loadHead)
289+
scanner.Scan()
290+
commitHead := scanner.Text()
291+
if len(commitHead) != 40 {
292+
return "", errors.New("head file doesn't contain valid commit ID")
293+
}
294+
return commitHead, nil
295+
}
296+
297+
// ReadPatchCommit will check if a diff patch exists and return stats
298+
func (repo *Repository) ReadPatchCommit(prID int64) (commitSHA string, err error) {
299+
// Migrated repositories download patches to "pulls" location
300+
patchFile := fmt.Sprintf("pulls/%d.patch", prID)
301+
loadPatch, err := os.Open(filepath.Join(repo.Path, patchFile))
302+
if err != nil {
303+
return "", err
304+
}
305+
defer loadPatch.Close()
306+
// Read only the first line of the patch - usually it contains the first commit made in patch
307+
scanner := bufio.NewScanner(loadPatch)
308+
scanner.Scan()
309+
// Parse the Patch stats, sometimes Migration returns a 404 for the patch file
310+
commitSHAGroups := patchCommits.FindStringSubmatch(scanner.Text())
311+
if len(commitSHAGroups) != 0 {
312+
commitSHA = commitSHAGroups[1]
313+
} else {
314+
return "", errors.New("patch file doesn't contain valid commit ID")
315+
}
316+
return commitSHA, nil
317+
}
318+
319+
// WritePullHead will populate a PR head retrieved from patch file
320+
func (repo *Repository) WritePullHead(prID int64, commitSHA string) error {
321+
headPath := fmt.Sprintf("refs/pull/%d", prID)
322+
fullHeadPath := filepath.Join(repo.Path, headPath)
323+
// Create missing directory just in case
324+
if err := os.MkdirAll(fullHeadPath, os.ModePerm); err != nil {
325+
return err
326+
}
327+
commitBytes := []byte(commitSHA)
328+
pullPath := filepath.Join(fullHeadPath, "head")
329+
return ioutil.WriteFile(pullPath, commitBytes, os.ModePerm)
330+
}

modules/git/repo_compare_test.go

+49-2
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@ import (
88
"bytes"
99
"io"
1010
"path/filepath"
11+
"strings"
1112
"testing"
1213

1314
"code.gitea.io/gitea/modules/util"
@@ -18,11 +19,11 @@ import (
1819
func TestGetFormatPatch(t *testing.T) {
1920
bareRepo1Path := filepath.Join(testReposDir, "repo1_bare")
2021
clonedPath, err := cloneRepo(bareRepo1Path, testReposDir, "repo1_TestGetFormatPatch")
21-
assert.NoError(t, err)
2222
defer util.RemoveAll(clonedPath)
23-
repo, err := OpenRepository(clonedPath)
2423
assert.NoError(t, err)
24+
repo, err := OpenRepository(clonedPath)
2525
defer repo.Close()
26+
assert.NoError(t, err)
2627
rd := &bytes.Buffer{}
2728
err = repo.GetPatch("8d92fc95^", "8d92fc95", rd)
2829
assert.NoError(t, err)
@@ -32,3 +33,49 @@ func TestGetFormatPatch(t *testing.T) {
3233
assert.Regexp(t, "^From 8d92fc95", patch)
3334
assert.Contains(t, patch, "Subject: [PATCH] Add file2.txt")
3435
}
36+
37+
func TestReadPatch(t *testing.T) {
38+
// Ensure we can read the patch files
39+
bareRepo1Path := filepath.Join(testReposDir, "repo1_bare")
40+
repo, err := OpenRepository(bareRepo1Path)
41+
defer repo.Close()
42+
assert.NoError(t, err)
43+
// This patch doesn't exist
44+
noFile, err := repo.ReadPatchCommit(0)
45+
assert.Error(t, err)
46+
// This patch is an empty one (sometimes it's a 404)
47+
noCommit, err := repo.ReadPatchCommit(1)
48+
assert.Error(t, err)
49+
// This patch is legit and should return a commit
50+
oldCommit, err := repo.ReadPatchCommit(2)
51+
assert.NoError(t, err)
52+
53+
assert.Empty(t, noFile)
54+
assert.Empty(t, noCommit)
55+
assert.Len(t, oldCommit, 40)
56+
assert.True(t, oldCommit == "6e8e2a6f9efd71dbe6917816343ed8415ad696c3")
57+
}
58+
59+
func TestReadWritePullHead(t *testing.T) {
60+
// Ensure we can write SHA1 head corresponding to PR and open them
61+
bareRepo1Path := filepath.Join(testReposDir, "repo1_bare")
62+
repo, err := OpenRepository(bareRepo1Path)
63+
assert.NoError(t, err)
64+
defer repo.Close()
65+
// Try to open non-existing Pull
66+
_, err = repo.ReadPullHead(0)
67+
assert.Error(t, err)
68+
// Write a fake sha1 with only 40 zeros
69+
newCommit := strings.Repeat("0", 40)
70+
err = repo.WritePullHead(1, newCommit)
71+
assert.NoError(t, err)
72+
headFile := filepath.Join(repo.Path, "refs/pull/1/head")
73+
// Remove file after the test
74+
defer util.Remove(headFile)
75+
assert.FileExists(t, headFile)
76+
// Read the file created
77+
headContents, err := repo.ReadPullHead(1)
78+
assert.NoError(t, err)
79+
assert.Len(t, string(headContents), 40)
80+
assert.True(t, string(headContents) == newCommit)
81+
}

modules/git/tests/repos/repo1_bare/pulls/1.patch

Whitespace-only changes.
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,39 @@
1+
From 6e8e2a6f9efd71dbe6917816343ed8415ad696c3 Mon Sep 17 00:00:00 2001
2+
From: 99rgosse <renaud@mycompany.com>
3+
Date: Fri, 26 Mar 2021 12:44:22 +0000
4+
Subject: [PATCH] Update gitea_import_actions.py
5+
6+
---
7+
gitea_import_actions.py | 6 +++---
8+
1 file changed, 3 insertions(+), 3 deletions(-)
9+
10+
diff --git a/gitea_import_actions.py b/gitea_import_actions.py
11+
index f0d72cd..7b31963 100644
12+
--- a/gitea_import_actions.py
13+
+++ b/gitea_import_actions.py
14+
@@ -3,14 +3,14 @@
15+
# git log --pretty=format:'%H,%at,%s' --date=default > /tmp/commit.log
16+
# to get the commits logfile for a repository
17+
18+
-import mysql.connector as mariadb
19+
+import psycopg2
20+
21+
# set the following variables to fit your need...
22+
USERID = 1
23+
REPOID = 1
24+
BRANCH = "master"
25+
26+
-mydb = mariadb.connect(
27+
+mydb = psycopg2.connect(
28+
host="localhost",
29+
user="user",
30+
passwd="password",
31+
@@ -31,4 +31,4 @@ with open("/tmp/commit.log") as f:
32+
33+
mydb.commit()
34+
35+
-print("actions inserted.")
36+
\ No newline at end of file
37+
+print("actions inserted.")
38+
--
39+
GitLab

routers/web/repo/pull.go

+39-1
Original file line numberDiff line numberDiff line change
@@ -320,8 +320,46 @@ func PrepareMergedViewPullInfo(ctx *context.Context, issue *models.Issue) *git.C
320320
setMergeTarget(ctx, pull)
321321
ctx.Data["HasMerged"] = true
322322

323+
var baseCommit string
324+
// Some migrated PR won't have any Base SHA and lose history, try to get one
325+
if pull.MergeBase == "" {
326+
var commitSHA, parentCommit string
327+
// If there is a head or a patch file, and it is readable, grab info
328+
commitSHA, err := ctx.Repo.GitRepo.ReadPullHead(pull.Index)
329+
if err != nil {
330+
// Head File does not exist, try the patch
331+
commitSHA, err = ctx.Repo.GitRepo.ReadPatchCommit(pull.Index)
332+
if err == nil {
333+
// Recreate pull head in files for next time
334+
if err := ctx.Repo.GitRepo.WritePullHead(pull.Index, commitSHA); err != nil {
335+
log.Error("Could not write head file", err)
336+
}
337+
} else {
338+
// There is no history available
339+
log.Trace("No history file available for PR %d", pull.Index)
340+
}
341+
}
342+
if commitSHA != "" {
343+
// Get immediate parent of the first commit in the patch, grab history back
344+
parentCommit, err = git.NewCommandContext(ctx, "rev-list", "-1", "--skip=1", commitSHA).RunInDir(ctx.Repo.GitRepo.Path)
345+
if err == nil {
346+
parentCommit = strings.TrimSpace(parentCommit)
347+
}
348+
// Special case on Git < 2.25 that doesn't fail on immediate empty history
349+
if err != nil || parentCommit == "" {
350+
log.Info("No known parent commit for PR %d, error: %v", pull.Index, err)
351+
// bring at least partial history if it can work
352+
parentCommit = commitSHA
353+
}
354+
}
355+
baseCommit = parentCommit
356+
} else {
357+
// Keep an empty history or original commit
358+
baseCommit = pull.MergeBase
359+
}
360+
323361
compareInfo, err := ctx.Repo.GitRepo.GetCompareInfo(ctx.Repo.Repository.RepoPath(),
324-
pull.MergeBase, pull.GetGitRefName(), true, false)
362+
baseCommit, pull.GetGitRefName(), true, false)
325363
if err != nil {
326364
if strings.Contains(err.Error(), "fatal: Not a valid object name") || strings.Contains(err.Error(), "unknown revision or path not in the working tree") {
327365
ctx.Data["IsPullRequestBroken"] = true

0 commit comments

Comments
 (0)