1
0
Fork 0
mirror of https://codeberg.org/forgejo/forgejo.git synced 2025-01-14 16:09:01 -05:00
forgejo/models/git_diff.go

301 lines
6.9 KiB
Go
Raw Normal View History

2014-04-12 21:35:36 -04:00
// Copyright 2014 The Gogs Authors. All rights reserved.
// Use of this source code is governed by a MIT-style
// license that can be found in the LICENSE file.
package models
import (
"bufio"
2014-12-09 02:18:25 -05:00
"bytes"
2014-06-19 01:08:03 -04:00
"fmt"
2014-04-12 21:35:36 -04:00
"io"
"os"
"os/exec"
"strings"
"time"
2014-04-12 21:35:36 -04:00
"golang.org/x/net/html/charset"
"golang.org/x/text/transform"
2014-07-26 00:24:27 -04:00
"github.com/Unknwon/com"
2014-12-09 02:18:25 -05:00
"github.com/gogits/gogs/modules/base"
2014-09-12 19:42:11 -04:00
"github.com/gogits/gogs/modules/git"
2014-04-12 21:35:36 -04:00
"github.com/gogits/gogs/modules/log"
2014-06-19 01:08:03 -04:00
"github.com/gogits/gogs/modules/process"
2014-04-12 21:35:36 -04:00
)
// Diff line types.
const (
DIFF_LINE_PLAIN = iota + 1
DIFF_LINE_ADD
DIFF_LINE_DEL
DIFF_LINE_SECTION
)
const (
DIFF_FILE_ADD = iota + 1
DIFF_FILE_CHANGE
DIFF_FILE_DEL
2015-11-02 19:55:24 -05:00
DIFF_FILE_RENAME
2014-04-12 21:35:36 -04:00
)
type DiffLine struct {
LeftIdx int
RightIdx int
Type int
Content string
}
func (d DiffLine) GetType() int {
return d.Type
}
type DiffSection struct {
Name string
Lines []*DiffLine
}
type DiffFile struct {
Name string
2015-11-02 19:55:24 -05:00
OldName string
2014-05-13 12:40:32 -04:00
Index int
2014-04-12 21:35:36 -04:00
Addition, Deletion int
Type int
IsCreated bool
IsDeleted bool
2014-04-15 20:01:20 -04:00
IsBin bool
2015-11-02 19:55:24 -05:00
IsRenamed bool
2014-04-12 21:35:36 -04:00
Sections []*DiffSection
}
type Diff struct {
TotalAddition, TotalDeletion int
Files []*DiffFile
}
func (diff *Diff) NumFiles() int {
return len(diff.Files)
}
const DIFF_HEAD = "diff --git "
func ParsePatch(pid int64, maxlines int, cmd *exec.Cmd, reader io.Reader) (*Diff, error) {
2014-04-12 21:35:36 -04:00
scanner := bufio.NewScanner(reader)
var (
curFile *DiffFile
curSection = &DiffSection{
Lines: make([]*DiffLine, 0, 10),
}
leftLine, rightLine int
2015-07-29 10:55:01 -04:00
// FIXME: Should use cache in the future.
2014-12-09 02:18:25 -05:00
buf bytes.Buffer
2014-04-12 21:35:36 -04:00
)
diff := &Diff{Files: make([]*DiffFile, 0)}
var i int
for scanner.Scan() {
line := scanner.Text()
2014-04-12 21:35:36 -04:00
if strings.HasPrefix(line, "+++ ") || strings.HasPrefix(line, "--- ") {
continue
}
if line == "" {
continue
}
2014-04-12 21:35:36 -04:00
i = i + 1
// Diff data too large, we only show the first about maxlines lines
2015-10-17 17:25:45 -04:00
if i >= maxlines {
2014-04-12 21:35:36 -04:00
log.Warn("Diff data too large")
2015-10-17 17:25:45 -04:00
diff.Files = nil
return diff, nil
2014-04-12 21:35:36 -04:00
}
2014-04-15 20:01:20 -04:00
switch {
case line[0] == ' ':
2014-04-12 21:35:36 -04:00
diffLine := &DiffLine{Type: DIFF_LINE_PLAIN, Content: line, LeftIdx: leftLine, RightIdx: rightLine}
leftLine++
rightLine++
curSection.Lines = append(curSection.Lines, diffLine)
continue
2014-04-15 20:01:20 -04:00
case line[0] == '@':
2014-04-12 21:35:36 -04:00
curSection = &DiffSection{}
curFile.Sections = append(curFile.Sections, curSection)
ss := strings.Split(line, "@@")
diffLine := &DiffLine{Type: DIFF_LINE_SECTION, Content: line}
curSection.Lines = append(curSection.Lines, diffLine)
// Parse line number.
2015-07-29 10:55:01 -04:00
ranges := strings.Split(ss[1][1:], " ")
2014-07-26 00:24:27 -04:00
leftLine, _ = com.StrTo(strings.Split(ranges[0], ",")[0][1:]).Int()
2015-07-29 10:55:01 -04:00
if len(ranges) > 1 {
rightLine, _ = com.StrTo(strings.Split(ranges[1], ",")[0]).Int()
} else {
log.Warn("Parse line number failed: %v", line)
rightLine = leftLine
}
2014-04-12 21:35:36 -04:00
continue
2014-04-15 20:01:20 -04:00
case line[0] == '+':
2014-04-12 21:35:36 -04:00
curFile.Addition++
diff.TotalAddition++
diffLine := &DiffLine{Type: DIFF_LINE_ADD, Content: line, RightIdx: rightLine}
rightLine++
curSection.Lines = append(curSection.Lines, diffLine)
continue
2014-04-15 20:01:20 -04:00
case line[0] == '-':
2014-04-12 21:35:36 -04:00
curFile.Deletion++
diff.TotalDeletion++
diffLine := &DiffLine{Type: DIFF_LINE_DEL, Content: line, LeftIdx: leftLine}
if leftLine > 0 {
leftLine++
}
curSection.Lines = append(curSection.Lines, diffLine)
2014-04-15 20:01:20 -04:00
case strings.HasPrefix(line, "Binary"):
curFile.IsBin = true
2014-04-12 21:35:36 -04:00
continue
}
// Get new file.
if strings.HasPrefix(line, DIFF_HEAD) {
2015-11-02 19:55:24 -05:00
middle := -1
2015-11-20 01:18:50 -05:00
// Note: In case file name is surrounded by double quotes (it happens only in git-shell).
// e.g. diff --git "a/xxx" "b/xxx"
hasQuote := line[len(DIFF_HEAD)] == '"'
2015-11-02 19:55:24 -05:00
if hasQuote {
middle = strings.Index(line, ` "b/`)
} else {
middle = strings.Index(line, " b/")
}
2014-04-12 21:35:36 -04:00
2015-11-02 19:55:24 -05:00
beg := len(DIFF_HEAD)
a := line[beg+2 : middle]
b := line[middle+3:]
if hasQuote {
2015-11-20 01:18:50 -05:00
a = string(git.UnescapeChars([]byte(a[1 : len(a)-1])))
b = string(git.UnescapeChars([]byte(b[1 : len(b)-1])))
2015-08-20 04:08:26 -04:00
}
2014-04-12 21:35:36 -04:00
curFile = &DiffFile{
2015-11-02 19:55:24 -05:00
Name: a,
2014-05-13 12:40:32 -04:00
Index: len(diff.Files) + 1,
2014-04-12 21:35:36 -04:00
Type: DIFF_FILE_CHANGE,
Sections: make([]*DiffSection, 0, 10),
}
diff.Files = append(diff.Files, curFile)
// Check file diff type.
for scanner.Scan() {
switch {
case strings.HasPrefix(scanner.Text(), "new file"):
curFile.Type = DIFF_FILE_ADD
curFile.IsCreated = true
2014-04-12 21:35:36 -04:00
case strings.HasPrefix(scanner.Text(), "deleted"):
curFile.Type = DIFF_FILE_DEL
curFile.IsDeleted = true
2014-04-12 21:35:36 -04:00
case strings.HasPrefix(scanner.Text(), "index"):
curFile.Type = DIFF_FILE_CHANGE
2015-11-02 19:55:24 -05:00
case strings.HasPrefix(scanner.Text(), "similarity index 100%"):
curFile.Type = DIFF_FILE_RENAME
curFile.IsRenamed = true
curFile.OldName = curFile.Name
curFile.Name = b
2014-04-12 21:35:36 -04:00
}
if curFile.Type > 0 {
break
}
}
}
}
2015-07-29 10:55:01 -04:00
for _, f := range diff.Files {
buf.Reset()
for _, sec := range f.Sections {
for _, l := range sec.Lines {
buf.WriteString(l.Content)
buf.WriteString("\n")
}
}
charsetLabel, err := base.DetectEncoding(buf.Bytes())
if charsetLabel != "UTF-8" && err == nil {
encoding, _ := charset.Lookup(charsetLabel)
if encoding != nil {
d := encoding.NewDecoder()
2014-12-09 02:18:25 -05:00
for _, sec := range f.Sections {
for _, l := range sec.Lines {
if c, _, err := transform.String(d, l.Content); err == nil {
l.Content = c
}
2014-12-09 02:18:25 -05:00
}
}
}
}
}
2014-04-12 21:35:36 -04:00
return diff, nil
}
func GetDiffRange(repoPath, beforeCommitId string, afterCommitId string, maxlines int) (*Diff, error) {
2014-04-12 21:35:36 -04:00
repo, err := git.OpenRepository(repoPath)
if err != nil {
return nil, err
}
2014-08-26 08:20:18 -04:00
commit, err := repo.GetCommit(afterCommitId)
2014-04-12 21:35:36 -04:00
if err != nil {
return nil, err
}
2014-05-28 22:15:15 -04:00
rd, wr := io.Pipe()
var cmd *exec.Cmd
2014-08-26 08:20:18 -04:00
// if "after" commit given
if beforeCommitId == "" {
// First commit of repository.
if commit.ParentCount() == 0 {
cmd = exec.Command("git", "show", afterCommitId)
} else {
c, _ := commit.Parent(0)
2015-11-03 22:49:06 -05:00
cmd = exec.Command("git", "diff", "-M", c.ID.String(), afterCommitId)
2014-08-26 08:20:18 -04:00
}
2014-05-28 22:15:15 -04:00
} else {
2015-11-02 19:55:24 -05:00
cmd = exec.Command("git", "diff", "-M", beforeCommitId, afterCommitId)
2014-04-12 21:35:36 -04:00
}
2014-05-28 22:15:15 -04:00
cmd.Dir = repoPath
cmd.Stdout = wr
cmd.Stdin = os.Stdin
cmd.Stderr = os.Stderr
done := make(chan error)
2014-04-12 21:35:36 -04:00
go func() {
cmd.Start()
done <- cmd.Wait()
2014-04-12 21:35:36 -04:00
wr.Close()
}()
defer rd.Close()
2014-08-26 08:20:18 -04:00
desc := fmt.Sprintf("GetDiffRange(%s)", repoPath)
pid := process.Add(desc, cmd)
go func() {
// In case process became zombie.
select {
case <-time.After(5 * time.Minute):
if errKill := process.Kill(pid); errKill != nil {
2014-07-26 00:24:27 -04:00
log.Error(4, "git_diff.ParsePatch(Kill): %v", err)
}
<-done
// return "", ErrExecTimeout.Error(), ErrExecTimeout
case err = <-done:
process.Remove(pid)
}
}()
return ParsePatch(pid, maxlines, cmd, rd)
2014-04-12 21:35:36 -04:00
}
2014-08-26 08:20:18 -04:00
func GetDiffCommit(repoPath, commitId string, maxlines int) (*Diff, error) {
return GetDiffRange(repoPath, "", commitId, maxlines)
2014-08-26 08:20:18 -04:00
}