2019-02-12 16:07:31 +03:00
// Copyright 2019 The Gitea Authors. All rights reserved.
// Use of this source code is governed by a MIT-style
// license that can be found in the LICENSE file.
2019-04-17 19:06:35 +03:00
package repofiles
2019-02-12 16:07:31 +03:00
import (
"bytes"
"context"
"fmt"
"io"
"os"
2019-04-17 19:06:35 +03:00
"regexp"
2019-02-12 16:07:31 +03:00
"strings"
"time"
"code.gitea.io/gitea/models"
2019-04-17 19:06:35 +03:00
"code.gitea.io/gitea/modules/git"
2019-05-11 18:29:17 +03:00
"code.gitea.io/gitea/modules/log"
2019-02-12 16:07:31 +03:00
"code.gitea.io/gitea/modules/setting"
2019-09-06 05:20:09 +03:00
"code.gitea.io/gitea/services/gitdiff"
2019-02-12 16:07:31 +03:00
)
2019-04-17 19:06:35 +03:00
// TemporaryUploadRepository is a type to wrap our upload repositories as a shallow clone
2019-02-12 16:07:31 +03:00
type TemporaryUploadRepository struct {
repo * models . Repository
2019-04-17 19:06:35 +03:00
gitRepo * git . Repository
2019-02-12 16:07:31 +03:00
basePath string
}
// NewTemporaryUploadRepository creates a new temporary upload repository
func NewTemporaryUploadRepository ( repo * models . Repository ) ( * TemporaryUploadRepository , error ) {
2019-05-11 18:29:17 +03:00
basePath , err := models . CreateTemporaryPath ( "upload" )
if err != nil {
return nil , err
2019-02-12 16:07:31 +03:00
}
t := & TemporaryUploadRepository { repo : repo , basePath : basePath }
return t , nil
}
// Close the repository cleaning up all files
func ( t * TemporaryUploadRepository ) Close ( ) {
2019-11-13 10:01:19 +03:00
defer t . gitRepo . Close ( )
2019-05-11 18:29:17 +03:00
if err := models . RemoveTemporaryPath ( t . basePath ) ; err != nil {
log . Error ( "Failed to remove temporary path %s: %v" , t . basePath , err )
2019-02-12 16:07:31 +03:00
}
}
// Clone the base repository to our path and set branch as the HEAD
func ( t * TemporaryUploadRepository ) Clone ( branch string ) error {
2019-11-11 14:46:28 +03:00
if _ , err := git . NewCommand ( "clone" , "-s" , "--bare" , "-b" , branch , t . repo . RepoPath ( ) , t . basePath ) . Run ( ) ; err != nil {
stderr := err . Error ( )
2019-04-17 19:06:35 +03:00
if matched , _ := regexp . MatchString ( ".*Remote branch .* not found in upstream origin.*" , stderr ) ; matched {
2019-04-19 15:17:27 +03:00
return git . ErrBranchNotExist {
2019-04-17 19:06:35 +03:00
Name : branch ,
}
} else if matched , _ := regexp . MatchString ( ".* repository .* does not exist.*" , stderr ) ; matched {
return models . ErrRepoNotExist {
ID : t . repo . ID ,
UID : t . repo . OwnerID ,
OwnerName : t . repo . OwnerName ,
Name : t . repo . Name ,
}
} else {
return fmt . Errorf ( "Clone: %v %s" , err , stderr )
}
}
gitRepo , err := git . OpenRepository ( t . basePath )
if err != nil {
return err
2019-02-12 16:07:31 +03:00
}
2019-04-17 19:06:35 +03:00
t . gitRepo = gitRepo
2019-02-12 16:07:31 +03:00
return nil
}
// SetDefaultIndex sets the git index to our HEAD
func ( t * TemporaryUploadRepository ) SetDefaultIndex ( ) error {
2019-11-11 14:46:28 +03:00
if _ , err := git . NewCommand ( "read-tree" , "HEAD" ) . RunInDir ( t . basePath ) ; err != nil {
return fmt . Errorf ( "SetDefaultIndex: %v" , err )
2019-02-12 16:07:31 +03:00
}
return nil
}
// LsFiles checks if the given filename arguments are in the index
func ( t * TemporaryUploadRepository ) LsFiles ( filenames ... string ) ( [ ] string , error ) {
stdOut := new ( bytes . Buffer )
stdErr := new ( bytes . Buffer )
cmdArgs := [ ] string { "ls-files" , "-z" , "--" }
for _ , arg := range filenames {
if arg != "" {
cmdArgs = append ( cmdArgs , arg )
}
}
2019-11-11 14:46:28 +03:00
if err := git . NewCommand ( cmdArgs ... ) . RunInDirPipeline ( t . basePath , stdOut , stdErr ) ; err != nil {
log . Error ( "Unable to run git ls-files for temporary repo: %s (%s) Error: %v\nstdout: %s\nstderr: %s" , t . repo . FullName ( ) , t . basePath , err , stdOut . String ( ) , stdErr . String ( ) )
err = fmt . Errorf ( "Unable to run git ls-files for temporary repo of: %s Error: %v\nstdout: %s\nstderr: %s" , t . repo . FullName ( ) , err , stdOut . String ( ) , stdErr . String ( ) )
2019-02-12 16:07:31 +03:00
return nil , err
}
filelist := make ( [ ] string , len ( filenames ) )
for _ , line := range bytes . Split ( stdOut . Bytes ( ) , [ ] byte { '\000' } ) {
filelist = append ( filelist , string ( line ) )
}
2019-11-11 14:46:28 +03:00
return filelist , nil
2019-02-12 16:07:31 +03:00
}
// RemoveFilesFromIndex removes the given files from the index
func ( t * TemporaryUploadRepository ) RemoveFilesFromIndex ( filenames ... string ) error {
stdOut := new ( bytes . Buffer )
stdErr := new ( bytes . Buffer )
stdIn := new ( bytes . Buffer )
for _ , file := range filenames {
if file != "" {
stdIn . WriteString ( "0 0000000000000000000000000000000000000000\t" )
stdIn . WriteString ( file )
stdIn . WriteByte ( '\000' )
}
}
2019-11-11 14:46:28 +03:00
if err := git . NewCommand ( "update-index" , "--remove" , "-z" , "--index-info" ) . RunInDirFullPipeline ( t . basePath , stdOut , stdErr , stdIn ) ; err != nil {
log . Error ( "Unable to update-index for temporary repo: %s (%s) Error: %v\nstdout: %s\nstderr: %s" , t . repo . FullName ( ) , t . basePath , err , stdOut . String ( ) , stdErr . String ( ) )
return fmt . Errorf ( "Unable to update-index for temporary repo: %s Error: %v\nstdout: %s\nstderr: %s" , t . repo . FullName ( ) , err , stdOut . String ( ) , stdErr . String ( ) )
2019-02-12 16:07:31 +03:00
}
2019-11-11 14:46:28 +03:00
return nil
2019-02-12 16:07:31 +03:00
}
// HashObject writes the provided content to the object db and returns its hash
func ( t * TemporaryUploadRepository ) HashObject ( content io . Reader ) ( string , error ) {
2019-11-11 14:46:28 +03:00
stdOut := new ( bytes . Buffer )
stdErr := new ( bytes . Buffer )
2019-02-12 16:07:31 +03:00
2019-11-11 14:46:28 +03:00
if err := git . NewCommand ( "hash-object" , "-w" , "--stdin" ) . RunInDirFullPipeline ( t . basePath , stdOut , stdErr , content ) ; err != nil {
log . Error ( "Unable to hash-object to temporary repo: %s (%s) Error: %v\nstdout: %s\nstderr: %s" , t . repo . FullName ( ) , t . basePath , err , stdOut . String ( ) , stdErr . String ( ) )
return "" , fmt . Errorf ( "Unable to hash-object to temporary repo: %s Error: %v\nstdout: %s\nstderr: %s" , t . repo . FullName ( ) , err , stdOut . String ( ) , stdErr . String ( ) )
2019-02-12 16:07:31 +03:00
}
2019-11-11 14:46:28 +03:00
return strings . TrimSpace ( stdOut . String ( ) ) , nil
2019-02-12 16:07:31 +03:00
}
// AddObjectToIndex adds the provided object hash to the index with the provided mode and path
func ( t * TemporaryUploadRepository ) AddObjectToIndex ( mode , objectHash , objectPath string ) error {
2019-11-11 14:46:28 +03:00
if _ , err := git . NewCommand ( "update-index" , "--add" , "--replace" , "--cacheinfo" , mode , objectHash , objectPath ) . RunInDir ( t . basePath ) ; err != nil {
stderr := err . Error ( )
2019-04-17 19:06:35 +03:00
if matched , _ := regexp . MatchString ( ".*Invalid path '.*" , stderr ) ; matched {
return models . ErrFilePathInvalid {
Message : objectPath ,
Path : objectPath ,
}
}
2019-11-11 14:46:28 +03:00
log . Error ( "Unable to add object to index: %s %s %s in temporary repo %s(%s) Error: %v" , mode , objectHash , objectPath , t . repo . FullName ( ) , t . basePath , err )
return fmt . Errorf ( "Unable to add object to index at %s in temporary repo %s Error: %v" , objectPath , t . repo . FullName ( ) , err )
2019-02-12 16:07:31 +03:00
}
return nil
}
// WriteTree writes the current index as a tree to the object db and returns its hash
func ( t * TemporaryUploadRepository ) WriteTree ( ) ( string , error ) {
2019-11-11 14:46:28 +03:00
stdout , err := git . NewCommand ( "write-tree" ) . RunInDir ( t . basePath )
2019-02-12 16:07:31 +03:00
if err != nil {
2019-11-11 14:46:28 +03:00
log . Error ( "Unable to write tree in temporary repo: %s(%s): Error: %v" , t . repo . FullName ( ) , t . basePath , err )
return "" , fmt . Errorf ( "Unable to write-tree in temporary repo for: %s Error: %v" , t . repo . FullName ( ) , err )
2019-02-12 16:07:31 +03:00
}
2019-11-11 14:46:28 +03:00
return strings . TrimSpace ( stdout ) , nil
2019-04-17 19:06:35 +03:00
}
2019-02-12 16:07:31 +03:00
2019-04-17 19:06:35 +03:00
// GetLastCommit gets the last commit ID SHA of the repo
func ( t * TemporaryUploadRepository ) GetLastCommit ( ) ( string , error ) {
return t . GetLastCommitByRef ( "HEAD" )
}
// GetLastCommitByRef gets the last commit ID SHA of the repo by ref
func ( t * TemporaryUploadRepository ) GetLastCommitByRef ( ref string ) ( string , error ) {
if ref == "" {
ref = "HEAD"
}
2019-11-11 14:46:28 +03:00
stdout , err := git . NewCommand ( "rev-parse" , ref ) . RunInDir ( t . basePath )
2019-04-17 19:06:35 +03:00
if err != nil {
2019-11-11 14:46:28 +03:00
log . Error ( "Unable to get last ref for %s in temporary repo: %s(%s): Error: %v" , ref , t . repo . FullName ( ) , t . basePath , err )
return "" , fmt . Errorf ( "Unable to rev-parse %s in temporary repo for: %s Error: %v" , ref , t . repo . FullName ( ) , err )
2019-04-17 19:06:35 +03:00
}
2019-11-11 14:46:28 +03:00
return strings . TrimSpace ( stdout ) , nil
2019-02-12 16:07:31 +03:00
}
// CommitTree creates a commit from a given tree for the user with provided message
2019-04-17 19:06:35 +03:00
func ( t * TemporaryUploadRepository ) CommitTree ( author , committer * models . User , treeHash string , message string ) ( string , error ) {
2019-12-24 05:33:52 +03:00
return t . CommitTreeWithDate ( author , committer , treeHash , message , time . Now ( ) , time . Now ( ) )
}
// CommitTreeWithDate creates a commit from a given tree for the user with provided message
func ( t * TemporaryUploadRepository ) CommitTreeWithDate ( author , committer * models . User , treeHash string , message string , authorDate , committerDate time . Time ) ( string , error ) {
2019-04-17 19:06:35 +03:00
authorSig := author . NewGitSig ( )
committerSig := committer . NewGitSig ( )
2019-02-12 16:07:31 +03:00
2020-09-05 19:42:58 +03:00
err := git . LoadGitVersion ( )
2019-10-12 03:13:27 +03:00
if err != nil {
return "" , fmt . Errorf ( "Unable to get git version: %v" , err )
}
2019-02-12 16:07:31 +03:00
// Because this may call hooks we should pass in the environment
env := append ( os . Environ ( ) ,
2019-04-17 19:06:35 +03:00
"GIT_AUTHOR_NAME=" + authorSig . Name ,
"GIT_AUTHOR_EMAIL=" + authorSig . Email ,
2019-12-24 05:33:52 +03:00
"GIT_AUTHOR_DATE=" + authorDate . Format ( time . RFC3339 ) ,
"GIT_COMMITTER_DATE=" + committerDate . Format ( time . RFC3339 ) ,
2019-02-12 16:07:31 +03:00
)
2019-10-16 16:42:42 +03:00
2019-10-12 03:13:27 +03:00
messageBytes := new ( bytes . Buffer )
_ , _ = messageBytes . WriteString ( message )
_ , _ = messageBytes . WriteString ( "\n" )
args := [ ] string { "commit-tree" , treeHash , "-p" , "HEAD" }
2019-10-16 16:42:42 +03:00
// Determine if we should sign
2020-09-05 19:42:58 +03:00
if git . CheckGitVersionConstraint ( ">= 1.7.9" ) == nil {
2020-09-19 19:44:55 +03:00
sign , keyID , signer , _ := t . repo . SignCRUDAction ( author , t . basePath , "HEAD" )
2019-10-16 16:42:42 +03:00
if sign {
args = append ( args , "-S" + keyID )
2020-09-19 19:44:55 +03:00
if t . repo . GetTrustModel ( ) == models . CommitterTrustModel || t . repo . GetTrustModel ( ) == models . CollaboratorCommitterTrustModel {
if committerSig . Name != authorSig . Name || committerSig . Email != authorSig . Email {
// Add trailers
_ , _ = messageBytes . WriteString ( "\n" )
_ , _ = messageBytes . WriteString ( "Co-Authored-By: " )
_ , _ = messageBytes . WriteString ( committerSig . String ( ) )
_ , _ = messageBytes . WriteString ( "\n" )
_ , _ = messageBytes . WriteString ( "Co-Committed-By: " )
_ , _ = messageBytes . WriteString ( committerSig . String ( ) )
_ , _ = messageBytes . WriteString ( "\n" )
}
committerSig = signer
}
2020-09-05 19:42:58 +03:00
} else if git . CheckGitVersionConstraint ( ">= 2.0.0" ) == nil {
2019-10-16 16:42:42 +03:00
args = append ( args , "--no-gpg-sign" )
}
2019-10-12 03:13:27 +03:00
}
2020-09-19 19:44:55 +03:00
env = append ( env ,
"GIT_COMMITTER_NAME=" + committerSig . Name ,
"GIT_COMMITTER_EMAIL=" + committerSig . Email ,
)
2019-11-11 14:46:28 +03:00
stdout := new ( bytes . Buffer )
stderr := new ( bytes . Buffer )
if err := git . NewCommand ( args ... ) . RunInDirTimeoutEnvFullPipeline ( env , - 1 , t . basePath , stdout , stderr , messageBytes ) ; err != nil {
log . Error ( "Unable to commit-tree in temporary repo: %s (%s) Error: %v\nStdout: %s\nStderr: %s" ,
t . repo . FullName ( ) , t . basePath , err , stdout , stderr )
return "" , fmt . Errorf ( "Unable to commit-tree in temporary repo: %s Error: %v\nStdout: %s\nStderr: %s" ,
t . repo . FullName ( ) , err , stdout , stderr )
2019-02-12 16:07:31 +03:00
}
2019-11-11 14:46:28 +03:00
return strings . TrimSpace ( stdout . String ( ) ) , nil
2019-02-12 16:07:31 +03:00
}
// Push the provided commitHash to the repository branch by the provided user
func ( t * TemporaryUploadRepository ) Push ( doer * models . User , commitHash string , branch string ) error {
// Because calls hooks we need to pass in the environment
2019-05-11 18:29:17 +03:00
env := models . PushingEnvironment ( doer , t . repo )
2020-03-28 07:13:18 +03:00
if err := git . Push ( t . basePath , git . PushOptions {
Remote : t . repo . RepoPath ( ) ,
Branch : strings . TrimSpace ( commitHash ) + ":refs/heads/" + strings . TrimSpace ( branch ) ,
Env : env ,
} ) ; err != nil {
if git . IsErrPushOutOfDate ( err ) {
return err
} else if git . IsErrPushRejected ( err ) {
rejectErr := err . ( * git . ErrPushRejected )
log . Info ( "Unable to push back to repo from temporary repo due to rejection: %s (%s)\nStdout: %s\nStderr: %s\nError: %v" ,
t . repo . FullName ( ) , t . basePath , rejectErr . StdOut , rejectErr . StdErr , rejectErr . Err )
2020-02-22 16:08:48 +03:00
return err
}
2020-03-28 07:13:18 +03:00
log . Error ( "Unable to push back to repo from temporary repo: %s (%s)\nError: %v" ,
t . repo . FullName ( ) , t . basePath , err )
2019-11-11 14:46:28 +03:00
return fmt . Errorf ( "Unable to push back to repo from temporary repo: %s (%s) Error: %v" ,
t . repo . FullName ( ) , t . basePath , err )
2019-02-12 16:07:31 +03:00
}
return nil
}
// DiffIndex returns a Diff of the current index to the head
2019-11-11 14:46:28 +03:00
func ( t * TemporaryUploadRepository ) DiffIndex ( ) ( * gitdiff . Diff , error ) {
stdoutReader , stdoutWriter , err := os . Pipe ( )
2019-02-12 16:07:31 +03:00
if err != nil {
2019-11-11 14:46:28 +03:00
log . Error ( "Unable to open stdout pipe: %v" , err )
return nil , fmt . Errorf ( "Unable to open stdout pipe: %v" , err )
2019-02-12 16:07:31 +03:00
}
2019-11-11 14:46:28 +03:00
defer func ( ) {
_ = stdoutReader . Close ( )
_ = stdoutWriter . Close ( )
} ( )
stderr := new ( bytes . Buffer )
var diff * gitdiff . Diff
var finalErr error
if err := git . NewCommand ( "diff-index" , "--cached" , "-p" , "HEAD" ) .
2020-01-15 11:32:57 +03:00
RunInDirTimeoutEnvFullPipelineFunc ( nil , 30 * time . Second , t . basePath , stdoutWriter , stderr , nil , func ( ctx context . Context , cancel context . CancelFunc ) error {
2019-11-11 14:46:28 +03:00
_ = stdoutWriter . Close ( )
diff , finalErr = gitdiff . ParsePatch ( setting . Git . MaxGitDiffLines , setting . Git . MaxGitDiffLineCharacters , setting . Git . MaxGitDiffFiles , stdoutReader )
if finalErr != nil {
log . Error ( "ParsePatch: %v" , finalErr )
cancel ( )
}
_ = stdoutReader . Close ( )
2020-01-15 11:32:57 +03:00
return finalErr
2019-11-11 14:46:28 +03:00
} ) ; err != nil {
if finalErr != nil {
log . Error ( "Unable to ParsePatch in temporary repo %s (%s). Error: %v" , t . repo . FullName ( ) , t . basePath , finalErr )
return nil , finalErr
}
log . Error ( "Unable to run diff-index pipeline in temporary repo %s (%s). Error: %v\nStderr: %s" ,
t . repo . FullName ( ) , t . basePath , err , stderr )
return nil , fmt . Errorf ( "Unable to run diff-index pipeline in temporary repo %s. Error: %v\nStderr: %s" ,
t . repo . FullName ( ) , err , stderr )
2019-02-12 16:07:31 +03:00
}
2020-05-26 08:58:07 +03:00
diff . NumFiles , diff . TotalAddition , diff . TotalDeletion , err = git . GetDiffShortStat ( t . basePath , "--cached" , "HEAD" )
if err != nil {
return nil , err
}
2019-02-12 16:07:31 +03:00
return diff , nil
}
// CheckAttribute checks the given attribute of the provided files
func ( t * TemporaryUploadRepository ) CheckAttribute ( attribute string , args ... string ) ( map [ string ] map [ string ] string , error ) {
2020-09-05 19:42:58 +03:00
err := git . LoadGitVersion ( )
2019-10-12 03:13:27 +03:00
if err != nil {
log . Error ( "Error retrieving git version: %v" , err )
return nil , err
}
2019-11-11 14:46:28 +03:00
stdout := new ( bytes . Buffer )
stderr := new ( bytes . Buffer )
2019-02-12 16:07:31 +03:00
2019-10-12 03:13:27 +03:00
cmdArgs := [ ] string { "check-attr" , "-z" , attribute }
// git check-attr --cached first appears in git 1.7.8
2020-09-05 19:42:58 +03:00
if git . CheckGitVersionConstraint ( ">= 1.7.8" ) == nil {
2019-10-12 03:13:27 +03:00
cmdArgs = append ( cmdArgs , "--cached" )
}
cmdArgs = append ( cmdArgs , "--" )
2019-02-12 16:07:31 +03:00
for _ , arg := range args {
if arg != "" {
cmdArgs = append ( cmdArgs , arg )
}
}
2019-11-11 14:46:28 +03:00
if err := git . NewCommand ( cmdArgs ... ) . RunInDirPipeline ( t . basePath , stdout , stderr ) ; err != nil {
log . Error ( "Unable to check-attr in temporary repo: %s (%s) Error: %v\nStdout: %s\nStderr: %s" ,
t . repo . FullName ( ) , t . basePath , err , stdout , stderr )
return nil , fmt . Errorf ( "Unable to check-attr in temporary repo: %s Error: %v\nStdout: %s\nStderr: %s" ,
t . repo . FullName ( ) , err , stdout , stderr )
2019-02-12 16:07:31 +03:00
}
2019-11-11 14:46:28 +03:00
fields := bytes . Split ( stdout . Bytes ( ) , [ ] byte { '\000' } )
2019-02-12 16:07:31 +03:00
if len ( fields ) % 3 != 1 {
return nil , fmt . Errorf ( "Wrong number of fields in return from check-attr" )
}
var name2attribute2info = make ( map [ string ] map [ string ] string )
for i := 0 ; i < ( len ( fields ) / 3 ) ; i ++ {
filename := string ( fields [ 3 * i ] )
attribute := string ( fields [ 3 * i + 1 ] )
info := string ( fields [ 3 * i + 2 ] )
attribute2info := name2attribute2info [ filename ]
if attribute2info == nil {
attribute2info = make ( map [ string ] string )
}
attribute2info [ attribute ] = info
name2attribute2info [ filename ] = attribute2info
}
return name2attribute2info , err
}
2019-04-17 19:06:35 +03:00
// GetBranchCommit Gets the commit object of the given branch
func ( t * TemporaryUploadRepository ) GetBranchCommit ( branch string ) ( * git . Commit , error ) {
if t . gitRepo == nil {
return nil , fmt . Errorf ( "repository has not been cloned" )
}
return t . gitRepo . GetBranchCommit ( branch )
}
// GetCommit Gets the commit object of the given commit ID
func ( t * TemporaryUploadRepository ) GetCommit ( commitID string ) ( * git . Commit , error ) {
if t . gitRepo == nil {
return nil , fmt . Errorf ( "repository has not been cloned" )
}
return t . gitRepo . GetCommit ( commitID )
}