@ -10,6 +10,7 @@ import (
"fmt"
"fmt"
"io"
"io"
"os"
"os"
"path"
"path/filepath"
"path/filepath"
"strconv"
"strconv"
"strings"
"strings"
@ -32,7 +33,7 @@ import (
"code.gitea.io/gitea/modules/uri"
"code.gitea.io/gitea/modules/uri"
"code.gitea.io/gitea/services/pull"
"code.gitea.io/gitea/services/pull"
gouuid "github.com/google/uuid"
"github.com/google/uuid"
)
)
var _ base . Uploader = & GiteaLocalUploader { }
var _ base . Uploader = & GiteaLocalUploader { }
@ -48,7 +49,7 @@ type GiteaLocalUploader struct {
milestones map [ string ] int64
milestones map [ string ] int64
issues map [ int64 ] * issues_model . Issue
issues map [ int64 ] * issues_model . Issue
gitRepo * git . Repository
gitRepo * git . Repository
prHeadCache map [ string ] struct { }
prHeadCache map [ string ] string
sameApp bool
sameApp bool
userMap map [ int64 ] int64 // external user id mapping to user id
userMap map [ int64 ] int64 // external user id mapping to user id
prCache map [ int64 ] * issues_model . PullRequest
prCache map [ int64 ] * issues_model . PullRequest
@ -65,7 +66,7 @@ func NewGiteaLocalUploader(ctx context.Context, doer *user_model.User, repoOwner
labels : make ( map [ string ] * issues_model . Label ) ,
labels : make ( map [ string ] * issues_model . Label ) ,
milestones : make ( map [ string ] int64 ) ,
milestones : make ( map [ string ] int64 ) ,
issues : make ( map [ int64 ] * issues_model . Issue ) ,
issues : make ( map [ int64 ] * issues_model . Issue ) ,
prHeadCache : make ( map [ string ] struct { } ) ,
prHeadCache : make ( map [ string ] string ) ,
userMap : make ( map [ int64 ] int64 ) ,
userMap : make ( map [ int64 ] int64 ) ,
prCache : make ( map [ int64 ] * issues_model . PullRequest ) ,
prCache : make ( map [ int64 ] * issues_model . PullRequest ) ,
}
}
@ -125,7 +126,7 @@ func (g *GiteaLocalUploader) CreateRepo(repo *base.Repository, opts base.Migrate
Mirror : repo . IsMirror ,
Mirror : repo . IsMirror ,
LFS : opts . LFS ,
LFS : opts . LFS ,
LFSEndpoint : opts . LFSEndpoint ,
LFSEndpoint : opts . LFSEndpoint ,
CloneAddr : repo . CloneURL ,
CloneAddr : repo . CloneURL , // SECURITY: we will assume that this has already been checked
Private : repo . IsPrivate ,
Private : repo . IsPrivate ,
Wiki : opts . Wiki ,
Wiki : opts . Wiki ,
Releases : opts . Releases , // if didn't get releases, then sync them from tags
Releases : opts . Releases , // if didn't get releases, then sync them from tags
@ -150,13 +151,15 @@ func (g *GiteaLocalUploader) Close() {
// CreateTopics creates topics
// CreateTopics creates topics
func ( g * GiteaLocalUploader ) CreateTopics ( topics ... string ) error {
func ( g * GiteaLocalUploader ) CreateTopics ( topics ... string ) error {
// ignore topics t o long for the db
// Ignore topics to o long for the db
c := 0
c := 0
for i := range topics {
for _ , topic := range topics {
if len ( topics [ i ] ) <= 50 {
if len ( topic ) > 50 {
topics [ c ] = topics [ i ]
continue
c ++
}
}
topics [ c ] = topic
c ++
}
}
topics = topics [ : c ]
topics = topics [ : c ]
return repo_model . SaveTopics ( g . repo . ID , topics ... )
return repo_model . SaveTopics ( g . repo . ID , topics ... )
@ -217,11 +220,17 @@ func (g *GiteaLocalUploader) CreateMilestones(milestones ...*base.Milestone) err
func ( g * GiteaLocalUploader ) CreateLabels ( labels ... * base . Label ) error {
func ( g * GiteaLocalUploader ) CreateLabels ( labels ... * base . Label ) error {
lbs := make ( [ ] * issues_model . Label , 0 , len ( labels ) )
lbs := make ( [ ] * issues_model . Label , 0 , len ( labels ) )
for _ , label := range labels {
for _ , label := range labels {
// We must validate color here:
if ! issues_model . LabelColorPattern . MatchString ( "#" + label . Color ) {
log . Warn ( "Invalid label color: #%s for label: %s in migration to %s/%s" , label . Color , label . Name , g . repoOwner , g . repoName )
label . Color = "ffffff"
}
lbs = append ( lbs , & issues_model . Label {
lbs = append ( lbs , & issues_model . Label {
RepoID : g . repo . ID ,
RepoID : g . repo . ID ,
Name : label . Name ,
Name : label . Name ,
Description : label . Description ,
Description : label . Description ,
Color : fmt . Sprintf ( "#%s" , label . Color ) ,
Color : "#" + label . Color ,
} )
} )
}
}
@ -247,6 +256,16 @@ func (g *GiteaLocalUploader) CreateReleases(releases ...*base.Release) error {
}
}
}
}
// SECURITY: The TagName must be a valid git ref
if release . TagName != "" && ! git . IsValidRefPattern ( release . TagName ) {
release . TagName = ""
}
// SECURITY: The TargetCommitish must be a valid git ref
if release . TargetCommitish != "" && ! git . IsValidRefPattern ( release . TargetCommitish ) {
release . TargetCommitish = ""
}
rel := models . Release {
rel := models . Release {
RepoID : g . repo . ID ,
RepoID : g . repo . ID ,
TagName : release . TagName ,
TagName : release . TagName ,
@ -288,14 +307,15 @@ func (g *GiteaLocalUploader) CreateReleases(releases ...*base.Release) error {
}
}
}
}
attach := repo_model . Attachment {
attach := repo_model . Attachment {
UUID : go uuid. New ( ) . String ( ) ,
UUID : uuid . New ( ) . String ( ) ,
Name : asset . Name ,
Name : asset . Name ,
DownloadCount : int64 ( * asset . DownloadCount ) ,
DownloadCount : int64 ( * asset . DownloadCount ) ,
Size : int64 ( * asset . Size ) ,
Size : int64 ( * asset . Size ) ,
CreatedUnix : timeutil . TimeStamp ( asset . Created . Unix ( ) ) ,
CreatedUnix : timeutil . TimeStamp ( asset . Created . Unix ( ) ) ,
}
}
// download attachment
// SECURITY: We cannot check the DownloadURL and DownloadFunc are safe here
// ... we must assume that they are safe and simply download the attachment
err := func ( ) error {
err := func ( ) error {
// asset.DownloadURL maybe a local file
// asset.DownloadURL maybe a local file
var rc io . ReadCloser
var rc io . ReadCloser
@ -365,6 +385,12 @@ func (g *GiteaLocalUploader) CreateIssues(issues ...*base.Issue) error {
}
}
}
}
// SECURITY: issue.Ref needs to be a valid reference
if ! git . IsValidRefPattern ( issue . Ref ) {
log . Warn ( "Invalid issue.Ref[%s] in issue #%d in %s/%s" , issue . Ref , issue . Number , g . repoOwner , g . repoName )
issue . Ref = ""
}
is := issues_model . Issue {
is := issues_model . Issue {
RepoID : g . repo . ID ,
RepoID : g . repo . ID ,
Repo : g . repo ,
Repo : g . repo ,
@ -496,102 +522,151 @@ func (g *GiteaLocalUploader) CreatePullRequests(prs ...*base.PullRequest) error
}
}
func ( g * GiteaLocalUploader ) updateGitForPullRequest ( pr * base . PullRequest ) ( head string , err error ) {
func ( g * GiteaLocalUploader ) updateGitForPullRequest ( pr * base . PullRequest ) ( head string , err error ) {
// download patch file
// SECURITY: this pr must have been must have been ensured safe
if ! pr . EnsuredSafe {
log . Error ( "PR #%d in %s/%s has not been checked for safety." , pr . Number , g . repoOwner , g . repoName )
return "" , fmt . Errorf ( "the PR[%d] was not checked for safety" , pr . Number )
}
// Anonymous function to download the patch file (allows us to use defer)
err = func ( ) error {
err = func ( ) error {
// if the patchURL is empty there is nothing to download
if pr . PatchURL == "" {
if pr . PatchURL == "" {
return nil
return nil
}
}
// pr.PatchURL maybe a local file
ret , err := uri . Open ( pr . PatchURL )
// SECURITY: We will assume that the pr.PatchURL has been checked
// pr.PatchURL maybe a local file - but note EnsureSafe should be asserting that this safe
ret , err := uri . Open ( pr . PatchURL ) // TODO: This probably needs to use the downloader as there may be rate limiting issues here
if err != nil {
if err != nil {
return err
return err
}
}
defer ret . Close ( )
defer ret . Close ( )
pullDir := filepath . Join ( g . repo . RepoPath ( ) , "pulls" )
pullDir := filepath . Join ( g . repo . RepoPath ( ) , "pulls" )
if err = os . MkdirAll ( pullDir , os . ModePerm ) ; err != nil {
if err = os . MkdirAll ( pullDir , os . ModePerm ) ; err != nil {
return err
return err
}
}
f , err := os . Create ( filepath . Join ( pullDir , fmt . Sprintf ( "%d.patch" , pr . Number ) ) )
f , err := os . Create ( filepath . Join ( pullDir , fmt . Sprintf ( "%d.patch" , pr . Number ) ) )
if err != nil {
if err != nil {
return err
return err
}
}
defer f . Close ( )
defer f . Close ( )
// TODO: Should there be limits on the size of this file?
_ , err = io . Copy ( f , ret )
_ , err = io . Copy ( f , ret )
return err
return err
} ( )
} ( )
if err != nil {
if err != nil {
return "" , err
return "" , err
}
}
// set head information
pullHead := filepath . Join ( g . repo . RepoPath ( ) , "refs" , "pull" , fmt . Sprintf ( "%d" , pr . Number ) )
if err := os . MkdirAll ( pullHead , os . ModePerm ) ; err != nil {
return "" , err
}
p , err := os . Create ( filepath . Join ( pullHead , "head" ) )
if err != nil {
return "" , err
}
_ , err = p . WriteString ( pr . Head . SHA )
p . Close ( )
if err != nil {
return "" , err
}
head = "unknown repository"
head = "unknown repository"
if pr . IsForkPullRequest ( ) && pr . State != "closed" {
if pr . IsForkPullRequest ( ) && pr . State != "closed" {
if pr . Head . OwnerName != "" {
// OK we want to fetch the current head as a branch from its CloneURL
remote := pr . Head . OwnerName
_ , ok := g . prHeadCache [ remote ]
// 1. Is there a head clone URL available?
// 2. Is there a head ref available?
if pr . Head . CloneURL == "" || pr . Head . Ref == "" {
return head , nil
}
// 3. We need to create a remote for this clone url
// ... maybe we already have a name for this remote
remote , ok := g . prHeadCache [ pr . Head . CloneURL + ":" ]
if ! ok {
if ! ok {
// git remote add
// ... let's try ownername as a reasonable name
remote = pr . Head . OwnerName
if ! git . IsValidRefPattern ( remote ) {
// ... let's try something less nice
remote = "head-pr-" + strconv . FormatInt ( pr . Number , 10 )
}
// ... now add the remote
err := g . gitRepo . AddRemote ( remote , pr . Head . CloneURL , true )
err := g . gitRepo . AddRemote ( remote , pr . Head . CloneURL , true )
if err != nil {
if err != nil {
log . Error ( "AddRemote failed: %s" , err )
log . Error ( "PR #%d in %s/%s AddRemote[%s] failed: %v" , pr . Number , g . repoOwner , g . repoName , remote , err )
} else {
} else {
g . prHeadCache [ remote ] = struct { } { }
g . prHeadCache [ pr . Head . CloneURL + ":" ] = remote
ok = true
ok = true
}
}
}
}
if ! ok {
return head , nil
}
if ok {
// 4. Check if we already have this ref?
_ , _ , err = git . NewCommand ( g . ctx , "fetch" , "--no-tags" , "--" , remote , pr . Head . Ref ) . RunStdString ( & git . RunOpts { Dir : g . repo . RepoPath ( ) } )
localRef , ok := g . prHeadCache [ pr . Head . CloneURL + ":" + pr . Head . Ref ]
if ! ok {
// ... We would normally name this migrated branch as <OwnerName>/<HeadRef> but we need to ensure that is safe
localRef = git . SanitizeRefPattern ( pr . Head . OwnerName + "/" + pr . Head . Ref )
// ... Now we must assert that this does not exist
if g . gitRepo . IsBranchExist ( localRef ) {
localRef = "head-pr-" + strconv . FormatInt ( pr . Number , 10 ) + "/" + localRef
i := 0
for g . gitRepo . IsBranchExist ( localRef ) {
if i > 5 {
// ... We tried, we really tried but this is just a seriously unfriendly repo
return head , nil
}
// OK just try some uuids!
localRef = git . SanitizeRefPattern ( "head-pr-" + strconv . FormatInt ( pr . Number , 10 ) + uuid . New ( ) . String ( ) )
i ++
}
}
fetchArg := pr . Head . Ref + ":" + git . BranchPrefix + localRef
if strings . HasPrefix ( fetchArg , "-" ) {
fetchArg = git . BranchPrefix + fetchArg
}
_ , _ , err = git . NewCommand ( g . ctx , "fetch" , "--no-tags" , "--" , remote , fetchArg ) . RunStdString ( & git . RunOpts { Dir : g . repo . RepoPath ( ) } )
if err != nil {
if err != nil {
log . Error ( "Fetch branch from %s failed: %v" , pr . Head . CloneURL , err )
log . Error ( "Fetch branch from %s failed: %v" , pr . Head . CloneURL , err )
} else {
return head , nil
headBranch := filepath . Join ( g . repo . RepoPath ( ) , "refs" , "heads" , pr . Head . OwnerName , pr . Head . Ref )
if err := os . MkdirAll ( filepath . Dir ( headBranch ) , os . ModePerm ) ; err != nil {
return "" , err
}
}
b , err := os . Create ( headBranch )
g . prHeadCache [ pr . Head . CloneURL + ":" + pr . Head . Ref ] = localRef
if err != nil {
head = localRef
return "" , err
}
}
_ , err = b . WriteString ( pr . Head . SHA )
b . Close ( )
// 5. Now if pr.Head.SHA == "" we should recover this to the head of this branch
if pr . Head . SHA == "" {
headSha , err := g . gitRepo . GetBranchCommitID ( localRef )
if err != nil {
if err != nil {
return "" , err
log . Error ( "unable to get head SHA of local head for PR #%d from %s in %s/%s. Error: %v" , pr . Number , pr . Head . Ref , g . repoOwner , g . repoName , err )
return head , nil
}
}
head = pr . Head . OwnerName + "/" + pr . Head . Ref
pr . Head . SHA = headSha
}
}
_ , _ , err = git . NewCommand ( g . ctx , "update-ref" , "--no-deref" , pr . GetGitRefName ( ) , pr . Head . SHA ) . RunStdString ( & git . RunOpts { Dir : g . repo . RepoPath ( ) } )
if err != nil {
return "" , err
}
}
return head , nil
}
}
} else {
if pr . Head . Ref != "" {
head = pr . Head . Ref
head = pr . Head . Ref
}
// Ensure the closed PR SHA still points to an existing ref
// Ensure the closed PR SHA still points to an existing ref
if pr . Head . SHA == "" {
// The SHA is empty
log . Warn ( "Empty reference, no pull head for PR #%d in %s/%s" , pr . Number , g . repoOwner , g . repoName )
} else {
_ , _ , err = git . NewCommand ( g . ctx , "rev-list" , "--quiet" , "-1" , pr . Head . SHA ) . RunStdString ( & git . RunOpts { Dir : g . repo . RepoPath ( ) } )
_ , _ , err = git . NewCommand ( g . ctx , "rev-list" , "--quiet" , "-1" , pr . Head . SHA ) . RunStdString ( & git . RunOpts { Dir : g . repo . RepoPath ( ) } )
if err != nil {
if err != nil {
if pr . Head . SHA != "" {
// Git update-ref remove bad references with a relative path
// Git update-ref remove bad references with a relative path
log . Warn ( "Deprecated local head, removing : %v" , pr . Head . SHA )
log . Warn ( "Deprecated local head %s for PR #%d in %s/%s, removing %s" , pr . Head . SHA , pr . Number , g . repoOwner , g . repoName , pr . GetGitRefName ( ) )
err = g . gitRepo . RemoveReference ( pr . GetGitRefName ( ) )
} else {
} else {
// The SHA is empty, remove the head file
// set head information
log . Warn ( "Empty reference, removing : %v" , pullHead )
_ , _ , err = git . NewCommand ( g . ctx , "update-ref" , "--no-deref" , pr . GetGitRefName ( ) , pr . Head . SHA ) . RunStdString ( & git . RunOpts { Dir : g . repo . RepoPath ( ) } )
err = os . Remove ( filepath . Join ( pullHead , "head" ) )
}
if err != nil {
if err != nil {
log . Error ( "Cannot remove local head ref, %v" , err )
log . Error ( "unable to set %s as the local head for PR #%d from %s in %s/%s. Error: %v" , pr . Head . SHA , pr . Number , pr . Head . Ref , g . repoOwner , g . repoName , err )
}
}
}
}
}
}
@ -615,6 +690,20 @@ func (g *GiteaLocalUploader) newPullRequest(pr *base.PullRequest) (*issues_model
return nil , fmt . Errorf ( "updateGitForPullRequest: %w" , err )
return nil , fmt . Errorf ( "updateGitForPullRequest: %w" , err )
}
}
// Now we may need to fix the mergebase
if pr . Base . SHA == "" {
if pr . Base . Ref != "" && pr . Head . SHA != "" {
// A PR against a tag base does not make sense - therefore pr.Base.Ref must be a branch
// TODO: should we be checking for the refs/heads/ prefix on the pr.Base.Ref? (i.e. are these actually branches or refs)
pr . Base . SHA , _ , err = g . gitRepo . GetMergeBase ( "" , git . BranchPrefix + pr . Base . Ref , pr . Head . SHA )
if err != nil {
log . Error ( "Cannot determine the merge base for PR #%d in %s/%s. Error: %v" , pr . Number , g . repoOwner , g . repoName , err )
}
} else {
log . Error ( "Cannot determine the merge base for PR #%d in %s/%s. Not enough information" , pr . Number , g . repoOwner , g . repoName )
}
}
if pr . Created . IsZero ( ) {
if pr . Created . IsZero ( ) {
if pr . Closed != nil {
if pr . Closed != nil {
pr . Created = * pr . Closed
pr . Created = * pr . Closed
@ -728,6 +817,8 @@ func (g *GiteaLocalUploader) CreateReviews(reviews ...*base.Review) error {
return err
return err
}
}
cms = append ( cms , & cm )
// get pr
// get pr
pr , ok := g . prCache [ issue . ID ]
pr , ok := g . prCache [ issue . ID ]
if ! ok {
if ! ok {
@ -738,6 +829,17 @@ func (g *GiteaLocalUploader) CreateReviews(reviews ...*base.Review) error {
}
}
g . prCache [ issue . ID ] = pr
g . prCache [ issue . ID ] = pr
}
}
if pr . MergeBase == "" {
// No mergebase -> no basis for any patches
log . Warn ( "PR #%d in %s/%s: does not have a merge base, all review comments will be ignored" , pr . Index , g . repoOwner , g . repoName )
continue
}
headCommitID , err := g . gitRepo . GetRefCommitID ( pr . GetGitRefName ( ) )
if err != nil {
log . Warn ( "PR #%d GetRefCommitID[%s] in %s/%s: %v, all review comments will be ignored" , pr . Index , pr . GetGitRefName ( ) , g . repoOwner , g . repoName , err )
continue
}
for _ , comment := range review . Comments {
for _ , comment := range review . Comments {
line := comment . Line
line := comment . Line
@ -746,11 +848,9 @@ func (g *GiteaLocalUploader) CreateReviews(reviews ...*base.Review) error {
} else {
} else {
_ , _ , line , _ = git . ParseDiffHunkString ( comment . DiffHunk )
_ , _ , line , _ = git . ParseDiffHunkString ( comment . DiffHunk )
}
}
headCommitID , err := g . gitRepo . GetRefCommitID ( pr . GetGitRefName ( ) )
if err != nil {
// SECURITY: The TreePath must be cleaned!
log . Warn ( "GetRefCommitID[%s]: %v, the review comment will be ignored" , pr . GetGitRefName ( ) , err )
comment . TreePath = path . Clean ( "/" + comment . TreePath ) [ 1 : ]
continue
}
var patch string
var patch string
reader , writer := io . Pipe ( )
reader , writer := io . Pipe ( )
@ -775,6 +875,11 @@ func (g *GiteaLocalUploader) CreateReviews(reviews ...*base.Review) error {
comment . UpdatedAt = comment . CreatedAt
comment . UpdatedAt = comment . CreatedAt
}
}
if ! git . IsValidSHAPattern ( comment . CommitID ) {
log . Warn ( "Invalid comment CommitID[%s] on comment[%d] in PR #%d of %s/%s replaced with %s" , comment . CommitID , pr . Index , g . repoOwner , g . repoName , headCommitID )
comment . CommitID = headCommitID
}
c := issues_model . Comment {
c := issues_model . Comment {
Type : issues_model . CommentTypeCode ,
Type : issues_model . CommentTypeCode ,
IssueID : issue . ID ,
IssueID : issue . ID ,
@ -793,8 +898,6 @@ func (g *GiteaLocalUploader) CreateReviews(reviews ...*base.Review) error {
cm . Comments = append ( cm . Comments , & c )
cm . Comments = append ( cm . Comments , & c )
}
}
cms = append ( cms , & cm )
}
}
return issues_model . InsertReviews ( cms )
return issues_model . InsertReviews ( cms )