git-lfs/commands/command_fetch.go

370 lines
10 KiB
Go
Raw Normal View History

package commands
import (
"fmt"
2015-07-28 13:50:19 +00:00
"time"
"github.com/git-lfs/git-lfs/filepathfilter"
2016-11-15 17:01:18 +00:00
"github.com/git-lfs/git-lfs/git"
"github.com/git-lfs/git-lfs/lfs"
"github.com/git-lfs/git-lfs/progress"
"github.com/git-lfs/git-lfs/tq"
"github.com/rubyist/tracerx"
"github.com/spf13/cobra"
)
var (
fetchRecentArg bool
fetchAllArg bool
fetchPruneArg bool
)
func getIncludeExcludeArgs(cmd *cobra.Command) (include, exclude *string) {
includeFlag := cmd.Flag("include")
excludeFlag := cmd.Flag("exclude")
if includeFlag.Changed {
include = &includeArg
}
if excludeFlag.Changed {
exclude = &excludeArg
}
return
}
2015-05-29 15:28:10 +00:00
func fetchCommand(cmd *cobra.Command, args []string) {
requireInRepo()
var refs []*git.Ref
2015-07-29 15:34:15 +00:00
if len(args) > 0 {
// Remote is first arg
if err := git.ValidateRemote(args[0]); err != nil {
Exit("Invalid remote name %q", args[0])
}
2016-07-21 22:37:53 +00:00
cfg.CurrentRemote = args[0]
} else {
cfg.CurrentRemote = ""
}
if len(args) > 1 {
resolvedrefs, err := git.ResolveRefs(args[1:])
if err != nil {
Panic(err, "Invalid ref argument: %v", args[1:])
2015-08-21 14:19:16 +00:00
}
refs = resolvedrefs
} else if !fetchAllArg {
2015-07-29 15:34:15 +00:00
ref, err := git.CurrentRef()
if err != nil {
2015-05-29 15:28:10 +00:00
Panic(err, "Could not fetch")
}
2015-08-21 14:19:16 +00:00
refs = []*git.Ref{ref}
2015-07-29 15:34:15 +00:00
}
success := true
gitscanner := lfs.NewGitScanner(nil)
defer gitscanner.Close()
include, exclude := getIncludeExcludeArgs(cmd)
2015-09-03 11:29:00 +00:00
if fetchAllArg {
2015-09-03 16:36:27 +00:00
if fetchRecentArg || len(args) > 1 {
2015-09-03 11:29:00 +00:00
Exit("Cannot combine --all with ref arguments or --recent")
}
if include != nil || exclude != nil {
2015-09-03 11:29:00 +00:00
Exit("Cannot combine --all with --include or --exclude")
}
2016-07-21 22:37:53 +00:00
if len(cfg.FetchIncludePaths()) > 0 || len(cfg.FetchExcludePaths()) > 0 {
2015-09-03 11:29:00 +00:00
Print("Ignoring global include / exclude paths to fulfil --all")
}
success = fetchAll()
2015-09-03 11:29:00 +00:00
} else { // !all
filter := buildFilepathFilter(cfg, include, exclude)
2015-09-03 11:29:00 +00:00
// Fetch refs sequentially per arg order; duplicates in later refs will be ignored
for _, ref := range refs {
Print("Fetching %v", ref.Name)
s := fetchRef(ref.Sha, filter)
success = success && s
2015-09-03 11:29:00 +00:00
}
2016-07-21 22:37:53 +00:00
if fetchRecentArg || cfg.FetchPruneConfig().FetchRecentAlways {
s := fetchRecent(refs, filter)
success = success && s
2015-09-03 11:29:00 +00:00
}
}
2015-10-15 15:35:26 +00:00
if fetchPruneArg {
2016-08-05 23:23:56 +00:00
fetchconf := cfg.FetchPruneConfig()
verify := fetchconf.PruneVerifyRemoteAlways
2015-10-15 15:35:26 +00:00
// no dry-run or verbose options in fetch, assume false
2016-08-05 23:23:56 +00:00
prune(fetchconf, verify, false, false)
2015-10-15 15:35:26 +00:00
}
2015-11-09 17:46:29 +00:00
if !success {
Exit("Warning: errors occurred")
}
}
func pointersToFetchForRef(ref string, filter *filepathfilter.Filter) ([]*lfs.WrappedPointer, error) {
var pointers []*lfs.WrappedPointer
var multiErr error
tempgitscanner := lfs.NewGitScanner(func(p *lfs.WrappedPointer, err error) {
if err != nil {
if multiErr != nil {
multiErr = fmt.Errorf("%v\n%v", multiErr, err)
} else {
multiErr = err
}
return
}
pointers = append(pointers, p)
})
tempgitscanner.Filter = filter
if err := tempgitscanner.ScanTree(ref); err != nil {
return nil, err
}
tempgitscanner.Close()
return pointers, multiErr
}
// Fetch all binaries for a given ref (that we don't have already)
func fetchRef(ref string, filter *filepathfilter.Filter) bool {
pointers, err := pointersToFetchForRef(ref, filter)
if err != nil {
Panic(err, "Could not scan for Git LFS files")
}
return fetchAndReportToChan(pointers, filter, nil)
}
2015-08-21 14:19:16 +00:00
// Fetch all previous versions of objects from since to ref (not including final state at ref)
// So this will fetch all the '-' sides of the diff from since to ref
func fetchPreviousVersions(ref string, since time.Time, filter *filepathfilter.Filter) bool {
var pointers []*lfs.WrappedPointer
tempgitscanner := lfs.NewGitScanner(func(p *lfs.WrappedPointer, err error) {
if err != nil {
Panic(err, "Could not scan for Git LFS previous versions")
return
}
pointers = append(pointers, p)
})
tempgitscanner.Filter = filter
if err := tempgitscanner.ScanPreviousVersions(ref, since, nil); err != nil {
ExitWithError(err)
}
tempgitscanner.Close()
return fetchAndReportToChan(pointers, filter, nil)
2015-08-21 14:19:16 +00:00
}
// Fetch recent objects based on config
func fetchRecent(alreadyFetchedRefs []*git.Ref, filter *filepathfilter.Filter) bool {
2016-07-21 22:37:53 +00:00
fetchconf := cfg.FetchPruneConfig()
2015-08-21 14:19:16 +00:00
if fetchconf.FetchRecentRefsDays == 0 && fetchconf.FetchRecentCommitsDays == 0 {
return true
2015-08-21 14:19:16 +00:00
}
ok := true
2015-08-21 14:19:16 +00:00
// Make a list of what unique commits we've already fetched for to avoid duplicating work
uniqueRefShas := make(map[string]string, len(alreadyFetchedRefs))
for _, ref := range alreadyFetchedRefs {
uniqueRefShas[ref.Sha] = ref.Name
}
// First find any other recent refs
if fetchconf.FetchRecentRefsDays > 0 {
2015-08-27 14:18:46 +00:00
Print("Fetching recent branches within %v days", fetchconf.FetchRecentRefsDays)
refsSince := time.Now().AddDate(0, 0, -fetchconf.FetchRecentRefsDays)
2016-07-21 22:37:53 +00:00
refs, err := git.RecentBranches(refsSince, fetchconf.FetchRecentRefsIncludeRemotes, cfg.CurrentRemote)
if err != nil {
Panic(err, "Could not scan for recent refs")
}
2015-08-21 14:19:16 +00:00
for _, ref := range refs {
// Don't fetch for the same SHA twice
if prevRefName, ok := uniqueRefShas[ref.Sha]; ok {
2015-08-27 14:18:46 +00:00
if ref.Name != prevRefName {
tracerx.Printf("Skipping fetch for %v, already fetched via %v", ref.Name, prevRefName)
}
} else {
uniqueRefShas[ref.Sha] = ref.Name
2015-08-27 14:18:46 +00:00
Print("Fetching %v", ref.Name)
k := fetchRef(ref.Sha, filter)
ok = ok && k
2015-08-21 14:19:16 +00:00
}
}
}
// For every unique commit we've fetched, check recent commits too
if fetchconf.FetchRecentCommitsDays > 0 {
for commit, refName := range uniqueRefShas {
// We measure from the last commit at the ref
summ, err := git.GetCommitSummary(commit)
if err != nil {
Error("Couldn't scan commits at %v: %v", refName, err)
continue
}
2015-08-27 14:18:46 +00:00
Print("Fetching changes within %v days of %v", fetchconf.FetchRecentCommitsDays, refName)
2015-08-21 14:19:16 +00:00
commitsSince := summ.CommitDate.AddDate(0, 0, -fetchconf.FetchRecentCommitsDays)
k := fetchPreviousVersions(commit, commitsSince, filter)
ok = ok && k
}
}
return ok
}
func fetchAll() bool {
pointers := scanAll()
Print("Fetching objects...")
return fetchAndReportToChan(pointers, nil, nil)
}
func scanAll() []*lfs.WrappedPointer {
// This could be a long process so use the chan version & report progress
2015-09-03 16:38:26 +00:00
Print("Scanning for all objects ever referenced...")
spinner := progress.NewSpinner()
var numObjs int64
2016-11-16 19:56:07 +00:00
// use temp gitscanner to collect pointers
var pointers []*lfs.WrappedPointer
var multiErr error
tempgitscanner := lfs.NewGitScanner(func(p *lfs.WrappedPointer, err error) {
if err != nil {
if multiErr != nil {
multiErr = fmt.Errorf("%v\n%v", multiErr, err)
} else {
multiErr = err
}
return
}
numObjs++
spinner.Print(OutputWriter, fmt.Sprintf("%d objects found", numObjs))
pointers = append(pointers, p)
})
if err := tempgitscanner.ScanAll(nil); err != nil {
Panic(err, "Could not scan for Git LFS files")
}
tempgitscanner.Close()
if multiErr != nil {
Panic(multiErr, "Could not scan for Git LFS files")
}
spinner.Finish(OutputWriter, fmt.Sprintf("%d objects found", numObjs))
return pointers
2015-09-03 11:29:00 +00:00
}
// Fetch and report completion of each OID to a channel (optional, pass nil to skip)
// Returns true if all completed with no errors, false if errors were written to stderr/log
func fetchAndReportToChan(allpointers []*lfs.WrappedPointer, filter *filepathfilter.Filter, out chan<- *lfs.WrappedPointer) bool {
// Lazily initialize the current remote.
if len(cfg.CurrentRemote) == 0 {
// Actively find the default remote, don't just assume origin
defaultRemote, err := git.DefaultRemote()
if err != nil {
Exit("No default remote")
}
cfg.CurrentRemote = defaultRemote
}
ready, pointers, meter := readyAndMissingPointers(allpointers, filter)
q := newDownloadQueue(tq.WithProgress(meter))
if out != nil {
2016-08-17 20:14:05 +00:00
// If we already have it, or it won't be fetched
// report it to chan immediately to support pull/checkout
for _, p := range ready {
2016-08-17 20:14:05 +00:00
out <- p
}
dlwatch := q.Watch()
go func() {
// fetch only reports single OID, but OID *might* be referenced by multiple
// WrappedPointers if same content is at multiple paths, so map oid->slice
oidToPointers := make(map[string][]*lfs.WrappedPointer, len(pointers))
for _, pointer := range pointers {
plist := oidToPointers[pointer.Oid]
oidToPointers[pointer.Oid] = append(plist, pointer)
}
for oid := range dlwatch {
plist, ok := oidToPointers[oid]
if !ok {
continue
}
for _, p := range plist {
out <- p
}
}
close(out)
}()
}
for _, p := range pointers {
2016-08-17 20:14:05 +00:00
tracerx.Printf("fetch %v [%v]", p.Name, p.Oid)
q.Add(downloadTransfer(p))
}
processQueue := time.Now()
q.Wait()
tracerx.PerformanceSince("process queue", processQueue)
2015-08-17 21:45:43 +00:00
ok := true
2015-08-17 21:45:43 +00:00
for _, err := range q.Errors() {
ok = false
2016-08-16 18:03:37 +00:00
FullError(err)
2015-08-17 21:45:43 +00:00
}
return ok
}
func readyAndMissingPointers(allpointers []*lfs.WrappedPointer, filter *filepathfilter.Filter) ([]*lfs.WrappedPointer, []*lfs.WrappedPointer, *progress.ProgressMeter) {
2016-12-07 20:27:42 +00:00
meter := buildProgressMeter(false)
2016-08-17 20:14:05 +00:00
seen := make(map[string]bool, len(allpointers))
missing := make([]*lfs.WrappedPointer, 0, len(allpointers))
ready := make([]*lfs.WrappedPointer, 0, len(allpointers))
2016-08-17 20:14:05 +00:00
for _, p := range allpointers {
// no need to download the same object multiple times
if seen[p.Oid] {
continue
}
seen[p.Oid] = true
// no need to download objects that exist locally already
lfs.LinkOrCopyFromReference(p.Oid, p.Size)
if lfs.ObjectExistsOfSize(p.Oid, p.Size) {
ready = append(ready, p)
2016-08-17 20:14:05 +00:00
continue
}
missing = append(missing, p)
meter.Add(p.Size)
2016-08-17 20:14:05 +00:00
}
return ready, missing, meter
2016-08-17 20:14:05 +00:00
}
func init() {
RegisterCommand("fetch", fetchCommand, func(cmd *cobra.Command) {
cmd.Flags().StringVarP(&includeArg, "include", "I", "", "Include a list of paths")
cmd.Flags().StringVarP(&excludeArg, "exclude", "X", "", "Exclude a list of paths")
cmd.Flags().BoolVarP(&fetchRecentArg, "recent", "r", false, "Fetch recent refs & commits")
cmd.Flags().BoolVarP(&fetchAllArg, "all", "a", false, "Fetch all LFS files ever referenced")
cmd.Flags().BoolVarP(&fetchPruneArg, "prune", "p", false, "After fetching, prune old data")
})
}