git-lfs/lfs/gitscanner.go

239 lines
6.5 KiB
Go
Raw Normal View History

2016-11-16 19:56:07 +00:00
package lfs
2016-11-17 22:41:19 +00:00
import (
"errors"
2016-11-17 22:41:19 +00:00
"fmt"
"sync"
2016-11-17 22:41:19 +00:00
"time"
"github.com/git-lfs/git-lfs/filepathfilter"
"github.com/rubyist/tracerx"
2016-11-17 22:41:19 +00:00
)
var missingCallbackErr = errors.New("No callback given")
2016-11-30 21:00:42 +00:00
// IsCallbackMissing returns a boolean indicating whether the error is reporting
// that a GitScanner is missing a required GitScannerCallback.
2016-11-30 21:00:42 +00:00
func IsCallbackMissing(err error) bool {
return err == missingCallbackErr
}
// GitScanner scans objects in a Git repository for LFS pointers.
2016-11-16 19:56:07 +00:00
type GitScanner struct {
Filter *filepathfilter.Filter
FoundPointer GitScannerFoundPointer
FoundLockable GitScannerFoundLockable
PotentialLockables GitScannerSet
remote string
skippedRefs []string
closed bool
started time.Time
mu sync.Mutex
2016-11-16 19:56:07 +00:00
}
2017-02-15 23:48:47 +00:00
type GitScannerFoundPointer func(*WrappedPointer, error)
type GitScannerFoundLockable func(filename string)
type GitScannerSet interface {
Contains(string) bool
}
// NewGitScanner initializes a *GitScanner for a Git repository in the current
// working directory.
2017-02-15 23:48:47 +00:00
func NewGitScanner(cb GitScannerFoundPointer) *GitScanner {
return &GitScanner{started: time.Now(), FoundPointer: cb}
}
// Close stops exits once all processing has stopped, and all resources are
// tracked and cleaned up.
func (s *GitScanner) Close() {
s.mu.Lock()
defer s.mu.Unlock()
if s.closed {
return
}
s.closed = true
tracerx.PerformanceSince("scan", s.started)
2016-11-16 19:56:07 +00:00
}
// RemoteForPush sets up this *GitScanner to scan for objects to push to the
// given remote. Needed for ScanLeftToRemote().
func (s *GitScanner) RemoteForPush(r string) error {
s.mu.Lock()
defer s.mu.Unlock()
if len(s.remote) > 0 && s.remote != r {
return fmt.Errorf("Trying to set remote to %q, already set to %q", r, s.remote)
}
s.remote = r
2016-11-16 23:05:03 +00:00
s.skippedRefs = calcSkippedRefs(r)
return nil
}
// ScanLeftToRemote scans through all commits starting at the given ref that the
// given remote does not have. See RemoteForPush().
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanLeftToRemote(left string, cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
s.mu.Lock()
if len(s.remote) == 0 {
s.mu.Unlock()
return fmt.Errorf("Unable to scan starting at %q: no remote set.", left)
}
s.mu.Unlock()
return scanRefsToChan(s, callback, left, "", s.opts(ScanLeftToRemoteMode))
}
// ScanRefRange scans through all commits from the given left and right refs,
// including git objects that have been modified or deleted.
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanRefRange(left, right string, cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
opts := s.opts(ScanRefsMode)
opts.SkipDeletedBlobs = false
return scanRefsToChan(s, callback, left, right, opts)
}
// ScanRefWithDeleted scans through all objects in the given ref, including
// git objects that have been modified or deleted.
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanRefWithDeleted(ref string, cb GitScannerFoundPointer) error {
return s.ScanRefRange(ref, "", cb)
}
// ScanRef scans through all objects in the current ref, excluding git objects
// that have been modified or deleted before the ref.
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanRef(ref string, cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
opts := s.opts(ScanRefsMode)
2016-11-16 20:02:45 +00:00
opts.SkipDeletedBlobs = true
return scanRefsToChan(s, callback, ref, "", opts)
2016-11-16 20:02:45 +00:00
}
// ScanAll scans through all objects in the git repository.
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanAll(cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
opts := s.opts(ScanAllMode)
2016-11-16 19:56:07 +00:00
opts.SkipDeletedBlobs = false
return scanRefsToChan(s, callback, "", "", opts)
2016-11-16 19:56:07 +00:00
}
2016-11-17 22:54:05 +00:00
// ScanTree takes a ref and returns WrappedPointer objects in the tree at that
// ref. Differs from ScanRefs in that multiple files in the tree with the same
// content are all reported.
func (s *GitScanner) ScanTree(ref string) error {
callback, err := firstGitScannerCallback(s.FoundPointer)
if err != nil {
return err
}
return runScanTree(callback, ref, s.Filter)
2016-11-17 22:54:05 +00:00
}
2016-11-17 16:53:01 +00:00
// ScanUnpushed scans history for all LFS pointers which have been added but not
// pushed to the named remote. remote can be left blank to mean 'any remote'.
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanUnpushed(remote string, cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
return scanUnpushed(callback, remote)
2016-11-17 16:53:01 +00:00
}
2016-11-17 22:41:19 +00:00
// ScanPreviousVersions scans changes reachable from ref (commit) back to since.
// Returns channel of pointers for *previous* versions that overlap that time.
// Does not include pointers which were still in use at ref (use ScanRefsToChan
// for that)
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanPreviousVersions(ref string, since time.Time, cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
return logPreviousSHAs(callback, ref, since)
2016-11-17 22:41:19 +00:00
}
2016-11-18 18:48:35 +00:00
// ScanIndex scans the git index for modified LFS objects.
2017-02-15 23:48:47 +00:00
func (s *GitScanner) ScanIndex(ref string, cb GitScannerFoundPointer) error {
callback, err := firstGitScannerCallback(cb, s.FoundPointer)
if err != nil {
return err
}
return scanIndex(callback, ref, s.Filter)
2016-11-18 18:48:35 +00:00
}
func (s *GitScanner) opts(mode ScanningMode) *ScanRefsOptions {
s.mu.Lock()
defer s.mu.Unlock()
2016-11-16 20:53:56 +00:00
opts := newScanRefsOptions()
opts.ScanMode = mode
2016-11-16 23:05:03 +00:00
opts.RemoteName = s.remote
opts.skippedRefs = s.skippedRefs
return opts
}
2016-11-18 18:51:15 +00:00
2017-02-15 23:48:47 +00:00
func firstGitScannerCallback(callbacks ...GitScannerFoundPointer) (GitScannerFoundPointer, error) {
for _, cb := range callbacks {
if cb == nil {
continue
}
return cb, nil
}
return nil, missingCallbackErr
}
2016-11-18 18:51:15 +00:00
type ScanningMode int
const (
ScanRefsMode = ScanningMode(iota) // 0 - or default scan mode
ScanAllMode = ScanningMode(iota)
ScanLeftToRemoteMode = ScanningMode(iota)
)
type ScanRefsOptions struct {
ScanMode ScanningMode
RemoteName string
SkipDeletedBlobs bool
skippedRefs []string
nameMap map[string]string
mutex *sync.Mutex
}
func (o *ScanRefsOptions) GetName(sha string) (string, bool) {
o.mutex.Lock()
name, ok := o.nameMap[sha]
o.mutex.Unlock()
return name, ok
}
func (o *ScanRefsOptions) SetName(sha, name string) {
o.mutex.Lock()
o.nameMap[sha] = name
o.mutex.Unlock()
}
func newScanRefsOptions() *ScanRefsOptions {
return &ScanRefsOptions{
nameMap: make(map[string]string, 0),
mutex: &sync.Mutex{},
}
}