| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196 | 
							- package plumbing
 
- import (
 
- 	"log"
 
- 	"gopkg.in/src-d/go-git.v4"
 
- 	"gopkg.in/src-d/go-git.v4/config"
 
- 	"gopkg.in/src-d/go-git.v4/plumbing"
 
- 	"gopkg.in/src-d/go-git.v4/plumbing/object"
 
- 	"gopkg.in/src-d/go-git.v4/utils/merkletrie"
 
- 	"gopkg.in/src-d/hercules.v4/internal"
 
- 	"gopkg.in/src-d/hercules.v4/internal/core"
 
- )
 
- // BlobCache loads the blobs which correspond to the changed files in a commit.
 
- // It is a PipelineItem.
 
- // It must provide the old and the new objects; "blobCache" rotates and allows to not load
 
- // the same blobs twice. Outdated objects are removed so "blobCache" never grows big.
 
- type BlobCache struct {
 
- 	// Specifies how to handle the situation when we encounter a git submodule - an object without
 
- 	// the blob. If false, we look inside .gitmodules and if don't find, raise an error.
 
- 	// If true, we do not look inside .gitmodules and always succeed.
 
- 	IgnoreMissingSubmodules bool
 
- 	repository *git.Repository
 
- 	cache      map[plumbing.Hash]*object.Blob
 
- }
 
- const (
 
- 	// ConfigBlobCacheIgnoreMissingSubmodules is the name of the configuration option for
 
- 	// BlobCache.Configure() to not check if the referenced submodules exist.
 
- 	ConfigBlobCacheIgnoreMissingSubmodules = "BlobCache.IgnoreMissingSubmodules"
 
- 	// DependencyBlobCache identifies the dependency provided by BlobCache.
 
- 	DependencyBlobCache = "blob_cache"
 
- )
 
- // Name of this PipelineItem. Uniquely identifies the type, used for mapping keys, etc.
 
- func (blobCache *BlobCache) Name() string {
 
- 	return "BlobCache"
 
- }
 
- // Provides returns the list of names of entities which are produced by this PipelineItem.
 
- // Each produced entity will be inserted into `deps` of dependent Consume()-s according
 
- // to this list. Also used by core.Registry to build the global map of providers.
 
- func (blobCache *BlobCache) Provides() []string {
 
- 	arr := [...]string{DependencyBlobCache}
 
- 	return arr[:]
 
- }
 
- // Requires returns the list of names of entities which are needed by this PipelineItem.
 
- // Each requested entity will be inserted into `deps` of Consume(). In turn, those
 
- // entities are Provides() upstream.
 
- func (blobCache *BlobCache) Requires() []string {
 
- 	arr := [...]string{DependencyTreeChanges}
 
- 	return arr[:]
 
- }
 
- // ListConfigurationOptions returns the list of changeable public properties of this PipelineItem.
 
- func (blobCache *BlobCache) ListConfigurationOptions() []core.ConfigurationOption {
 
- 	options := [...]core.ConfigurationOption{{
 
- 		Name: ConfigBlobCacheIgnoreMissingSubmodules,
 
- 		Description: "Specifies whether to panic if some referenced submodules do not exist and thus" +
 
- 			" the corresponding Git objects cannot be loaded. Override this if you know that the " +
 
- 			"history is dirty and you want to get things done.",
 
- 		Flag:    "ignore-missing-submodules",
 
- 		Type:    core.BoolConfigurationOption,
 
- 		Default: false}}
 
- 	return options[:]
 
- }
 
- // Configure sets the properties previously published by ListConfigurationOptions().
 
- func (blobCache *BlobCache) Configure(facts map[string]interface{}) {
 
- 	if val, exists := facts[ConfigBlobCacheIgnoreMissingSubmodules].(bool); exists {
 
- 		blobCache.IgnoreMissingSubmodules = val
 
- 	}
 
- }
 
- // Initialize resets the temporary caches and prepares this PipelineItem for a series of Consume()
 
- // calls. The repository which is going to be analysed is supplied as an argument.
 
- func (blobCache *BlobCache) Initialize(repository *git.Repository) {
 
- 	blobCache.repository = repository
 
- 	blobCache.cache = map[plumbing.Hash]*object.Blob{}
 
- }
 
- // Consume runs this PipelineItem on the next commit data.
 
- // `deps` contain all the results from upstream PipelineItem-s as requested by Requires().
 
- // Additionally, "commit" is always present there and represents the analysed *object.Commit.
 
- // This function returns the mapping with analysis results. The keys must be the same as
 
- // in Provides(). If there was an error, nil is returned.
 
- func (blobCache *BlobCache) Consume(deps map[string]interface{}) (map[string]interface{}, error) {
 
- 	commit := deps["commit"].(*object.Commit)
 
- 	changes := deps[DependencyTreeChanges].(object.Changes)
 
- 	cache := map[plumbing.Hash]*object.Blob{}
 
- 	newCache := map[plumbing.Hash]*object.Blob{}
 
- 	for _, change := range changes {
 
- 		action, err := change.Action()
 
- 		if err != nil {
 
- 			log.Printf("no action in %s\n", change.To.TreeEntry.Hash)
 
- 			return nil, err
 
- 		}
 
- 		var exists bool
 
- 		var blob *object.Blob
 
- 		switch action {
 
- 		case merkletrie.Insert:
 
- 			blob, err = blobCache.getBlob(&change.To, commit.File)
 
- 			if err != nil {
 
- 				log.Printf("file to %s %s\n", change.To.Name, change.To.TreeEntry.Hash)
 
- 			} else {
 
- 				cache[change.To.TreeEntry.Hash] = blob
 
- 				newCache[change.To.TreeEntry.Hash] = blob
 
- 			}
 
- 		case merkletrie.Delete:
 
- 			cache[change.From.TreeEntry.Hash], exists = blobCache.cache[change.From.TreeEntry.Hash]
 
- 			if !exists {
 
- 				cache[change.From.TreeEntry.Hash], err = blobCache.getBlob(&change.From, commit.File)
 
- 				if err != nil {
 
- 					if err.Error() != plumbing.ErrObjectNotFound.Error() {
 
- 						log.Printf("file from %s %s\n", change.From.Name,
 
- 							change.From.TreeEntry.Hash)
 
- 					} else {
 
- 						cache[change.From.TreeEntry.Hash], err = internal.CreateDummyBlob(
 
- 							change.From.TreeEntry.Hash)
 
- 					}
 
- 				}
 
- 			}
 
- 		case merkletrie.Modify:
 
- 			blob, err = blobCache.getBlob(&change.To, commit.File)
 
- 			if err != nil {
 
- 				log.Printf("file to %s\n", change.To.Name)
 
- 			} else {
 
- 				cache[change.To.TreeEntry.Hash] = blob
 
- 				newCache[change.To.TreeEntry.Hash] = blob
 
- 			}
 
- 			cache[change.From.TreeEntry.Hash], exists = blobCache.cache[change.From.TreeEntry.Hash]
 
- 			if !exists {
 
- 				cache[change.From.TreeEntry.Hash], err = blobCache.getBlob(&change.From, commit.File)
 
- 				if err != nil {
 
- 					log.Printf("file from %s\n", change.From.Name)
 
- 				}
 
- 			}
 
- 		}
 
- 		if err != nil {
 
- 			return nil, err
 
- 		}
 
- 	}
 
- 	blobCache.cache = newCache
 
- 	return map[string]interface{}{DependencyBlobCache: cache}, nil
 
- }
 
- // FileGetter defines a function which loads the Git file by the specified path.
 
- // The state can be arbitrary though here it always corresponds to the currently processed
 
- // commit.
 
- type FileGetter func(path string) (*object.File, error)
 
- // Returns the blob which corresponds to the specified ChangeEntry.
 
- func (blobCache *BlobCache) getBlob(entry *object.ChangeEntry, fileGetter FileGetter) (
 
- 	*object.Blob, error) {
 
- 	blob, err := blobCache.repository.BlobObject(entry.TreeEntry.Hash)
 
- 	if err != nil {
 
- 		if err.Error() != plumbing.ErrObjectNotFound.Error() {
 
- 			log.Printf("getBlob(%s)\n", entry.TreeEntry.Hash.String())
 
- 			return nil, err
 
- 		}
 
- 		if entry.TreeEntry.Mode != 0160000 {
 
- 			// this is not a submodule
 
- 			return nil, err
 
- 		} else if blobCache.IgnoreMissingSubmodules {
 
- 			return internal.CreateDummyBlob(entry.TreeEntry.Hash)
 
- 		}
 
- 		file, errModules := fileGetter(".gitmodules")
 
- 		if errModules != nil {
 
- 			return nil, errModules
 
- 		}
 
- 		contents, errModules := file.Contents()
 
- 		if errModules != nil {
 
- 			return nil, errModules
 
- 		}
 
- 		modules := config.NewModules()
 
- 		errModules = modules.Unmarshal([]byte(contents))
 
- 		if errModules != nil {
 
- 			return nil, errModules
 
- 		}
 
- 		_, exists := modules.Submodules[entry.Name]
 
- 		if exists {
 
- 			// we found that this is a submodule
 
- 			return internal.CreateDummyBlob(entry.TreeEntry.Hash)
 
- 		}
 
- 		return nil, err
 
- 	}
 
- 	return blob, nil
 
- }
 
- func init() {
 
- 	core.Registry.Register(&BlobCache{})
 
- }
 
 
  |