changes_xpather.go 2.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475
  1. package hercules
  2. import (
  3. "log"
  4. "github.com/minio/highwayhash"
  5. "gopkg.in/bblfsh/client-go.v2/tools"
  6. "gopkg.in/bblfsh/sdk.v1/uast"
  7. "gopkg.in/src-d/go-git.v4/plumbing"
  8. "io"
  9. "bytes"
  10. )
  11. // ChangesXPather extracts changed UAST nodes from files changed in the current commit.
  12. type ChangesXPather struct {
  13. XPath string
  14. }
  15. var hashKey = []byte{
  16. 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15,
  17. 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31,
  18. }
  19. // Extract returns the list of new or changed UAST nodes filtered by XPath.
  20. func (xpather ChangesXPather) Extract(changes []UASTChange) []*uast.Node {
  21. result := []*uast.Node{}
  22. for _, change := range changes {
  23. if change.After == nil {
  24. continue
  25. }
  26. oldNodes := xpather.filter(change.Before, change.Change.From.TreeEntry.Hash)
  27. newNodes := xpather.filter(change.After, change.Change.To.TreeEntry.Hash)
  28. oldHashes := xpather.hash(oldNodes)
  29. newHashes := xpather.hash(newNodes)
  30. // remove any untouched nodes
  31. for hash := range oldHashes {
  32. delete(newHashes, hash)
  33. }
  34. // there can be hash collisions; we ignore them
  35. for _, node := range newHashes {
  36. result = append(result, node)
  37. }
  38. }
  39. return result
  40. }
  41. func (xpather ChangesXPather) filter(root *uast.Node, origin plumbing.Hash) []*uast.Node {
  42. if root != nil {
  43. nodes, err := tools.Filter(root, xpather.XPath)
  44. if err != nil {
  45. log.Printf("libuast filter error on object %s: %v", origin.String(), err)
  46. return []*uast.Node{}
  47. }
  48. return nodes
  49. }
  50. return []*uast.Node{}
  51. }
  52. func (xpather ChangesXPather) hash(nodes []*uast.Node) map[uint64]*uast.Node {
  53. result := map[uint64]*uast.Node{}
  54. for _, node := range nodes {
  55. buffer := &bytes.Buffer{}
  56. stringifyUASTNode(node, buffer)
  57. result[highwayhash.Sum64(buffer.Bytes(), hashKey)] = node
  58. }
  59. return result
  60. }
  61. func stringifyUASTNode(node *uast.Node, writer io.Writer) {
  62. writer.Write([]byte(node.Token + "|" + node.InternalType + ">"))
  63. for _, child := range node.Children {
  64. stringifyUASTNode(child, writer)
  65. }
  66. }