git.py 4.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147
  1. # -*- coding: utf-8 -*-
  2. import collections
  3. import datetime
  4. import logging
  5. import re
  6. import subprocess
  7. import tarfile
  8. import tempfile
  9. GitRef = collections.namedtuple(
  10. "VersionRef",
  11. ["name", "commit", "source", "is_remote", "refname", "creatordate",],
  12. )
  13. logger = logging.getLogger(__name__)
  14. def get_all_refs(gitroot):
  15. cmd = (
  16. "git",
  17. "for-each-ref",
  18. "--format",
  19. "%(objectname)\t%(refname)\t%(creatordate:iso)",
  20. "refs",
  21. )
  22. output = subprocess.check_output(cmd, cwd=gitroot).decode()
  23. for line in output.splitlines():
  24. is_remote = False
  25. fields = line.strip().split("\t")
  26. if len(fields) != 3:
  27. continue
  28. commit = fields[0]
  29. refname = fields[1]
  30. creatordate = datetime.datetime.strptime(
  31. fields[2], "%Y-%m-%d %H:%M:%S %z"
  32. )
  33. # Parse refname
  34. matchobj = re.match(
  35. r"^refs/(heads|tags|remotes/[^/]+)/(\S+)$", refname
  36. )
  37. if not matchobj:
  38. continue
  39. source = matchobj.group(1)
  40. name = matchobj.group(2)
  41. if source.startswith("remotes/"):
  42. is_remote = True
  43. yield GitRef(name, commit, source, is_remote, refname, creatordate)
  44. def get_refs(
  45. gitroot, tag_whitelist, branch_whitelist, remote_whitelist, files=()
  46. ):
  47. for ref in get_all_refs(gitroot):
  48. if ref.source == "tags":
  49. if tag_whitelist is None or not re.match(tag_whitelist, ref.name):
  50. logger.debug(
  51. "Skipping '%s' because tag '%s' doesn't match the "
  52. "whitelist pattern",
  53. ref.refname,
  54. ref.name,
  55. )
  56. continue
  57. elif ref.source == "heads":
  58. if branch_whitelist is None or not re.match(
  59. branch_whitelist, ref.name
  60. ):
  61. logger.debug(
  62. "Skipping '%s' because branch '%s' doesn't match the "
  63. "whitelist pattern",
  64. ref.refname,
  65. ref.name,
  66. )
  67. continue
  68. elif ref.is_remote and remote_whitelist is not None:
  69. remote_name = ref.source.partition("/")[2]
  70. if not re.match(remote_whitelist, remote_name):
  71. logger.debug(
  72. "Skipping '%s' because remote '%s' doesn't match the "
  73. "whitelist pattern",
  74. ref.refname,
  75. remote_name,
  76. )
  77. continue
  78. if branch_whitelist is None or not re.match(
  79. branch_whitelist, ref.name
  80. ):
  81. logger.debug(
  82. "Skipping '%s' because branch '%s' doesn't match the "
  83. "whitelist pattern",
  84. ref.refname,
  85. ref.name,
  86. )
  87. continue
  88. else:
  89. logger.debug(
  90. "Skipping '%s' because its not a branch or tag", ref.refname
  91. )
  92. continue
  93. missing_files = [
  94. filename
  95. for filename in files
  96. if not file_exists(gitroot, ref.refname, filename)
  97. ]
  98. if missing_files:
  99. logger.debug(
  100. "Skipping '%s' because it lacks required files: %r",
  101. ref.refname,
  102. missing_files,
  103. )
  104. continue
  105. yield ref
  106. def file_exists(gitroot, refname, filename):
  107. cmd = (
  108. "git",
  109. "cat-file",
  110. "-e",
  111. "{}:{}".format(refname, filename),
  112. )
  113. proc = subprocess.run(
  114. cmd, cwd=gitroot, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL
  115. )
  116. return proc.returncode == 0
  117. def copy_tree(src, dst, reference, sourcepath="."):
  118. with tempfile.SpooledTemporaryFile() as fp:
  119. cmd = (
  120. "git",
  121. "archive",
  122. "--format",
  123. "tar",
  124. reference.commit,
  125. "--",
  126. sourcepath,
  127. )
  128. subprocess.check_call(cmd, stdout=fp)
  129. fp.seek(0)
  130. with tarfile.TarFile(fileobj=fp) as tarfp:
  131. tarfp.extractall(dst)