git.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338
  1. # Copyright 2011 OpenStack Foundation
  2. # Copyright 2012-2013 Hewlett-Packard Development Company, L.P.
  3. # All Rights Reserved.
  4. #
  5. # Licensed under the Apache License, Version 2.0 (the "License"); you may
  6. # not use this file except in compliance with the License. You may obtain
  7. # a copy of the License at
  8. #
  9. # http://www.apache.org/licenses/LICENSE-2.0
  10. #
  11. # Unless required by applicable law or agreed to in writing, software
  12. # distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
  13. # WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
  14. # License for the specific language governing permissions and limitations
  15. # under the License.
  16. from __future__ import unicode_literals
  17. import distutils.errors
  18. from distutils import log
  19. import errno
  20. import io
  21. import os
  22. import re
  23. import subprocess
  24. import time
  25. import pkg_resources
  26. from pbr import options
  27. from pbr import version
  28. def _run_shell_command(cmd, throw_on_error=False, buffer=True, env=None):
  29. if buffer:
  30. out_location = subprocess.PIPE
  31. err_location = subprocess.PIPE
  32. else:
  33. out_location = None
  34. err_location = None
  35. newenv = os.environ.copy()
  36. if env:
  37. newenv.update(env)
  38. output = subprocess.Popen(cmd,
  39. stdout=out_location,
  40. stderr=err_location,
  41. env=newenv)
  42. out = output.communicate()
  43. if output.returncode and throw_on_error:
  44. raise distutils.errors.DistutilsError(
  45. "%s returned %d" % (cmd, output.returncode))
  46. if len(out) == 0 or not out[0] or not out[0].strip():
  47. return ''
  48. # Since we don't control the history, and forcing users to rebase arbitrary
  49. # history to fix utf8 issues is harsh, decode with replace.
  50. return out[0].strip().decode('utf-8', 'replace')
  51. def _run_git_command(cmd, git_dir, **kwargs):
  52. if not isinstance(cmd, (list, tuple)):
  53. cmd = [cmd]
  54. return _run_shell_command(
  55. ['git', '--git-dir=%s' % git_dir] + cmd, **kwargs)
  56. def _get_git_directory():
  57. try:
  58. return _run_shell_command(['git', 'rev-parse', '--git-dir'])
  59. except OSError as e:
  60. if e.errno == errno.ENOENT:
  61. # git not installed.
  62. return ''
  63. raise
  64. def _git_is_installed():
  65. try:
  66. # We cannot use 'which git' as it may not be available
  67. # in some distributions, So just try 'git --version'
  68. # to see if we run into trouble
  69. _run_shell_command(['git', '--version'])
  70. except OSError:
  71. return False
  72. return True
  73. def _get_highest_tag(tags):
  74. """Find the highest tag from a list.
  75. Pass in a list of tag strings and this will return the highest
  76. (latest) as sorted by the pkg_resources version parser.
  77. """
  78. return max(tags, key=pkg_resources.parse_version)
  79. def _find_git_files(dirname='', git_dir=None):
  80. """Behave like a file finder entrypoint plugin.
  81. We don't actually use the entrypoints system for this because it runs
  82. at absurd times. We only want to do this when we are building an sdist.
  83. """
  84. file_list = []
  85. if git_dir is None:
  86. git_dir = _run_git_functions()
  87. if git_dir:
  88. log.info("[pbr] In git context, generating filelist from git")
  89. file_list = _run_git_command(['ls-files', '-z'], git_dir)
  90. # Users can fix utf8 issues locally with a single commit, so we are
  91. # strict here.
  92. file_list = file_list.split(b'\x00'.decode('utf-8'))
  93. return [f for f in file_list if f]
  94. def _get_raw_tag_info(git_dir):
  95. describe = _run_git_command(['describe', '--always'], git_dir)
  96. if "-" in describe:
  97. return describe.rsplit("-", 2)[-2]
  98. if "." in describe:
  99. return 0
  100. return None
  101. def get_is_release(git_dir):
  102. return _get_raw_tag_info(git_dir) == 0
  103. def _run_git_functions():
  104. git_dir = None
  105. if _git_is_installed():
  106. git_dir = _get_git_directory()
  107. return git_dir or None
  108. def get_git_short_sha(git_dir=None):
  109. """Return the short sha for this repo, if it exists."""
  110. if not git_dir:
  111. git_dir = _run_git_functions()
  112. if git_dir:
  113. return _run_git_command(
  114. ['log', '-n1', '--pretty=format:%h'], git_dir)
  115. return None
  116. def _clean_changelog_message(msg):
  117. """Cleans any instances of invalid sphinx wording.
  118. This escapes/removes any instances of invalid characters
  119. that can be interpreted by sphinx as a warning or error
  120. when translating the Changelog into an HTML file for
  121. documentation building within projects.
  122. * Escapes '_' which is interpreted as a link
  123. * Escapes '*' which is interpreted as a new line
  124. * Escapes '`' which is interpreted as a literal
  125. """
  126. msg = msg.replace('*', r'\*')
  127. msg = msg.replace('_', r'\_')
  128. msg = msg.replace('`', r'\`')
  129. return msg
  130. def _iter_changelog(changelog):
  131. """Convert a oneline log iterator to formatted strings.
  132. :param changelog: An iterator of one line log entries like
  133. that given by _iter_log_oneline.
  134. :return: An iterator over (release, formatted changelog) tuples.
  135. """
  136. first_line = True
  137. current_release = None
  138. yield current_release, "CHANGES\n=======\n\n"
  139. for hash, tags, msg in changelog:
  140. if tags:
  141. current_release = _get_highest_tag(tags)
  142. underline = len(current_release) * '-'
  143. if not first_line:
  144. yield current_release, '\n'
  145. yield current_release, (
  146. "%(tag)s\n%(underline)s\n\n" %
  147. dict(tag=current_release, underline=underline))
  148. if not msg.startswith("Merge "):
  149. if msg.endswith("."):
  150. msg = msg[:-1]
  151. msg = _clean_changelog_message(msg)
  152. yield current_release, "* %(msg)s\n" % dict(msg=msg)
  153. first_line = False
  154. def _iter_log_oneline(git_dir=None):
  155. """Iterate over --oneline log entries if possible.
  156. This parses the output into a structured form but does not apply
  157. presentation logic to the output - making it suitable for different
  158. uses.
  159. :return: An iterator of (hash, tags_set, 1st_line) tuples, or None if
  160. changelog generation is disabled / not available.
  161. """
  162. if git_dir is None:
  163. git_dir = _get_git_directory()
  164. if not git_dir:
  165. return []
  166. return _iter_log_inner(git_dir)
  167. def _is_valid_version(candidate):
  168. try:
  169. version.SemanticVersion.from_pip_string(candidate)
  170. return True
  171. except ValueError:
  172. return False
  173. def _iter_log_inner(git_dir):
  174. """Iterate over --oneline log entries.
  175. This parses the output intro a structured form but does not apply
  176. presentation logic to the output - making it suitable for different
  177. uses.
  178. .. caution:: this function risk to return a tag that doesn't exist really
  179. inside the git objects list due to replacement made
  180. to tag name to also list pre-release suffix.
  181. Compliant with the SemVer specification (e.g 1.2.3-rc1)
  182. :return: An iterator of (hash, tags_set, 1st_line) tuples.
  183. """
  184. log.info('[pbr] Generating ChangeLog')
  185. log_cmd = ['log', '--decorate=full', '--format=%h%x00%s%x00%d']
  186. changelog = _run_git_command(log_cmd, git_dir)
  187. for line in changelog.split('\n'):
  188. line_parts = line.split('\x00')
  189. if len(line_parts) != 3:
  190. continue
  191. sha, msg, refname = line_parts
  192. tags = set()
  193. # refname can be:
  194. # <empty>
  195. # HEAD, tag: refs/tags/1.4.0, refs/remotes/origin/master, \
  196. # refs/heads/master
  197. # refs/tags/1.3.4
  198. if "refs/tags/" in refname:
  199. refname = refname.strip()[1:-1] # remove wrapping ()'s
  200. # If we start with "tag: refs/tags/1.2b1, tag: refs/tags/1.2"
  201. # The first split gives us "['', '1.2b1, tag:', '1.2']"
  202. # Which is why we do the second split below on the comma
  203. for tag_string in refname.split("refs/tags/")[1:]:
  204. # git tag does not allow : or " " in tag names, so we split
  205. # on ", " which is the separator between elements
  206. candidate = tag_string.split(", ")[0].replace("-", ".")
  207. if _is_valid_version(candidate):
  208. tags.add(candidate)
  209. yield sha, tags, msg
  210. def write_git_changelog(git_dir=None, dest_dir=os.path.curdir,
  211. option_dict=None, changelog=None):
  212. """Write a changelog based on the git changelog."""
  213. start = time.time()
  214. if not option_dict:
  215. option_dict = {}
  216. should_skip = options.get_boolean_option(option_dict, 'skip_changelog',
  217. 'SKIP_WRITE_GIT_CHANGELOG')
  218. if should_skip:
  219. return
  220. if not changelog:
  221. changelog = _iter_log_oneline(git_dir=git_dir)
  222. if changelog:
  223. changelog = _iter_changelog(changelog)
  224. if not changelog:
  225. return
  226. new_changelog = os.path.join(dest_dir, 'ChangeLog')
  227. if os.path.exists(new_changelog) and not os.access(new_changelog, os.W_OK):
  228. # If there's already a ChangeLog and it's not writable, just use it
  229. log.info('[pbr] ChangeLog not written (file already'
  230. ' exists and it is not writeable)')
  231. return
  232. log.info('[pbr] Writing ChangeLog')
  233. with io.open(new_changelog, "w", encoding="utf-8") as changelog_file:
  234. for release, content in changelog:
  235. changelog_file.write(content)
  236. stop = time.time()
  237. log.info('[pbr] ChangeLog complete (%0.1fs)' % (stop - start))
  238. def generate_authors(git_dir=None, dest_dir='.', option_dict=dict()):
  239. """Create AUTHORS file using git commits."""
  240. should_skip = options.get_boolean_option(option_dict, 'skip_authors',
  241. 'SKIP_GENERATE_AUTHORS')
  242. if should_skip:
  243. return
  244. start = time.time()
  245. old_authors = os.path.join(dest_dir, 'AUTHORS.in')
  246. new_authors = os.path.join(dest_dir, 'AUTHORS')
  247. if os.path.exists(new_authors) and not os.access(new_authors, os.W_OK):
  248. # If there's already an AUTHORS file and it's not writable, just use it
  249. return
  250. log.info('[pbr] Generating AUTHORS')
  251. ignore_emails = '((jenkins|zuul)@review|infra@lists|jenkins@openstack)'
  252. if git_dir is None:
  253. git_dir = _get_git_directory()
  254. if git_dir:
  255. authors = []
  256. # don't include jenkins email address in AUTHORS file
  257. git_log_cmd = ['log', '--format=%aN <%aE>']
  258. authors += _run_git_command(git_log_cmd, git_dir).split('\n')
  259. authors = [a for a in authors if not re.search(ignore_emails, a)]
  260. # get all co-authors from commit messages
  261. co_authors_out = _run_git_command('log', git_dir)
  262. co_authors = re.findall('Co-authored-by:.+', co_authors_out,
  263. re.MULTILINE)
  264. co_authors = [signed.split(":", 1)[1].strip()
  265. for signed in co_authors if signed]
  266. authors += co_authors
  267. authors = sorted(set(authors))
  268. with open(new_authors, 'wb') as new_authors_fh:
  269. if os.path.exists(old_authors):
  270. with open(old_authors, "rb") as old_authors_fh:
  271. new_authors_fh.write(old_authors_fh.read())
  272. new_authors_fh.write(('\n'.join(authors) + '\n')
  273. .encode('utf-8'))
  274. stop = time.time()
  275. log.info('[pbr] AUTHORS complete (%0.1fs)' % (stop - start))