git_footers.py 7.49 KB
Newer Older
1 2 3 4 5 6
#!/usr/bin/env python
# Copyright 2014 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.

import argparse
7
import json
8 9 10 11 12 13 14
import re
import sys

from collections import defaultdict

import git_common as git

15

16
FOOTER_PATTERN = re.compile(r'^\s*([\w-]+): *(.*)$')
17
CHROME_COMMIT_POSITION_PATTERN = re.compile(r'^([\w/\-\.]+)@{#(\d+)}$')
18

19

20 21 22 23 24
def normalize_name(header):
  return '-'.join([ word.title() for word in header.strip().split('-') ])


def parse_footer(line):
25
  """Returns footer's (key, value) if footer is valid, else None."""
26 27 28 29 30 31 32 33 34
  match = FOOTER_PATTERN.match(line)
  if match:
    return (match.group(1), match.group(2))
  else:
    return None


def parse_footers(message):
  """Parses a git commit message into a multimap of footers."""
35 36 37 38 39 40 41 42 43 44
  _, _, parsed_footers = split_footers(message)
  footer_map = defaultdict(list)
  if parsed_footers:
    # Read footers from bottom to top, because latter takes precedense,
    # and we want it to be first in the multimap value.
    for (k, v) in reversed(parsed_footers):
      footer_map[normalize_name(k)].append(v.strip())
  return footer_map


45 46 47 48 49 50 51
def matches_footer_key(line, key):
  """Returns whether line is a valid footer whose key matches a given one.

  Keys are compared in normalized form.
  """
  r = parse_footer(line)
  if r is None:
52
    return False
53 54 55
  return normalize_name(r[0]) == normalize_name(key)


56 57 58 59 60 61
def split_footers(message):
  """Returns (non_footer_lines, footer_lines, parsed footers).

  Guarantees that:
    (non_footer_lines + footer_lines) == message.splitlines().
    parsed_footers is parse_footer applied on each line of footer_lines.
62 63
      There could be fewer parsed_footers than footer lines if some lines in
      last paragraph are malformed.
64 65
  """
  message_lines = list(message.splitlines())
66
  footer_lines = []
67
  for line in reversed(message_lines):
68 69 70
    if line == '' or line.isspace():
      break
    footer_lines.append(line)
71 72 73 74
  else:
    # The whole description was consisting of footers,
    # which means those aren't footers.
    footer_lines = []
75

76
  footer_lines.reverse()
77 78
  footers = filter(None, map(parse_footer, footer_lines))
  if not footers:
79 80
    return message_lines, [], []
  return message_lines[:-len(footer_lines)], footer_lines, footers
81 82


83 84 85 86 87 88 89 90
def get_footer_change_id(message):
  """Returns a list of Gerrit's ChangeId from given commit message."""
  return parse_footers(message).get(normalize_name('Change-Id'), [])


def add_footer_change_id(message, change_id):
  """Returns message with Change-ID footer in it.

91 92 93
  Assumes that Change-Id is not yet in footers, which is then inserted at
  earliest footer line which is after all of these footers:
    Bug|Issue|Test|Feature.
94
  """
95 96 97 98
  assert 'Change-Id' not in parse_footers(message)
  return add_footer(message, 'Change-Id', change_id,
                    after_keys=['Bug', 'Issue', 'Test', 'Feature'])

99

100
def add_footer(message, key, value, after_keys=None, before_keys=None):
101 102
  """Returns a message with given footer appended.

103 104 105 106 107 108 109
  If after_keys and before_keys are both None (default), appends footer last.
  If after_keys is provided and matches footers already present, inserts footer
  as *early* as possible while still appearing after all provided keys, even
  if doing so conflicts with before_keys.
  If before_keys is provided, inserts footer as late as possible while still
  appearing before all provided keys.

110 111 112 113 114 115 116 117
  For example, given
      message='Header.\n\nAdded: 2016\nBug: 123\nVerified-By: CQ'
      after_keys=['Bug', 'Issue']
  the new footer will be inserted between Bug and Verified-By existing footers.
  """
  assert key == normalize_name(key), 'Use normalized key'
  new_footer = '%s: %s' % (key, value)

118
  top_lines, footer_lines, _ = split_footers(message)
119 120 121 122
  if not footer_lines:
    if not top_lines or top_lines[-1] != '':
      top_lines.append('')
    footer_lines = [new_footer]
123
  else:
124 125 126
    after_keys = set(map(normalize_name, after_keys or []))
    after_indices = [
        footer_lines.index(x) for x in footer_lines for k in after_keys
127
        if matches_footer_key(x, k)]
128 129 130
    before_keys = set(map(normalize_name, before_keys or []))
    before_indices = [
        footer_lines.index(x) for x in footer_lines for k in before_keys
131
        if matches_footer_key(x, k)]
132 133 134 135 136
    if after_indices:
      # after_keys takes precedence, even if there's a conflict.
      insert_idx = max(after_indices) + 1
    elif before_indices:
      insert_idx = min(before_indices)
137
    else:
138 139
      insert_idx = len(footer_lines)
    footer_lines.insert(insert_idx, new_footer)
140
  return '\n'.join(top_lines + footer_lines)
141 142


143 144 145 146 147 148
def remove_footer(message, key):
  """Returns a message with all instances of given footer removed."""
  key = normalize_name(key)
  top_lines, footer_lines, _ = split_footers(message)
  if not footer_lines:
    return message
149 150 151 152 153 154 155 156 157
  new_footer_lines = []
  for line in footer_lines:
    try:
      f = normalize_name(parse_footer(line)[0])
      if f != key:
        new_footer_lines.append(line)
    except TypeError:
      # If the footer doesn't parse (i.e. is malformed), just let it carry over.
      new_footer_lines.append(line)
158 159 160
  return '\n'.join(top_lines + new_footer_lines)


161 162 163 164 165 166 167 168 169 170 171
def get_unique(footers, key):
  key = normalize_name(key)
  values = footers[key]
  assert len(values) <= 1, 'Multiple %s footers' % key
  if values:
    return values[0]
  else:
    return None


def get_position(footers):
172
  """Get the commit position from the footers multimap using a heuristic.
173 174 175 176 177 178

  Returns:
    A tuple of the branch and the position on that branch. For example,

    Cr-Commit-Position: refs/heads/master@{#292272}

179
    would give the return value ('refs/heads/master', 292272).
180 181 182 183 184 185 186 187 188 189 190 191 192 193 194
  """

  position = get_unique(footers, 'Cr-Commit-Position')
  if position:
    match = CHROME_COMMIT_POSITION_PATTERN.match(position)
    assert match, 'Invalid Cr-Commit-Position value: %s' % position
    return (match.group(1), match.group(2))

  raise ValueError('Unable to infer commit position from footers')


def main(args):
  parser = argparse.ArgumentParser(
    formatter_class=argparse.ArgumentDefaultsHelpFormatter
  )
195 196
  parser.add_argument('ref', nargs='?', help='Git ref to retrieve footers from.'
                      ' Omit to parse stdin.')
197 198 199 200 201 202 203 204

  g = parser.add_mutually_exclusive_group()
  g.add_argument('--key', metavar='KEY',
                 help='Get all values for the given footer name, one per '
                 'line (case insensitive)')
  g.add_argument('--position', action='store_true')
  g.add_argument('--position-ref', action='store_true')
  g.add_argument('--position-num', action='store_true')
205
  g.add_argument('--json', help='filename to dump JSON serialized footers to.')
206 207 208

  opts = parser.parse_args(args)

209 210 211
  if opts.ref:
    message = git.run('log', '-1', '--format=%B', opts.ref)
  else:
212
    message = sys.stdin.read()
213

214 215 216 217 218 219 220 221 222 223 224 225 226 227
  footers = parse_footers(message)

  if opts.key:
    for v in footers.get(normalize_name(opts.key), []):
      print v
  elif opts.position:
    pos = get_position(footers)
    print '%s@{#%s}' % (pos[0], pos[1] or '?')
  elif opts.position_ref:
    print get_position(footers)[0]
  elif opts.position_num:
    pos = get_position(footers)
    assert pos[1], 'No valid position for commit'
    print pos[1]
228 229 230
  elif opts.json:
    with open(opts.json, 'w') as f:
      json.dump(footers, f)
231 232 233 234
  else:
    for k in footers.keys():
      for v in footers[k]:
        print '%s: %s' % (k, v)
235
  return 0
236 237 238


if __name__ == '__main__':
239 240 241 242 243
  try:
    sys.exit(main(sys.argv[1:]))
  except KeyboardInterrupt:
    sys.stderr.write('interrupted\n')
    sys.exit(1)