]> git.ipfire.org Git - people/ms/u-boot.git/blob - tools/patman/patchstream.py
patman: Explain how to make doc/git-mailrc work
[people/ms/u-boot.git] / tools / patman / patchstream.py
1 # Copyright (c) 2011 The Chromium OS Authors.
2 #
3 # SPDX-License-Identifier: GPL-2.0+
4 #
5
6 import os
7 import re
8 import shutil
9 import tempfile
10
11 import command
12 import commit
13 import gitutil
14 from series import Series
15
16 # Tags that we detect and remove
17 re_remove = re.compile('^BUG=|^TEST=|^BRANCH=|^Change-Id:|^Review URL:'
18 '|Reviewed-on:|Commit-\w*:')
19
20 # Lines which are allowed after a TEST= line
21 re_allowed_after_test = re.compile('^Signed-off-by:')
22
23 # Signoffs
24 re_signoff = re.compile('^Signed-off-by: *(.*)')
25
26 # The start of the cover letter
27 re_cover = re.compile('^Cover-letter:')
28
29 # A cover letter Cc
30 re_cover_cc = re.compile('^Cover-letter-cc: *(.*)')
31
32 # Patch series tag
33 re_series_tag = re.compile('^Series-([a-z-]*): *(.*)')
34
35 # Commit series tag
36 re_commit_tag = re.compile('^Commit-([a-z-]*): *(.*)')
37
38 # Commit tags that we want to collect and keep
39 re_tag = re.compile('^(Tested-by|Acked-by|Reviewed-by|Patch-cc): (.*)')
40
41 # The start of a new commit in the git log
42 re_commit = re.compile('^commit ([0-9a-f]*)$')
43
44 # We detect these since checkpatch doesn't always do it
45 re_space_before_tab = re.compile('^[+].* \t')
46
47 # States we can be in - can we use range() and still have comments?
48 STATE_MSG_HEADER = 0 # Still in the message header
49 STATE_PATCH_SUBJECT = 1 # In patch subject (first line of log for a commit)
50 STATE_PATCH_HEADER = 2 # In patch header (after the subject)
51 STATE_DIFFS = 3 # In the diff part (past --- line)
52
53 class PatchStream:
54 """Class for detecting/injecting tags in a patch or series of patches
55
56 We support processing the output of 'git log' to read out the tags we
57 are interested in. We can also process a patch file in order to remove
58 unwanted tags or inject additional ones. These correspond to the two
59 phases of processing.
60 """
61 def __init__(self, series, name=None, is_log=False):
62 self.skip_blank = False # True to skip a single blank line
63 self.found_test = False # Found a TEST= line
64 self.lines_after_test = 0 # MNumber of lines found after TEST=
65 self.warn = [] # List of warnings we have collected
66 self.linenum = 1 # Output line number we are up to
67 self.in_section = None # Name of start...END section we are in
68 self.notes = [] # Series notes
69 self.section = [] # The current section...END section
70 self.series = series # Info about the patch series
71 self.is_log = is_log # True if indent like git log
72 self.in_change = 0 # Non-zero if we are in a change list
73 self.blank_count = 0 # Number of blank lines stored up
74 self.state = STATE_MSG_HEADER # What state are we in?
75 self.signoff = [] # Contents of signoff line
76 self.commit = None # Current commit
77
78 def AddToSeries(self, line, name, value):
79 """Add a new Series-xxx tag.
80
81 When a Series-xxx tag is detected, we come here to record it, if we
82 are scanning a 'git log'.
83
84 Args:
85 line: Source line containing tag (useful for debug/error messages)
86 name: Tag name (part after 'Series-')
87 value: Tag value (part after 'Series-xxx: ')
88 """
89 if name == 'notes':
90 self.in_section = name
91 self.skip_blank = False
92 if self.is_log:
93 self.series.AddTag(self.commit, line, name, value)
94
95 def AddToCommit(self, line, name, value):
96 """Add a new Commit-xxx tag.
97
98 When a Commit-xxx tag is detected, we come here to record it.
99
100 Args:
101 line: Source line containing tag (useful for debug/error messages)
102 name: Tag name (part after 'Commit-')
103 value: Tag value (part after 'Commit-xxx: ')
104 """
105 if name == 'notes':
106 self.in_section = 'commit-' + name
107 self.skip_blank = False
108
109 def CloseCommit(self):
110 """Save the current commit into our commit list, and reset our state"""
111 if self.commit and self.is_log:
112 self.series.AddCommit(self.commit)
113 self.commit = None
114
115 def ProcessLine(self, line):
116 """Process a single line of a patch file or commit log
117
118 This process a line and returns a list of lines to output. The list
119 may be empty or may contain multiple output lines.
120
121 This is where all the complicated logic is located. The class's
122 state is used to move between different states and detect things
123 properly.
124
125 We can be in one of two modes:
126 self.is_log == True: This is 'git log' mode, where most output is
127 indented by 4 characters and we are scanning for tags
128
129 self.is_log == False: This is 'patch' mode, where we already have
130 all the tags, and are processing patches to remove junk we
131 don't want, and add things we think are required.
132
133 Args:
134 line: text line to process
135
136 Returns:
137 list of output lines, or [] if nothing should be output
138 """
139 # Initially we have no output. Prepare the input line string
140 out = []
141 line = line.rstrip('\n')
142
143 commit_match = re_commit.match(line) if self.is_log else None
144
145 if self.is_log:
146 if line[:4] == ' ':
147 line = line[4:]
148
149 # Handle state transition and skipping blank lines
150 series_tag_match = re_series_tag.match(line)
151 commit_tag_match = re_commit_tag.match(line)
152 cover_cc_match = re_cover_cc.match(line)
153 signoff_match = re_signoff.match(line)
154 tag_match = None
155 if self.state == STATE_PATCH_HEADER:
156 tag_match = re_tag.match(line)
157 is_blank = not line.strip()
158 if is_blank:
159 if (self.state == STATE_MSG_HEADER
160 or self.state == STATE_PATCH_SUBJECT):
161 self.state += 1
162
163 # We don't have a subject in the text stream of patch files
164 # It has its own line with a Subject: tag
165 if not self.is_log and self.state == STATE_PATCH_SUBJECT:
166 self.state += 1
167 elif commit_match:
168 self.state = STATE_MSG_HEADER
169
170 # If we are in a section, keep collecting lines until we see END
171 if self.in_section:
172 if line == 'END':
173 if self.in_section == 'cover':
174 self.series.cover = self.section
175 elif self.in_section == 'notes':
176 if self.is_log:
177 self.series.notes += self.section
178 elif self.in_section == 'commit-notes':
179 if self.is_log:
180 self.commit.notes += self.section
181 else:
182 self.warn.append("Unknown section '%s'" % self.in_section)
183 self.in_section = None
184 self.skip_blank = True
185 self.section = []
186 else:
187 self.section.append(line)
188
189 # Detect the commit subject
190 elif not is_blank and self.state == STATE_PATCH_SUBJECT:
191 self.commit.subject = line
192
193 # Detect the tags we want to remove, and skip blank lines
194 elif re_remove.match(line) and not commit_tag_match:
195 self.skip_blank = True
196
197 # TEST= should be the last thing in the commit, so remove
198 # everything after it
199 if line.startswith('TEST='):
200 self.found_test = True
201 elif self.skip_blank and is_blank:
202 self.skip_blank = False
203
204 # Detect the start of a cover letter section
205 elif re_cover.match(line):
206 self.in_section = 'cover'
207 self.skip_blank = False
208
209 elif cover_cc_match:
210 value = cover_cc_match.group(1)
211 self.AddToSeries(line, 'cover-cc', value)
212
213 # If we are in a change list, key collected lines until a blank one
214 elif self.in_change:
215 if is_blank:
216 # Blank line ends this change list
217 self.in_change = 0
218 elif line == '---':
219 self.in_change = 0
220 out = self.ProcessLine(line)
221 else:
222 if self.is_log:
223 self.series.AddChange(self.in_change, self.commit, line)
224 self.skip_blank = False
225
226 # Detect Series-xxx tags
227 elif series_tag_match:
228 name = series_tag_match.group(1)
229 value = series_tag_match.group(2)
230 if name == 'changes':
231 # value is the version number: e.g. 1, or 2
232 try:
233 value = int(value)
234 except ValueError as str:
235 raise ValueError("%s: Cannot decode version info '%s'" %
236 (self.commit.hash, line))
237 self.in_change = int(value)
238 else:
239 self.AddToSeries(line, name, value)
240 self.skip_blank = True
241
242 # Detect Commit-xxx tags
243 elif commit_tag_match:
244 name = commit_tag_match.group(1)
245 value = commit_tag_match.group(2)
246 if name == 'notes':
247 self.AddToCommit(line, name, value)
248 self.skip_blank = True
249
250 # Detect the start of a new commit
251 elif commit_match:
252 self.CloseCommit()
253 self.commit = commit.Commit(commit_match.group(1))
254
255 # Detect tags in the commit message
256 elif tag_match:
257 # Remove Tested-by self, since few will take much notice
258 if (tag_match.group(1) == 'Tested-by' and
259 tag_match.group(2).find(os.getenv('USER') + '@') != -1):
260 self.warn.append("Ignoring %s" % line)
261 elif tag_match.group(1) == 'Patch-cc':
262 self.commit.AddCc(tag_match.group(2).split(','))
263 else:
264 out = [line]
265
266 # Suppress duplicate signoffs
267 elif signoff_match:
268 if (self.is_log or not self.commit or
269 self.commit.CheckDuplicateSignoff(signoff_match.group(1))):
270 out = [line]
271
272 # Well that means this is an ordinary line
273 else:
274 pos = 1
275 # Look for ugly ASCII characters
276 for ch in line:
277 # TODO: Would be nicer to report source filename and line
278 if ord(ch) > 0x80:
279 self.warn.append("Line %d/%d ('%s') has funny ascii char" %
280 (self.linenum, pos, line))
281 pos += 1
282
283 # Look for space before tab
284 m = re_space_before_tab.match(line)
285 if m:
286 self.warn.append('Line %d/%d has space before tab' %
287 (self.linenum, m.start()))
288
289 # OK, we have a valid non-blank line
290 out = [line]
291 self.linenum += 1
292 self.skip_blank = False
293 if self.state == STATE_DIFFS:
294 pass
295
296 # If this is the start of the diffs section, emit our tags and
297 # change log
298 elif line == '---':
299 self.state = STATE_DIFFS
300
301 # Output the tags (signeoff first), then change list
302 out = []
303 log = self.series.MakeChangeLog(self.commit)
304 out += [line]
305 if self.commit:
306 out += self.commit.notes
307 out += [''] + log
308 elif self.found_test:
309 if not re_allowed_after_test.match(line):
310 self.lines_after_test += 1
311
312 return out
313
314 def Finalize(self):
315 """Close out processing of this patch stream"""
316 self.CloseCommit()
317 if self.lines_after_test:
318 self.warn.append('Found %d lines after TEST=' %
319 self.lines_after_test)
320
321 def ProcessStream(self, infd, outfd):
322 """Copy a stream from infd to outfd, filtering out unwanting things.
323
324 This is used to process patch files one at a time.
325
326 Args:
327 infd: Input stream file object
328 outfd: Output stream file object
329 """
330 # Extract the filename from each diff, for nice warnings
331 fname = None
332 last_fname = None
333 re_fname = re.compile('diff --git a/(.*) b/.*')
334 while True:
335 line = infd.readline()
336 if not line:
337 break
338 out = self.ProcessLine(line)
339
340 # Try to detect blank lines at EOF
341 for line in out:
342 match = re_fname.match(line)
343 if match:
344 last_fname = fname
345 fname = match.group(1)
346 if line == '+':
347 self.blank_count += 1
348 else:
349 if self.blank_count and (line == '-- ' or match):
350 self.warn.append("Found possible blank line(s) at "
351 "end of file '%s'" % last_fname)
352 outfd.write('+\n' * self.blank_count)
353 outfd.write(line + '\n')
354 self.blank_count = 0
355 self.Finalize()
356
357
358 def GetMetaDataForList(commit_range, git_dir=None, count=None,
359 series = None, allow_overwrite=False):
360 """Reads out patch series metadata from the commits
361
362 This does a 'git log' on the relevant commits and pulls out the tags we
363 are interested in.
364
365 Args:
366 commit_range: Range of commits to count (e.g. 'HEAD..base')
367 git_dir: Path to git repositiory (None to use default)
368 count: Number of commits to list, or None for no limit
369 series: Series object to add information into. By default a new series
370 is started.
371 allow_overwrite: Allow tags to overwrite an existing tag
372 Returns:
373 A Series object containing information about the commits.
374 """
375 if not series:
376 series = Series()
377 series.allow_overwrite = allow_overwrite
378 params = gitutil.LogCmd(commit_range,reverse=True, count=count,
379 git_dir=git_dir)
380 stdout = command.RunPipe([params], capture=True).stdout
381 ps = PatchStream(series, is_log=True)
382 for line in stdout.splitlines():
383 ps.ProcessLine(line)
384 ps.Finalize()
385 return series
386
387 def GetMetaData(start, count):
388 """Reads out patch series metadata from the commits
389
390 This does a 'git log' on the relevant commits and pulls out the tags we
391 are interested in.
392
393 Args:
394 start: Commit to start from: 0=HEAD, 1=next one, etc.
395 count: Number of commits to list
396 """
397 return GetMetaDataForList('HEAD~%d' % start, None, count)
398
399 def FixPatch(backup_dir, fname, series, commit):
400 """Fix up a patch file, by adding/removing as required.
401
402 We remove our tags from the patch file, insert changes lists, etc.
403 The patch file is processed in place, and overwritten.
404
405 A backup file is put into backup_dir (if not None).
406
407 Args:
408 fname: Filename to patch file to process
409 series: Series information about this patch set
410 commit: Commit object for this patch file
411 Return:
412 A list of errors, or [] if all ok.
413 """
414 handle, tmpname = tempfile.mkstemp()
415 outfd = os.fdopen(handle, 'w')
416 infd = open(fname, 'r')
417 ps = PatchStream(series)
418 ps.commit = commit
419 ps.ProcessStream(infd, outfd)
420 infd.close()
421 outfd.close()
422
423 # Create a backup file if required
424 if backup_dir:
425 shutil.copy(fname, os.path.join(backup_dir, os.path.basename(fname)))
426 shutil.move(tmpname, fname)
427 return ps.warn
428
429 def FixPatches(series, fnames):
430 """Fix up a list of patches identified by filenames
431
432 The patch files are processed in place, and overwritten.
433
434 Args:
435 series: The series object
436 fnames: List of patch files to process
437 """
438 # Current workflow creates patches, so we shouldn't need a backup
439 backup_dir = None #tempfile.mkdtemp('clean-patch')
440 count = 0
441 for fname in fnames:
442 commit = series.commits[count]
443 commit.patch = fname
444 result = FixPatch(backup_dir, fname, series, commit)
445 if result:
446 print '%d warnings for %s:' % (len(result), fname)
447 for warn in result:
448 print '\t', warn
449 print
450 count += 1
451 print 'Cleaned %d patches' % count
452 return series
453
454 def InsertCoverLetter(fname, series, count):
455 """Inserts a cover letter with the required info into patch 0
456
457 Args:
458 fname: Input / output filename of the cover letter file
459 series: Series object
460 count: Number of patches in the series
461 """
462 fd = open(fname, 'r')
463 lines = fd.readlines()
464 fd.close()
465
466 fd = open(fname, 'w')
467 text = series.cover
468 prefix = series.GetPatchPrefix()
469 for line in lines:
470 if line.startswith('Subject:'):
471 # TODO: if more than 10 patches this should save 00/xx, not 0/xx
472 line = 'Subject: [%s 0/%d] %s\n' % (prefix, count, text[0])
473
474 # Insert our cover letter
475 elif line.startswith('*** BLURB HERE ***'):
476 # First the blurb test
477 line = '\n'.join(text[1:]) + '\n'
478 if series.get('notes'):
479 line += '\n'.join(series.notes) + '\n'
480
481 # Now the change list
482 out = series.MakeChangeLog(None)
483 line += '\n' + '\n'.join(out)
484 fd.write(line)
485 fd.close()