]> git.proxmox.com Git - mirror_edk2.git/blob - BaseTools/Scripts/PatchCheck.py
IntelFsp2WrapperPkg: Convert files to CRLF line ending
[mirror_edk2.git] / BaseTools / Scripts / PatchCheck.py
1 ## @file
2 # Check a patch for various format issues
3 #
4 # Copyright (c) 2015 - 2016, Intel Corporation. All rights reserved.<BR>
5 #
6 # This program and the accompanying materials are licensed and made
7 # available under the terms and conditions of the BSD License which
8 # accompanies this distribution. The full text of the license may be
9 # found at http://opensource.org/licenses/bsd-license.php
10 #
11 # THE PROGRAM IS DISTRIBUTED UNDER THE BSD LICENSE ON AN "AS IS"
12 # BASIS, WITHOUT WARRANTIES OR REPRESENTATIONS OF ANY KIND, EITHER
13 # EXPRESS OR IMPLIED.
14 #
15
16 from __future__ import print_function
17
18 VersionNumber = '0.1'
19 __copyright__ = "Copyright (c) 2015 - 2016, Intel Corporation All rights reserved."
20
21 import email
22 import argparse
23 import os
24 import re
25 import subprocess
26 import sys
27
28 class Verbose:
29 SILENT, ONELINE, NORMAL = range(3)
30 level = NORMAL
31
32 class CommitMessageCheck:
33 """Checks the contents of a git commit message."""
34
35 def __init__(self, subject, message):
36 self.ok = True
37
38 if subject is None and message is None:
39 self.error('Commit message is missing!')
40 return
41
42 self.subject = subject
43 self.msg = message
44
45 self.check_contributed_under()
46 self.check_signed_off_by()
47 self.check_misc_signatures()
48 self.check_overall_format()
49 self.report_message_result()
50
51 url = 'https://github.com/tianocore/tianocore.github.io/wiki/Commit-Message-Format'
52
53 def report_message_result(self):
54 if Verbose.level < Verbose.NORMAL:
55 return
56 if self.ok:
57 # All checks passed
58 return_code = 0
59 print('The commit message format passed all checks.')
60 else:
61 return_code = 1
62 if not self.ok:
63 print(self.url)
64
65 def error(self, *err):
66 if self.ok and Verbose.level > Verbose.ONELINE:
67 print('The commit message format is not valid:')
68 self.ok = False
69 if Verbose.level < Verbose.NORMAL:
70 return
71 count = 0
72 for line in err:
73 prefix = (' *', ' ')[count > 0]
74 print(prefix, line)
75 count += 1
76
77 def check_contributed_under(self):
78 cu_msg='Contributed-under: TianoCore Contribution Agreement 1.0'
79 if self.msg.find(cu_msg) < 0:
80 self.error('Missing Contributed-under! (Note: this must be ' +
81 'added by the code contributor!)')
82
83 @staticmethod
84 def make_signature_re(sig, re_input=False):
85 if re_input:
86 sub_re = sig
87 else:
88 sub_re = sig.replace('-', r'[-\s]+')
89 re_str = (r'^(?P<tag>' + sub_re +
90 r')(\s*):(\s*)(?P<value>\S.*?)(?:\s*)$')
91 try:
92 return re.compile(re_str, re.MULTILINE|re.IGNORECASE)
93 except Exception:
94 print("Tried to compile re:", re_str)
95 raise
96
97 sig_block_re = \
98 re.compile(r'''^
99 (?: (?P<tag>[^:]+) \s* : \s*
100 (?P<value>\S.*?) )
101 |
102 (?: \[ (?P<updater>[^:]+) \s* : \s*
103 (?P<note>.+?) \s* \] )
104 \s* $''',
105 re.VERBOSE | re.MULTILINE)
106
107 def find_signatures(self, sig):
108 if not sig.endswith('-by') and sig != 'Cc':
109 sig += '-by'
110 regex = self.make_signature_re(sig)
111
112 sigs = regex.findall(self.msg)
113
114 bad_case_sigs = filter(lambda m: m[0] != sig, sigs)
115 for s in bad_case_sigs:
116 self.error("'" +s[0] + "' should be '" + sig + "'")
117
118 for s in sigs:
119 if s[1] != '':
120 self.error('There should be no spaces between ' + sig +
121 " and the ':'")
122 if s[2] != ' ':
123 self.error("There should be a space after '" + sig + ":'")
124
125 self.check_email_address(s[3])
126
127 return sigs
128
129 email_re1 = re.compile(r'(?:\s*)(.*?)(\s*)<(.+)>\s*$',
130 re.MULTILINE|re.IGNORECASE)
131
132 def check_email_address(self, email):
133 email = email.strip()
134 mo = self.email_re1.match(email)
135 if mo is None:
136 self.error("Email format is invalid: " + email.strip())
137 return
138
139 name = mo.group(1).strip()
140 if name == '':
141 self.error("Name is not provided with email address: " +
142 email)
143 else:
144 quoted = len(name) > 2 and name[0] == '"' and name[-1] == '"'
145 if name.find(',') >= 0 and not quoted:
146 self.error('Add quotes (") around name with a comma: ' +
147 name)
148
149 if mo.group(2) == '':
150 self.error("There should be a space between the name and " +
151 "email address: " + email)
152
153 if mo.group(3).find(' ') >= 0:
154 self.error("The email address cannot contain a space: " +
155 mo.group(3))
156
157 def check_signed_off_by(self):
158 sob='Signed-off-by'
159 if self.msg.find(sob) < 0:
160 self.error('Missing Signed-off-by! (Note: this must be ' +
161 'added by the code contributor!)')
162 return
163
164 sobs = self.find_signatures('Signed-off')
165
166 if len(sobs) == 0:
167 self.error('Invalid Signed-off-by format!')
168 return
169
170 sig_types = (
171 'Reviewed',
172 'Reported',
173 'Tested',
174 'Suggested',
175 'Acked',
176 'Cc'
177 )
178
179 def check_misc_signatures(self):
180 for sig in self.sig_types:
181 self.find_signatures(sig)
182
183 def check_overall_format(self):
184 lines = self.msg.splitlines()
185
186 if len(lines) >= 1 and lines[0].endswith('\r\n'):
187 empty_line = '\r\n'
188 else:
189 empty_line = '\n'
190
191 lines.insert(0, empty_line)
192 lines.insert(0, self.subject + empty_line)
193
194 count = len(lines)
195
196 if count <= 0:
197 self.error('Empty commit message!')
198 return
199
200 if count >= 1 and len(lines[0]) >= 72:
201 self.error('First line of commit message (subject line) ' +
202 'is too long.')
203
204 if count >= 1 and len(lines[0].strip()) == 0:
205 self.error('First line of commit message (subject line) ' +
206 'is empty.')
207
208 if count >= 2 and lines[1].strip() != '':
209 self.error('Second line of commit message should be ' +
210 'empty.')
211
212 for i in range(2, count):
213 if (len(lines[i]) >= 76 and
214 len(lines[i].split()) > 1 and
215 not lines[i].startswith('git-svn-id:')):
216 self.error('Line %d of commit message is too long.' % (i + 1))
217
218 last_sig_line = None
219 for i in range(count - 1, 0, -1):
220 line = lines[i]
221 mo = self.sig_block_re.match(line)
222 if mo is None:
223 if line.strip() == '':
224 break
225 elif last_sig_line is not None:
226 err2 = 'Add empty line before "%s"?' % last_sig_line
227 self.error('The line before the signature block ' +
228 'should be empty', err2)
229 else:
230 self.error('The signature block was not found')
231 break
232 last_sig_line = line.strip()
233
234 (START, PRE_PATCH, PATCH) = range(3)
235
236 class GitDiffCheck:
237 """Checks the contents of a git diff."""
238
239 def __init__(self, diff):
240 self.ok = True
241 self.format_ok = True
242 self.lines = diff.splitlines(True)
243 self.count = len(self.lines)
244 self.line_num = 0
245 self.state = START
246 while self.line_num < self.count and self.format_ok:
247 line_num = self.line_num
248 self.run()
249 assert(self.line_num > line_num)
250 self.report_message_result()
251
252 def report_message_result(self):
253 if Verbose.level < Verbose.NORMAL:
254 return
255 if self.ok:
256 print('The code passed all checks.')
257
258 def run(self):
259 line = self.lines[self.line_num]
260
261 if self.state in (PRE_PATCH, PATCH):
262 if line.startswith('diff --git'):
263 self.state = START
264 if self.state == PATCH:
265 if line.startswith('@@ '):
266 self.state = PRE_PATCH
267 elif len(line) >= 1 and line[0] not in ' -+' and \
268 not line.startswith(r'\ No newline '):
269 for line in self.lines[self.line_num + 1:]:
270 if line.startswith('diff --git'):
271 self.format_error('diff found after end of patch')
272 break
273 self.line_num = self.count
274 return
275
276 if self.state == START:
277 if line.startswith('diff --git'):
278 self.state = PRE_PATCH
279 self.set_filename(None)
280 elif len(line.rstrip()) != 0:
281 self.format_error("didn't find diff command")
282 self.line_num += 1
283 elif self.state == PRE_PATCH:
284 if line.startswith('+++ b/'):
285 self.set_filename(line[6:].rstrip())
286 if line.startswith('@@ '):
287 self.state = PATCH
288 self.binary = False
289 elif line.startswith('GIT binary patch'):
290 self.state = PATCH
291 self.binary = True
292 else:
293 ok = False
294 for pfx in self.pre_patch_prefixes:
295 if line.startswith(pfx):
296 ok = True
297 if not ok:
298 self.format_error("didn't find diff hunk marker (@@)")
299 self.line_num += 1
300 elif self.state == PATCH:
301 if self.binary:
302 pass
303 if line.startswith('-'):
304 pass
305 elif line.startswith('+'):
306 self.check_added_line(line[1:])
307 elif line.startswith(r'\ No newline '):
308 pass
309 elif not line.startswith(' '):
310 self.format_error("unexpected patch line")
311 self.line_num += 1
312
313 pre_patch_prefixes = (
314 '--- ',
315 '+++ ',
316 'index ',
317 'new file ',
318 'deleted file ',
319 'old mode ',
320 'new mode ',
321 'similarity index ',
322 'rename ',
323 'Binary files ',
324 )
325
326 line_endings = ('\r\n', '\n\r', '\n', '\r')
327
328 def set_filename(self, filename):
329 self.hunk_filename = filename
330 if filename:
331 self.force_crlf = not filename.endswith('.sh')
332 else:
333 self.force_crlf = True
334
335 def added_line_error(self, msg, line):
336 lines = [ msg ]
337 if self.hunk_filename is not None:
338 lines.append('File: ' + self.hunk_filename)
339 lines.append('Line: ' + line)
340
341 self.error(*lines)
342
343 old_debug_re = \
344 re.compile(r'''
345 DEBUG \s* \( \s* \( \s*
346 (?: DEBUG_[A-Z_]+ \s* \| \s*)*
347 EFI_D_ ([A-Z_]+)
348 ''',
349 re.VERBOSE)
350
351 def check_added_line(self, line):
352 eol = ''
353 for an_eol in self.line_endings:
354 if line.endswith(an_eol):
355 eol = an_eol
356 line = line[:-len(eol)]
357
358 stripped = line.rstrip()
359
360 if self.force_crlf and eol != '\r\n':
361 self.added_line_error('Line ending (%s) is not CRLF' % repr(eol),
362 line)
363 if '\t' in line:
364 self.added_line_error('Tab character used', line)
365 if len(stripped) < len(line):
366 self.added_line_error('Trailing whitespace found', line)
367
368 mo = self.old_debug_re.search(line)
369 if mo is not None:
370 self.added_line_error('EFI_D_' + mo.group(1) + ' was used, '
371 'but DEBUG_' + mo.group(1) +
372 ' is now recommended', line)
373
374 split_diff_re = re.compile(r'''
375 (?P<cmd>
376 ^ diff \s+ --git \s+ a/.+ \s+ b/.+ $
377 )
378 (?P<index>
379 ^ index \s+ .+ $
380 )
381 ''',
382 re.IGNORECASE | re.VERBOSE | re.MULTILINE)
383
384 def format_error(self, err):
385 self.format_ok = False
386 err = 'Patch format error: ' + err
387 err2 = 'Line: ' + self.lines[self.line_num].rstrip()
388 self.error(err, err2)
389
390 def error(self, *err):
391 if self.ok and Verbose.level > Verbose.ONELINE:
392 print('Code format is not valid:')
393 self.ok = False
394 if Verbose.level < Verbose.NORMAL:
395 return
396 count = 0
397 for line in err:
398 prefix = (' *', ' ')[count > 0]
399 print(prefix, line)
400 count += 1
401
402 class CheckOnePatch:
403 """Checks the contents of a git email formatted patch.
404
405 Various checks are performed on both the commit message and the
406 patch content.
407 """
408
409 def __init__(self, name, patch):
410 self.patch = patch
411 self.find_patch_pieces()
412
413 msg_check = CommitMessageCheck(self.commit_subject, self.commit_msg)
414 msg_ok = msg_check.ok
415
416 diff_ok = True
417 if self.diff is not None:
418 diff_check = GitDiffCheck(self.diff)
419 diff_ok = diff_check.ok
420
421 self.ok = msg_ok and diff_ok
422
423 if Verbose.level == Verbose.ONELINE:
424 if self.ok:
425 result = 'ok'
426 else:
427 result = list()
428 if not msg_ok:
429 result.append('commit message')
430 if not diff_ok:
431 result.append('diff content')
432 result = 'bad ' + ' and '.join(result)
433 print(name, result)
434
435
436 git_diff_re = re.compile(r'''
437 ^ diff \s+ --git \s+ a/.+ \s+ b/.+ $
438 ''',
439 re.IGNORECASE | re.VERBOSE | re.MULTILINE)
440
441 stat_re = \
442 re.compile(r'''
443 (?P<commit_message> [\s\S\r\n]* )
444 (?P<stat>
445 ^ --- $ [\r\n]+
446 (?: ^ \s+ .+ \s+ \| \s+ \d+ \s+ \+* \-*
447 $ [\r\n]+ )+
448 [\s\S\r\n]+
449 )
450 ''',
451 re.IGNORECASE | re.VERBOSE | re.MULTILINE)
452
453 subject_prefix_re = \
454 re.compile(r'''^
455 \s* (\[
456 [^\[\]]* # Allow all non-brackets
457 \])* \s*
458 ''',
459 re.VERBOSE)
460
461 def find_patch_pieces(self):
462 if sys.version_info < (3, 0):
463 patch = self.patch.encode('ascii', 'ignore')
464 else:
465 patch = self.patch
466
467 self.commit_msg = None
468 self.stat = None
469 self.commit_subject = None
470 self.commit_prefix = None
471 self.diff = None
472
473 if patch.startswith('diff --git'):
474 self.diff = patch
475 return
476
477 pmail = email.message_from_string(patch)
478 parts = list(pmail.walk())
479 assert(len(parts) == 1)
480 assert(parts[0].get_content_type() == 'text/plain')
481 content = parts[0].get_payload(decode=True).decode('utf-8', 'ignore')
482
483 mo = self.git_diff_re.search(content)
484 if mo is not None:
485 self.diff = content[mo.start():]
486 content = content[:mo.start()]
487
488 mo = self.stat_re.search(content)
489 if mo is None:
490 self.commit_msg = content
491 else:
492 self.stat = mo.group('stat')
493 self.commit_msg = mo.group('commit_message')
494
495 self.commit_subject = pmail['subject'].replace('\r\n', '')
496 self.commit_subject = self.commit_subject.replace('\n', '')
497 self.commit_subject = self.subject_prefix_re.sub('', self.commit_subject, 1)
498
499 class CheckGitCommits:
500 """Reads patches from git based on the specified git revision range.
501
502 The patches are read from git, and then checked.
503 """
504
505 def __init__(self, rev_spec, max_count):
506 commits = self.read_commit_list_from_git(rev_spec, max_count)
507 if len(commits) == 1 and Verbose.level > Verbose.ONELINE:
508 commits = [ rev_spec ]
509 self.ok = True
510 blank_line = False
511 for commit in commits:
512 if Verbose.level > Verbose.ONELINE:
513 if blank_line:
514 print()
515 else:
516 blank_line = True
517 print('Checking git commit:', commit)
518 patch = self.read_patch_from_git(commit)
519 self.ok &= CheckOnePatch(commit, patch).ok
520
521 def read_commit_list_from_git(self, rev_spec, max_count):
522 # Run git to get the commit patch
523 cmd = [ 'rev-list', '--abbrev-commit', '--no-walk' ]
524 if max_count is not None:
525 cmd.append('--max-count=' + str(max_count))
526 cmd.append(rev_spec)
527 out = self.run_git(*cmd)
528 return out.split()
529
530 def read_patch_from_git(self, commit):
531 # Run git to get the commit patch
532 return self.run_git('show', '--pretty=email', commit)
533
534 def run_git(self, *args):
535 cmd = [ 'git' ]
536 cmd += args
537 p = subprocess.Popen(cmd,
538 stdout=subprocess.PIPE,
539 stderr=subprocess.STDOUT)
540 return p.communicate()[0].decode('utf-8', 'ignore')
541
542 class CheckOnePatchFile:
543 """Performs a patch check for a single file.
544
545 stdin is used when the filename is '-'.
546 """
547
548 def __init__(self, patch_filename):
549 if patch_filename == '-':
550 patch = sys.stdin.read()
551 patch_filename = 'stdin'
552 else:
553 f = open(patch_filename, 'rb')
554 patch = f.read().decode('utf-8', 'ignore')
555 f.close()
556 if Verbose.level > Verbose.ONELINE:
557 print('Checking patch file:', patch_filename)
558 self.ok = CheckOnePatch(patch_filename, patch).ok
559
560 class CheckOneArg:
561 """Performs a patch check for a single command line argument.
562
563 The argument will be handed off to a file or git-commit based
564 checker.
565 """
566
567 def __init__(self, param, max_count=None):
568 self.ok = True
569 if param == '-' or os.path.exists(param):
570 checker = CheckOnePatchFile(param)
571 else:
572 checker = CheckGitCommits(param, max_count)
573 self.ok = checker.ok
574
575 class PatchCheckApp:
576 """Checks patches based on the command line arguments."""
577
578 def __init__(self):
579 self.parse_options()
580 patches = self.args.patches
581
582 if len(patches) == 0:
583 patches = [ 'HEAD' ]
584
585 self.ok = True
586 self.count = None
587 for patch in patches:
588 self.process_one_arg(patch)
589
590 if self.count is not None:
591 self.process_one_arg('HEAD')
592
593 if self.ok:
594 self.retval = 0
595 else:
596 self.retval = -1
597
598 def process_one_arg(self, arg):
599 if len(arg) >= 2 and arg[0] == '-':
600 try:
601 self.count = int(arg[1:])
602 return
603 except ValueError:
604 pass
605 self.ok &= CheckOneArg(arg, self.count).ok
606 self.count = None
607
608 def parse_options(self):
609 parser = argparse.ArgumentParser(description=__copyright__)
610 parser.add_argument('--version', action='version',
611 version='%(prog)s ' + VersionNumber)
612 parser.add_argument('patches', nargs='*',
613 help='[patch file | git rev list]')
614 group = parser.add_mutually_exclusive_group()
615 group.add_argument("--oneline",
616 action="store_true",
617 help="Print one result per line")
618 group.add_argument("--silent",
619 action="store_true",
620 help="Print nothing")
621 self.args = parser.parse_args()
622 if self.args.oneline:
623 Verbose.level = Verbose.ONELINE
624 if self.args.silent:
625 Verbose.level = Verbose.SILENT
626
627 if __name__ == "__main__":
628 sys.exit(PatchCheckApp().retval)