# Copyright (c) 2011 The Chromium OS Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
import json
import os
import re
import sys
import subprocess
# General Helpers
# C++ and friends
r".*\.c$", r".*\.cc$", r".*\.cpp$", r".*\.h$", r".*\.m$", r".*\.mm$",
r".*\.inl$", r".*\.asm$", r".*\.hxx$", r".*\.hpp$", r".*\.s$", r".*\.S$",
# Scripts
r".*\.js$", r".*\.py$", r".*\.sh$", r".*\.rb$", r".*\.pl$", r".*\.pm$",
# No extension at all, note that ALL CAPS files are black listed in
# Other
r".*\.java$", r".*\.mk$", r".*\.am$",
# avoid doing source file checks for kernel
MIN_GIT_VERSION = [1, 7, 2]
def _run_command(cmd):
"""Executes the passed in command and returns raw stdout output."""
return subprocess.Popen(cmd, stdout=subprocess.PIPE).communicate()[0]
def _get_hooks_dir():
"""Returns the absolute path to the repohooks directory."""
cmd = ['repo', 'forall', 'chromiumos/repohooks', '-c', 'pwd']
return _run_command(cmd).strip()
def _match_regex_list(subject, expressions):
"""Try to match a list of regular expressions to a string.
subject: The string to match regexes on
expressions: A list of regular expressions to check for matches with.
Whether the passed in subject matches any of the passed in regexes.
for expr in expressions:
if (, subject)):
return True
return False
def _filter_files(files, include_list, exclude_list=[]):
"""Filter out files based on the conditions passed in.
files: list of filepaths to filter
include_list: list of regex that when matched with a file path will cause it
to be added to the output list unless the file is also matched with a
regex in the exclude_list.
exclude_list: list of regex that when matched with a file will prevent it
from being added to the output list, even if it is also matched with a
regex in the include_list.
A list of filepaths that contain files matched in the include_list and not
in the exclude_list.
filtered = []
for f in files:
if (_match_regex_list(f, include_list) and
not _match_regex_list(f, exclude_list)):
return filtered
def _report_error(msg, items=None):
"""Raises an exception with the passed in error message.
If extra error detail is passed in, it will be appended to the error message.
msg: Error message header.
items: A list of lines that follow the header that give extra error
if items:
msg += '\n' + '\n'.join(items)
raise Exception(msg)
# Git Helpers
def _check_git_version():
"""Checks the git version installed, dies if it is insufficient"""
cmd = ['git', '--version']
output = subprocess.Popen(cmd, stdout=subprocess.PIPE).communicate()[0]
m = re.match('(git version )([0-9]+\.[0-9]+\.[0-9]+).*\n', output)
if not m or not
_report_error('Failed to get git version, git output=' + output)
version ='.')
version = map(lambda x: int(x), version)
for v, mv in zip(version, MIN_GIT_VERSION):
if v < mv:
_report_error('Invalid version of git (' + + '), you need '
+ 'at least version '
+ ''.join([`num` + '.' for num in MIN_GIT_VERSION]))
elif v > mv:
def _get_upstream_branch():
"""Returns the upstream tracking branch of the current branch.
Error if there is no tracking branch
current_branch = _run_command(['git', 'symbolic-ref', 'HEAD']).strip()
current_branch = current_branch.replace('refs/heads/', '')
if not current_branch:
_report_error('Need to be on a tracking branch')
cfg_option = 'branch.' + current_branch + '.%s'
full_upstream = _run_command(['git', 'config', cfg_option % 'merge']).strip()
remote = _run_command(['git', 'config', cfg_option % 'remote']).strip()
if not remote or not full_upstream:
_report_error('Need to be on a tracking branch')
return full_upstream.replace('heads', 'remotes/' + remote)
def _get_diff(commit):
"""Returns the diff for this commit."""
return _run_command(['git', 'show', commit])
def _get_file_diff(file, commit):
"""Returns a list of (linenum, lines) tuples that the commit touched."""
output = _run_command(['git', 'show', '-p', '--no-ext-diff', commit, file])
new_lines = []
line_num = 0
for line in output.splitlines():
m = re.match(r'^@@ [0-9\,\+\-]+ \+([0-9]+)\,[0-9]+ @@', line)
if m:
line_num = int(m.groups(1)[0])
if line.startswith('+') and not line.startswith('++'):
new_lines.append((line_num, line[1:]))
if not line.startswith('-'):
line_num += 1
return new_lines
def _get_affected_files(commit):
"""Returns list of absolute filepaths that were modified/added."""
output = _run_command(['git', 'diff', '--name-status', commit + '^!'])
files = []
for statusline in output.splitlines():
m = re.match('^(\w)+\t(.+)$', statusline.rstrip())
# Ignore deleted files, and return absolute paths of files
if ([0] != 'D'):
pwd = os.getcwd()
return files
def _get_commits():
"""Returns a list of commits for this review."""
cmd = ['git', 'log', '%s..' % _get_upstream_branch(), '--format=%H']
return _run_command(cmd).split()
def _get_commit_desc(commit):
"""Returns the full commit message of a commit."""
return _run_command(['git', 'log', '--format=%B', commit + '^!'])
# Common Hooks
def _check_no_long_lines(project, commit):
"""Checks that there aren't any lines longer than maxlen characters in any of
the text files to be submitted.
MAX_LEN = 80
errors = []
files = _filter_files(_get_affected_files(commit),
for afile in files:
for line_num, line in _get_file_diff(afile, commit):
# Allow certain lines to exceed the maxlen rule.
if (len(line) > MAX_LEN and
not 'http://' in line and
not 'https://' in line and
not line.startswith('#define') and
not line.startswith('#include') and
not line.startswith('#import') and
not line.startswith('#pragma') and
not line.startswith('#if') and
not line.startswith('#endif')):
errors.append('%s, line %s, %s chars' % (afile, line_num, len(line)))
if len(errors) == 5: # Just show the first 5 errors.
if errors:
msg = 'Found lines longer than %s characters (first 5 shown):' % MAX_LEN
_report_error(msg, errors)
def _check_no_stray_whitespace(project, commit):
"""Checks that there is no stray whitespace at source lines end."""
errors = []
files = _filter_files(_get_affected_files(commit),
for afile in files:
for line_num, line in _get_file_diff(afile, commit):
if line.rstrip() != line:
errors.append('%s, line %s' % (afile, line_num))
if errors:
_report_error('Found line ending with white space in:', errors)
def _check_no_tabs(project, commit):
"""Checks there are no unexpanded tabs."""
errors = []
files = _filter_files(_get_affected_files(commit),
for afile in files:
for line_num, line in _get_file_diff(afile, commit):
if '\t' in line:
errors.append('%s, line %s' % (afile, line_num))
if errors:
_report_error('Found a tab character in:', errors)
def _check_change_has_test_field(project, commit):
"""Check for a non-empty 'TEST=' field in the commit message."""
TEST_RE = r'\n\s*TEST\s*=[^\n]*\S+'
if not, _get_commit_desc(commit)):
_report_error('Changelist description needs TEST field (after first line)')
def _check_change_has_bug_field(project, commit):
"""Check for a non-empty 'BUG=' field in the commit message."""
BUG_RE = r'\n\s*BUG\s*=[^\n]*\S+'
if not, _get_commit_desc(commit)):
_report_error('Changelist description needs BUG field (after first line)')
def _check_change_has_proper_changeid(project, commit):
"""Verify that Change-ID is present in last paragraph of commit message."""
desc = _get_commit_desc(commit)
loc = desc.rfind('\nChange-Id:')
if loc == -1 or'\n\s*\n\s*\S+', desc[loc:]):
_report_error('Change-Id must be in last paragraph of description.')
def _check_license(project, commit):
"""Verifies the license header."""
r".*? Copyright \(c\) 20[-0-9]{2,7} The Chromium OS Authors\. All rights "
r"reserved\." "\n"
r".*? Use of this source code is governed by a BSD-style license that can "
r".*? found in the LICENSE file\."
license_re = re.compile(LICENSE_HEADER, re.MULTILINE)
bad_files = []
files = _filter_files(_get_affected_files(commit),
for f in files:
contents = open(f).read()
if len(contents) == 0: continue # Ignore empty files
if not
if bad_files:
_report_error('License must match:\n%s\n' % license_re.pattern +
'Found a bad license header in these files:',
# Project-specific hooks
def _run_checkpatch(project, commit):
"""Runs on the given project"""
hooks_dir = _get_hooks_dir()
cmd = ['%s/' % hooks_dir, '-']
p = subprocess.Popen(cmd, stdin=subprocess.PIPE, stdout=subprocess.PIPE)
output = p.communicate(_get_diff(commit))[0]
if p.returncode:
_report_error(' errors/warnings\n\n' + output)
def _run_json_check(project, commit):
"""Checks that all JSON files are syntactically valid."""
for f in _filter_files(_get_affected_files(commit), [r'.*\.json']):
except Exception, e:
_report_error('Invalid JSON in %s: %s' % (f, e))
# Base
COMMON_HOOKS = [_check_change_has_bug_field,
def _setup_project_hooks():
"""Returns a dictionay of callbacks: dict[project] = [callback1, callback2]"""
return {
"chromiumos/third_party/kernel": [_run_checkpatch],
"chromiumos/third_party/kernel-next": [_run_checkpatch],
"chromeos/autotest-tools": [_run_json_check],
def _run_project_hooks(project, hooks):
"""For each project run its project specific hook from the hooks dictionary"""
proj_dir = _run_command(['repo', 'forall', project, '-c', 'pwd']).strip()
pwd = os.getcwd()
# hooks assume they are run from the root of the project
project_specific_hooks = []
if project in hooks:
project_specific_hooks = hooks[project]
for commit in _get_commits():
for hook in COMMON_HOOKS + project_specific_hooks:
hook(project, commit)
msg = 'ERROR: pre-upload failed: commit=%s, project=%s' % (commit[:8],
print >> sys.stderr, msg
# Main
def main(project_list, **kwargs):
hooks = _setup_project_hooks()
for project in project_list:
_run_project_hooks(project, hooks)
if __name__ == '__main__':