2020-01-10 18:19:42 +00:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
# Copyright 2020 Google LLC.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
#
|
|
|
|
################################################################################
|
|
|
|
"""Check code for common issues before submitting."""
|
|
|
|
|
|
|
|
import argparse
|
|
|
|
import os
|
|
|
|
import subprocess
|
|
|
|
import sys
|
2020-02-21 16:47:13 +00:00
|
|
|
import unittest
|
2020-01-10 18:19:42 +00:00
|
|
|
import yaml
|
|
|
|
|
|
|
|
_SRC_ROOT = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
|
|
|
|
|
|
|
|
|
|
|
|
def _is_project_file(actual_path, expected_filename):
|
|
|
|
"""Returns True if actual_path's name is |expected_filename| and is a file
|
|
|
|
that exists and is in in projects/."""
|
|
|
|
if os.path.basename(actual_path) != expected_filename:
|
|
|
|
return False
|
|
|
|
|
|
|
|
if os.path.basename(os.path.dirname(
|
|
|
|
os.path.dirname(actual_path))) != 'projects':
|
|
|
|
return False
|
|
|
|
|
|
|
|
return os.path.exists(actual_path)
|
|
|
|
|
|
|
|
|
|
|
|
# TODO: Check for -fsanitize=fuzzer in files as well.
|
|
|
|
|
|
|
|
|
|
|
|
def _check_one_lib_fuzzing_engine(build_sh_file):
|
|
|
|
"""Returns False if |build_sh_file| contains -lFuzzingEngine.
|
|
|
|
This is deprecated behavior. $LIB_FUZZING_ENGINE should be used instead
|
|
|
|
so that -fsanitize=fuzzer is used."""
|
|
|
|
if not _is_project_file(build_sh_file, 'build.sh'):
|
|
|
|
return True
|
|
|
|
|
|
|
|
with open(build_sh_file) as build_sh:
|
|
|
|
build_sh_lines = build_sh.readlines()
|
|
|
|
for line_num, line in enumerate(build_sh_lines):
|
|
|
|
uncommented_code = line.split('#')[0]
|
|
|
|
if '-lFuzzingEngine' in uncommented_code:
|
|
|
|
print(
|
|
|
|
'Error: build.sh contains deprecated "-lFuzzingEngine" on line: {0}. '
|
|
|
|
'Please use "$LIB_FUZZING_ENGINE" instead.'.format(line_num))
|
|
|
|
return False
|
|
|
|
return True
|
|
|
|
|
|
|
|
|
|
|
|
def check_lib_fuzzing_engine(paths):
|
|
|
|
"""Call _check_one_lib_fuzzing_engine on each path in |paths|. Return True if
|
|
|
|
the result of every call is True."""
|
|
|
|
return all([_check_one_lib_fuzzing_engine(path) for path in paths])
|
|
|
|
|
|
|
|
|
|
|
|
class ProjectYamlChecker:
|
|
|
|
"""Checks for a project.yaml file."""
|
|
|
|
|
|
|
|
# Sections in a project.yaml and the constant values that they are allowed
|
|
|
|
# to have.
|
|
|
|
SECTIONS_AND_CONSTANTS = {
|
|
|
|
'sanitizers': {'address', 'none', 'memory', 'undefined', 'dataflow'},
|
|
|
|
'architectures': {'i386', 'x86_64'},
|
2020-08-25 23:31:29 +00:00
|
|
|
'fuzzing_engines': {'afl', 'libfuzzer', 'honggfuzz', 'dataflow', 'none'},
|
2020-01-10 18:19:42 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
# Note: this list must be updated when we allow new sections.
|
|
|
|
VALID_SECTION_NAMES = [
|
2020-01-21 23:48:09 +00:00
|
|
|
'architectures',
|
|
|
|
'auto_ccs',
|
2020-09-03 01:08:09 +00:00
|
|
|
'blackbox',
|
2020-08-10 15:08:25 +00:00
|
|
|
'builds_per_day',
|
2020-01-21 23:48:09 +00:00
|
|
|
'coverage_extra_args',
|
|
|
|
'disabled',
|
|
|
|
'fuzzing_engines',
|
2020-08-10 15:08:25 +00:00
|
|
|
'help_url',
|
2020-01-21 23:48:09 +00:00
|
|
|
'homepage',
|
2020-08-10 15:08:25 +00:00
|
|
|
'language',
|
|
|
|
'labels', # For internal use only, hard to lint as it uses fuzzer names.
|
2020-09-23 00:41:20 +00:00
|
|
|
'main_repo',
|
2020-01-21 23:48:09 +00:00
|
|
|
'primary_contact',
|
2020-12-09 22:49:27 +00:00
|
|
|
'run_tests',
|
2020-01-21 23:48:09 +00:00
|
|
|
'sanitizers',
|
2020-08-10 15:08:25 +00:00
|
|
|
'selective_unpack',
|
2020-01-21 23:48:09 +00:00
|
|
|
'vendor_ccs',
|
|
|
|
'view_restrictions',
|
2020-01-10 18:19:42 +00:00
|
|
|
]
|
|
|
|
|
2020-03-10 18:08:01 +00:00
|
|
|
LANGUAGES_SUPPORTED = [
|
|
|
|
'c',
|
|
|
|
'c++',
|
|
|
|
'go',
|
2020-11-19 15:40:10 +00:00
|
|
|
'python',
|
2020-03-10 18:08:01 +00:00
|
|
|
'rust',
|
|
|
|
]
|
2020-01-30 23:36:44 +00:00
|
|
|
|
2020-01-10 18:19:42 +00:00
|
|
|
# Note that some projects like boost only have auto-ccs. However, forgetting
|
|
|
|
# primary contact is probably a mistake.
|
2020-12-09 22:49:27 +00:00
|
|
|
REQUIRED_SECTIONS = ['primary_contact', 'main_repo']
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
def __init__(self, filename):
|
|
|
|
self.filename = filename
|
|
|
|
with open(filename) as file_handle:
|
|
|
|
self.data = yaml.safe_load(file_handle)
|
|
|
|
|
|
|
|
self.success = True
|
|
|
|
|
|
|
|
def do_checks(self):
|
|
|
|
"""Do all project.yaml checks. Return True if they pass."""
|
|
|
|
if self.is_disabled():
|
|
|
|
return True
|
|
|
|
|
|
|
|
checks = [
|
2020-01-30 23:36:44 +00:00
|
|
|
self.check_project_yaml_constants,
|
|
|
|
self.check_required_sections,
|
|
|
|
self.check_valid_section_names,
|
|
|
|
self.check_valid_emails,
|
|
|
|
self.check_valid_language,
|
2020-01-10 18:19:42 +00:00
|
|
|
]
|
|
|
|
for check_function in checks:
|
|
|
|
check_function()
|
|
|
|
return self.success
|
|
|
|
|
|
|
|
def is_disabled(self):
|
|
|
|
"""Is this project disabled."""
|
|
|
|
return self.data.get('disabled', False)
|
|
|
|
|
2020-01-23 15:20:59 +00:00
|
|
|
def error(self, message):
|
2020-01-10 18:19:42 +00:00
|
|
|
"""Print an error message and set self.success to False."""
|
|
|
|
self.success = False
|
2020-01-23 15:20:59 +00:00
|
|
|
print('Error in {filename}: {message}'.format(filename=self.filename,
|
|
|
|
message=message))
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
def check_project_yaml_constants(self):
|
|
|
|
"""Check that certain sections only have certain constant values."""
|
|
|
|
for section, allowed_constants in self.SECTIONS_AND_CONSTANTS.items():
|
|
|
|
if section not in self.data:
|
|
|
|
continue
|
|
|
|
actual_constants = self.data[section]
|
|
|
|
for constant in actual_constants:
|
2020-01-23 15:20:59 +00:00
|
|
|
if isinstance(constant, str):
|
|
|
|
if constant not in allowed_constants:
|
|
|
|
self.error(('{constant} (in {section} section) is not a valid '
|
|
|
|
'constant ({allowed_constants}).').format(
|
|
|
|
constant=constant,
|
|
|
|
section=section,
|
|
|
|
allowed_constants=', '.join(allowed_constants)))
|
|
|
|
elif isinstance(constant, dict):
|
|
|
|
# The only alternative value allowed is the experimental flag, i.e.
|
|
|
|
# `constant == {'memory': {'experimental': True}}`. Do not check the
|
|
|
|
# experimental flag, but assert that the sanitizer is a valid one.
|
|
|
|
if (len(constant.keys()) > 1 or
|
|
|
|
list(constant.keys())[0] not in allowed_constants):
|
|
|
|
self.error('Not allowed value in the project.yaml: ' +
|
|
|
|
str(constant))
|
|
|
|
else:
|
|
|
|
self.error('Not allowed value in the project.yaml: ' + str(constant))
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
def check_valid_section_names(self):
|
|
|
|
"""Check that only valid sections are included."""
|
|
|
|
for name in self.data:
|
|
|
|
if name not in self.VALID_SECTION_NAMES:
|
2020-01-23 15:20:59 +00:00
|
|
|
self.error('{name} is not a valid section name ({valid_names})'.format(
|
|
|
|
name=name, valid_names=self.VALID_SECTION_NAMES))
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
def check_required_sections(self):
|
|
|
|
"""Check that all required sections are present."""
|
|
|
|
for section in self.REQUIRED_SECTIONS:
|
|
|
|
if section not in self.data:
|
2020-01-23 15:20:59 +00:00
|
|
|
self.error(section + ' section is missing.')
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
def check_valid_emails(self):
|
|
|
|
"""Check that emails are valid looking."""
|
|
|
|
# Get email addresses.
|
|
|
|
email_addresses = []
|
2020-01-15 15:41:53 +00:00
|
|
|
primary_contact = self.data.get('primary_contact')
|
|
|
|
if primary_contact:
|
|
|
|
email_addresses.append(primary_contact)
|
|
|
|
auto_ccs = self.data.get('auto_ccs')
|
|
|
|
if auto_ccs:
|
|
|
|
email_addresses.extend(auto_ccs)
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
# Sanity check them.
|
|
|
|
for email_address in email_addresses:
|
|
|
|
if '@' not in email_address or '.' not in email_address:
|
2020-01-23 15:20:59 +00:00
|
|
|
self.error(email_address + ' is an invalid email address.')
|
2020-01-10 18:19:42 +00:00
|
|
|
|
2020-01-30 23:36:44 +00:00
|
|
|
def check_valid_language(self):
|
2020-03-10 18:08:01 +00:00
|
|
|
"""Check that the language is specified and valid."""
|
2020-01-30 23:36:44 +00:00
|
|
|
language = self.data.get('language')
|
|
|
|
if not language:
|
2020-03-10 18:08:01 +00:00
|
|
|
self.error('Missing "language" attribute in project.yaml.')
|
|
|
|
elif language not in self.LANGUAGES_SUPPORTED:
|
|
|
|
self.error(
|
|
|
|
'"language: {language}" is not supported ({supported}).'.format(
|
|
|
|
language=language, supported=self.LANGUAGES_SUPPORTED))
|
2020-01-30 23:36:44 +00:00
|
|
|
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
def _check_one_project_yaml(project_yaml_filename):
|
|
|
|
"""Do checks on the project.yaml file."""
|
|
|
|
if not _is_project_file(project_yaml_filename, 'project.yaml'):
|
|
|
|
return True
|
|
|
|
|
|
|
|
checker = ProjectYamlChecker(project_yaml_filename)
|
|
|
|
return checker.do_checks()
|
|
|
|
|
|
|
|
|
|
|
|
def check_project_yaml(paths):
|
|
|
|
"""Call _check_one_project_yaml on each path in |paths|. Return True if
|
|
|
|
the result of every call is True."""
|
|
|
|
return all([_check_one_project_yaml(path) for path in paths])
|
|
|
|
|
|
|
|
|
|
|
|
def do_checks(changed_files):
|
|
|
|
"""Run all presubmit checks return False if any fails."""
|
|
|
|
checks = [
|
|
|
|
check_license, yapf, lint, check_project_yaml, check_lib_fuzzing_engine
|
|
|
|
]
|
|
|
|
# Use a list comprehension here and in other cases where we use all() so that
|
|
|
|
# we don't quit early on failure. This is more user-friendly since the more
|
|
|
|
# errors we spit out at once, the less frequently the less check-fix-check
|
|
|
|
# cycles they need to do.
|
|
|
|
return all([check(changed_files) for check in checks])
|
|
|
|
|
|
|
|
|
|
|
|
_CHECK_LICENSE_FILENAMES = ['Dockerfile']
|
|
|
|
_CHECK_LICENSE_EXTENSIONS = [
|
|
|
|
'.bash',
|
|
|
|
'.c',
|
|
|
|
'.cc',
|
|
|
|
'.cpp',
|
|
|
|
'.css',
|
|
|
|
'.h',
|
|
|
|
'.htm',
|
|
|
|
'.html',
|
|
|
|
'.js',
|
|
|
|
'.proto',
|
|
|
|
'.py',
|
|
|
|
'.sh',
|
|
|
|
]
|
2020-01-15 17:33:39 +00:00
|
|
|
|
2020-01-10 18:19:42 +00:00
|
|
|
_LICENSE_STRING = 'http://www.apache.org/licenses/LICENSE-2.0'
|
|
|
|
|
|
|
|
|
|
|
|
def check_license(paths):
|
|
|
|
"""Validate license header."""
|
|
|
|
if not paths:
|
|
|
|
return True
|
|
|
|
|
|
|
|
success = True
|
|
|
|
for path in paths:
|
|
|
|
filename = os.path.basename(path)
|
|
|
|
extension = os.path.splitext(path)[1]
|
|
|
|
if (filename not in _CHECK_LICENSE_FILENAMES and
|
|
|
|
extension not in _CHECK_LICENSE_EXTENSIONS):
|
|
|
|
continue
|
|
|
|
|
|
|
|
with open(path) as file_handle:
|
|
|
|
if _LICENSE_STRING not in file_handle.read():
|
|
|
|
print('Missing license header in file %s.' % str(path))
|
|
|
|
success = False
|
|
|
|
|
|
|
|
return success
|
|
|
|
|
|
|
|
|
|
|
|
def bool_to_returncode(success):
|
|
|
|
"""Return 0 if |success|. Otherwise return 1."""
|
|
|
|
if success:
|
|
|
|
print('Success.')
|
|
|
|
return 0
|
|
|
|
|
|
|
|
print('Failed.')
|
|
|
|
return 1
|
|
|
|
|
|
|
|
|
2020-11-19 15:40:10 +00:00
|
|
|
def is_nonfuzzer_python(path):
|
2020-01-10 18:19:42 +00:00
|
|
|
"""Returns True if |path| ends in .py."""
|
2020-11-19 15:40:10 +00:00
|
|
|
return os.path.splitext(path)[1] == '.py' and '/projects/' not in path
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
|
2021-01-20 20:34:29 +00:00
|
|
|
def lint():
|
2020-01-10 18:19:42 +00:00
|
|
|
"""Run python's linter on |paths| if it is a python file. Return False if it
|
|
|
|
fails linting."""
|
|
|
|
|
2021-01-20 20:34:29 +00:00
|
|
|
command = ['python3', '-m', 'pylint', '-j', '0', 'infra']
|
2020-01-10 18:19:42 +00:00
|
|
|
returncode = subprocess.run(command, check=False).returncode
|
|
|
|
return returncode == 0
|
|
|
|
|
|
|
|
|
|
|
|
def yapf(paths, validate=True):
|
|
|
|
"""Do yapf on |path| if it is Python file. Only validates format if
|
|
|
|
|validate| otherwise, formats the file. Returns False if validation
|
|
|
|
or formatting fails."""
|
2020-11-19 15:40:10 +00:00
|
|
|
paths = [path for path in paths if is_nonfuzzer_python(path)]
|
2020-01-10 18:19:42 +00:00
|
|
|
if not paths:
|
|
|
|
return True
|
|
|
|
|
|
|
|
validate_argument = '-d' if validate else '-i'
|
|
|
|
command = ['yapf', validate_argument, '-p']
|
|
|
|
command.extend(paths)
|
|
|
|
|
|
|
|
returncode = subprocess.run(command, check=False).returncode
|
|
|
|
return returncode == 0
|
|
|
|
|
|
|
|
|
|
|
|
def get_changed_files():
|
|
|
|
"""Return a list of absolute paths of files changed in this git branch."""
|
|
|
|
# FIXME: This doesn't work if branch is behind master.
|
|
|
|
diff_command = ['git', 'diff', '--name-only', 'FETCH_HEAD']
|
|
|
|
return [
|
|
|
|
os.path.abspath(path)
|
|
|
|
for path in subprocess.check_output(diff_command).decode().splitlines()
|
|
|
|
if os.path.isfile(path)
|
|
|
|
]
|
|
|
|
|
|
|
|
|
2021-01-20 20:34:29 +00:00
|
|
|
def run_tests(relevant_files):
|
2020-02-21 16:47:13 +00:00
|
|
|
"""Run all unit tests in directories that are different from HEAD."""
|
|
|
|
changed_dirs = set()
|
2021-01-20 20:34:29 +00:00
|
|
|
for file in relevant_files:
|
2020-02-21 16:47:13 +00:00
|
|
|
changed_dirs.add(os.path.dirname(file))
|
2020-03-05 16:44:18 +00:00
|
|
|
|
2020-05-28 17:14:57 +00:00
|
|
|
# TODO(metzman): This approach for running tests is flawed since tests can
|
|
|
|
# fail even if their directory isn't changed. Figure out if it is needed (to
|
|
|
|
# save time) and remove it if it isn't.
|
2020-02-21 16:47:13 +00:00
|
|
|
suite_list = []
|
|
|
|
for change_dir in changed_dirs:
|
|
|
|
suite_list.append(unittest.TestLoader().discover(change_dir,
|
|
|
|
pattern='*_test.py'))
|
2020-05-28 17:14:57 +00:00
|
|
|
suite = unittest.TestSuite(suite_list)
|
|
|
|
result = unittest.TextTestRunner().run(suite)
|
|
|
|
return not result.failures and not result.errors
|
2020-02-21 16:47:13 +00:00
|
|
|
|
|
|
|
|
2020-12-18 18:43:22 +00:00
|
|
|
def get_all_files():
|
|
|
|
"""Returns a list of absolute paths of files in this repo."""
|
|
|
|
get_all_files_command = ['git', 'ls-files']
|
|
|
|
output = subprocess.check_output(get_all_files_command).decode().splitlines()
|
|
|
|
return [os.path.abspath(path) for path in output if os.path.isfile(path)]
|
|
|
|
|
|
|
|
|
2020-01-10 18:19:42 +00:00
|
|
|
def main():
|
|
|
|
"""Check changes on a branch for common issues before submitting."""
|
|
|
|
# Get program arguments.
|
|
|
|
parser = argparse.ArgumentParser(description='Presubmit script for oss-fuzz.')
|
|
|
|
parser.add_argument('command',
|
2020-03-05 16:44:18 +00:00
|
|
|
choices=['format', 'lint', 'license', 'infra-tests'],
|
2020-01-10 18:19:42 +00:00
|
|
|
nargs='?')
|
2020-12-18 18:43:22 +00:00
|
|
|
parser.add_argument('--all-files',
|
|
|
|
action='store_true',
|
|
|
|
help='Run presubmit check(s) on all files',
|
|
|
|
default=False)
|
2020-01-10 18:19:42 +00:00
|
|
|
args = parser.parse_args()
|
|
|
|
|
2020-12-18 18:43:22 +00:00
|
|
|
if args.all_files:
|
|
|
|
relevant_files = get_all_files()
|
|
|
|
else:
|
|
|
|
relevant_files = get_changed_files()
|
2020-01-10 18:19:42 +00:00
|
|
|
|
|
|
|
os.chdir(_SRC_ROOT)
|
|
|
|
|
|
|
|
# Do one specific check if the user asked for it.
|
|
|
|
if args.command == 'format':
|
2020-12-18 18:43:22 +00:00
|
|
|
success = yapf(relevant_files, False)
|
2020-01-10 18:19:42 +00:00
|
|
|
return bool_to_returncode(success)
|
|
|
|
|
|
|
|
if args.command == 'lint':
|
2021-01-20 20:34:29 +00:00
|
|
|
success = lint()
|
2020-01-10 18:19:42 +00:00
|
|
|
return bool_to_returncode(success)
|
|
|
|
|
|
|
|
if args.command == 'license':
|
2020-12-18 18:43:22 +00:00
|
|
|
success = check_license(relevant_files)
|
2020-01-10 18:19:42 +00:00
|
|
|
return bool_to_returncode(success)
|
|
|
|
|
2020-03-05 16:44:18 +00:00
|
|
|
if args.command == 'infra-tests':
|
2021-01-20 20:34:29 +00:00
|
|
|
success = run_tests(relevant_files)
|
2020-12-18 18:43:22 +00:00
|
|
|
return bool_to_returncode(success)
|
2020-02-21 16:47:13 +00:00
|
|
|
|
|
|
|
# Do all the checks (but no tests).
|
2020-12-18 18:43:22 +00:00
|
|
|
success = do_checks(relevant_files)
|
2020-02-21 16:47:13 +00:00
|
|
|
|
2020-01-10 18:19:42 +00:00
|
|
|
return bool_to_returncode(success)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
|
sys.exit(main())
|