support/mesos-style.py - mesos - Git at Google

 #!/usr/bin/env python

 ''' Runs checks for mesos style. '''

 import os
 import re
 import string
 import subprocess
 import sys


 class LinterBase(object):
     '''
     This is an abstract class that provides the base functionality for
     linting files in the mesos project. Its 'main()' function
     walks through the set of files passed to it and runs some
     standard linting over them. This includes checking for license headers
     and checking for non-supported characters. From there it calls a
     'run_lint()' function that can be overridden to provide
     customizable style checks for a specific class of files (e.g. C++,
     Python, etc.).

     Any class that extends from 'LinterBase' should override the
     following class variables / functions:

     linter_type
     source_dirs
     exclude_files
     source_files
     comment_prefix

     run_lint()

     Please see the comments below for details on how to override each
     variable.
     '''
     # The name of the linter to help with printing which linter files
     # are currently being processed by.
     linter_type = ''

     # Root source paths (will be traversed recursively).
     source_dirs = []

     # Add file paths and patterns which should not be checked
     # This should include 3rdparty libraries, includes and machine generated
     # source.
     exclude_files = ''

     # A regex of possible matches for your source files.
     source_files = ''

     # A prefix at the beginning of the line to demark comments (e.g. '//')
     comment_prefix = ''

     def find_candidates(self, root_dir):
         '''
         Search through the all files rooted at 'root_dir' and compare
         them against 'self.exclude_files' and 'self.source_files' to
         come up with a set of candidate files to lint.
         '''
         exclude_file_regex = re.compile(self.exclude_files)
         source_criteria_regex = re.compile(self.source_files)
         for root, dirs, files in os.walk(root_dir):
             for name in files:
                 path = os.path.join(root, name)
                 if exclude_file_regex.search(path) is not None:
                     continue

                 if source_criteria_regex.search(name) is not None:
                     yield path

     def run_lint(self, source_paths):
         '''
         A custom function to provide linting for 'linter_type'.
         It takes a list of source files to lint and returns the number
         of errors found during the linting process.

         It should print any errors as it encounters them to provide
         feedback to the caller.
         '''
         pass

     def check_license_header(self, source_paths):
         ''' Checks the license headers of the given files. '''
         error_count = 0
         for path in source_paths:
             with open(path) as source_file:
                 head = source_file.readline()

                 # Check that opening comment has correct style.
                 # TODO(bbannier) We allow `Copyright` for currently deviating files.
                 # This should be removed one we have a uniform license format.
                 regex = r'^{comment_prefix} [Licensed|Copyright]'.\
                             format(comment_prefix=self.comment_prefix)
                 if not re.match(regex, head):
                     sys.stderr.write(
                         "{path}:1:  A license header should appear on the file's "
                         "first line starting with '{comment_prefix} Licensed'.: {head}".\
                             format(path=path, head=head, comment_prefix=self.comment_prefix))
                     error_count += 1

         return error_count

     def check_encoding(self, source_paths):
         '''
         Checks for encoding errors in the given files. Source
         code files must contain only printable ascii characters.
         This excludes the extended ascii characters 128-255.
         http://www.asciitable.com/
         '''
         error_count = 0
         for path in source_paths:
             with open(path) as source_file:
                 for line_number, line in enumerate(source_file):
                     # If we find an error, add 1 to both the character and
                     # the line offset to give them 1-based indexing
                     # instead of 0 (as is common in most editors).
                     char_errors = [offset for offset, char in enumerate(line)
                                    if char not in string.printable]
                     if char_errors:
                         sys.stderr.write(
                             "{path}:{line_number}:  Non-printable characters"
                             " found at [{offsets}]: \"{line}\"\n".format(
                                 path=path,
                                 line_number=line_number + 1,
                                 offsets=', '.join([str(offset + 1) for offset
                                                    in char_errors]),
                                 line=line.rstrip()))
                         error_count += 1

         return error_count

     def main(self, file_list):
         '''
         This function takes a list of files and lints them for the
         class of files defined by 'linter_type'.
         '''

         # Verify that source roots are accessible from current working directory.
         # A common error could be to call the style checker from other
         # (possibly nested) paths.
         for source_dir in self.source_dirs:
             if not os.path.exists(source_dir):
                 print "Could not find '{dir}'".format(dir=source_dir)
                 print 'Please run from the root of the mesos source directory'
                 exit(1)

         # Add all source file candidates to candidates list.
         candidates = []
         for source_dir in self.source_dirs:
             for candidate in self.find_candidates(source_dir):
                 candidates.append(candidate)

         # If file paths are specified, check all file paths that are
         # candidates; else check all candidates.
         file_paths = file_list if len(file_list) > 0 else candidates

         # Compute the set intersect of the input file paths and candidates.
         # This represents the reduced set of candidates to run lint on.
         candidates_set = set(candidates)
         clean_file_paths_set = set(map(lambda x: x.rstrip(), file_paths))
         filtered_candidates_set = clean_file_paths_set.intersection(
             candidates_set)

         if filtered_candidates_set:
             plural = '' if len(filtered_candidates_set) == 1 else 's'
             print 'Checking {num_files} {linter} file{plural}'.\
                     format(num_files=len(filtered_candidates_set),
                            linter=self.linter_type,
                            plural=plural)

             license_errors = self.check_license_header(filtered_candidates_set)
             encoding_errors = self.check_encoding(list(filtered_candidates_set))
             lint_errors = self.run_lint(list(filtered_candidates_set))
             total_errors = license_errors + encoding_errors + lint_errors

             sys.stderr.write('Total errors found: {num_errors}\n'.\
                                 format(num_errors=total_errors))

             return total_errors
         else:
             print "No {linter} files to lint".format(linter=self.linter_type)
             return 0


 class CppLinter(LinterBase):
     linter_type = 'C++'

     source_dirs = ['src',
                    'include',
                    os.path.join('3rdparty', 'libprocess'),
                    os.path.join('3rdparty', 'stout')]

     exclude_files = '(protobuf\-2\.4\.1|gmock\-1\.6\.0|glog\-0\.3\.3|boost\-1\.53\.0|libev\-4\.15|java/jni|\.pb\.cc|\.pb\.h|\.md|\.virtualenv)'

     source_files = '\.(cpp|hpp|cc|h)$'

     comment_prefix = '\/\/'

     def run_lint(self, source_paths):
         '''
         Runs cpplint over given files.

         http://google-styleguide.googlecode.com/svn/trunk/cpplint/cpplint.py
         '''

         # See cpplint.py for full list of rules.
         active_rules = [
             'build/class',
             'build/deprecated',
             'build/endif_comment',
             'build/nullptr',
             'readability/todo',
             'readability/namespace',
             'runtime/vlog',
             'whitespace/blank_line',
             'whitespace/comma',
             'whitespace/end_of_line',
             'whitespace/ending_newline',
             'whitespace/forcolon',
             'whitespace/indent',
             'whitespace/line_length',
             'whitespace/operators',
             'whitespace/semicolon',
             'whitespace/tab',
             'whitespace/comments',
             'whitespace/todo']

         rules_filter = '--filter=-,+' + ',+'.join(active_rules)
         p = subprocess.Popen(
             ['python', 'support/cpplint.py', rules_filter] + source_paths,
             stderr=subprocess.PIPE,
             close_fds=True)

         # Lines are stored and filtered, only showing found errors instead
         # of e.g., 'Done processing XXX.' which tends to be dominant output.
         for line in p.stderr:
             if re.match('^(Done processing |Total errors found: )', line):
                 continue
             sys.stderr.write(line)

         p.wait()
         return p.returncode


 class PyLinter(LinterBase):
     linter_type = 'Python'

     source_dirs = ['src/cli_new']

     exclude_files = '(protobuf\-2\.4\.1|gmock\-1\.6\.0|glog\-0\.3\.3|boost\-1\.53\.0|libev\-4\.15|java/jni|\.virtualenv)'

     source_files = '\.(py)$'

     comment_prefix = '#'

     def __check_virtualenv(self):
         cli_dir = os.path.abspath(self.source_dirs[0])

         if not os.path.isdir(os.path.join(cli_dir, '.virtualenv')):
             print 'Virtualenv not detected... Building'

             p = subprocess.Popen(
                 [os.path.join(cli_dir, 'bootstrap')],
                 stdout=subprocess.PIPE)

             output = ''
             for line in p.stdout:
                 output += line

             p.wait()

             if p.returncode != 0:
                 sys.stderr.write(output)
                 sys.exit(1);

     def run_lint(self, source_paths):
         '''
         Runs pylint over given files.

         https://google.github.io/styleguide/pyguide.html
         '''

         cli_dir = os.path.abspath(self.source_dirs[0])
         source_files = ' '.join(source_paths)

         self.__check_virtualenv()

         p = subprocess.Popen(
             ['. {virtualenv_dir}/bin/activate; \
              PYTHONPATH={lib_dir}:{bin_dir} pylint --rcfile={config} --ignore={ignore} {files}'.\
              format(virtualenv_dir=os.path.join(cli_dir, '.virtualenv'),
                     lib_dir=os.path.join(cli_dir,'lib'),
                     bin_dir=os.path.join(cli_dir,'bin'),
                     config=os.path.join(cli_dir, 'pylint.config'),
                     ignore=os.path.join(cli_dir, 'bin', 'mesos'),
                     files=source_files)],
             shell=True, stdout=subprocess.PIPE)

         num_errors = 0
         for line in p.stdout:
             if not line.startswith('*'):
                 num_errors += 1
             sys.stderr.write(line)

         return num_errors


 if __name__ == '__main__':
     cpp_linter = CppLinter()
     cpp_errors = cpp_linter.main(sys.argv[1:])
     py_linter = PyLinter()
     py_errors = py_linter.main(sys.argv[1:])
     sys.exit(cpp_errors + py_errors)
	#!/usr/bin/env python

	''' Runs checks for mesos style. '''

	import os
	import re
	import string
	import subprocess
	import sys


	class LinterBase(object):
	'''
	This is an abstract class that provides the base functionality for
	linting files in the mesos project. Its 'main()' function
	walks through the set of files passed to it and runs some
	standard linting over them. This includes checking for license headers
	and checking for non-supported characters. From there it calls a
	'run_lint()' function that can be overridden to provide
	customizable style checks for a specific class of files (e.g. C++,
	Python, etc.).

	Any class that extends from 'LinterBase' should override the
	following class variables / functions:

	linter_type
	source_dirs
	exclude_files
	source_files
	comment_prefix

	run_lint()

	Please see the comments below for details on how to override each
	variable.
	'''
	# The name of the linter to help with printing which linter files
	# are currently being processed by.
	linter_type = ''

	# Root source paths (will be traversed recursively).
	source_dirs = []

	# Add file paths and patterns which should not be checked
	# This should include 3rdparty libraries, includes and machine generated
	# source.
	exclude_files = ''

	# A regex of possible matches for your source files.
	source_files = ''

	# A prefix at the beginning of the line to demark comments (e.g. '//')
	comment_prefix = ''

	def find_candidates(self, root_dir):
	'''
	Search through the all files rooted at 'root_dir' and compare
	them against 'self.exclude_files' and 'self.source_files' to
	come up with a set of candidate files to lint.
	'''
	exclude_file_regex = re.compile(self.exclude_files)
	source_criteria_regex = re.compile(self.source_files)
	for root, dirs, files in os.walk(root_dir):
	for name in files:
	path = os.path.join(root, name)
	if exclude_file_regex.search(path) is not None:
	continue

	if source_criteria_regex.search(name) is not None:
	yield path

	def run_lint(self, source_paths):
	'''
	A custom function to provide linting for 'linter_type'.
	It takes a list of source files to lint and returns the number
	of errors found during the linting process.

	It should print any errors as it encounters them to provide
	feedback to the caller.
	'''
	pass

	def check_license_header(self, source_paths):
	''' Checks the license headers of the given files. '''
	error_count = 0
	for path in source_paths:
	with open(path) as source_file:
	head = source_file.readline()

	# Check that opening comment has correct style.
	# TODO(bbannier) We allow `Copyright` for currently deviating files.
	# This should be removed one we have a uniform license format.
	regex = r'^{comment_prefix} [Licensed\|Copyright]'.\
	format(comment_prefix=self.comment_prefix)
	if not re.match(regex, head):
	sys.stderr.write(
	"{path}:1: A license header should appear on the file's "
	"first line starting with '{comment_prefix} Licensed'.: {head}".\
	format(path=path, head=head, comment_prefix=self.comment_prefix))
	error_count += 1

	return error_count

	def check_encoding(self, source_paths):
	'''
	Checks for encoding errors in the given files. Source
	code files must contain only printable ascii characters.
	This excludes the extended ascii characters 128-255.
	http://www.asciitable.com/
	'''
	error_count = 0
	for path in source_paths:
	with open(path) as source_file:
	for line_number, line in enumerate(source_file):
	# If we find an error, add 1 to both the character and
	# the line offset to give them 1-based indexing
	# instead of 0 (as is common in most editors).
	char_errors = [offset for offset, char in enumerate(line)
	if char not in string.printable]
	if char_errors:
	sys.stderr.write(
	"{path}:{line_number}: Non-printable characters"
	" found at [{offsets}]: \"{line}\"\n".format(
	path=path,
	line_number=line_number + 1,
	offsets=', '.join([str(offset + 1) for offset
	in char_errors]),
	line=line.rstrip()))
	error_count += 1

	return error_count

	def main(self, file_list):
	'''
	This function takes a list of files and lints them for the
	class of files defined by 'linter_type'.
	'''

	# Verify that source roots are accessible from current working directory.
	# A common error could be to call the style checker from other
	# (possibly nested) paths.
	for source_dir in self.source_dirs:
	if not os.path.exists(source_dir):
	print "Could not find '{dir}'".format(dir=source_dir)
	print 'Please run from the root of the mesos source directory'
	exit(1)

	# Add all source file candidates to candidates list.
	candidates = []
	for source_dir in self.source_dirs:
	for candidate in self.find_candidates(source_dir):
	candidates.append(candidate)

	# If file paths are specified, check all file paths that are
	# candidates; else check all candidates.
	file_paths = file_list if len(file_list) > 0 else candidates

	# Compute the set intersect of the input file paths and candidates.
	# This represents the reduced set of candidates to run lint on.
	candidates_set = set(candidates)
	clean_file_paths_set = set(map(lambda x: x.rstrip(), file_paths))
	filtered_candidates_set = clean_file_paths_set.intersection(
	candidates_set)

	if filtered_candidates_set:
	plural = '' if len(filtered_candidates_set) == 1 else 's'
	print 'Checking {num_files} {linter} file{plural}'.\
	format(num_files=len(filtered_candidates_set),
	linter=self.linter_type,
	plural=plural)

	license_errors = self.check_license_header(filtered_candidates_set)
	encoding_errors = self.check_encoding(list(filtered_candidates_set))
	lint_errors = self.run_lint(list(filtered_candidates_set))
	total_errors = license_errors + encoding_errors + lint_errors

	sys.stderr.write('Total errors found: {num_errors}\n'.\
	format(num_errors=total_errors))

	return total_errors
	else:
	print "No {linter} files to lint".format(linter=self.linter_type)
	return 0


	class CppLinter(LinterBase):
	linter_type = 'C++'

	source_dirs = ['src',
	'include',
	os.path.join('3rdparty', 'libprocess'),
	os.path.join('3rdparty', 'stout')]

	exclude_files = '(protobuf\-2\.4\.1\|gmock\-1\.6\.0\|glog\-0\.3\.3\|boost\-1\.53\.0\|libev\-4\.15\|java/jni\|\.pb\.cc\|\.pb\.h\|\.md\|\.virtualenv)'

	source_files = '\.(cpp\|hpp\|cc\|h)$'

	comment_prefix = '\/\/'

	def run_lint(self, source_paths):
	'''
	Runs cpplint over given files.

	http://google-styleguide.googlecode.com/svn/trunk/cpplint/cpplint.py
	'''

	# See cpplint.py for full list of rules.
	active_rules = [
	'build/class',
	'build/deprecated',
	'build/endif_comment',
	'build/nullptr',
	'readability/todo',
	'readability/namespace',
	'runtime/vlog',
	'whitespace/blank_line',
	'whitespace/comma',
	'whitespace/end_of_line',
	'whitespace/ending_newline',
	'whitespace/forcolon',
	'whitespace/indent',
	'whitespace/line_length',
	'whitespace/operators',
	'whitespace/semicolon',
	'whitespace/tab',
	'whitespace/comments',
	'whitespace/todo']

	rules_filter = '--filter=-,+' + ',+'.join(active_rules)
	p = subprocess.Popen(
	['python', 'support/cpplint.py', rules_filter] + source_paths,
	stderr=subprocess.PIPE,
	close_fds=True)

	# Lines are stored and filtered, only showing found errors instead
	# of e.g., 'Done processing XXX.' which tends to be dominant output.
	for line in p.stderr:
	if re.match('^(Done processing \|Total errors found: )', line):
	continue
	sys.stderr.write(line)

	p.wait()
	return p.returncode


	class PyLinter(LinterBase):
	linter_type = 'Python'

	source_dirs = ['src/cli_new']

	exclude_files = '(protobuf\-2\.4\.1\|gmock\-1\.6\.0\|glog\-0\.3\.3\|boost\-1\.53\.0\|libev\-4\.15\|java/jni\|\.virtualenv)'

	source_files = '\.(py)$'

	comment_prefix = '#'

	def __check_virtualenv(self):
	cli_dir = os.path.abspath(self.source_dirs[0])

	if not os.path.isdir(os.path.join(cli_dir, '.virtualenv')):
	print 'Virtualenv not detected... Building'

	p = subprocess.Popen(
	[os.path.join(cli_dir, 'bootstrap')],
	stdout=subprocess.PIPE)

	output = ''
	for line in p.stdout:
	output += line

	p.wait()

	if p.returncode != 0:
	sys.stderr.write(output)
	sys.exit(1);

	def run_lint(self, source_paths):
	'''
	Runs pylint over given files.

	https://google.github.io/styleguide/pyguide.html
	'''

	cli_dir = os.path.abspath(self.source_dirs[0])
	source_files = ' '.join(source_paths)

	self.__check_virtualenv()

	p = subprocess.Popen(
	['. {virtualenv_dir}/bin/activate; \
	PYTHONPATH={lib_dir}:{bin_dir} pylint --rcfile={config} --ignore={ignore} {files}'.\
	format(virtualenv_dir=os.path.join(cli_dir, '.virtualenv'),
	lib_dir=os.path.join(cli_dir,'lib'),
	bin_dir=os.path.join(cli_dir,'bin'),
	config=os.path.join(cli_dir, 'pylint.config'),
	ignore=os.path.join(cli_dir, 'bin', 'mesos'),
	files=source_files)],
	shell=True, stdout=subprocess.PIPE)

	num_errors = 0
	for line in p.stdout:
	if not line.startswith('*'):
	num_errors += 1
	sys.stderr.write(line)

	return num_errors


	if __name__ == '__main__':
	cpp_linter = CppLinter()
	cpp_errors = cpp_linter.main(sys.argv[1:])
	py_linter = PyLinter()
	py_errors = py_linter.main(sys.argv[1:])
	sys.exit(cpp_errors + py_errors)