tools/run_tests/filter_pull_request_tests.py - platform/external/grpc-grpc - Gitiles

 #!/usr/bin/env python2.7
 # Copyright 2015, Google Inc.
 # All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions are
 # met:
 #
 #     * Redistributions of source code must retain the above copyright
 # notice, this list of conditions and the following disclaimer.
 #     * Redistributions in binary form must reproduce the above
 # copyright notice, this list of conditions and the following disclaimer
 # in the documentation and/or other materials provided with the
 # distribution.
 #     * Neither the name of Google Inc. nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 # A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 # LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 # DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 # THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 # OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 """Filter out tests based on file differences compared to merge target branch"""

 import re
 from subprocess import call, check_output


 class TestSuite:
   """
   Contains tag to identify job as belonging to this test suite and
   triggers to identify if changed files are relevant
   """
   def __init__(self, tags):
     """
     Build TestSuite to group tests by their tags
     :param tag: string used to identify if a job belongs to this TestSuite
     todo(mattkwong): Change the use of tag because do not want to depend on
     job.shortname to identify what suite a test belongs to
     """
     self.triggers = []
     self.tags = tags

   def add_trigger(self, trigger):
     """
     Add a regex to list of triggers that determine if a changed file should run tests
     :param trigger: regex matching file relevant to tests
     """
     self.triggers.append(trigger)

 # Create test suites
 _core_test_suite = TestSuite(['_c_'])
 _cpp_test_suite = TestSuite(['_c++_'])
 _csharp_test_suite = TestSuite(['_csharp_'])
 _node_test_suite = TestSuite(['_node_'])
 _objc_test_suite = TestSuite(['_objc_'])
 _php_test_suite = TestSuite(['_php_', '_php7_'])
 _python_test_suite = TestSuite(['_python_'])
 _ruby_test_suite = TestSuite(['_ruby'])
 _all_test_suites = [_core_test_suite, _cpp_test_suite, _csharp_test_suite,
                     _node_test_suite, _objc_test_suite, _php_test_suite,
                     _python_test_suite, _ruby_test_suite]

 # Dictionary of whitelistable files where the key is a regex matching changed files
 # and the value is a list of tests that should be run. An empty list means that
 # the changed files should not trigger any tests. Any changed file that does not
 # match any of these regexes will trigger all tests
 _WHITELIST_DICT = {
   '^templates/.*': [],
   '^doc/.*': [],
   '^examples/.*': [],
   '^summerofcode/.*': [],
   '.*README.md$': [],
   '.*LICENSE$': [],
   '^src/cpp.*': [_cpp_test_suite],
   '^src/csharp.*': [_csharp_test_suite],
   '^src/node.*': [_node_test_suite],
   '^src/objective-c.*': [_objc_test_suite],
   '^src/php.*': [_php_test_suite],
   '^src/python.*': [_python_test_suite],
   '^src/ruby.*': [_ruby_test_suite],
   '^test/core.*': [_core_test_suite],
   '^test/cpp.*': [_cpp_test_suite],
   '^test/distrib/cpp.*': [_cpp_test_suite],
   '^test/distrib/csharp.*': [_csharp_test_suite],
   '^test/distrib/node.*': [_node_test_suite],
   '^test/distrib/php.*': [_php_test_suite],
   '^test/distrib/python.*': [_python_test_suite],
   '^test/distrib/ruby.*': [_ruby_test_suite]
 }
 # Add all triggers to their respective test suites
 for trigger, test_suites in _WHITELIST_DICT.iteritems():
   for test_suite in test_suites:
     test_suite.add_trigger(trigger)


 def _get_changed_files(base_branch):
   """
   Get list of changed files between current branch and base of target merge branch
   """
   # git fetch might need to be called on Jenkins slave
   # todo(mattkwong): remove or uncomment below after seeing if Jenkins needs this
   # call(['git', 'fetch'])

   # Get file changes between branch and merge-base of specified branch
   # Not combined to be Windows friendly
   base_commit = check_output(["git", "merge-base", base_branch, "HEAD"]).rstrip()
   return check_output(["git", "diff", base_commit, "--name-only"]).splitlines()


 def _can_skip_tests(file_names, triggers):
   """
   Determines if tests are skippable based on if all files do not match list of regexes
   :param file_names: list of changed files generated by _get_changed_files()
   :param triggers: list of regexes matching file name that indicates tests should be run
   :return: safe to skip tests
   """
   for file_name in file_names:
     if any(re.match(trigger, file_name) for trigger in triggers):
       return False
   return True


 def _remove_irrelevant_tests(tests, tag):
   """
   Filters out tests by config or language - will not remove sanitizer tests
   :param tests: list of all tests generated by run_tests_matrix.py
   :param tag: string representing language or config to filter - "_(language)_" or "_(config)"
   :return: list of relevant tests
   """
   # todo(mattkwong): find a more reliable way to filter tests - don't use shortname
   return [test for test in tests if tag not in test.shortname or
           any(san_tag in test.shortname for san_tag in ['_asan', '_tsan', '_msan'])]


 def _remove_sanitizer_tests(tests):
   """
   Filters out sanitizer tests
   :param tests: list of all tests generated by run_tests_matrix.py
   :return: list of relevant tests
   """
   # todo(mattkwong): find a more reliable way to filter tests - don't use shortname
   return [test for test in tests if
           all(san_tag not in test.shortname for san_tag in ['_asan', '_tsan', '_msan'])]


 def filter_tests(tests, base_branch):
   """
   Filters out tests that are safe to ignore
   :param tests: list of all tests generated by run_tests_matrix.py
   :return: list of relevant tests
   """
   print("Finding file differences between %s repo and current branch...\n" % base_branch)
   changed_files = _get_changed_files(base_branch)
   for changed_file in changed_files:
     print(changed_file)
   print

   # Regex that combines all keys in _WHITELIST_DICT
   all_triggers = "(" + ")|(".join(_WHITELIST_DICT.keys()) + ")"
   # Check if all tests have to be run
   for changed_file in changed_files:
     if not re.match(all_triggers, changed_file):
       return(tests)
   # Filter out tests by language
   for test_suite in _all_test_suites:
     if _can_skip_tests(changed_files, test_suite.triggers):
       for tag in test_suite.tags:
         print("  Filtering %s tests" % tag)
         tests = _remove_irrelevant_tests(tests, tag)
   # Sanitizer tests skipped if core and c++ are skipped
   if _can_skip_tests(changed_files, _cpp_test_suite.triggers + _core_test_suite.triggers):
     print("  Filtering Sanitizer tests")
     tests = _remove_sanitizer_tests(tests)

   return tests
	#!/usr/bin/env python2.7
	# Copyright 2015, Google Inc.
	# All rights reserved.
	#
	# Redistribution and use in source and binary forms, with or without
	# modification, are permitted provided that the following conditions are
	# met:
	#
	# * Redistributions of source code must retain the above copyright
	# notice, this list of conditions and the following disclaimer.
	# * Redistributions in binary form must reproduce the above
	# copyright notice, this list of conditions and the following disclaimer
	# in the documentation and/or other materials provided with the
	# distribution.
	# * Neither the name of Google Inc. nor the names of its
	# contributors may be used to endorse or promote products derived from
	# this software without specific prior written permission.
	#
	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

	"""Filter out tests based on file differences compared to merge target branch"""

	import re
	from subprocess import call, check_output


	class TestSuite:
	"""
	Contains tag to identify job as belonging to this test suite and
	triggers to identify if changed files are relevant
	"""
	def __init__(self, tags):
	"""
	Build TestSuite to group tests by their tags
	:param tag: string used to identify if a job belongs to this TestSuite
	todo(mattkwong): Change the use of tag because do not want to depend on
	job.shortname to identify what suite a test belongs to
	"""
	self.triggers = []
	self.tags = tags

	def add_trigger(self, trigger):
	"""
	Add a regex to list of triggers that determine if a changed file should run tests
	:param trigger: regex matching file relevant to tests
	"""
	self.triggers.append(trigger)

	# Create test suites
	_core_test_suite = TestSuite(['_c_'])
	_cpp_test_suite = TestSuite(['_c++_'])
	_csharp_test_suite = TestSuite(['_csharp_'])
	_node_test_suite = TestSuite(['_node_'])
	_objc_test_suite = TestSuite(['_objc_'])
	_php_test_suite = TestSuite(['_php_', '_php7_'])
	_python_test_suite = TestSuite(['_python_'])
	_ruby_test_suite = TestSuite(['_ruby'])
	_all_test_suites = [_core_test_suite, _cpp_test_suite, _csharp_test_suite,
	_node_test_suite, _objc_test_suite, _php_test_suite,
	_python_test_suite, _ruby_test_suite]

	# Dictionary of whitelistable files where the key is a regex matching changed files
	# and the value is a list of tests that should be run. An empty list means that
	# the changed files should not trigger any tests. Any changed file that does not
	# match any of these regexes will trigger all tests
	_WHITELIST_DICT = {
	'^templates/.*': [],
	'^doc/.*': [],
	'^examples/.*': [],
	'^summerofcode/.*': [],
	'.*README.md$': [],
	'.*LICENSE$': [],
	'^src/cpp.*': [_cpp_test_suite],
	'^src/csharp.*': [_csharp_test_suite],
	'^src/node.*': [_node_test_suite],
	'^src/objective-c.*': [_objc_test_suite],
	'^src/php.*': [_php_test_suite],
	'^src/python.*': [_python_test_suite],
	'^src/ruby.*': [_ruby_test_suite],
	'^test/core.*': [_core_test_suite],
	'^test/cpp.*': [_cpp_test_suite],
	'^test/distrib/cpp.*': [_cpp_test_suite],
	'^test/distrib/csharp.*': [_csharp_test_suite],
	'^test/distrib/node.*': [_node_test_suite],
	'^test/distrib/php.*': [_php_test_suite],
	'^test/distrib/python.*': [_python_test_suite],
	'^test/distrib/ruby.*': [_ruby_test_suite]
	}
	# Add all triggers to their respective test suites
	for trigger, test_suites in _WHITELIST_DICT.iteritems():
	for test_suite in test_suites:
	test_suite.add_trigger(trigger)


	def _get_changed_files(base_branch):
	"""
	Get list of changed files between current branch and base of target merge branch
	"""
	# git fetch might need to be called on Jenkins slave
	# todo(mattkwong): remove or uncomment below after seeing if Jenkins needs this
	# call(['git', 'fetch'])

	# Get file changes between branch and merge-base of specified branch
	# Not combined to be Windows friendly
	base_commit = check_output(["git", "merge-base", base_branch, "HEAD"]).rstrip()
	return check_output(["git", "diff", base_commit, "--name-only"]).splitlines()


	def _can_skip_tests(file_names, triggers):
	"""
	Determines if tests are skippable based on if all files do not match list of regexes
	:param file_names: list of changed files generated by _get_changed_files()
	:param triggers: list of regexes matching file name that indicates tests should be run
	:return: safe to skip tests
	"""
	for file_name in file_names:
	if any(re.match(trigger, file_name) for trigger in triggers):
	return False
	return True


	def _remove_irrelevant_tests(tests, tag):
	"""
	Filters out tests by config or language - will not remove sanitizer tests
	:param tests: list of all tests generated by run_tests_matrix.py
	:param tag: string representing language or config to filter - "_(language)_" or "_(config)"
	:return: list of relevant tests
	"""
	# todo(mattkwong): find a more reliable way to filter tests - don't use shortname
	return [test for test in tests if tag not in test.shortname or
	any(san_tag in test.shortname for san_tag in ['_asan', '_tsan', '_msan'])]


	def _remove_sanitizer_tests(tests):
	"""
	Filters out sanitizer tests
	:param tests: list of all tests generated by run_tests_matrix.py
	:return: list of relevant tests
	"""
	# todo(mattkwong): find a more reliable way to filter tests - don't use shortname
	return [test for test in tests if
	all(san_tag not in test.shortname for san_tag in ['_asan', '_tsan', '_msan'])]


	def filter_tests(tests, base_branch):
	"""
	Filters out tests that are safe to ignore
	:param tests: list of all tests generated by run_tests_matrix.py
	:return: list of relevant tests
	"""
	print("Finding file differences between %s repo and current branch...\n" % base_branch)
	changed_files = _get_changed_files(base_branch)
	for changed_file in changed_files:
	print(changed_file)
	print

	# Regex that combines all keys in _WHITELIST_DICT
	all_triggers = "(" + ")\|(".join(_WHITELIST_DICT.keys()) + ")"
	# Check if all tests have to be run
	for changed_file in changed_files:
	if not re.match(all_triggers, changed_file):
	return(tests)
	# Filter out tests by language
	for test_suite in _all_test_suites:
	if _can_skip_tests(changed_files, test_suite.triggers):
	for tag in test_suite.tags:
	print(" Filtering %s tests" % tag)
	tests = _remove_irrelevant_tests(tests, tag)
	# Sanitizer tests skipped if core and c++ are skipped
	if _can_skip_tests(changed_files, _cpp_test_suite.triggers + _core_test_suite.triggers):
	print(" Filtering Sanitizer tests")
	tests = _remove_sanitizer_tests(tests)

	return tests