Blame - tools/cpplint.py - platform/art

blob: 0b5fb935361dc7e42c914de8908982ebabbe541e [file] [log] [blame]

Elliott Hughes	08b82a9	2012-04-05 12:13:56 -0700	[diff] [blame]	1	#!/usr/bin/python
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2	#
				3	# Copyright (c) 2009 Google Inc. All rights reserved.
				4	#
				5	# Redistribution and use in source and binary forms, with or without
				6	# modification, are permitted provided that the following conditions are
				7	# met:
				8	#
				9	# * Redistributions of source code must retain the above copyright
				10	# notice, this list of conditions and the following disclaimer.
				11	# * Redistributions in binary form must reproduce the above
				12	# copyright notice, this list of conditions and the following disclaimer
				13	# in the documentation and/or other materials provided with the
				14	# distribution.
				15	# * Neither the name of Google Inc. nor the names of its
				16	# contributors may be used to endorse or promote products derived from
				17	# this software without specific prior written permission.
				18	#
				19	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				20	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				21	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				22	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
				23	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
				24	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
				25	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
				26	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
				27	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
				28	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
				29	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				30
				31	# Here are some issues that I've had people identify in my code during reviews,
				32	# that I think are possible to flag automatically in a lint tool. If these were
				33	# caught by lint, it would save time both for myself and that of my reviewers.
				34	# Most likely, some of these are beyond the scope of the current lint framework,
				35	# but I think it is valuable to retain these wish-list items even if they cannot
				36	# be immediately implemented.
				37	#
				38	# Suggestions
				39	# -----------
				40	# - Check for no 'explicit' for multi-arg ctor
				41	# - Check for boolean assign RHS in parens
				42	# - Check for ctor initializer-list colon position and spacing
				43	# - Check that if there's a ctor, there should be a dtor
				44	# - Check accessors that return non-pointer member variables are
				45	# declared const
				46	# - Check accessors that return non-const pointer member vars are
				47	# not declared const
				48	# - Check for using public includes for testing
				49	# - Check for spaces between brackets in one-line inline method
				50	# - Check for no assert()
				51	# - Check for spaces surrounding operators
				52	# - Check for 0 in pointer context (should be NULL)
				53	# - Check for 0 in char context (should be '\0')
				54	# - Check for camel-case method name conventions for methods
				55	# that are not simple inline getters and setters
				56	# - Check that base classes have virtual destructors
				57	# put " // namespace" after } that closes a namespace, with
				58	# namespace's name after 'namespace' if it is named.
				59	# - Do not indent namespace contents
				60	# - Avoid inlining non-trivial constructors in header files
				61	# include base/basictypes.h if DISALLOW_EVIL_CONSTRUCTORS is used
				62	# - Check for old-school (void) cast for call-sites of functions
				63	# ignored return value
				64	# - Check gUnit usage of anonymous namespace
				65	# - Check for class declaration order (typedefs, consts, enums,
				66	# ctor(s?), dtor, friend declarations, methods, member vars)
				67	#
				68
				69	"""Does google-lint on c++ files.
				70
				71	The goal of this script is to identify places in the code that may
				72	be in non-compliance with google style. It does not attempt to fix
				73	up these problems -- the point is to educate. It does also not
				74	attempt to find all problems, or to ensure that everything it does
				75	find is legitimately a problem.
				76
				77	In particular, we can get very confused by /* and // inside strings!
				78	We do a small hack, which is to ignore //'s with "'s after them on the
				79	same line, but it is far from perfect (in either direction).
				80	"""
				81
				82	import codecs
				83	import getopt
				84	import math # for log
				85	import os
				86	import re
				87	import sre_compile
				88	import string
				89	import sys
				90	import unicodedata
				91
				92
				93	_USAGE = """
				94	Syntax: cpplint.py [--verbose=#] [--output=vs7] [--filter=-x,+y,...]
				95	[--counting=total\|toplevel\|detailed]
				96	<file> [file] ...
				97
				98	The style guidelines this tries to follow are those in
				99	http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml
				100
				101	Every problem is given a confidence score from 1-5, with 5 meaning we are
				102	certain of the problem, and 1 meaning it could be a legitimate construct.
				103	This will miss some errors, and is not a substitute for a code review.
				104
				105	To suppress false-positive errors of a certain category, add a
				106	'NOLINT(category)' comment to the line. NOLINT or NOLINT(*)
				107	suppresses errors of all categories on that line.
				108
				109	The files passed in will be linted; at least one file must be provided.
				110	Linted extensions are .cc, .cpp, and .h. Other file types will be ignored.
				111
				112	Flags:
				113
				114	output=vs7
				115	By default, the output is formatted to ease emacs parsing. Visual Studio
				116	compatible output (vs7) may also be used. Other formats are unsupported.
				117
				118	verbose=#
				119	Specify a number 0-5 to restrict errors to certain verbosity levels.
				120
				121	filter=-x,+y,...
				122	Specify a comma-separated list of category-filters to apply: only
				123	error messages whose category names pass the filters will be printed.
				124	(Category names are printed with the message and look like
				125	"[whitespace/indent]".) Filters are evaluated left to right.
				126	"-FOO" and "FOO" means "do not print categories that start with FOO".
				127	"+FOO" means "do print categories that start with FOO".
				128
				129	Examples: --filter=-whitespace,+whitespace/braces
				130	--filter=whitespace,runtime/printf,+runtime/printf_format
				131	--filter=-,+build/include_what_you_use
				132
				133	To see a list of all the categories used in cpplint, pass no arg:
				134	--filter=
				135
				136	counting=total\|toplevel\|detailed
				137	The total number of errors found is always printed. If
				138	'toplevel' is provided, then the count of errors in each of
				139	the top-level categories like 'build' and 'whitespace' will
				140	also be printed. If 'detailed' is provided, then a count
				141	is provided for each category like 'build/class'.
				142	"""
				143
				144	# We categorize each error message we print. Here are the categories.
				145	# We want an explicit list so we can list them all in cpplint --filter=.
				146	# If you add a new error message with a new category, add it to the list
				147	# here! cpplint_unittest.py should tell you if you forget to do this.
				148	# \ used for clearer layout -- pylint: disable-msg=C6013
				149	_ERROR_CATEGORIES = [
				150	'build/class',
				151	'build/deprecated',
				152	'build/endif_comment',
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	153	'build/explicit_make_pair',
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	154	'build/forward_decl',
				155	'build/header_guard',
				156	'build/include',
				157	'build/include_alpha',
				158	'build/include_order',
				159	'build/include_what_you_use',
				160	'build/namespaces',
				161	'build/printf_format',
				162	'build/storage_class',
				163	'legal/copyright',
				164	'readability/braces',
				165	'readability/casting',
				166	'readability/check',
				167	'readability/constructors',
				168	'readability/fn_size',
				169	'readability/function',
				170	'readability/multiline_comment',
				171	'readability/multiline_string',
				172	'readability/nolint',
				173	'readability/streams',
				174	'readability/todo',
				175	'readability/utf8',
				176	'runtime/arrays',
				177	'runtime/casting',
				178	'runtime/explicit',
				179	'runtime/int',
				180	'runtime/init',
				181	'runtime/invalid_increment',
				182	'runtime/member_string_references',
				183	'runtime/memset',
				184	'runtime/operator',
				185	'runtime/printf',
				186	'runtime/printf_format',
				187	'runtime/references',
				188	'runtime/rtti',
				189	'runtime/sizeof',
				190	'runtime/string',
				191	'runtime/threadsafe_fn',
				192	'runtime/virtual',
				193	'whitespace/blank_line',
				194	'whitespace/braces',
				195	'whitespace/comma',
				196	'whitespace/comments',
				197	'whitespace/end_of_line',
				198	'whitespace/ending_newline',
				199	'whitespace/indent',
				200	'whitespace/labels',
				201	'whitespace/line_length',
				202	'whitespace/newline',
				203	'whitespace/operators',
				204	'whitespace/parens',
				205	'whitespace/semicolon',
				206	'whitespace/tab',
				207	'whitespace/todo'
				208	]
				209
				210	# The default state of the category filter. This is overrided by the --filter=
				211	# flag. By default all errors are on, so only add here categories that should be
				212	# off by default (i.e., categories that must be enabled by the --filter= flags).
				213	# All entries here should start with a '-' or '+', as in the --filter= flag.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	214	_DEFAULT_FILTERS = ['-build/include_alpha']
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	215
				216	# We used to check for high-bit characters, but after much discussion we
				217	# decided those were OK, as long as they were in UTF-8 and didn't represent
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	218	# hard-coded international strings, which belong in a separate i18n file.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	219
				220	# Headers that we consider STL headers.
				221	_STL_HEADERS = frozenset([
				222	'algobase.h', 'algorithm', 'alloc.h', 'bitset', 'deque', 'exception',
				223	'function.h', 'functional', 'hash_map', 'hash_map.h', 'hash_set',
				224	'hash_set.h', 'iterator', 'list', 'list.h', 'map', 'memory', 'new',
				225	'pair.h', 'pthread_alloc', 'queue', 'set', 'set.h', 'sstream', 'stack',
				226	'stl_alloc.h', 'stl_relops.h', 'type_traits.h',
				227	'utility', 'vector', 'vector.h',
				228	])
				229
				230
				231	# Non-STL C++ system headers.
				232	_CPP_HEADERS = frozenset([
				233	'algo.h', 'builtinbuf.h', 'bvector.h', 'cassert', 'cctype',
				234	'cerrno', 'cfloat', 'ciso646', 'climits', 'clocale', 'cmath',
				235	'complex', 'complex.h', 'csetjmp', 'csignal', 'cstdarg', 'cstddef',
				236	'cstdio', 'cstdlib', 'cstring', 'ctime', 'cwchar', 'cwctype',
				237	'defalloc.h', 'deque.h', 'editbuf.h', 'exception', 'fstream',
				238	'fstream.h', 'hashtable.h', 'heap.h', 'indstream.h', 'iomanip',
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	239	'iomanip.h', 'ios', 'iosfwd', 'iostream', 'iostream.h', 'istream',
				240	'istream.h', 'iterator.h', 'limits', 'map.h', 'multimap.h', 'multiset.h',
				241	'numeric', 'ostream', 'ostream.h', 'parsestream.h', 'pfstream.h',
				242	'PlotFile.h', 'procbuf.h', 'pthread_alloc.h', 'rope', 'rope.h',
				243	'ropeimpl.h', 'SFile.h', 'slist', 'slist.h', 'stack.h', 'stdexcept',
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	244	'stdiostream.h', 'streambuf.h', 'stream.h', 'strfile.h', 'string',
				245	'strstream', 'strstream.h', 'tempbuf.h', 'tree.h', 'typeinfo', 'valarray',
				246	])
				247
				248
				249	# Assertion macros. These are defined in base/logging.h and
				250	# testing/base/gunit.h. Note that the _M versions need to come first
				251	# for substring matching to work.
				252	_CHECK_MACROS = [
				253	'DCHECK', 'CHECK',
				254	'EXPECT_TRUE_M', 'EXPECT_TRUE',
				255	'ASSERT_TRUE_M', 'ASSERT_TRUE',
				256	'EXPECT_FALSE_M', 'EXPECT_FALSE',
				257	'ASSERT_FALSE_M', 'ASSERT_FALSE',
				258	]
				259
				260	# Replacement macros for CHECK/DCHECK/EXPECT_TRUE/EXPECT_FALSE
				261	_CHECK_REPLACEMENT = dict([(m, {}) for m in _CHECK_MACROS])
				262
				263	for op, replacement in [('==', 'EQ'), ('!=', 'NE'),
				264	('>=', 'GE'), ('>', 'GT'),
				265	('<=', 'LE'), ('<', 'LT')]:
				266	_CHECK_REPLACEMENT['DCHECK'][op] = 'DCHECK_%s' % replacement
				267	_CHECK_REPLACEMENT['CHECK'][op] = 'CHECK_%s' % replacement
				268	_CHECK_REPLACEMENT['EXPECT_TRUE'][op] = 'EXPECT_%s' % replacement
				269	_CHECK_REPLACEMENT['ASSERT_TRUE'][op] = 'ASSERT_%s' % replacement
				270	_CHECK_REPLACEMENT['EXPECT_TRUE_M'][op] = 'EXPECT_%s_M' % replacement
				271	_CHECK_REPLACEMENT['ASSERT_TRUE_M'][op] = 'ASSERT_%s_M' % replacement
				272
				273	for op, inv_replacement in [('==', 'NE'), ('!=', 'EQ'),
				274	('>=', 'LT'), ('>', 'LE'),
				275	('<=', 'GT'), ('<', 'GE')]:
				276	_CHECK_REPLACEMENT['EXPECT_FALSE'][op] = 'EXPECT_%s' % inv_replacement
				277	_CHECK_REPLACEMENT['ASSERT_FALSE'][op] = 'ASSERT_%s' % inv_replacement
				278	_CHECK_REPLACEMENT['EXPECT_FALSE_M'][op] = 'EXPECT_%s_M' % inv_replacement
				279	_CHECK_REPLACEMENT['ASSERT_FALSE_M'][op] = 'ASSERT_%s_M' % inv_replacement
				280
				281
				282	# These constants define types of headers for use with
				283	# _IncludeState.CheckNextIncludeOrder().
				284	_C_SYS_HEADER = 1
				285	_CPP_SYS_HEADER = 2
				286	_LIKELY_MY_HEADER = 3
				287	_POSSIBLE_MY_HEADER = 4
				288	_OTHER_HEADER = 5
				289
				290
				291	_regexp_compile_cache = {}
				292
				293	# Finds occurrences of NOLINT or NOLINT(...).
				294	_RE_SUPPRESSION = re.compile(r'\bNOLINT\b($[^)]*$)?')
				295
				296	# {str, set(int)}: a map from error categories to sets of linenumbers
				297	# on which those errors are expected and should be suppressed.
				298	_error_suppressions = {}
				299
				300	def ParseNolintSuppressions(filename, raw_line, linenum, error):
				301	"""Updates the global list of error-suppressions.
				302
				303	Parses any NOLINT comments on the current line, updating the global
				304	error_suppressions store. Reports an error if the NOLINT comment
				305	was malformed.
				306
				307	Args:
				308	filename: str, the name of the input file.
				309	raw_line: str, the line of input text, with comments.
				310	linenum: int, the number of the current line.
				311	error: function, an error handler.
				312	"""
				313	# FIXME(adonovan): "NOLINT(" is misparsed as NOLINT(*).
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	314	matched = _RE_SUPPRESSION.search(raw_line)
				315	if matched:
				316	category = matched.group(1)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	317	if category in (None, '(*)'): # => "suppress all"
				318	_error_suppressions.setdefault(None, set()).add(linenum)
				319	else:
				320	if category.startswith('(') and category.endswith(')'):
				321	category = category[1:-1]
				322	if category in _ERROR_CATEGORIES:
				323	_error_suppressions.setdefault(category, set()).add(linenum)
				324	else:
				325	error(filename, linenum, 'readability/nolint', 5,
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	326	'Unknown NOLINT error category: %s' % category)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	327
				328
				329	def ResetNolintSuppressions():
				330	"Resets the set of NOLINT suppressions to empty."
				331	_error_suppressions.clear()
				332
				333
				334	def IsErrorSuppressedByNolint(category, linenum):
				335	"""Returns true if the specified error category is suppressed on this line.
				336
				337	Consults the global error_suppressions map populated by
				338	ParseNolintSuppressions/ResetNolintSuppressions.
				339
				340	Args:
				341	category: str, the category of the error.
				342	linenum: int, the current line number.
				343	Returns:
				344	bool, True iff the error should be suppressed due to a NOLINT comment.
				345	"""
				346	return (linenum in _error_suppressions.get(category, set()) or
				347	linenum in _error_suppressions.get(None, set()))
				348
				349	def Match(pattern, s):
				350	"""Matches the string with the pattern, caching the compiled regexp."""
				351	# The regexp compilation caching is inlined in both Match and Search for
				352	# performance reasons; factoring it out into a separate function turns out
				353	# to be noticeably expensive.
				354	if not pattern in _regexp_compile_cache:
				355	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				356	return _regexp_compile_cache[pattern].match(s)
				357
				358
				359	def Search(pattern, s):
				360	"""Searches the string for the pattern, caching the compiled regexp."""
				361	if not pattern in _regexp_compile_cache:
				362	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				363	return _regexp_compile_cache[pattern].search(s)
				364
				365
				366	class _IncludeState(dict):
				367	"""Tracks line numbers for includes, and the order in which includes appear.
				368
				369	As a dict, an _IncludeState object serves as a mapping between include
				370	filename and line number on which that file was included.
				371
				372	Call CheckNextIncludeOrder() once for each header in the file, passing
				373	in the type constants defined above. Calls in an illegal order will
				374	raise an _IncludeError with an appropriate error message.
				375
				376	"""
				377	# self._section will move monotonically through this set. If it ever
				378	# needs to move backwards, CheckNextIncludeOrder will raise an error.
				379	_INITIAL_SECTION = 0
				380	_MY_H_SECTION = 1
				381	_C_SECTION = 2
				382	_CPP_SECTION = 3
				383	_OTHER_H_SECTION = 4
				384
				385	_TYPE_NAMES = {
				386	_C_SYS_HEADER: 'C system header',
				387	_CPP_SYS_HEADER: 'C++ system header',
				388	_LIKELY_MY_HEADER: 'header this file implements',
				389	_POSSIBLE_MY_HEADER: 'header this file may implement',
				390	_OTHER_HEADER: 'other header',
				391	}
				392	_SECTION_NAMES = {
				393	_INITIAL_SECTION: "... nothing. (This can't be an error.)",
				394	_MY_H_SECTION: 'a header this file implements',
				395	_C_SECTION: 'C system header',
				396	_CPP_SECTION: 'C++ system header',
				397	_OTHER_H_SECTION: 'other header',
				398	}
				399
				400	def __init__(self):
				401	dict.__init__(self)
				402	# The name of the current section.
				403	self._section = self._INITIAL_SECTION
				404	# The path of last found header.
				405	self._last_header = ''
				406
				407	def CanonicalizeAlphabeticalOrder(self, header_path):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	408	"""Returns a path canonicalized for alphabetical comparison.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	409
				410	- replaces "-" with "_" so they both cmp the same.
				411	- removes '-inl' since we don't require them to be after the main header.
				412	- lowercase everything, just in case.
				413
				414	Args:
				415	header_path: Path to be canonicalized.
				416
				417	Returns:
				418	Canonicalized path.
				419	"""
				420	return header_path.replace('-inl.h', '.h').replace('-', '_').lower()
				421
				422	def IsInAlphabeticalOrder(self, header_path):
				423	"""Check if a header is in alphabetical order with the previous header.
				424
				425	Args:
				426	header_path: Header to be checked.
				427
				428	Returns:
				429	Returns true if the header is in alphabetical order.
				430	"""
				431	canonical_header = self.CanonicalizeAlphabeticalOrder(header_path)
				432	if self._last_header > canonical_header:
				433	return False
				434	self._last_header = canonical_header
				435	return True
				436
				437	def CheckNextIncludeOrder(self, header_type):
				438	"""Returns a non-empty error message if the next header is out of order.
				439
				440	This function also updates the internal state to be ready to check
				441	the next include.
				442
				443	Args:
				444	header_type: One of the _XXX_HEADER constants defined above.
				445
				446	Returns:
				447	The empty string if the header is in the right order, or an
				448	error message describing what's wrong.
				449
				450	"""
				451	error_message = ('Found %s after %s' %
				452	(self._TYPE_NAMES[header_type],
				453	self._SECTION_NAMES[self._section]))
				454
				455	last_section = self._section
				456
				457	if header_type == _C_SYS_HEADER:
				458	if self._section <= self._C_SECTION:
				459	self._section = self._C_SECTION
				460	else:
				461	self._last_header = ''
				462	return error_message
				463	elif header_type == _CPP_SYS_HEADER:
				464	if self._section <= self._CPP_SECTION:
				465	self._section = self._CPP_SECTION
				466	else:
				467	self._last_header = ''
				468	return error_message
				469	elif header_type == _LIKELY_MY_HEADER:
				470	if self._section <= self._MY_H_SECTION:
				471	self._section = self._MY_H_SECTION
				472	else:
				473	self._section = self._OTHER_H_SECTION
				474	elif header_type == _POSSIBLE_MY_HEADER:
				475	if self._section <= self._MY_H_SECTION:
				476	self._section = self._MY_H_SECTION
				477	else:
				478	# This will always be the fallback because we're not sure
				479	# enough that the header is associated with this file.
				480	self._section = self._OTHER_H_SECTION
				481	else:
				482	assert header_type == _OTHER_HEADER
				483	self._section = self._OTHER_H_SECTION
				484
				485	if last_section != self._section:
				486	self._last_header = ''
				487
				488	return ''
				489
				490
				491	class _CppLintState(object):
				492	"""Maintains module-wide state.."""
				493
				494	def __init__(self):
				495	self.verbose_level = 1 # global setting.
				496	self.error_count = 0 # global count of reported errors
				497	# filters to apply when emitting error messages
				498	self.filters = _DEFAULT_FILTERS[:]
				499	self.counting = 'total' # In what way are we counting errors?
				500	self.errors_by_category = {} # string to int dict storing error counts
				501
				502	# output format:
				503	# "emacs" - format that emacs can parse (default)
				504	# "vs7" - format that Microsoft Visual Studio 7 can parse
				505	self.output_format = 'emacs'
				506
				507	def SetOutputFormat(self, output_format):
				508	"""Sets the output format for errors."""
				509	self.output_format = output_format
				510
				511	def SetVerboseLevel(self, level):
				512	"""Sets the module's verbosity, and returns the previous setting."""
				513	last_verbose_level = self.verbose_level
				514	self.verbose_level = level
				515	return last_verbose_level
				516
				517	def SetCountingStyle(self, counting_style):
				518	"""Sets the module's counting options."""
				519	self.counting = counting_style
				520
				521	def SetFilters(self, filters):
				522	"""Sets the error-message filters.
				523
				524	These filters are applied when deciding whether to emit a given
				525	error message.
				526
				527	Args:
				528	filters: A string of comma-separated filters (eg "+whitespace/indent").
				529	Each filter should start with + or -; else we die.
				530
				531	Raises:
				532	ValueError: The comma-separated filters did not all start with '+' or '-'.
				533	E.g. "-,+whitespace,-whitespace/indent,whitespace/badfilter"
				534	"""
				535	# Default filters always have less priority than the flag ones.
				536	self.filters = _DEFAULT_FILTERS[:]
				537	for filt in filters.split(','):
				538	clean_filt = filt.strip()
				539	if clean_filt:
				540	self.filters.append(clean_filt)
				541	for filt in self.filters:
				542	if not (filt.startswith('+') or filt.startswith('-')):
				543	raise ValueError('Every filter in --filters must start with + or -'
				544	' (%s does not)' % filt)
				545
				546	def ResetErrorCounts(self):
				547	"""Sets the module's error statistic back to zero."""
				548	self.error_count = 0
				549	self.errors_by_category = {}
				550
				551	def IncrementErrorCount(self, category):
				552	"""Bumps the module's error statistic."""
				553	self.error_count += 1
				554	if self.counting in ('toplevel', 'detailed'):
				555	if self.counting != 'detailed':
				556	category = category.split('/')[0]
				557	if category not in self.errors_by_category:
				558	self.errors_by_category[category] = 0
				559	self.errors_by_category[category] += 1
				560
				561	def PrintErrorCounts(self):
				562	"""Print a summary of errors by category, and the total."""
				563	for category, count in self.errors_by_category.iteritems():
				564	sys.stderr.write('Category \'%s\' errors found: %d\n' %
				565	(category, count))
				566	sys.stderr.write('Total errors found: %d\n' % self.error_count)
				567
				568	_cpplint_state = _CppLintState()
				569
				570
				571	def _OutputFormat():
				572	"""Gets the module's output format."""
				573	return _cpplint_state.output_format
				574
				575
				576	def _SetOutputFormat(output_format):
				577	"""Sets the module's output format."""
				578	_cpplint_state.SetOutputFormat(output_format)
				579
				580
				581	def _VerboseLevel():
				582	"""Returns the module's verbosity setting."""
				583	return _cpplint_state.verbose_level
				584
				585
				586	def _SetVerboseLevel(level):
				587	"""Sets the module's verbosity, and returns the previous setting."""
				588	return _cpplint_state.SetVerboseLevel(level)
				589
				590
				591	def _SetCountingStyle(level):
				592	"""Sets the module's counting options."""
				593	_cpplint_state.SetCountingStyle(level)
				594
				595
				596	def _Filters():
				597	"""Returns the module's list of output filters, as a list."""
				598	return _cpplint_state.filters
				599
				600
				601	def _SetFilters(filters):
				602	"""Sets the module's error-message filters.
				603
				604	These filters are applied when deciding whether to emit a given
				605	error message.
				606
				607	Args:
				608	filters: A string of comma-separated filters (eg "whitespace/indent").
				609	Each filter should start with + or -; else we die.
				610	"""
				611	_cpplint_state.SetFilters(filters)
				612
				613
				614	class _FunctionState(object):
				615	"""Tracks current function name and the number of lines in its body."""
				616
				617	_NORMAL_TRIGGER = 250 # for --v=0, 500 for --v=1, etc.
				618	_TEST_TRIGGER = 400 # about 50% more than _NORMAL_TRIGGER.
				619
				620	def __init__(self):
				621	self.in_a_function = False
				622	self.lines_in_function = 0
				623	self.current_function = ''
				624
				625	def Begin(self, function_name):
				626	"""Start analyzing function body.
				627
				628	Args:
				629	function_name: The name of the function being tracked.
				630	"""
				631	self.in_a_function = True
				632	self.lines_in_function = 0
				633	self.current_function = function_name
				634
				635	def Count(self):
				636	"""Count line in current function body."""
				637	if self.in_a_function:
				638	self.lines_in_function += 1
				639
				640	def Check(self, error, filename, linenum):
				641	"""Report if too many lines in function body.
				642
				643	Args:
				644	error: The function to call with any errors found.
				645	filename: The name of the current file.
				646	linenum: The number of the line to check.
				647	"""
Brian Carlstrom	1895ea3	2013-07-18 13:28:37 -0700	[diff] [blame]	648	# BEGIN android-added
				649	if not self.in_a_function:
				650	return
				651	# END android-added
				652
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	653	if Match(r'T(EST\|est)', self.current_function):
				654	base_trigger = self._TEST_TRIGGER
				655	else:
				656	base_trigger = self._NORMAL_TRIGGER
				657	trigger = base_trigger * 2**_VerboseLevel()
				658
				659	if self.lines_in_function > trigger:
				660	error_level = int(math.log(self.lines_in_function / base_trigger, 2))
				661	# 50 => 0, 100 => 1, 200 => 2, 400 => 3, 800 => 4, 1600 => 5, ...
				662	if error_level > 5:
				663	error_level = 5
				664	error(filename, linenum, 'readability/fn_size', error_level,
				665	'Small and focused functions are preferred:'
				666	' %s has %d non-comment lines'
				667	' (error triggered by exceeding %d lines).' % (
				668	self.current_function, self.lines_in_function, trigger))
				669
				670	def End(self):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	671	"""Stop analyzing function body."""
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	672	self.in_a_function = False
				673
				674
				675	class _IncludeError(Exception):
				676	"""Indicates a problem with the include order in a file."""
				677	pass
				678
				679
				680	class FileInfo:
				681	"""Provides utility functions for filenames.
				682
				683	FileInfo provides easy access to the components of a file's path
				684	relative to the project root.
				685	"""
				686
				687	def __init__(self, filename):
				688	self._filename = filename
				689
				690	def FullName(self):
				691	"""Make Windows paths like Unix."""
				692	return os.path.abspath(self._filename).replace('\\', '/')
				693
				694	def RepositoryName(self):
				695	"""FullName after removing the local path to the repository.
				696
				697	If we have a real absolute path name here we can try to do something smart:
				698	detecting the root of the checkout and truncating /path/to/checkout from
				699	the name so that we get header guards that don't include things like
				700	"C:\Documents and Settings\..." or "/home/username/..." in them and thus
				701	people on different computers who have checked the source out to different
				702	locations won't see bogus errors.
				703	"""
				704	fullname = self.FullName()
				705
				706	if os.path.exists(fullname):
				707	project_dir = os.path.dirname(fullname)
				708
				709	if os.path.exists(os.path.join(project_dir, ".svn")):
				710	# If there's a .svn file in the current directory, we recursively look
				711	# up the directory tree for the top of the SVN checkout
				712	root_dir = project_dir
				713	one_up_dir = os.path.dirname(root_dir)
				714	while os.path.exists(os.path.join(one_up_dir, ".svn")):
				715	root_dir = os.path.dirname(root_dir)
				716	one_up_dir = os.path.dirname(one_up_dir)
				717
				718	prefix = os.path.commonprefix([root_dir, project_dir])
				719	return fullname[len(prefix) + 1:]
				720
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	721	# Not SVN <= 1.6? Try to find a git, hg, or svn top level directory by
				722	# searching up from the current path.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	723	root_dir = os.path.dirname(fullname)
				724	while (root_dir != os.path.dirname(root_dir) and
				725	not os.path.exists(os.path.join(root_dir, ".git")) and
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	726	not os.path.exists(os.path.join(root_dir, ".hg")) and
				727	not os.path.exists(os.path.join(root_dir, ".svn"))):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	728	root_dir = os.path.dirname(root_dir)
				729
				730	if (os.path.exists(os.path.join(root_dir, ".git")) or
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	731	os.path.exists(os.path.join(root_dir, ".hg")) or
				732	os.path.exists(os.path.join(root_dir, ".svn"))):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	733	prefix = os.path.commonprefix([root_dir, project_dir])
Brian Carlstrom	fc0e321	2013-07-17 14:40:12 -0700	[diff] [blame]	734	# BEGIN android-changed
				735	# return fullname[len(prefix) + 1:]
				736	return "art/" + fullname[len(prefix) + 1:]
				737	# END android-changed
				738
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	739
				740	# Don't know what to do; header guard warnings may be wrong...
				741	return fullname
				742
				743	def Split(self):
				744	"""Splits the file into the directory, basename, and extension.
				745
				746	For 'chrome/browser/browser.cc', Split() would
				747	return ('chrome/browser', 'browser', '.cc')
				748
				749	Returns:
				750	A tuple of (directory, basename, extension).
				751	"""
				752
				753	googlename = self.RepositoryName()
				754	project, rest = os.path.split(googlename)
				755	return (project,) + os.path.splitext(rest)
				756
				757	def BaseName(self):
				758	"""File base name - text after the final slash, before the final period."""
				759	return self.Split()[1]
				760
				761	def Extension(self):
				762	"""File extension - text following the final period."""
				763	return self.Split()[2]
				764
				765	def NoExtension(self):
				766	"""File has no source file extension."""
				767	return '/'.join(self.Split()[0:2])
				768
				769	def IsSource(self):
				770	"""File has a source file extension."""
				771	return self.Extension()[1:] in ('c', 'cc', 'cpp', 'cxx')
				772
				773
				774	def _ShouldPrintError(category, confidence, linenum):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	775	"""If confidence >= verbose, category passes filter and is not suppressed."""
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	776
				777	# There are three ways we might decide not to print an error message:
				778	# a "NOLINT(category)" comment appears in the source,
				779	# the verbosity level isn't high enough, or the filters filter it out.
				780	if IsErrorSuppressedByNolint(category, linenum):
				781	return False
				782	if confidence < _cpplint_state.verbose_level:
				783	return False
				784
				785	is_filtered = False
				786	for one_filter in _Filters():
				787	if one_filter.startswith('-'):
				788	if category.startswith(one_filter[1:]):
				789	is_filtered = True
				790	elif one_filter.startswith('+'):
				791	if category.startswith(one_filter[1:]):
				792	is_filtered = False
				793	else:
				794	assert False # should have been checked for in SetFilter.
				795	if is_filtered:
				796	return False
				797
				798	return True
				799
				800
				801	def Error(filename, linenum, category, confidence, message):
				802	"""Logs the fact we've found a lint error.
				803
				804	We log where the error was found, and also our confidence in the error,
				805	that is, how certain we are this is a legitimate style regression, and
				806	not a misidentification or a use that's sometimes justified.
				807
				808	False positives can be suppressed by the use of
				809	"cpplint(category)" comments on the offending line. These are
				810	parsed into _error_suppressions.
				811
				812	Args:
				813	filename: The name of the file containing the error.
				814	linenum: The number of the line containing the error.
				815	category: A string used to describe the "category" this bug
				816	falls under: "whitespace", say, or "runtime". Categories
				817	may have a hierarchy separated by slashes: "whitespace/indent".
				818	confidence: A number from 1-5 representing a confidence score for
				819	the error, with 5 meaning that we are certain of the problem,
				820	and 1 meaning that it could be a legitimate construct.
				821	message: The error message.
				822	"""
				823	if _ShouldPrintError(category, confidence, linenum):
				824	_cpplint_state.IncrementErrorCount(category)
				825	if _cpplint_state.output_format == 'vs7':
				826	sys.stderr.write('%s(%s): %s [%s] [%d]\n' % (
				827	filename, linenum, message, category, confidence))
				828	else:
				829	sys.stderr.write('%s:%s: %s [%s] [%d]\n' % (
				830	filename, linenum, message, category, confidence))
				831
				832
				833	# Matches standard C++ escape esequences per 2.13.2.3 of the C++ standard.
				834	_RE_PATTERN_CLEANSE_LINE_ESCAPES = re.compile(
				835	r'\\([abfnrtv?"\\\']\|\d+\|x[0-9a-fA-F]+)')
				836	# Matches strings. Escape codes should already be removed by ESCAPES.
				837	_RE_PATTERN_CLEANSE_LINE_DOUBLE_QUOTES = re.compile(r'"[^"]*"')
				838	# Matches characters. Escape codes should already be removed by ESCAPES.
				839	_RE_PATTERN_CLEANSE_LINE_SINGLE_QUOTES = re.compile(r"'.'")
				840	# Matches multi-line C++ comments.
				841	# This RE is a little bit more complicated than one might expect, because we
				842	# have to take care of space removals tools so we can handle comments inside
				843	# statements better.
				844	# The current rule is: We only clear spaces from both sides when we're at the
				845	# end of the line. Otherwise, we try to remove spaces from the right side,
				846	# if this doesn't work we try on left side but only if there's a non-character
				847	# on the right.
				848	_RE_PATTERN_CLEANSE_LINE_C_COMMENTS = re.compile(
				849	r"""(\s/\.\/\s*$\|
				850	/\.\*/\s+\|
				851	\s+/\.\*/(?=\W)\|
				852	/\.\*/)""", re.VERBOSE)
				853
				854
				855	def IsCppString(line):
				856	"""Does line terminate so, that the next symbol is in string constant.
				857
				858	This function does not consider single-line nor multi-line comments.
				859
				860	Args:
				861	line: is a partial line of code starting from the 0..n.
				862
				863	Returns:
				864	True, if next character appended to 'line' is inside a
				865	string constant.
				866	"""
				867
				868	line = line.replace(r'\\', 'XX') # after this, \\" does not match to \"
				869	return ((line.count('"') - line.count(r'\"') - line.count("'\"'")) & 1) == 1
				870
				871
				872	def FindNextMultiLineCommentStart(lines, lineix):
				873	"""Find the beginning marker for a multiline comment."""
				874	while lineix < len(lines):
				875	if lines[lineix].strip().startswith('/*'):
				876	# Only return this marker if the comment goes beyond this line
				877	if lines[lineix].strip().find('*/', 2) < 0:
				878	return lineix
				879	lineix += 1
				880	return len(lines)
				881
				882
				883	def FindNextMultiLineCommentEnd(lines, lineix):
				884	"""We are inside a comment, find the end marker."""
				885	while lineix < len(lines):
				886	if lines[lineix].strip().endswith('*/'):
				887	return lineix
				888	lineix += 1
				889	return len(lines)
				890
				891
				892	def RemoveMultiLineCommentsFromRange(lines, begin, end):
				893	"""Clears a range of lines for multi-line comments."""
				894	# Having // dummy comments makes the lines non-empty, so we will not get
				895	# unnecessary blank line warnings later in the code.
				896	for i in range(begin, end):
				897	lines[i] = '// dummy'
				898
				899
				900	def RemoveMultiLineComments(filename, lines, error):
				901	"""Removes multiline (c-style) comments from lines."""
				902	lineix = 0
				903	while lineix < len(lines):
				904	lineix_begin = FindNextMultiLineCommentStart(lines, lineix)
				905	if lineix_begin >= len(lines):
				906	return
				907	lineix_end = FindNextMultiLineCommentEnd(lines, lineix_begin)
				908	if lineix_end >= len(lines):
				909	error(filename, lineix_begin + 1, 'readability/multiline_comment', 5,
				910	'Could not find end of multi-line comment')
				911	return
				912	RemoveMultiLineCommentsFromRange(lines, lineix_begin, lineix_end + 1)
				913	lineix = lineix_end + 1
				914
				915
				916	def CleanseComments(line):
				917	"""Removes //-comments and single-line C-style /* */ comments.
				918
				919	Args:
				920	line: A line of C++ source.
				921
				922	Returns:
				923	The line with single-line comments removed.
				924	"""
				925	commentpos = line.find('//')
				926	if commentpos != -1 and not IsCppString(line[:commentpos]):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	927	line = line[:commentpos].rstrip()
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	928	# get rid of /* ... */
				929	return _RE_PATTERN_CLEANSE_LINE_C_COMMENTS.sub('', line)
				930
				931
				932	class CleansedLines(object):
				933	"""Holds 3 copies of all lines with different preprocessing applied to them.
				934
				935	1) elided member contains lines without strings and comments,
				936	2) lines member contains lines without comments, and
				937	3) raw member contains all the lines without processing.
				938	All these three members are of <type 'list'>, and of the same length.
				939	"""
				940
				941	def __init__(self, lines):
				942	self.elided = []
				943	self.lines = []
				944	self.raw_lines = lines
				945	self.num_lines = len(lines)
				946	for linenum in range(len(lines)):
				947	self.lines.append(CleanseComments(lines[linenum]))
				948	elided = self._CollapseStrings(lines[linenum])
				949	self.elided.append(CleanseComments(elided))
				950
				951	def NumLines(self):
				952	"""Returns the number of lines represented."""
				953	return self.num_lines
				954
				955	@staticmethod
				956	def _CollapseStrings(elided):
				957	"""Collapses strings and chars on a line to simple "" or '' blocks.
				958
				959	We nix strings first so we're not fooled by text like '"http://"'
				960
				961	Args:
				962	elided: The line being processed.
				963
				964	Returns:
				965	The line with collapsed strings.
				966	"""
				967	if not _RE_PATTERN_INCLUDE.match(elided):
				968	# Remove escaped characters first to make quote/single quote collapsing
				969	# basic. Things that look like escaped characters shouldn't occur
				970	# outside of strings and chars.
				971	elided = _RE_PATTERN_CLEANSE_LINE_ESCAPES.sub('', elided)
				972	elided = _RE_PATTERN_CLEANSE_LINE_SINGLE_QUOTES.sub("''", elided)
				973	elided = _RE_PATTERN_CLEANSE_LINE_DOUBLE_QUOTES.sub('""', elided)
				974	return elided
				975
				976
				977	def CloseExpression(clean_lines, linenum, pos):
				978	"""If input points to ( or { or [, finds the position that closes it.
				979
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	980	If lines[linenum][pos] points to a '(' or '{' or '[', finds the
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	981	linenum/pos that correspond to the closing of the expression.
				982
				983	Args:
				984	clean_lines: A CleansedLines instance containing the file.
				985	linenum: The number of the line to check.
				986	pos: A position on the line.
				987
				988	Returns:
				989	A tuple (line, linenum, pos) pointer past the closing brace, or
				990	(line, len(lines), -1) if we never find a close. Note we ignore
				991	strings and comments when matching; and the line we return is the
				992	'cleansed' line at linenum.
				993	"""
				994
				995	line = clean_lines.elided[linenum]
				996	startchar = line[pos]
				997	if startchar not in '({[':
				998	return (line, clean_lines.NumLines(), -1)
				999	if startchar == '(': endchar = ')'
				1000	if startchar == '[': endchar = ']'
				1001	if startchar == '{': endchar = '}'
				1002
				1003	num_open = line.count(startchar) - line.count(endchar)
				1004	while linenum < clean_lines.NumLines() and num_open > 0:
				1005	linenum += 1
				1006	line = clean_lines.elided[linenum]
				1007	num_open += line.count(startchar) - line.count(endchar)
				1008	# OK, now find the endchar that actually got us back to even
				1009	endpos = len(line)
				1010	while num_open >= 0:
				1011	endpos = line.rfind(')', 0, endpos)
				1012	num_open -= 1 # chopped off another )
				1013	return (line, linenum, endpos + 1)
				1014
				1015
				1016	def CheckForCopyright(filename, lines, error):
				1017	"""Logs an error if no Copyright message appears at the top of the file."""
				1018
				1019	# We'll say it should occur by line 10. Don't forget there's a
				1020	# dummy line at the front.
				1021	for line in xrange(1, min(len(lines), 11)):
				1022	if re.search(r'Copyright', lines[line], re.I): break
				1023	else: # means no copyright line was found
				1024	error(filename, 0, 'legal/copyright', 5,
				1025	'No copyright message found. '
				1026	'You should have a line: "Copyright [year] <Copyright Owner>"')
				1027
				1028
				1029	def GetHeaderGuardCPPVariable(filename):
				1030	"""Returns the CPP variable that should be used as a header guard.
				1031
				1032	Args:
				1033	filename: The name of a C++ header file.
				1034
				1035	Returns:
				1036	The CPP variable that should be used as a header guard in the
				1037	named file.
				1038
				1039	"""
				1040
				1041	# Restores original filename in case that cpplint is invoked from Emacs's
				1042	# flymake.
				1043	filename = re.sub(r'_flymake\.h$', '.h', filename)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1044	fileinfo = FileInfo(filename)
				1045	return re.sub(r'[-./\s]', '_', fileinfo.RepositoryName()).upper() + '_'
				1046
				1047
				1048	def CheckForHeaderGuard(filename, lines, error):
				1049	"""Checks that the file contains a header guard.
				1050
				1051	Logs an error if no #ifndef header guard is present. For other
				1052	headers, checks that the full pathname is used.
				1053
				1054	Args:
				1055	filename: The name of the C++ header file.
				1056	lines: An array of strings, each representing a line of the file.
				1057	error: The function to call with any errors found.
				1058	"""
				1059
				1060	cppvar = GetHeaderGuardCPPVariable(filename)
				1061
				1062	ifndef = None
				1063	ifndef_linenum = 0
				1064	define = None
				1065	endif = None
				1066	endif_linenum = 0
				1067	for linenum, line in enumerate(lines):
				1068	linesplit = line.split()
				1069	if len(linesplit) >= 2:
				1070	# find the first occurrence of #ifndef and #define, save arg
				1071	if not ifndef and linesplit[0] == '#ifndef':
				1072	# set ifndef to the header guard presented on the #ifndef line.
				1073	ifndef = linesplit[1]
				1074	ifndef_linenum = linenum
				1075	if not define and linesplit[0] == '#define':
				1076	define = linesplit[1]
				1077	# find the last occurrence of #endif, save entire line
				1078	if line.startswith('#endif'):
				1079	endif = line
				1080	endif_linenum = linenum
				1081
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1082	if not ifndef:
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1083	error(filename, 0, 'build/header_guard', 5,
				1084	'No #ifndef header guard found, suggested CPP variable is: %s' %
				1085	cppvar)
				1086	return
				1087
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1088	if not define:
				1089	error(filename, 0, 'build/header_guard', 5,
				1090	'No #define header guard found, suggested CPP variable is: %s' %
				1091	cppvar)
				1092	return
				1093
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1094	# The guard should be PATH_FILE_H_, but we also allow PATH_FILE_H__
				1095	# for backward compatibility.
				1096	if ifndef != cppvar:
				1097	error_level = 0
				1098	if ifndef != cppvar + '_':
				1099	error_level = 5
				1100
				1101	ParseNolintSuppressions(filename, lines[ifndef_linenum], ifndef_linenum,
				1102	error)
				1103	error(filename, ifndef_linenum, 'build/header_guard', error_level,
				1104	'#ifndef header guard has wrong style, please use: %s' % cppvar)
				1105
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1106	if define != ifndef:
				1107	error(filename, 0, 'build/header_guard', 5,
				1108	'#ifndef and #define don\'t match, suggested CPP variable is: %s' %
				1109	cppvar)
				1110	return
				1111
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1112	if endif != ('#endif // %s' % cppvar):
				1113	error_level = 0
				1114	if endif != ('#endif // %s' % (cppvar + '_')):
				1115	error_level = 5
				1116
				1117	ParseNolintSuppressions(filename, lines[endif_linenum], endif_linenum,
				1118	error)
				1119	error(filename, endif_linenum, 'build/header_guard', error_level,
				1120	'#endif line should be "#endif // %s"' % cppvar)
				1121
				1122
				1123	def CheckForUnicodeReplacementCharacters(filename, lines, error):
				1124	"""Logs an error for each line containing Unicode replacement characters.
				1125
				1126	These indicate that either the file contained invalid UTF-8 (likely)
				1127	or Unicode replacement characters (which it shouldn't). Note that
				1128	it's possible for this to throw off line numbering if the invalid
				1129	UTF-8 occurred adjacent to a newline.
				1130
				1131	Args:
				1132	filename: The name of the current file.
				1133	lines: An array of strings, each representing a line of the file.
				1134	error: The function to call with any errors found.
				1135	"""
				1136	for linenum, line in enumerate(lines):
				1137	if u'\ufffd' in line:
				1138	error(filename, linenum, 'readability/utf8', 5,
				1139	'Line contains invalid UTF-8 (or Unicode replacement character).')
				1140
				1141
				1142	def CheckForNewlineAtEOF(filename, lines, error):
				1143	"""Logs an error if there is no newline char at the end of the file.
				1144
				1145	Args:
				1146	filename: The name of the current file.
				1147	lines: An array of strings, each representing a line of the file.
				1148	error: The function to call with any errors found.
				1149	"""
				1150
				1151	# The array lines() was created by adding two newlines to the
				1152	# original file (go figure), then splitting on \n.
				1153	# To verify that the file ends in \n, we just have to make sure the
				1154	# last-but-two element of lines() exists and is empty.
				1155	if len(lines) < 3 or lines[-2]:
				1156	error(filename, len(lines) - 2, 'whitespace/ending_newline', 5,
				1157	'Could not find a newline character at the end of the file.')
				1158
				1159
				1160	def CheckForMultilineCommentsAndStrings(filename, clean_lines, linenum, error):
				1161	"""Logs an error if we see /* ... */ or "..." that extend past one line.
				1162
				1163	/* ... */ comments are legit inside macros, for one line.
				1164	Otherwise, we prefer // comments, so it's ok to warn about the
				1165	other. Likewise, it's ok for strings to extend across multiple
				1166	lines, as long as a line continuation character (backslash)
				1167	terminates each line. Although not currently prohibited by the C++
				1168	style guide, it's ugly and unnecessary. We don't do well with either
				1169	in this lint program, so we warn about both.
				1170
				1171	Args:
				1172	filename: The name of the current file.
				1173	clean_lines: A CleansedLines instance containing the file.
				1174	linenum: The number of the line to check.
				1175	error: The function to call with any errors found.
				1176	"""
				1177	line = clean_lines.elided[linenum]
				1178
				1179	# Remove all \\ (escaped backslashes) from the line. They are OK, and the
				1180	# second (escaped) slash may trigger later \" detection erroneously.
				1181	line = line.replace('\\\\', '')
				1182
				1183	if line.count('/') > line.count('/'):
				1184	error(filename, linenum, 'readability/multiline_comment', 5,
				1185	'Complex multi-line /.../-style comment found. '
				1186	'Lint may give bogus warnings. '
				1187	'Consider replacing these with //-style comments, '
				1188	'with #if 0...#endif, '
				1189	'or with more clearly structured multi-line comments.')
				1190
				1191	if (line.count('"') - line.count('\\"')) % 2:
				1192	error(filename, linenum, 'readability/multiline_string', 5,
				1193	'Multi-line string ("...") found. This lint script doesn\'t '
				1194	'do well with such strings, and may give bogus warnings. They\'re '
				1195	'ugly and unnecessary, and you should use concatenation instead".')
				1196
				1197
				1198	threading_list = (
				1199	('asctime(', 'asctime_r('),
				1200	('ctime(', 'ctime_r('),
				1201	('getgrgid(', 'getgrgid_r('),
				1202	('getgrnam(', 'getgrnam_r('),
				1203	('getlogin(', 'getlogin_r('),
				1204	('getpwnam(', 'getpwnam_r('),
				1205	('getpwuid(', 'getpwuid_r('),
				1206	('gmtime(', 'gmtime_r('),
				1207	('localtime(', 'localtime_r('),
				1208	('rand(', 'rand_r('),
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1209	('strtok(', 'strtok_r('),
				1210	('ttyname(', 'ttyname_r('),
				1211	)
				1212
				1213
				1214	def CheckPosixThreading(filename, clean_lines, linenum, error):
				1215	"""Checks for calls to thread-unsafe functions.
				1216
				1217	Much code has been originally written without consideration of
				1218	multi-threading. Also, engineers are relying on their old experience;
				1219	they have learned posix before threading extensions were added. These
				1220	tests guide the engineers to use thread-safe functions (when using
				1221	posix directly).
				1222
				1223	Args:
				1224	filename: The name of the current file.
				1225	clean_lines: A CleansedLines instance containing the file.
				1226	linenum: The number of the line to check.
				1227	error: The function to call with any errors found.
				1228	"""
				1229	line = clean_lines.elided[linenum]
				1230	for single_thread_function, multithread_safe_function in threading_list:
				1231	ix = line.find(single_thread_function)
				1232	# Comparisons made explicit for clarity -- pylint: disable-msg=C6403
				1233	if ix >= 0 and (ix == 0 or (not line[ix - 1].isalnum() and
				1234	line[ix - 1] not in ('_', '.', '>'))):
				1235	error(filename, linenum, 'runtime/threadsafe_fn', 2,
				1236	'Consider using ' + multithread_safe_function +
				1237	'...) instead of ' + single_thread_function +
				1238	'...) for improved thread safety.')
				1239
				1240
				1241	# Matches invalid increment: *count++, which moves pointer instead of
				1242	# incrementing a value.
				1243	_RE_PATTERN_INVALID_INCREMENT = re.compile(
				1244	r'^\s\\w+(\+\+\|--);')
				1245
				1246
				1247	def CheckInvalidIncrement(filename, clean_lines, linenum, error):
				1248	"""Checks for invalid increment *count++.
				1249
				1250	For example following function:
				1251	void increment_counter(int* count) {
				1252	*count++;
				1253	}
				1254	is invalid, because it effectively does count++, moving pointer, and should
				1255	be replaced with ++count, (count)++ or *count += 1.
				1256
				1257	Args:
				1258	filename: The name of the current file.
				1259	clean_lines: A CleansedLines instance containing the file.
				1260	linenum: The number of the line to check.
				1261	error: The function to call with any errors found.
				1262	"""
				1263	line = clean_lines.elided[linenum]
				1264	if _RE_PATTERN_INVALID_INCREMENT.match(line):
				1265	error(filename, linenum, 'runtime/invalid_increment', 5,
				1266	'Changing pointer instead of value (or unused value of operator*).')
				1267
				1268
				1269	class _ClassInfo(object):
				1270	"""Stores information about a class."""
				1271
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1272	def __init__(self, name, clean_lines, linenum):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1273	self.name = name
				1274	self.linenum = linenum
				1275	self.seen_open_brace = False
				1276	self.is_derived = False
				1277	self.virtual_method_linenumber = None
				1278	self.has_virtual_destructor = False
				1279	self.brace_depth = 0
				1280
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1281	# Try to find the end of the class. This will be confused by things like:
				1282	# class A {
				1283	# } *x = { ...
				1284	#
				1285	# But it's still good enough for CheckSectionSpacing.
				1286	self.last_line = 0
				1287	depth = 0
				1288	for i in range(linenum, clean_lines.NumLines()):
				1289	line = clean_lines.lines[i]
				1290	depth += line.count('{') - line.count('}')
				1291	if not depth:
				1292	self.last_line = i
				1293	break
				1294
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1295
				1296	class _ClassState(object):
				1297	"""Holds the current state of the parse relating to class declarations.
				1298
				1299	It maintains a stack of _ClassInfos representing the parser's guess
				1300	as to the current nesting of class declarations. The innermost class
				1301	is at the top (back) of the stack. Typically, the stack will either
				1302	be empty or have exactly one entry.
				1303	"""
				1304
				1305	def __init__(self):
				1306	self.classinfo_stack = []
				1307
				1308	def CheckFinished(self, filename, error):
				1309	"""Checks that all classes have been completely parsed.
				1310
				1311	Call this when all lines in a file have been processed.
				1312	Args:
				1313	filename: The name of the current file.
				1314	error: The function to call with any errors found.
				1315	"""
				1316	if self.classinfo_stack:
				1317	# Note: This test can result in false positives if #ifdef constructs
				1318	# get in the way of brace matching. See the testBuildClass test in
				1319	# cpplint_unittest.py for an example of this.
				1320	error(filename, self.classinfo_stack[0].linenum, 'build/class', 5,
				1321	'Failed to find complete declaration of class %s' %
				1322	self.classinfo_stack[0].name)
				1323
				1324
				1325	def CheckForNonStandardConstructs(filename, clean_lines, linenum,
				1326	class_state, error):
				1327	"""Logs an error if we see certain non-ANSI constructs ignored by gcc-2.
				1328
				1329	Complain about several constructs which gcc-2 accepts, but which are
				1330	not standard C++. Warning about these in lint is one way to ease the
				1331	transition to new compilers.
				1332	- put storage class first (e.g. "static const" instead of "const static").
				1333	- "%lld" instead of %qd" in printf-type functions.
				1334	- "%1$d" is non-standard in printf-type functions.
				1335	- "\%" is an undefined character escape sequence.
				1336	- text after #endif is not allowed.
				1337	- invalid inner-style forward declaration.
				1338	- >? and <? operators, and their >?= and <?= cousins.
				1339	- classes with virtual methods need virtual destructors (compiler warning
				1340	available, but not turned on yet.)
				1341
				1342	Additionally, check for constructor/destructor style violations and reference
				1343	members, as it is very convenient to do so while checking for
				1344	gcc-2 compliance.
				1345
				1346	Args:
				1347	filename: The name of the current file.
				1348	clean_lines: A CleansedLines instance containing the file.
				1349	linenum: The number of the line to check.
				1350	class_state: A _ClassState instance which maintains information about
				1351	the current stack of nested class declarations being parsed.
				1352	error: A callable to which errors are reported, which takes 4 arguments:
				1353	filename, line number, error level, and message
				1354	"""
				1355
				1356	# Remove comments from the line, but leave in strings for now.
				1357	line = clean_lines.lines[linenum]
				1358
				1359	if Search(r'printf\s\(.".%[-+ ]?\dq', line):
				1360	error(filename, linenum, 'runtime/printf_format', 3,
				1361	'%q in format strings is deprecated. Use %ll instead.')
				1362
				1363	if Search(r'printf\s\(.".*%\d+\$', line):
				1364	error(filename, linenum, 'runtime/printf_format', 2,
				1365	'%N$ formats are unconventional. Try rewriting to avoid them.')
				1366
				1367	# Remove escaped backslashes before looking for undefined escapes.
				1368	line = line.replace('\\\\', '')
				1369
				1370	if Search(r'("\|\').*\\(%\|\[\|\(\|{)', line):
				1371	error(filename, linenum, 'build/printf_format', 3,
				1372	'%, [, (, and { are undefined character escapes. Unescape them.')
				1373
				1374	# For the rest, work with both comments and strings removed.
				1375	line = clean_lines.elided[linenum]
				1376
				1377	if Search(r'\b(const\|volatile\|void\|char\|short\|int\|long'
				1378	r'\|float\|double\|signed\|unsigned'
				1379	r'\|schar\|u?int8\|u?int16\|u?int32\|u?int64)'
				1380	r'\s+(auto\|register\|static\|extern\|typedef)\b',
				1381	line):
				1382	error(filename, linenum, 'build/storage_class', 5,
				1383	'Storage class (static, extern, typedef, etc) should be first.')
				1384
				1385	if Match(r'\s#\sendif\s*[^/\s]+', line):
				1386	error(filename, linenum, 'build/endif_comment', 5,
				1387	'Uncommented text after #endif is non-standard. Use a comment.')
				1388
				1389	if Match(r'\sclass\s+(\w+\s::\s)+\w+\s;', line):
				1390	error(filename, linenum, 'build/forward_decl', 5,
				1391	'Inner-style forward declarations are invalid. Remove this line.')
				1392
				1393	if Search(r'(\w+\|[+-]?\d+(\.\d)?)\s(<\|>)\?=?\s(\w+\|[+-]?\d+)(\.\d)?',
				1394	line):
				1395	error(filename, linenum, 'build/deprecated', 3,
				1396	'>? and <? (max and min) operators are non-standard and deprecated.')
				1397
				1398	if Search(r'^\sconst\sstring\s&\s\w+\s*;', line):
				1399	# TODO(unknown): Could it be expanded safely to arbitrary references,
				1400	# without triggering too many false positives? The first
				1401	# attempt triggered 5 warnings for mostly benign code in the regtest, hence
				1402	# the restriction.
				1403	# Here's the original regexp, for the reference:
				1404	# type_name = r'\w+((\s::\s\w+)\|(\s<\s\w+?\s*>))?'
				1405	# r'\sconst\s' + type_name + '\s&\s\w+\s*;'
				1406	error(filename, linenum, 'runtime/member_string_references', 2,
				1407	'const string& members are dangerous. It is much better to use '
				1408	'alternatives, such as pointers or simple constants.')
				1409
				1410	# Track class entry and exit, and attempt to find cases within the
				1411	# class declaration that don't meet the C++ style
				1412	# guidelines. Tracking is very dependent on the code matching Google
				1413	# style guidelines, but it seems to perform well enough in testing
				1414	# to be a worthwhile addition to the checks.
				1415	classinfo_stack = class_state.classinfo_stack
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1416	# Look for a class declaration. The regexp accounts for decorated classes
				1417	# such as in:
				1418	# class LOCKABLE API Object {
				1419	# };
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1420	class_decl_match = Match(
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1421	r'\s(template\s<[\w\s<>,:]>\s)?'
				1422	'(class\|struct)\s+([A-Z_]+\s+)(\w+(::\w+))', line)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1423	if class_decl_match:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1424	classinfo_stack.append(_ClassInfo(
				1425	class_decl_match.group(4), clean_lines, linenum))
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1426
				1427	# Everything else in this function uses the top of the stack if it's
				1428	# not empty.
				1429	if not classinfo_stack:
				1430	return
				1431
				1432	classinfo = classinfo_stack[-1]
				1433
				1434	# If the opening brace hasn't been seen look for it and also
				1435	# parent class declarations.
				1436	if not classinfo.seen_open_brace:
				1437	# If the line has a ';' in it, assume it's a forward declaration or
				1438	# a single-line class declaration, which we won't process.
				1439	if line.find(';') != -1:
				1440	classinfo_stack.pop()
				1441	return
				1442	classinfo.seen_open_brace = (line.find('{') != -1)
				1443	# Look for a bare ':'
				1444	if Search('(^\|[^:]):($\|[^:])', line):
				1445	classinfo.is_derived = True
				1446	if not classinfo.seen_open_brace:
				1447	return # Everything else in this function is for after open brace
				1448
				1449	# The class may have been declared with namespace or classname qualifiers.
				1450	# The constructor and destructor will not have those qualifiers.
				1451	base_classname = classinfo.name.split('::')[-1]
				1452
				1453	# Look for single-argument constructors that aren't marked explicit.
				1454	# Technically a valid construct, but against style.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1455	args = Match(r'\s+(?:inline\s+)?%s\s*$([^,()]+)$'
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1456	% re.escape(base_classname),
				1457	line)
				1458	if (args and
				1459	args.group(1) != 'void' and
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1460	not Match(r'(const\s+)?%s\s(?:<\w+>\s)?&' % re.escape(base_classname),
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1461	args.group(1).strip())):
				1462	error(filename, linenum, 'runtime/explicit', 5,
				1463	'Single-argument constructors should be marked explicit.')
				1464
				1465	# Look for methods declared virtual.
				1466	if Search(r'\bvirtual\b', line):
				1467	classinfo.virtual_method_linenumber = linenum
				1468	# Only look for a destructor declaration on the same line. It would
				1469	# be extremely unlikely for the destructor declaration to occupy
				1470	# more than one line.
				1471	if Search(r'~%s\s*\(' % base_classname, line):
				1472	classinfo.has_virtual_destructor = True
				1473
				1474	# Look for class end.
				1475	brace_depth = classinfo.brace_depth
				1476	brace_depth = brace_depth + line.count('{') - line.count('}')
				1477	if brace_depth <= 0:
				1478	classinfo = classinfo_stack.pop()
				1479	# Try to detect missing virtual destructor declarations.
				1480	# For now, only warn if a non-derived class with virtual methods lacks
				1481	# a virtual destructor. This is to make it less likely that people will
				1482	# declare derived virtual destructors without declaring the base
				1483	# destructor virtual.
				1484	if ((classinfo.virtual_method_linenumber is not None) and
				1485	(not classinfo.has_virtual_destructor) and
				1486	(not classinfo.is_derived)): # Only warn for base classes
				1487	error(filename, classinfo.linenum, 'runtime/virtual', 4,
				1488	'The class %s probably needs a virtual destructor due to '
				1489	'having virtual method(s), one declared at line %d.'
				1490	% (classinfo.name, classinfo.virtual_method_linenumber))
				1491	else:
				1492	classinfo.brace_depth = brace_depth
				1493
				1494
				1495	def CheckSpacingForFunctionCall(filename, line, linenum, error):
				1496	"""Checks for the correctness of various spacing around function calls.
				1497
				1498	Args:
				1499	filename: The name of the current file.
				1500	line: The text of the line to check.
				1501	linenum: The number of the line to check.
				1502	error: The function to call with any errors found.
				1503	"""
				1504
				1505	# Since function calls often occur inside if/for/while/switch
				1506	# expressions - which have their own, more liberal conventions - we
				1507	# first see if we should be looking inside such an expression for a
				1508	# function call, to which we can apply more strict standards.
				1509	fncall = line # if there's no control flow construct, look at whole line
				1510	for pattern in (r'\bif\s$(.)$\s*{',
				1511	r'\bfor\s$(.)$\s*{',
				1512	r'\bwhile\s$(.)$\s*[{;]',
				1513	r'\bswitch\s$(.)$\s*{'):
				1514	match = Search(pattern, line)
				1515	if match:
				1516	fncall = match.group(1) # look inside the parens for function calls
				1517	break
				1518
				1519	# Except in if/for/while/switch, there should never be space
				1520	# immediately inside parens (eg "f( 3, 4 )"). We make an exception
				1521	# for nested parens ( (a+b) + c ). Likewise, there should never be
				1522	# a space before a ( when it's a function argument. I assume it's a
				1523	# function argument when the char before the whitespace is legal in
				1524	# a function name (alnum + _) and we're not starting a macro. Also ignore
				1525	# pointers and references to arrays and functions coz they're too tricky:
				1526	# we use a very simple way to recognize these:
				1527	# " (something)(maybe-something)" or
				1528	# " (something)(maybe-something," or
				1529	# " (something)[something]"
				1530	# Note that we assume the contents of [] to be short enough that
				1531	# they'll never need to wrap.
				1532	if ( # Ignore control structures.
Brian Carlstrom	df62950	2013-07-17 22:39:56 -0700	[diff] [blame]	1533	# BEGIN android-changed
				1534	# not Search(r'\b(if\|for\|while\|switch\|return\|delete)\b', fncall) and
				1535	not Search(r'\b(if\|for\|while\|switch\|return\|delete\|new)\b', fncall) and
				1536	# END android-changed
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1537	# Ignore pointers/references to functions.
				1538	not Search(r' $[^)]+$$[^)]*($\|,$)', fncall) and
				1539	# Ignore pointers/references to arrays.
				1540	not Search(r' $[^)]+$\[[^\]]+\]', fncall)):
				1541	if Search(r'\w\s\(\s(?!\s\\$)', fncall): # a ( used for a fn call
				1542	error(filename, linenum, 'whitespace/parens', 4,
				1543	'Extra space after ( in function call')
				1544	elif Search(r'$\s+(?!(\s*\$\|\()', fncall):
				1545	error(filename, linenum, 'whitespace/parens', 2,
				1546	'Extra space after (')
				1547	if (Search(r'\w\s+\(', fncall) and
				1548	not Search(r'#\s*define\|typedef', fncall)):
				1549	error(filename, linenum, 'whitespace/parens', 4,
				1550	'Extra space before ( in function call')
				1551	# If the ) is followed only by a newline or a { + newline, assume it's
				1552	# part of a control statement (if/while/etc), and don't complain
				1553	if Search(r'[^)]\s+\)\s*[^{\s]', fncall):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1554	# If the closing parenthesis is preceded by only whitespaces,
				1555	# try to give a more descriptive error message.
				1556	if Search(r'^\s+\)', fncall):
				1557	error(filename, linenum, 'whitespace/parens', 2,
				1558	'Closing ) should be moved to the previous line')
				1559	else:
				1560	error(filename, linenum, 'whitespace/parens', 2,
				1561	'Extra space before )')
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1562
				1563
				1564	def IsBlankLine(line):
				1565	"""Returns true if the given line is blank.
				1566
				1567	We consider a line to be blank if the line is empty or consists of
				1568	only white spaces.
				1569
				1570	Args:
				1571	line: A line of a string.
				1572
				1573	Returns:
				1574	True, if the given line is blank.
				1575	"""
				1576	return not line or line.isspace()
				1577
				1578
				1579	def CheckForFunctionLengths(filename, clean_lines, linenum,
				1580	function_state, error):
				1581	"""Reports for long function bodies.
				1582
				1583	For an overview why this is done, see:
				1584	http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml#Write_Short_Functions
				1585
				1586	Uses a simplistic algorithm assuming other style guidelines
				1587	(especially spacing) are followed.
				1588	Only checks unindented functions, so class members are unchecked.
				1589	Trivial bodies are unchecked, so constructors with huge initializer lists
				1590	may be missed.
				1591	Blank/comment lines are not counted so as to avoid encouraging the removal
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1592	of vertical space and comments just to get through a lint check.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1593	NOLINT on the last line of a function disables this check.
				1594
				1595	Args:
				1596	filename: The name of the current file.
				1597	clean_lines: A CleansedLines instance containing the file.
				1598	linenum: The number of the line to check.
				1599	function_state: Current function name and lines in body so far.
				1600	error: The function to call with any errors found.
				1601	"""
				1602	lines = clean_lines.lines
				1603	line = lines[linenum]
				1604	raw = clean_lines.raw_lines
				1605	raw_line = raw[linenum]
				1606	joined_line = ''
				1607
				1608	starting_func = False
				1609	regexp = r'(\w(\w\|::\|\\|\&\|\s))\(' # decls * & space::name( ...
				1610	match_result = Match(regexp, line)
				1611	if match_result:
				1612	# If the name is all caps and underscores, figure it's a macro and
				1613	# ignore it, unless it's TEST or TEST_F.
				1614	function_name = match_result.group(1).split()[-1]
				1615	if function_name == 'TEST' or function_name == 'TEST_F' or (
				1616	not Match(r'[A-Z_]+$', function_name)):
				1617	starting_func = True
				1618
				1619	if starting_func:
				1620	body_found = False
				1621	for start_linenum in xrange(linenum, clean_lines.NumLines()):
				1622	start_line = lines[start_linenum]
				1623	joined_line += ' ' + start_line.lstrip()
				1624	if Search(r'(;\|})', start_line): # Declarations and trivial functions
				1625	body_found = True
				1626	break # ... ignore
				1627	elif Search(r'{', start_line):
				1628	body_found = True
				1629	function = Search(r'((\w\|:)*)\(', line).group(1)
				1630	if Match(r'TEST', function): # Handle TEST... macros
				1631	parameter_regexp = Search(r'($.*$)', joined_line)
				1632	if parameter_regexp: # Ignore bad syntax
				1633	function += parameter_regexp.group(1)
				1634	else:
				1635	function += '()'
				1636	function_state.Begin(function)
				1637	break
				1638	if not body_found:
				1639	# No body for the function (or evidence of a non-function) was found.
				1640	error(filename, linenum, 'readability/fn_size', 5,
				1641	'Lint failed to find start of function body.')
				1642	elif Match(r'^\}\s*$', line): # function end
				1643	function_state.Check(error, filename, linenum)
				1644	function_state.End()
				1645	elif not Match(r'^\s*$', line):
				1646	function_state.Count() # Count non-blank/non-comment lines.
				1647
				1648
				1649	_RE_PATTERN_TODO = re.compile(r'^//(\s*)TODO($.+?$)?:?(\s\|$)?')
				1650
				1651
				1652	def CheckComment(comment, filename, linenum, error):
				1653	"""Checks for common mistakes in TODO comments.
				1654
				1655	Args:
				1656	comment: The text of the comment from the line in question.
				1657	filename: The name of the current file.
				1658	linenum: The number of the line to check.
				1659	error: The function to call with any errors found.
				1660	"""
				1661	match = _RE_PATTERN_TODO.match(comment)
				1662	if match:
				1663	# One whitespace is correct; zero whitespace is handled elsewhere.
				1664	leading_whitespace = match.group(1)
				1665	if len(leading_whitespace) > 1:
				1666	error(filename, linenum, 'whitespace/todo', 2,
				1667	'Too many spaces before TODO')
				1668
				1669	username = match.group(2)
				1670	if not username:
				1671	error(filename, linenum, 'readability/todo', 2,
				1672	'Missing username in TODO; it should look like '
				1673	'"// TODO(my_username): Stuff."')
				1674
				1675	middle_whitespace = match.group(3)
				1676	# Comparisons made explicit for correctness -- pylint: disable-msg=C6403
				1677	if middle_whitespace != ' ' and middle_whitespace != '':
				1678	error(filename, linenum, 'whitespace/todo', 2,
				1679	'TODO(my_username) should be followed by a space')
				1680
				1681
				1682	def CheckSpacing(filename, clean_lines, linenum, error):
				1683	"""Checks for the correctness of various spacing issues in the code.
				1684
				1685	Things we check for: spaces around operators, spaces after
				1686	if/for/while/switch, no spaces around parens in function calls, two
				1687	spaces between code and comment, don't start a block with a blank
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1688	line, don't end a function with a blank line, don't add a blank line
				1689	after public/protected/private, don't have too many blank lines in a row.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1690
				1691	Args:
				1692	filename: The name of the current file.
				1693	clean_lines: A CleansedLines instance containing the file.
				1694	linenum: The number of the line to check.
				1695	error: The function to call with any errors found.
				1696	"""
				1697
				1698	raw = clean_lines.raw_lines
				1699	line = raw[linenum]
				1700
				1701	# Before nixing comments, check if the line is blank for no good
				1702	# reason. This includes the first line after a block is opened, and
				1703	# blank lines at the end of a function (ie, right before a line like '}'
				1704	if IsBlankLine(line):
				1705	elided = clean_lines.elided
				1706	prev_line = elided[linenum - 1]
				1707	prevbrace = prev_line.rfind('{')
				1708	# TODO(unknown): Don't complain if line before blank line, and line after,
				1709	# both start with alnums and are indented the same amount.
				1710	# This ignores whitespace at the start of a namespace block
				1711	# because those are not usually indented.
				1712	if (prevbrace != -1 and prev_line[prevbrace:].find('}') == -1
				1713	and prev_line[:prevbrace].find('namespace') == -1):
				1714	# OK, we have a blank line at the start of a code block. Before we
				1715	# complain, we check if it is an exception to the rule: The previous
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1716	# non-empty line has the parameters of a function header that are indented
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1717	# 4 spaces (because they did not fit in a 80 column line when placed on
				1718	# the same line as the function name). We also check for the case where
				1719	# the previous line is indented 6 spaces, which may happen when the
				1720	# initializers of a constructor do not fit into a 80 column line.
				1721	exception = False
				1722	if Match(r' {6}\w', prev_line): # Initializer list?
				1723	# We are looking for the opening column of initializer list, which
				1724	# should be indented 4 spaces to cause 6 space indentation afterwards.
				1725	search_position = linenum-2
				1726	while (search_position >= 0
				1727	and Match(r' {6}\w', elided[search_position])):
				1728	search_position -= 1
				1729	exception = (search_position >= 0
				1730	and elided[search_position][:5] == ' :')
				1731	else:
				1732	# Search for the function arguments or an initializer list. We use a
				1733	# simple heuristic here: If the line is indented 4 spaces; and we have a
				1734	# closing paren, without the opening paren, followed by an opening brace
				1735	# or colon (for initializer lists) we assume that it is the last line of
				1736	# a function header. If we have a colon indented 4 spaces, it is an
				1737	# initializer list.
				1738	exception = (Match(r' {4}\w[^$]$\s(const\s)?(\{\s$\|:)',
				1739	prev_line)
				1740	or Match(r' {4}:', prev_line))
				1741
				1742	if not exception:
				1743	error(filename, linenum, 'whitespace/blank_line', 2,
				1744	'Blank line at the start of a code block. Is this needed?')
				1745	# This doesn't ignore whitespace at the end of a namespace block
				1746	# because that is too hard without pairing open/close braces;
				1747	# however, a special exception is made for namespace closing
				1748	# brackets which have a comment containing "namespace".
				1749	#
				1750	# Also, ignore blank lines at the end of a block in a long if-else
				1751	# chain, like this:
				1752	# if (condition1) {
				1753	# // Something followed by a blank line
				1754	#
				1755	# } else if (condition2) {
				1756	# // Something else
				1757	# }
				1758	if linenum + 1 < clean_lines.NumLines():
				1759	next_line = raw[linenum + 1]
				1760	if (next_line
				1761	and Match(r'\s*}', next_line)
				1762	and next_line.find('namespace') == -1
				1763	and next_line.find('} else ') == -1):
				1764	error(filename, linenum, 'whitespace/blank_line', 3,
				1765	'Blank line at the end of a code block. Is this needed?')
				1766
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1767	matched = Match(r'\s*(public\|protected\|private):', prev_line)
				1768	if matched:
				1769	error(filename, linenum, 'whitespace/blank_line', 3,
				1770	'Do not leave a blank line after "%s:"' % matched.group(1))
				1771
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1772	# Next, we complain if there's a comment too near the text
				1773	commentpos = line.find('//')
				1774	if commentpos != -1:
				1775	# Check if the // may be in quotes. If so, ignore it
				1776	# Comparisons made explicit for clarity -- pylint: disable-msg=C6403
				1777	if (line.count('"', 0, commentpos) -
				1778	line.count('\\"', 0, commentpos)) % 2 == 0: # not in quotes
				1779	# Allow one space for new scopes, two spaces otherwise:
				1780	if (not Match(r'^\s*{ //', line) and
				1781	((commentpos >= 1 and
				1782	line[commentpos-1] not in string.whitespace) or
				1783	(commentpos >= 2 and
				1784	line[commentpos-2] not in string.whitespace))):
				1785	error(filename, linenum, 'whitespace/comments', 2,
				1786	'At least two spaces is best between code and comments')
				1787	# There should always be a space between the // and the comment
				1788	commentend = commentpos + 2
				1789	if commentend < len(line) and not line[commentend] == ' ':
				1790	# but some lines are exceptions -- e.g. if they're big
				1791	# comment delimiters like:
				1792	# //----------------------------------------------------------
				1793	# or are an empty C++ style Doxygen comment, like:
				1794	# ///
				1795	# or they begin with multiple slashes followed by a space:
				1796	# //////// Header comment
				1797	match = (Search(r'[=/-]{4,}\s*$', line[commentend:]) or
				1798	Search(r'^/$', line[commentend:]) or
				1799	Search(r'^/+ ', line[commentend:]))
				1800	if not match:
				1801	error(filename, linenum, 'whitespace/comments', 4,
				1802	'Should have a space between // and comment')
				1803	CheckComment(line[commentpos:], filename, linenum, error)
				1804
				1805	line = clean_lines.elided[linenum] # get rid of comments and strings
				1806
				1807	# Don't try to do spacing checks for operator methods
				1808	line = re.sub(r'operator(==\|!=\|<\|<<\|<=\|>=\|>>\|>)\(', 'operator\(', line)
				1809
				1810	# We allow no-spaces around = within an if: "if ( (a=Foo()) == 0 )".
				1811	# Otherwise not. Note we only check for non-spaces on both sides;
				1812	# sometimes people put non-spaces on one side when aligning ='s among
				1813	# many lines (not that this is behavior that I approve of...)
				1814	if Search(r'[\w.]=[\w.]', line) and not Search(r'\b(if\|while) ', line):
				1815	error(filename, linenum, 'whitespace/operators', 4,
				1816	'Missing spaces around =')
				1817
				1818	# It's ok not to have spaces around binary operators like + - * /, but if
				1819	# there's too little whitespace, we get concerned. It's hard to tell,
				1820	# though, so we punt on this one for now. TODO.
				1821
				1822	# You should always have whitespace around binary operators.
				1823	# Alas, we can't test < or > because they're legitimately used sans spaces
				1824	# (a->b, vector<int> a). The only time we can tell is a < with no >, and
				1825	# only if it's not template params list spilling into the next line.
				1826	match = Search(r'[^<>=!\s](==\|!=\|<=\|>=)[^<>=!\s]', line)
				1827	if not match:
				1828	# Note that while it seems that the '<[^<]*' term in the following
				1829	# regexp could be simplified to '<.*', which would indeed match
				1830	# the same class of strings, the [^<] means that searching for the
				1831	# regexp takes linear rather than quadratic time.
				1832	if not Search(r'<[^<],\s$', line): # template params spill
				1833	match = Search(r'[^<>=!\s](<)[^<>=!\s]([^>]\|->)*$', line)
				1834	if match:
				1835	error(filename, linenum, 'whitespace/operators', 3,
				1836	'Missing spaces around %s' % match.group(1))
				1837	# We allow no-spaces around << and >> when used like this: 10<<20, but
				1838	# not otherwise (particularly, not when used as streams)
				1839	match = Search(r'[^0-9\s](<<\|>>)[^0-9\s]', line)
				1840	if match:
				1841	error(filename, linenum, 'whitespace/operators', 3,
				1842	'Missing spaces around %s' % match.group(1))
				1843
				1844	# There shouldn't be space around unary operators
				1845	match = Search(r'(!\s\|~\s\|[\s]--[\s;]\|[\s]\+\+[\s;])', line)
				1846	if match:
				1847	error(filename, linenum, 'whitespace/operators', 4,
				1848	'Extra space for operator %s' % match.group(1))
				1849
				1850	# A pet peeve of mine: no spaces after an if, while, switch, or for
				1851	match = Search(r' (if\(\|for\(\|while\(\|switch\()', line)
				1852	if match:
				1853	error(filename, linenum, 'whitespace/parens', 5,
				1854	'Missing space before ( in %s' % match.group(1))
				1855
				1856	# For if/for/while/switch, the left and right parens should be
				1857	# consistent about how many spaces are inside the parens, and
				1858	# there should either be zero or one spaces inside the parens.
				1859	# We don't want: "if ( foo)" or "if ( foo )".
				1860	# Exception: "for ( ; foo; bar)" and "for (foo; bar; )" are allowed.
				1861	match = Search(r'\b(if\|for\|while\|switch)\s*'
				1862	r'$([ ])(.).[^ ]+([ ])$\s{\s*$',
				1863	line)
				1864	if match:
				1865	if len(match.group(2)) != len(match.group(4)):
				1866	if not (match.group(3) == ';' and
				1867	len(match.group(2)) == 1 + len(match.group(4)) or
				1868	not match.group(2) and Search(r'\bfor\s$.; $', line)):
				1869	error(filename, linenum, 'whitespace/parens', 5,
				1870	'Mismatching spaces inside () in %s' % match.group(1))
				1871	if not len(match.group(2)) in [0, 1]:
				1872	error(filename, linenum, 'whitespace/parens', 5,
				1873	'Should have zero or one spaces inside ( and ) in %s' %
				1874	match.group(1))
				1875
				1876	# You should always have a space after a comma (either as fn arg or operator)
				1877	if Search(r',[^\s]', line):
				1878	error(filename, linenum, 'whitespace/comma', 3,
				1879	'Missing space after ,')
				1880
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1881	# You should always have a space after a semicolon
				1882	# except for few corner cases
				1883	# TODO(unknown): clarify if 'if (1) { return 1;}' is requires one more
				1884	# space after ;
				1885	if Search(r';[^\s};\\)/]', line):
				1886	error(filename, linenum, 'whitespace/semicolon', 3,
				1887	'Missing space after ;')
				1888
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1889	# Next we will look for issues with function calls.
				1890	CheckSpacingForFunctionCall(filename, line, linenum, error)
				1891
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1892	# Except after an opening paren, or after another opening brace (in case of
				1893	# an initializer list, for instance), you should have spaces before your
				1894	# braces. And since you should never have braces at the beginning of a line,
				1895	# this is an easy test.
				1896	if Search(r'[^ ({]{', line):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1897	error(filename, linenum, 'whitespace/braces', 5,
				1898	'Missing space before {')
				1899
				1900	# Make sure '} else {' has spaces.
				1901	if Search(r'}else', line):
				1902	error(filename, linenum, 'whitespace/braces', 5,
				1903	'Missing space before else')
				1904
				1905	# You shouldn't have spaces before your brackets, except maybe after
				1906	# 'delete []' or 'new char * []'.
				1907	if Search(r'\w\s+\[', line) and not Search(r'delete\s+\[', line):
				1908	error(filename, linenum, 'whitespace/braces', 5,
				1909	'Extra space before [')
				1910
				1911	# You shouldn't have a space before a semicolon at the end of the line.
				1912	# There's a special case for "for" since the style guide allows space before
				1913	# the semicolon there.
				1914	if Search(r':\s;\s$', line):
				1915	error(filename, linenum, 'whitespace/semicolon', 5,
				1916	'Semicolon defining empty statement. Use { } instead.')
				1917	elif Search(r'^\s;\s$', line):
				1918	error(filename, linenum, 'whitespace/semicolon', 5,
				1919	'Line contains only semicolon. If this should be an empty statement, '
				1920	'use { } instead.')
				1921	elif (Search(r'\s+;\s*$', line) and
				1922	not Search(r'\bfor\b', line)):
				1923	error(filename, linenum, 'whitespace/semicolon', 5,
				1924	'Extra space before last semicolon. If this should be an empty '
				1925	'statement, use { } instead.')
				1926
				1927
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1928	def CheckSectionSpacing(filename, clean_lines, class_info, linenum, error):
				1929	"""Checks for additional blank line issues related to sections.
				1930
				1931	Currently the only thing checked here is blank line before protected/private.
				1932
				1933	Args:
				1934	filename: The name of the current file.
				1935	clean_lines: A CleansedLines instance containing the file.
				1936	class_info: A _ClassInfo objects.
				1937	linenum: The number of the line to check.
				1938	error: The function to call with any errors found.
				1939	"""
				1940	# Skip checks if the class is small, where small means 25 lines or less.
				1941	# 25 lines seems like a good cutoff since that's the usual height of
				1942	# terminals, and any class that can't fit in one screen can't really
				1943	# be considered "small".
				1944	#
				1945	# Also skip checks if we are on the first line. This accounts for
				1946	# classes that look like
				1947	# class Foo { public: ... };
				1948	#
				1949	# If we didn't find the end of the class, last_line would be zero,
				1950	# and the check will be skipped by the first condition.
				1951	if (class_info.last_line - class_info.linenum <= 24 or
				1952	linenum <= class_info.linenum):
				1953	return
				1954
				1955	matched = Match(r'\s*(public\|protected\|private):', clean_lines.lines[linenum])
				1956	if matched:
				1957	# Issue warning if the line before public/protected/private was
				1958	# not a blank line, but don't do this if the previous line contains
				1959	# "class" or "struct". This can happen two ways:
				1960	# - We are at the beginning of the class.
				1961	# - We are forward-declaring an inner class that is semantically
				1962	# private, but needed to be public for implementation reasons.
				1963	prev_line = clean_lines.lines[linenum - 1]
				1964	if (not IsBlankLine(prev_line) and
				1965	not Search(r'\b(class\|struct)\b', prev_line)):
				1966	# Try a bit harder to find the beginning of the class. This is to
				1967	# account for multi-line base-specifier lists, e.g.:
				1968	# class Derived
				1969	# : public Base {
				1970	end_class_head = class_info.linenum
				1971	for i in range(class_info.linenum, linenum):
				1972	if Search(r'\{\s*$', clean_lines.lines[i]):
				1973	end_class_head = i
				1974	break
				1975	if end_class_head < linenum - 1:
				1976	error(filename, linenum, 'whitespace/blank_line', 3,
				1977	'"%s:" should be preceded by a blank line' % matched.group(1))
				1978
				1979
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1980	def GetPreviousNonBlankLine(clean_lines, linenum):
				1981	"""Return the most recent non-blank line and its line number.
				1982
				1983	Args:
				1984	clean_lines: A CleansedLines instance containing the file contents.
				1985	linenum: The number of the line to check.
				1986
				1987	Returns:
				1988	A tuple with two elements. The first element is the contents of the last
				1989	non-blank line before the current line, or the empty string if this is the
				1990	first non-blank line. The second is the line number of that line, or -1
				1991	if this is the first non-blank line.
				1992	"""
				1993
				1994	prevlinenum = linenum - 1
				1995	while prevlinenum >= 0:
				1996	prevline = clean_lines.elided[prevlinenum]
				1997	if not IsBlankLine(prevline): # if not a blank line...
				1998	return (prevline, prevlinenum)
				1999	prevlinenum -= 1
				2000	return ('', -1)
				2001
				2002
				2003	def CheckBraces(filename, clean_lines, linenum, error):
				2004	"""Looks for misplaced braces (e.g. at the end of line).
				2005
				2006	Args:
				2007	filename: The name of the current file.
				2008	clean_lines: A CleansedLines instance containing the file.
				2009	linenum: The number of the line to check.
				2010	error: The function to call with any errors found.
				2011	"""
				2012
				2013	line = clean_lines.elided[linenum] # get rid of comments and strings
				2014
				2015	if Match(r'\s{\s$', line):
				2016	# We allow an open brace to start a line in the case where someone
				2017	# is using braces in a block to explicitly create a new scope,
				2018	# which is commonly used to control the lifetime of
				2019	# stack-allocated variables. We don't detect this perfectly: we
				2020	# just don't complain if the last non-whitespace character on the
				2021	# previous non-blank line is ';', ':', '{', or '}'.
				2022	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
				2023	if not Search(r'[;:}{]\s*$', prevline):
				2024	error(filename, linenum, 'whitespace/braces', 4,
				2025	'{ should almost always be at the end of the previous line')
				2026
				2027	# An else clause should be on the same line as the preceding closing brace.
				2028	if Match(r'\selse\s', line):
				2029	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
				2030	if Match(r'\s}\s$', prevline):
				2031	error(filename, linenum, 'whitespace/newline', 4,
				2032	'An else should appear on the same line as the preceding }')
				2033
				2034	# If braces come on one side of an else, they should be on both.
				2035	# However, we have to worry about "else if" that spans multiple lines!
				2036	if Search(r'}\selse[^{]$', line) or Match(r'[^}]else\s{', line):
				2037	if Search(r'}\selse if([^{])$', line): # could be multi-line if
				2038	# find the ( after the if
				2039	pos = line.find('else if')
				2040	pos = line.find('(', pos)
				2041	if pos > 0:
				2042	(endline, _, endpos) = CloseExpression(clean_lines, linenum, pos)
				2043	if endline[endpos:].find('{') == -1: # must be brace after if
				2044	error(filename, linenum, 'readability/braces', 5,
				2045	'If an else has a brace on one side, it should have it on both')
				2046	else: # common case: else not followed by a multi-line if
				2047	error(filename, linenum, 'readability/braces', 5,
				2048	'If an else has a brace on one side, it should have it on both')
				2049
				2050	# Likewise, an else should never have the else clause on the same line
				2051	if Search(r'\belse [^\s{]', line) and not Search(r'\belse if\b', line):
				2052	error(filename, linenum, 'whitespace/newline', 4,
				2053	'Else clause should never be on same line as else (use 2 lines)')
				2054
				2055	# In the same way, a do/while should never be on one line
				2056	if Match(r'\s*do [^\s{]', line):
				2057	error(filename, linenum, 'whitespace/newline', 4,
				2058	'do/while clauses should not be on a single line')
				2059
				2060	# Braces shouldn't be followed by a ; unless they're defining a struct
				2061	# or initializing an array.
				2062	# We can't tell in general, but we can for some common cases.
				2063	prevlinenum = linenum
				2064	while True:
				2065	(prevline, prevlinenum) = GetPreviousNonBlankLine(clean_lines, prevlinenum)
				2066	if Match(r'\s+{.}\s;', line) and not prevline.count(';'):
				2067	line = prevline + line
				2068	else:
				2069	break
				2070	if (Search(r'{.}\s;', line) and
				2071	line.count('{') == line.count('}') and
				2072	not Search(r'struct\|class\|enum\|\s=\s{', line)):
				2073	error(filename, linenum, 'readability/braces', 4,
				2074	"You don't need a ; after a }")
				2075
				2076
				2077	def ReplaceableCheck(operator, macro, line):
				2078	"""Determine whether a basic CHECK can be replaced with a more specific one.
				2079
				2080	For example suggest using CHECK_EQ instead of CHECK(a == b) and
				2081	similarly for CHECK_GE, CHECK_GT, CHECK_LE, CHECK_LT, CHECK_NE.
				2082
				2083	Args:
				2084	operator: The C++ operator used in the CHECK.
				2085	macro: The CHECK or EXPECT macro being called.
				2086	line: The current source line.
				2087
				2088	Returns:
				2089	True if the CHECK can be replaced with a more specific one.
				2090	"""
				2091
				2092	# This matches decimal and hex integers, strings, and chars (in that order).
				2093	match_constant = r'([-+]?(\d+\|0[xX][0-9a-fA-F]+)[lLuU]{0,3}\|"."\|\'.\')'
				2094
				2095	# Expression to match two sides of the operator with something that
				2096	# looks like a literal, since CHECK(x == iterator) won't compile.
				2097	# This means we can't catch all the cases where a more specific
				2098	# CHECK is possible, but it's less annoying than dealing with
				2099	# extraneous warnings.
				2100	match_this = (r'\s' + macro + r'\((\s' +
				2101	match_constant + r'\s' + operator + r'[^<>].\|'
				2102	r'.[^<>]' + operator + r'\s' + match_constant +
				2103	r'\s*\))')
				2104
				2105	# Don't complain about CHECK(x == NULL) or similar because
				2106	# CHECK_EQ(x, NULL) won't compile (requires a cast).
				2107	# Also, don't complain about more complex boolean expressions
				2108	# involving && or \|\| such as CHECK(a == b \|\| c == d).
				2109	return Match(match_this, line) and not Search(r'NULL\|&&\|\\|\\|', line)
				2110
				2111
				2112	def CheckCheck(filename, clean_lines, linenum, error):
				2113	"""Checks the use of CHECK and EXPECT macros.
				2114
				2115	Args:
				2116	filename: The name of the current file.
				2117	clean_lines: A CleansedLines instance containing the file.
				2118	linenum: The number of the line to check.
				2119	error: The function to call with any errors found.
				2120	"""
				2121
				2122	# Decide the set of replacement macros that should be suggested
				2123	raw_lines = clean_lines.raw_lines
				2124	current_macro = ''
				2125	for macro in _CHECK_MACROS:
				2126	if raw_lines[linenum].find(macro) >= 0:
				2127	current_macro = macro
				2128	break
				2129	if not current_macro:
				2130	# Don't waste time here if line doesn't contain 'CHECK' or 'EXPECT'
				2131	return
				2132
				2133	line = clean_lines.elided[linenum] # get rid of comments and strings
				2134
				2135	# Encourage replacing plain CHECKs with CHECK_EQ/CHECK_NE/etc.
				2136	for operator in ['==', '!=', '>=', '>', '<=', '<']:
				2137	if ReplaceableCheck(operator, current_macro, line):
				2138	error(filename, linenum, 'readability/check', 2,
				2139	'Consider using %s instead of %s(a %s b)' % (
				2140	_CHECK_REPLACEMENT[current_macro][operator],
				2141	current_macro, operator))
				2142	break
				2143
				2144
				2145	def GetLineWidth(line):
				2146	"""Determines the width of the line in column positions.
				2147
				2148	Args:
				2149	line: A string, which may be a Unicode string.
				2150
				2151	Returns:
				2152	The width of the line in column positions, accounting for Unicode
				2153	combining characters and wide characters.
				2154	"""
				2155	if isinstance(line, unicode):
				2156	width = 0
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2157	for uc in unicodedata.normalize('NFC', line):
				2158	if unicodedata.east_asian_width(uc) in ('W', 'F'):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2159	width += 2
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2160	elif not unicodedata.combining(uc):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2161	width += 1
				2162	return width
				2163	else:
				2164	return len(line)
				2165
				2166
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2167	def CheckStyle(filename, clean_lines, linenum, file_extension, class_state,
				2168	error):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2169	"""Checks rules from the 'C++ style rules' section of cppguide.html.
				2170
				2171	Most of these rules are hard to test (naming, comment style), but we
				2172	do what we can. In particular we check for 2-space indents, line lengths,
				2173	tab usage, spaces inside code, etc.
				2174
				2175	Args:
				2176	filename: The name of the current file.
				2177	clean_lines: A CleansedLines instance containing the file.
				2178	linenum: The number of the line to check.
				2179	file_extension: The extension (without the dot) of the filename.
				2180	error: The function to call with any errors found.
				2181	"""
				2182
				2183	raw_lines = clean_lines.raw_lines
				2184	line = raw_lines[linenum]
				2185
				2186	if line.find('\t') != -1:
				2187	error(filename, linenum, 'whitespace/tab', 1,
				2188	'Tab found; better to use spaces')
				2189
				2190	# One or three blank spaces at the beginning of the line is weird; it's
				2191	# hard to reconcile that with 2-space indents.
				2192	# NOTE: here are the conditions rob pike used for his tests. Mine aren't
				2193	# as sophisticated, but it may be worth becoming so: RLENGTH==initial_spaces
				2194	# if(RLENGTH > 20) complain = 0;
				2195	# if(match($0, " +(error\|private\|public\|protected):")) complain = 0;
				2196	# if(match(prev, "&& *$")) complain = 0;
				2197	# if(match(prev, "\\\|\\\| *$")) complain = 0;
				2198	# if(match(prev, "[\",=><] *$")) complain = 0;
				2199	# if(match($0, " <<")) complain = 0;
				2200	# if(match(prev, " +for \\(")) complain = 0;
				2201	# if(prevodd && match(prevprev, " +for \\(")) complain = 0;
				2202	initial_spaces = 0
				2203	cleansed_line = clean_lines.elided[linenum]
				2204	while initial_spaces < len(line) and line[initial_spaces] == ' ':
				2205	initial_spaces += 1
				2206	if line and line[-1].isspace():
				2207	error(filename, linenum, 'whitespace/end_of_line', 4,
				2208	'Line ends in whitespace. Consider deleting these extra spaces.')
				2209	# There are certain situations we allow one space, notably for labels
				2210	elif ((initial_spaces == 1 or initial_spaces == 3) and
				2211	not Match(r'\s\w+\s:\s*$', cleansed_line)):
				2212	error(filename, linenum, 'whitespace/indent', 3,
				2213	'Weird number of spaces at line-start. '
				2214	'Are you using a 2-space indent?')
				2215	# Labels should always be indented at least one space.
				2216	elif not initial_spaces and line[:2] != '//' and Search(r'[^:]:\s*$',
				2217	line):
				2218	error(filename, linenum, 'whitespace/labels', 4,
				2219	'Labels should always be indented at least one space. '
				2220	'If this is a member-initializer list in a constructor or '
				2221	'the base class list in a class definition, the colon should '
				2222	'be on the following line.')
				2223
				2224
				2225	# Check if the line is a header guard.
				2226	is_header_guard = False
				2227	if file_extension == 'h':
				2228	cppvar = GetHeaderGuardCPPVariable(filename)
				2229	if (line.startswith('#ifndef %s' % cppvar) or
				2230	line.startswith('#define %s' % cppvar) or
				2231	line.startswith('#endif // %s' % cppvar)):
				2232	is_header_guard = True
				2233	# #include lines and header guards can be long, since there's no clean way to
				2234	# split them.
				2235	#
				2236	# URLs can be long too. It's possible to split these, but it makes them
				2237	# harder to cut&paste.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2238	#
				2239	# The "$Id:...$" comment may also get very long without it being the
				2240	# developers fault.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2241	if (not line.startswith('#include') and not is_header_guard and
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2242	not Match(r'^\s//.http(s?)://\S*$', line) and
				2243	not Match(r'^// \$Id:.*#[0-9]+ \$$', line)):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2244	line_width = GetLineWidth(line)
				2245	if line_width > 100:
				2246	error(filename, linenum, 'whitespace/line_length', 4,
				2247	'Lines should very rarely be longer than 100 characters')
				2248	elif line_width > 80:
				2249	error(filename, linenum, 'whitespace/line_length', 2,
				2250	'Lines should be <= 80 characters long')
				2251
				2252	if (cleansed_line.count(';') > 1 and
				2253	# for loops are allowed two ;'s (and may run over two lines).
				2254	cleansed_line.find('for') == -1 and
				2255	(GetPreviousNonBlankLine(clean_lines, linenum)[0].find('for') == -1 or
				2256	GetPreviousNonBlankLine(clean_lines, linenum)[0].find(';') != -1) and
				2257	# It's ok to have many commands in a switch case that fits in 1 line
				2258	not ((cleansed_line.find('case ') != -1 or
				2259	cleansed_line.find('default:') != -1) and
				2260	cleansed_line.find('break;') != -1)):
				2261	error(filename, linenum, 'whitespace/newline', 4,
				2262	'More than one command on the same line')
				2263
				2264	# Some more style checks
				2265	CheckBraces(filename, clean_lines, linenum, error)
				2266	CheckSpacing(filename, clean_lines, linenum, error)
				2267	CheckCheck(filename, clean_lines, linenum, error)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2268	if class_state and class_state.classinfo_stack:
				2269	CheckSectionSpacing(filename, clean_lines,
				2270	class_state.classinfo_stack[-1], linenum, error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2271
				2272
				2273	_RE_PATTERN_INCLUDE_NEW_STYLE = re.compile(r'#include +"[^/]+\.h"')
				2274	_RE_PATTERN_INCLUDE = re.compile(r'^\s#\sinclude\s([<"])([^>"])[>"].*$')
				2275	# Matches the first component of a filename delimited by -s and _s. That is:
				2276	# _RE_FIRST_COMPONENT.match('foo').group(0) == 'foo'
				2277	# _RE_FIRST_COMPONENT.match('foo.cc').group(0) == 'foo'
				2278	# _RE_FIRST_COMPONENT.match('foo-bar_baz.cc').group(0) == 'foo'
				2279	# _RE_FIRST_COMPONENT.match('foo_bar-baz.cc').group(0) == 'foo'
				2280	_RE_FIRST_COMPONENT = re.compile(r'^[^-_.]+')
				2281
				2282
				2283	def _DropCommonSuffixes(filename):
				2284	"""Drops common suffixes like _test.cc or -inl.h from filename.
				2285
				2286	For example:
				2287	>>> _DropCommonSuffixes('foo/foo-inl.h')
				2288	'foo/foo'
				2289	>>> _DropCommonSuffixes('foo/bar/foo.cc')
				2290	'foo/bar/foo'
				2291	>>> _DropCommonSuffixes('foo/foo_internal.h')
				2292	'foo/foo'
				2293	>>> _DropCommonSuffixes('foo/foo_unusualinternal.h')
				2294	'foo/foo_unusualinternal'
				2295
				2296	Args:
				2297	filename: The input filename.
				2298
				2299	Returns:
				2300	The filename with the common suffix removed.
				2301	"""
				2302	for suffix in ('test.cc', 'regtest.cc', 'unittest.cc',
				2303	'inl.h', 'impl.h', 'internal.h'):
				2304	if (filename.endswith(suffix) and len(filename) > len(suffix) and
				2305	filename[-len(suffix) - 1] in ('-', '_')):
				2306	return filename[:-len(suffix) - 1]
				2307	return os.path.splitext(filename)[0]
				2308
				2309
				2310	def _IsTestFilename(filename):
				2311	"""Determines if the given filename has a suffix that identifies it as a test.
				2312
				2313	Args:
				2314	filename: The input filename.
				2315
				2316	Returns:
				2317	True if 'filename' looks like a test, False otherwise.
				2318	"""
				2319	if (filename.endswith('_test.cc') or
				2320	filename.endswith('_unittest.cc') or
				2321	filename.endswith('_regtest.cc')):
				2322	return True
				2323	else:
				2324	return False
				2325
				2326
				2327	def _ClassifyInclude(fileinfo, include, is_system):
				2328	"""Figures out what kind of header 'include' is.
				2329
				2330	Args:
				2331	fileinfo: The current file cpplint is running over. A FileInfo instance.
				2332	include: The path to a #included file.
				2333	is_system: True if the #include used <> rather than "".
				2334
				2335	Returns:
				2336	One of the _XXX_HEADER constants.
				2337
				2338	For example:
				2339	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'stdio.h', True)
				2340	_C_SYS_HEADER
				2341	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'string', True)
				2342	_CPP_SYS_HEADER
				2343	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'foo/foo.h', False)
				2344	_LIKELY_MY_HEADER
				2345	>>> _ClassifyInclude(FileInfo('foo/foo_unknown_extension.cc'),
				2346	... 'bar/foo_other_ext.h', False)
				2347	_POSSIBLE_MY_HEADER
				2348	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'foo/bar.h', False)
				2349	_OTHER_HEADER
				2350	"""
				2351	# This is a list of all standard c++ header files, except
				2352	# those already checked for above.
				2353	is_stl_h = include in _STL_HEADERS
				2354	is_cpp_h = is_stl_h or include in _CPP_HEADERS
				2355
				2356	if is_system:
				2357	if is_cpp_h:
				2358	return _CPP_SYS_HEADER
				2359	else:
				2360	return _C_SYS_HEADER
				2361
				2362	# If the target file and the include we're checking share a
				2363	# basename when we drop common extensions, and the include
				2364	# lives in . , then it's likely to be owned by the target file.
				2365	target_dir, target_base = (
				2366	os.path.split(_DropCommonSuffixes(fileinfo.RepositoryName())))
				2367	include_dir, include_base = os.path.split(_DropCommonSuffixes(include))
				2368	if target_base == include_base and (
				2369	include_dir == target_dir or
				2370	include_dir == os.path.normpath(target_dir + '/../public')):
				2371	return _LIKELY_MY_HEADER
				2372
				2373	# If the target and include share some initial basename
				2374	# component, it's possible the target is implementing the
				2375	# include, so it's allowed to be first, but we'll never
				2376	# complain if it's not there.
				2377	target_first_component = _RE_FIRST_COMPONENT.match(target_base)
				2378	include_first_component = _RE_FIRST_COMPONENT.match(include_base)
				2379	if (target_first_component and include_first_component and
				2380	target_first_component.group(0) ==
				2381	include_first_component.group(0)):
				2382	return _POSSIBLE_MY_HEADER
				2383
				2384	return _OTHER_HEADER
				2385
				2386
				2387
				2388	def CheckIncludeLine(filename, clean_lines, linenum, include_state, error):
				2389	"""Check rules that are applicable to #include lines.
				2390
				2391	Strings on #include lines are NOT removed from elided line, to make
				2392	certain tasks easier. However, to prevent false positives, checks
				2393	applicable to #include lines in CheckLanguage must be put here.
				2394
				2395	Args:
				2396	filename: The name of the current file.
				2397	clean_lines: A CleansedLines instance containing the file.
				2398	linenum: The number of the line to check.
				2399	include_state: An _IncludeState instance in which the headers are inserted.
				2400	error: The function to call with any errors found.
				2401	"""
				2402	fileinfo = FileInfo(filename)
				2403
				2404	line = clean_lines.lines[linenum]
				2405
				2406	# "include" should use the new style "foo/bar.h" instead of just "bar.h"
				2407	if _RE_PATTERN_INCLUDE_NEW_STYLE.search(line):
				2408	error(filename, linenum, 'build/include', 4,
				2409	'Include the directory when naming .h files')
				2410
				2411	# we shouldn't include a file more than once. actually, there are a
				2412	# handful of instances where doing so is okay, but in general it's
				2413	# not.
				2414	match = _RE_PATTERN_INCLUDE.search(line)
				2415	if match:
				2416	include = match.group(2)
				2417	is_system = (match.group(1) == '<')
				2418	if include in include_state:
				2419	error(filename, linenum, 'build/include', 4,
				2420	'"%s" already included at %s:%s' %
				2421	(include, filename, include_state[include]))
				2422	else:
				2423	include_state[include] = linenum
				2424
				2425	# We want to ensure that headers appear in the right order:
				2426	# 1) for foo.cc, foo.h (preferred location)
				2427	# 2) c system files
				2428	# 3) cpp system files
				2429	# 4) for foo.cc, foo.h (deprecated location)
				2430	# 5) other google headers
				2431	#
				2432	# We classify each include statement as one of those 5 types
				2433	# using a number of techniques. The include_state object keeps
				2434	# track of the highest type seen, and complains if we see a
				2435	# lower type after that.
				2436	error_message = include_state.CheckNextIncludeOrder(
				2437	_ClassifyInclude(fileinfo, include, is_system))
				2438	if error_message:
				2439	error(filename, linenum, 'build/include_order', 4,
				2440	'%s. Should be: %s.h, c system, c++ system, other.' %
				2441	(error_message, fileinfo.BaseName()))
				2442	if not include_state.IsInAlphabeticalOrder(include):
				2443	error(filename, linenum, 'build/include_alpha', 4,
				2444	'Include "%s" not in alphabetical order' % include)
				2445
				2446	# Look for any of the stream classes that are part of standard C++.
				2447	match = _RE_PATTERN_INCLUDE.match(line)
				2448	if match:
				2449	include = match.group(2)
				2450	if Match(r'(f\|ind\|io\|i\|o\|parse\|pf\|stdio\|str\|)?stream$', include):
				2451	# Many unit tests use cout, so we exempt them.
				2452	if not _IsTestFilename(filename):
				2453	error(filename, linenum, 'readability/streams', 3,
				2454	'Streams are highly discouraged.')
				2455
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2456
				2457	def _GetTextInside(text, start_pattern):
				2458	"""Retrieves all the text between matching open and close parentheses.
				2459
				2460	Given a string of lines and a regular expression string, retrieve all the text
				2461	following the expression and between opening punctuation symbols like
				2462	(, [, or {, and the matching close-punctuation symbol. This properly nested
				2463	occurrences of the punctuations, so for the text like
				2464	printf(a(), b(c()));
				2465	a call to _GetTextInside(text, r'printf\(') will return 'a(), b(c())'.
				2466	start_pattern must match string having an open punctuation symbol at the end.
				2467
				2468	Args:
				2469	text: The lines to extract text. Its comments and strings must be elided.
				2470	It can be single line and can span multiple lines.
				2471	start_pattern: The regexp string indicating where to start extracting
				2472	the text.
				2473	Returns:
				2474	The extracted text.
				2475	None if either the opening string or ending punctuation could not be found.
				2476	"""
				2477	# TODO(sugawarayu): Audit cpplint.py to see what places could be profitably
				2478	# rewritten to use _GetTextInside (and use inferior regexp matching today).
				2479
				2480	# Give opening punctuations to get the matching close-punctuations.
				2481	matching_punctuation = {'(': ')', '{': '}', '[': ']'}
				2482	closing_punctuation = set(matching_punctuation.itervalues())
				2483
				2484	# Find the position to start extracting text.
				2485	match = re.search(start_pattern, text, re.M)
				2486	if not match: # start_pattern not found in text.
				2487	return None
				2488	start_position = match.end(0)
				2489
				2490	assert start_position > 0, (
				2491	'start_pattern must ends with an opening punctuation.')
				2492	assert text[start_position - 1] in matching_punctuation, (
				2493	'start_pattern must ends with an opening punctuation.')
				2494	# Stack of closing punctuations we expect to have in text after position.
				2495	punctuation_stack = [matching_punctuation[text[start_position - 1]]]
				2496	position = start_position
				2497	while punctuation_stack and position < len(text):
				2498	if text[position] == punctuation_stack[-1]:
				2499	punctuation_stack.pop()
				2500	elif text[position] in closing_punctuation:
				2501	# A closing punctuation without matching opening punctuations.
				2502	return None
				2503	elif text[position] in matching_punctuation:
				2504	punctuation_stack.append(matching_punctuation[text[position]])
				2505	position += 1
				2506	if punctuation_stack:
				2507	# Opening punctuations left without matching close-punctuations.
				2508	return None
				2509	# punctuations match.
				2510	return text[start_position:position - 1]
				2511
				2512
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2513	def CheckLanguage(filename, clean_lines, linenum, file_extension, include_state,
				2514	error):
				2515	"""Checks rules from the 'C++ language rules' section of cppguide.html.
				2516
				2517	Some of these rules are hard to test (function overloading, using
				2518	uint32 inappropriately), but we do the best we can.
				2519
				2520	Args:
				2521	filename: The name of the current file.
				2522	clean_lines: A CleansedLines instance containing the file.
				2523	linenum: The number of the line to check.
				2524	file_extension: The extension (without the dot) of the filename.
				2525	include_state: An _IncludeState instance in which the headers are inserted.
				2526	error: The function to call with any errors found.
				2527	"""
				2528	# If the line is empty or consists of entirely a comment, no need to
				2529	# check it.
				2530	line = clean_lines.elided[linenum]
				2531	if not line:
				2532	return
				2533
				2534	match = _RE_PATTERN_INCLUDE.search(line)
				2535	if match:
				2536	CheckIncludeLine(filename, clean_lines, linenum, include_state, error)
				2537	return
				2538
				2539	# Create an extended_line, which is the concatenation of the current and
				2540	# next lines, for more effective checking of code that may span more than one
				2541	# line.
				2542	if linenum + 1 < clean_lines.NumLines():
				2543	extended_line = line + clean_lines.elided[linenum + 1]
				2544	else:
				2545	extended_line = line
				2546
				2547	# Make Windows paths like Unix.
				2548	fullname = os.path.abspath(filename).replace('\\', '/')
				2549
				2550	# TODO(unknown): figure out if they're using default arguments in fn proto.
				2551
				2552	# Check for non-const references in functions. This is tricky because &
				2553	# is also used to take the address of something. We allow <> for templates,
				2554	# (ignoring whatever is between the braces) and : for classes.
				2555	# These are complicated re's. They try to capture the following:
				2556	# paren (for fn-prototype start), typename, &, varname. For the const
				2557	# version, we're willing for const to be before typename or after
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2558	# Don't check the implementation on same line.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2559	fnline = line.split('{', 1)[0]
				2560	if (len(re.findall(r'\([^()]\b(?:[\w:]\|<[^()]>)+(\s?&\|&\s?)\w+', fnline)) >
				2561	len(re.findall(r'\([^()]*\bconst\s+(?:typename\s+)?(?:struct\s+)?'
				2562	r'(?:[\w:]\|<[^()]*>)+(\s?&\|&\s?)\w+', fnline)) +
				2563	len(re.findall(r'\([^()]\b(?:[\w:]\|<[^()]>)+\s+const(\s?&\|&\s?)[\w]+',
				2564	fnline))):
				2565
				2566	# We allow non-const references in a few standard places, like functions
				2567	# called "swap()" or iostream operators like "<<" or ">>".
				2568	if not Search(
				2569	r'(swap\|Swap\|operator[<>][<>])\s\(\s(?:[\w:]\|<.>)+\s&',
				2570	fnline):
				2571	error(filename, linenum, 'runtime/references', 2,
				2572	'Is this a non-const reference? '
				2573	'If so, make const or use a pointer.')
				2574
				2575	# Check to see if they're using an conversion function cast.
				2576	# I just try to capture the most common basic types, though there are more.
				2577	# Parameterless conversion functions, such as bool(), are allowed as they are
				2578	# probably a member operator declaration or default constructor.
				2579	match = Search(
				2580	r'(\bnew\s+)?\b' # Grab 'new' operator, if it's there
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	2581	r'(int\|float\|double\|bool\|char\|u?int(8\|16\|32\|64)_t)\([^)]', line) # TODO(enh): upstream change to handle all stdint types.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2582	if match:
				2583	# gMock methods are defined using some variant of MOCK_METHODx(name, type)
				2584	# where type may be float(), int(string), etc. Without context they are
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2585	# virtually indistinguishable from int(x) casts. Likewise, gMock's
				2586	# MockCallback takes a template parameter of the form return_type(arg_type),
				2587	# which looks much like the cast we're trying to detect.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2588	if (match.group(1) is None and # If new operator, then this isn't a cast
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2589	not (Match(r'^\s*MOCK_(CONST_)?METHOD\d+(_T)?\(', line) or
				2590	Match(r'^\sMockCallback<.>', line))):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2591	error(filename, linenum, 'readability/casting', 4,
				2592	'Using deprecated casting style. '
				2593	'Use static_cast<%s>(...) instead' %
				2594	match.group(2))
				2595
				2596	CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				2597	'static_cast',
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	2598	r'$(int\|float\|double\|bool\|char\|u?int(8\|16\|32\|64))$', error) # TODO(enh): upstream change to handle all stdint types.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2599
				2600	# This doesn't catch all cases. Consider (const char * const)"hello".
				2601	#
				2602	# (char *) "foo" should always be a const_cast (reinterpret_cast won't
				2603	# compile).
				2604	if CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				2605	'const_cast', r'$(char\s?\+\s?)$\s"', error):
				2606	pass
				2607	else:
				2608	# Check pointer casts for other than string constants
				2609	CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				2610	'reinterpret_cast', r'$(\w+\s?\*+\s?)$', error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2611
				2612	# In addition, we look for people taking the address of a cast. This
				2613	# is dangerous -- casts can assign to temporaries, so the pointer doesn't
				2614	# point where you think.
				2615	if Search(
				2616	r'(&$[^)]+$[\w(])\|(&(static\|dynamic\|reinterpret)_cast\b)', line):
				2617	error(filename, linenum, 'runtime/casting', 4,
				2618	('Are you taking an address of a cast? '
				2619	'This is dangerous: could be a temp var. '
				2620	'Take the address before doing the cast, rather than after'))
				2621
				2622	# Check for people declaring static/global STL strings at the top level.
				2623	# This is dangerous because the C++ language does not guarantee that
				2624	# globals with constructors are initialized before the first access.
				2625	match = Match(
				2626	r'((?:\|static +)(?:\|const +))string +([a-zA-Z0-9_:]+)\b(.*)',
				2627	line)
				2628	# Make sure it's not a function.
				2629	# Function template specialization looks like: "string foo<Type>(...".
				2630	# Class template definitions look like: "string Foo<Type>::Method(...".
				2631	if match and not Match(r'\s(<.>)?(::[a-zA-Z0-9_]+)?\s*\(([^"]\|$)',
				2632	match.group(3)):
				2633	error(filename, linenum, 'runtime/string', 4,
				2634	'For a static/global string constant, use a C style string instead: '
				2635	'"%schar %s[]".' %
				2636	(match.group(1), match.group(2)))
				2637
				2638	# Check that we're not using RTTI outside of testing code.
				2639	if Search(r'\bdynamic_cast<', line) and not _IsTestFilename(filename):
				2640	error(filename, linenum, 'runtime/rtti', 5,
				2641	'Do not use dynamic_cast<>. If you need to cast within a class '
				2642	"hierarchy, use static_cast<> to upcast. Google doesn't support "
				2643	'RTTI.')
				2644
				2645	if Search(r'\b([A-Za-z0-9_]*_)$\1$', line):
				2646	error(filename, linenum, 'runtime/init', 4,
				2647	'You seem to be initializing a member variable with itself.')
				2648
				2649	if file_extension == 'h':
				2650	# TODO(unknown): check that 1-arg constructors are explicit.
				2651	# How to tell it's a constructor?
				2652	# (handled in CheckForNonStandardConstructs for now)
				2653	# TODO(unknown): check that classes have DISALLOW_EVIL_CONSTRUCTORS
				2654	# (level 1 error)
				2655	pass
				2656
				2657	# Check if people are using the verboten C basic types. The only exception
				2658	# we regularly allow is "unsigned short port" for port.
				2659	if Search(r'\bshort port\b', line):
				2660	if not Search(r'\bunsigned short port\b', line):
				2661	error(filename, linenum, 'runtime/int', 4,
				2662	'Use "unsigned short" for ports, not "short"')
				2663	else:
				2664	match = Search(r'\b(short\|long(?! +double)\|long long)\b', line)
				2665	if match:
				2666	error(filename, linenum, 'runtime/int', 4,
				2667	'Use int16/int64/etc, rather than the C type %s' % match.group(1))
				2668
				2669	# When snprintf is used, the second argument shouldn't be a literal.
				2670	match = Search(r'snprintf\s\(([^,]),\s([0-9])\s*,', line)
				2671	if match and match.group(2) != '0':
				2672	# If 2nd arg is zero, snprintf is used to calculate size.
				2673	error(filename, linenum, 'runtime/printf', 3,
				2674	'If you can, use sizeof(%s) instead of %s as the 2nd arg '
				2675	'to snprintf.' % (match.group(1), match.group(2)))
				2676
				2677	# Check if some verboten C functions are being used.
				2678	if Search(r'\bsprintf\b', line):
				2679	error(filename, linenum, 'runtime/printf', 5,
				2680	'Never use sprintf. Use snprintf instead.')
				2681	match = Search(r'\b(strcpy\|strcat)\b', line)
				2682	if match:
				2683	error(filename, linenum, 'runtime/printf', 4,
				2684	'Almost always, snprintf is better than %s' % match.group(1))
				2685
				2686	if Search(r'\bsscanf\b', line):
				2687	error(filename, linenum, 'runtime/printf', 1,
				2688	'sscanf can be ok, but is slow and can overflow buffers.')
				2689
				2690	# Check if some verboten operator overloading is going on
				2691	# TODO(unknown): catch out-of-line unary operator&:
				2692	# class X {};
				2693	# int operator&(const X& x) { return 42; } // unary operator&
				2694	# The trick is it's hard to tell apart from binary operator&:
				2695	# class Y { int operator&(const Y& x) { return 23; } }; // binary operator&
				2696	if Search(r'\boperator\s&\s$\s*$', line):
				2697	error(filename, linenum, 'runtime/operator', 4,
				2698	'Unary operator& is dangerous. Do not use it.')
				2699
				2700	# Check for suspicious usage of "if" like
				2701	# } if (a == b) {
				2702	if Search(r'\}\sif\s\(', line):
				2703	error(filename, linenum, 'readability/braces', 4,
				2704	'Did you mean "else if"? If not, start a new line for "if".')
				2705
				2706	# Check for potential format string bugs like printf(foo).
				2707	# We constrain the pattern not to pick things like DocidForPrintf(foo).
				2708	# Not perfect but it can catch printf(foo.c_str()) and printf(foo->c_str())
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2709	# TODO(sugawarayu): Catch the following case. Need to change the calling
				2710	# convention of the whole function to process multiple line to handle it.
				2711	# printf(
				2712	# boy_this_is_a_really_long_variable_that_cannot_fit_on_the_prev_line);
				2713	printf_args = _GetTextInside(line, r'(?i)\b(string)?printf\s*\(')
				2714	if printf_args:
				2715	match = Match(r'([\w.\->()]+)$', printf_args)
				2716	if match:
				2717	function_name = re.search(r'\b((?:string)?printf)\s*\(',
				2718	line, re.I).group(1)
				2719	error(filename, linenum, 'runtime/printf', 4,
				2720	'Potential format string bug. Do %s("%%s", %s) instead.'
				2721	% (function_name, match.group(1)))
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2722
				2723	# Check for potential memset bugs like memset(buf, sizeof(buf), 0).
				2724	match = Search(r'memset\s$([^,]),\s([^,]),\s0\s$', line)
				2725	if match and not Match(r"^''\|-?[0-9]+\|0x[0-9A-Fa-f]$", match.group(2)):
				2726	error(filename, linenum, 'runtime/memset', 4,
				2727	'Did you mean "memset(%s, 0, %s)"?'
				2728	% (match.group(1), match.group(2)))
				2729
				2730	if Search(r'\busing namespace\b', line):
				2731	error(filename, linenum, 'build/namespaces', 5,
				2732	'Do not use namespace using-directives. '
				2733	'Use using-declarations instead.')
				2734
				2735	# Detect variable-length arrays.
				2736	match = Match(r'\s(.+::)?(\w+) [a-z]\w\[(.+)];', line)
				2737	if (match and match.group(2) != 'return' and match.group(2) != 'delete' and
				2738	match.group(3).find(']') == -1):
				2739	# Split the size using space and arithmetic operators as delimiters.
				2740	# If any of the resulting tokens are not compile time constants then
				2741	# report the error.
				2742	tokens = re.split(r'\s\|\+\|\-\|\*\|\/\|<<\|>>]', match.group(3))
				2743	is_const = True
				2744	skip_next = False
				2745	for tok in tokens:
				2746	if skip_next:
				2747	skip_next = False
				2748	continue
				2749
				2750	if Search(r'sizeof$.+$', tok): continue
				2751	if Search(r'arraysize$\w+$', tok): continue
				2752
				2753	tok = tok.lstrip('(')
				2754	tok = tok.rstrip(')')
				2755	if not tok: continue
				2756	if Match(r'\d+', tok): continue
				2757	if Match(r'0[xX][0-9a-fA-F]+', tok): continue
				2758	if Match(r'k[A-Z0-9]\w*', tok): continue
				2759	if Match(r'(.+::)?k[A-Z0-9]\w*', tok): continue
				2760	if Match(r'(.+::)?[A-Z][A-Z0-9_]*', tok): continue
				2761	# A catch all for tricky sizeof cases, including 'sizeof expression',
				2762	# 'sizeof(*type)', 'sizeof(const type)', 'sizeof(struct StructName)'
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2763	# requires skipping the next token because we split on ' ' and '*'.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2764	if tok.startswith('sizeof'):
				2765	skip_next = True
				2766	continue
				2767	is_const = False
				2768	break
				2769	if not is_const:
				2770	error(filename, linenum, 'runtime/arrays', 1,
				2771	'Do not use variable-length arrays. Use an appropriately named '
				2772	"('k' followed by CamelCase) compile-time constant for the size.")
				2773
				2774	# If DISALLOW_EVIL_CONSTRUCTORS, DISALLOW_COPY_AND_ASSIGN, or
				2775	# DISALLOW_IMPLICIT_CONSTRUCTORS is present, then it should be the last thing
				2776	# in the class declaration.
				2777	match = Match(
				2778	(r'\s*'
				2779	r'(DISALLOW_(EVIL_CONSTRUCTORS\|COPY_AND_ASSIGN\|IMPLICIT_CONSTRUCTORS))'
				2780	r'$.*$;$'),
				2781	line)
				2782	if match and linenum + 1 < clean_lines.NumLines():
				2783	next_line = clean_lines.elided[linenum + 1]
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2784	# We allow some, but not all, declarations of variables to be present
				2785	# in the statement that defines the class. The [\w\,\s] fragment of
				2786	# the regular expression below allows users to declare instances of
				2787	# the class or pointers to instances, but not less common types such
				2788	# as function pointers or arrays. It's a tradeoff between allowing
				2789	# reasonable code and avoiding trying to parse more C++ using regexps.
				2790	if not Search(r'^\s}[\w\,\s]*;', next_line):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2791	error(filename, linenum, 'readability/constructors', 3,
				2792	match.group(1) + ' should be the last thing in the class')
				2793
				2794	# Check for use of unnamed namespaces in header files. Registration
				2795	# macros are typically OK, so we allow use of "namespace {" on lines
				2796	# that end with backslashes.
				2797	if (file_extension == 'h'
				2798	and Search(r'\bnamespace\s*{', line)
				2799	and line[-1] != '\\'):
				2800	error(filename, linenum, 'build/namespaces', 4,
				2801	'Do not use unnamed namespaces in header files. See '
				2802	'http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml#Namespaces'
				2803	' for more information.')
				2804
				2805
				2806	def CheckCStyleCast(filename, linenum, line, raw_line, cast_type, pattern,
				2807	error):
				2808	"""Checks for a C-style cast by looking for the pattern.
				2809
				2810	This also handles sizeof(type) warnings, due to similarity of content.
				2811
				2812	Args:
				2813	filename: The name of the current file.
				2814	linenum: The number of the line to check.
				2815	line: The line of code to check.
				2816	raw_line: The raw line of code to check, with comments.
				2817	cast_type: The string for the C++ cast to recommend. This is either
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2818	reinterpret_cast, static_cast, or const_cast, depending.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2819	pattern: The regular expression used to find C-style casts.
				2820	error: The function to call with any errors found.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2821
				2822	Returns:
				2823	True if an error was emitted.
				2824	False otherwise.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2825	"""
				2826	match = Search(pattern, line)
				2827	if not match:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2828	return False
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2829
				2830	# e.g., sizeof(int)
				2831	sizeof_match = Match(r'.sizeof\s$', line[0:match.start(1) - 1])
				2832	if sizeof_match:
				2833	error(filename, linenum, 'runtime/sizeof', 1,
				2834	'Using sizeof(type). Use sizeof(varname) instead if possible')
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2835	return True
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2836
				2837	remainder = line[match.end(0):]
				2838
				2839	# The close paren is for function pointers as arguments to a function.
				2840	# eg, void foo(void (*bar)(int));
				2841	# The semicolon check is a more basic function check; also possibly a
				2842	# function pointer typedef.
				2843	# eg, void foo(int); or void foo(int) const;
				2844	# The equals check is for function pointer assignment.
				2845	# eg, void (foo)(int) = ...
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2846	# The > is for MockCallback<...> ...
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2847	#
				2848	# Right now, this will only catch cases where there's a single argument, and
				2849	# it's unnamed. It should probably be expanded to check for multiple
				2850	# arguments with some unnamed.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2851	function_match = Match(r'\s(\)\|=\|(const)?\s(;\|\{\|throw\|>))', remainder)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2852	if function_match:
				2853	if (not function_match.group(3) or
				2854	function_match.group(3) == ';' or
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2855	('MockCallback<' not in raw_line and
				2856	'/*' not in raw_line)):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2857	error(filename, linenum, 'readability/function', 3,
				2858	'All parameters should be named in a function')
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2859	return True
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2860
				2861	# At this point, all that should be left is actual casts.
				2862	error(filename, linenum, 'readability/casting', 4,
				2863	'Using C-style cast. Use %s<%s>(...) instead' %
				2864	(cast_type, match.group(1)))
				2865
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2866	return True
				2867
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2868
				2869	_HEADERS_CONTAINING_TEMPLATES = (
				2870	('<deque>', ('deque',)),
				2871	('<functional>', ('unary_function', 'binary_function',
				2872	'plus', 'minus', 'multiplies', 'divides', 'modulus',
				2873	'negate',
				2874	'equal_to', 'not_equal_to', 'greater', 'less',
				2875	'greater_equal', 'less_equal',
				2876	'logical_and', 'logical_or', 'logical_not',
				2877	'unary_negate', 'not1', 'binary_negate', 'not2',
				2878	'bind1st', 'bind2nd',
				2879	'pointer_to_unary_function',
				2880	'pointer_to_binary_function',
				2881	'ptr_fun',
				2882	'mem_fun_t', 'mem_fun', 'mem_fun1_t', 'mem_fun1_ref_t',
				2883	'mem_fun_ref_t',
				2884	'const_mem_fun_t', 'const_mem_fun1_t',
				2885	'const_mem_fun_ref_t', 'const_mem_fun1_ref_t',
				2886	'mem_fun_ref',
				2887	)),
				2888	('<limits>', ('numeric_limits',)),
				2889	('<list>', ('list',)),
				2890	('<map>', ('map', 'multimap',)),
				2891	('<memory>', ('allocator',)),
				2892	('<queue>', ('queue', 'priority_queue',)),
				2893	('<set>', ('set', 'multiset',)),
				2894	('<stack>', ('stack',)),
				2895	('<string>', ('char_traits', 'basic_string',)),
				2896	('<utility>', ('pair',)),
				2897	('<vector>', ('vector',)),
				2898
				2899	# gcc extensions.
				2900	# Note: std::hash is their hash, ::hash is our hash
				2901	('<hash_map>', ('hash_map', 'hash_multimap',)),
				2902	('<hash_set>', ('hash_set', 'hash_multiset',)),
				2903	('<slist>', ('slist',)),
				2904	)
				2905
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2906	_RE_PATTERN_STRING = re.compile(r'\bstring\b')
				2907
				2908	_re_pattern_algorithm_header = []
				2909	for _template in ('copy', 'max', 'min', 'min_element', 'sort', 'swap',
				2910	'transform'):
				2911	# Match max<type>(..., ...), max(..., ...), but not foo->max, foo.max or
				2912	# type::max().
				2913	_re_pattern_algorithm_header.append(
				2914	(re.compile(r'[^>.]\b' + _template + r'(<.*?>)?$[^$]'),
				2915	_template,
				2916	'<algorithm>'))
				2917
				2918	_re_pattern_templates = []
				2919	for _header, _templates in _HEADERS_CONTAINING_TEMPLATES:
				2920	for _template in _templates:
				2921	_re_pattern_templates.append(
				2922	(re.compile(r'(\<\|\b)' + _template + r'\s*\<'),
				2923	_template + '<>',
				2924	_header))
				2925
				2926
				2927	def FilesBelongToSameModule(filename_cc, filename_h):
				2928	"""Check if these two filenames belong to the same module.
				2929
				2930	The concept of a 'module' here is a as follows:
				2931	foo.h, foo-inl.h, foo.cc, foo_test.cc and foo_unittest.cc belong to the
				2932	same 'module' if they are in the same directory.
				2933	some/path/public/xyzzy and some/path/internal/xyzzy are also considered
				2934	to belong to the same module here.
				2935
				2936	If the filename_cc contains a longer path than the filename_h, for example,
				2937	'/absolute/path/to/base/sysinfo.cc', and this file would include
				2938	'base/sysinfo.h', this function also produces the prefix needed to open the
				2939	header. This is used by the caller of this function to more robustly open the
				2940	header file. We don't have access to the real include paths in this context,
				2941	so we need this guesswork here.
				2942
				2943	Known bugs: tools/base/bar.cc and base/bar.h belong to the same module
				2944	according to this implementation. Because of this, this function gives
				2945	some false positives. This should be sufficiently rare in practice.
				2946
				2947	Args:
				2948	filename_cc: is the path for the .cc file
				2949	filename_h: is the path for the header path
				2950
				2951	Returns:
				2952	Tuple with a bool and a string:
				2953	bool: True if filename_cc and filename_h belong to the same module.
				2954	string: the additional prefix needed to open the header file.
				2955	"""
				2956
				2957	if not filename_cc.endswith('.cc'):
				2958	return (False, '')
				2959	filename_cc = filename_cc[:-len('.cc')]
				2960	if filename_cc.endswith('_unittest'):
				2961	filename_cc = filename_cc[:-len('_unittest')]
				2962	elif filename_cc.endswith('_test'):
				2963	filename_cc = filename_cc[:-len('_test')]
				2964	filename_cc = filename_cc.replace('/public/', '/')
				2965	filename_cc = filename_cc.replace('/internal/', '/')
				2966
				2967	if not filename_h.endswith('.h'):
				2968	return (False, '')
				2969	filename_h = filename_h[:-len('.h')]
				2970	if filename_h.endswith('-inl'):
				2971	filename_h = filename_h[:-len('-inl')]
				2972	filename_h = filename_h.replace('/public/', '/')
				2973	filename_h = filename_h.replace('/internal/', '/')
				2974
				2975	files_belong_to_same_module = filename_cc.endswith(filename_h)
				2976	common_path = ''
				2977	if files_belong_to_same_module:
				2978	common_path = filename_cc[:-len(filename_h)]
				2979	return files_belong_to_same_module, common_path
				2980
				2981
				2982	def UpdateIncludeState(filename, include_state, io=codecs):
				2983	"""Fill up the include_state with new includes found from the file.
				2984
				2985	Args:
				2986	filename: the name of the header to read.
				2987	include_state: an _IncludeState instance in which the headers are inserted.
				2988	io: The io factory to use to read the file. Provided for testability.
				2989
				2990	Returns:
				2991	True if a header was succesfully added. False otherwise.
				2992	"""
				2993	headerfile = None
				2994	try:
				2995	headerfile = io.open(filename, 'r', 'utf8', 'replace')
				2996	except IOError:
				2997	return False
				2998	linenum = 0
				2999	for line in headerfile:
				3000	linenum += 1
				3001	clean_line = CleanseComments(line)
				3002	match = _RE_PATTERN_INCLUDE.search(clean_line)
				3003	if match:
				3004	include = match.group(2)
				3005	# The value formatting is cute, but not really used right now.
				3006	# What matters here is that the key is in include_state.
				3007	include_state.setdefault(include, '%s:%d' % (filename, linenum))
				3008	return True
				3009
				3010
				3011	def CheckForIncludeWhatYouUse(filename, clean_lines, include_state, error,
				3012	io=codecs):
				3013	"""Reports for missing stl includes.
				3014
				3015	This function will output warnings to make sure you are including the headers
				3016	necessary for the stl containers and functions that you use. We only give one
				3017	reason to include a header. For example, if you use both equal_to<> and
				3018	less<> in a .h file, only one (the latter in the file) of these will be
				3019	reported as a reason to include the <functional>.
				3020
				3021	Args:
				3022	filename: The name of the current file.
				3023	clean_lines: A CleansedLines instance containing the file.
				3024	include_state: An _IncludeState instance.
				3025	error: The function to call with any errors found.
				3026	io: The IO factory to use to read the header file. Provided for unittest
				3027	injection.
				3028	"""
				3029	required = {} # A map of header name to linenumber and the template entity.
				3030	# Example of required: { '<functional>': (1219, 'less<>') }
				3031
				3032	for linenum in xrange(clean_lines.NumLines()):
				3033	line = clean_lines.elided[linenum]
				3034	if not line or line[0] == '#':
				3035	continue
				3036
				3037	# String is special -- it is a non-templatized type in STL.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3038	matched = _RE_PATTERN_STRING.search(line)
				3039	if matched:
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3040	# Don't warn about strings in non-STL namespaces:
				3041	# (We check only the first match per line; good enough.)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3042	prefix = line[:matched.start()]
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3043	if prefix.endswith('std::') or not prefix.endswith('::'):
				3044	required['<string>'] = (linenum, 'string')
				3045
				3046	for pattern, template, header in _re_pattern_algorithm_header:
				3047	if pattern.search(line):
				3048	required[header] = (linenum, template)
				3049
				3050	# The following function is just a speed up, no semantics are changed.
				3051	if not '<' in line: # Reduces the cpu time usage by skipping lines.
				3052	continue
				3053
				3054	for pattern, template, header in _re_pattern_templates:
				3055	if pattern.search(line):
				3056	required[header] = (linenum, template)
				3057
				3058	# The policy is that if you #include something in foo.h you don't need to
				3059	# include it again in foo.cc. Here, we will look at possible includes.
				3060	# Let's copy the include_state so it is only messed up within this function.
				3061	include_state = include_state.copy()
				3062
				3063	# Did we find the header for this file (if any) and succesfully load it?
				3064	header_found = False
				3065
				3066	# Use the absolute path so that matching works properly.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3067	abs_filename = FileInfo(filename).FullName()
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3068
				3069	# For Emacs's flymake.
				3070	# If cpplint is invoked from Emacs's flymake, a temporary file is generated
				3071	# by flymake and that file name might end with '_flymake.cc'. In that case,
				3072	# restore original file name here so that the corresponding header file can be
				3073	# found.
				3074	# e.g. If the file name is 'foo_flymake.cc', we should search for 'foo.h'
				3075	# instead of 'foo_flymake.h'
				3076	abs_filename = re.sub(r'_flymake\.cc$', '.cc', abs_filename)
				3077
				3078	# include_state is modified during iteration, so we iterate over a copy of
				3079	# the keys.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3080	header_keys = include_state.keys()
				3081	for header in header_keys:
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3082	(same_module, common_path) = FilesBelongToSameModule(abs_filename, header)
				3083	fullpath = common_path + header
				3084	if same_module and UpdateIncludeState(fullpath, include_state, io):
				3085	header_found = True
				3086
				3087	# If we can't find the header file for a .cc, assume it's because we don't
				3088	# know where to look. In that case we'll give up as we're not sure they
				3089	# didn't include it in the .h file.
				3090	# TODO(unknown): Do a better job of finding .h files so we are confident that
				3091	# not having the .h file means there isn't one.
				3092	if filename.endswith('.cc') and not header_found:
				3093	return
				3094
				3095	# All the lines have been processed, report the errors found.
				3096	for required_header_unstripped in required:
				3097	template = required[required_header_unstripped][1]
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3098	if required_header_unstripped.strip('<>"') not in include_state:
				3099	error(filename, required[required_header_unstripped][0],
				3100	'build/include_what_you_use', 4,
				3101	'Add #include ' + required_header_unstripped + ' for ' + template)
				3102
				3103
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3104	_RE_PATTERN_EXPLICIT_MAKEPAIR = re.compile(r'\bmake_pair\s*<')
				3105
				3106
				3107	def CheckMakePairUsesDeduction(filename, clean_lines, linenum, error):
				3108	"""Check that make_pair's template arguments are deduced.
				3109
				3110	G++ 4.6 in C++0x mode fails badly if make_pair's template arguments are
				3111	specified explicitly, and such use isn't intended in any case.
				3112
				3113	Args:
				3114	filename: The name of the current file.
				3115	clean_lines: A CleansedLines instance containing the file.
				3116	linenum: The number of the line to check.
				3117	error: The function to call with any errors found.
				3118	"""
				3119	raw = clean_lines.raw_lines
				3120	line = raw[linenum]
				3121	match = _RE_PATTERN_EXPLICIT_MAKEPAIR.search(line)
				3122	if match:
				3123	error(filename, linenum, 'build/explicit_make_pair',
				3124	4, # 4 = high confidence
				3125	'Omit template arguments from make_pair OR use pair directly OR'
				3126	' if appropriate, construct a pair directly')
				3127
				3128
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3129	def ProcessLine(filename, file_extension,
				3130	clean_lines, line, include_state, function_state,
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3131	class_state, error, extra_check_functions=[]):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3132	"""Processes a single line in the file.
				3133
				3134	Args:
				3135	filename: Filename of the file that is being processed.
				3136	file_extension: The extension (dot not included) of the file.
				3137	clean_lines: An array of strings, each representing a line of the file,
				3138	with comments stripped.
				3139	line: Number of line being processed.
				3140	include_state: An _IncludeState instance in which the headers are inserted.
				3141	function_state: A _FunctionState instance which counts function lines, etc.
				3142	class_state: A _ClassState instance which maintains information about
				3143	the current stack of nested class declarations being parsed.
				3144	error: A callable to which errors are reported, which takes 4 arguments:
				3145	filename, line number, error level, and message
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3146	extra_check_functions: An array of additional check functions that will be
				3147	run on each source line. Each function takes 4
				3148	arguments: filename, clean_lines, line, error
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3149	"""
				3150	raw_lines = clean_lines.raw_lines
				3151	ParseNolintSuppressions(filename, raw_lines[line], line, error)
				3152	CheckForFunctionLengths(filename, clean_lines, line, function_state, error)
				3153	CheckForMultilineCommentsAndStrings(filename, clean_lines, line, error)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3154	CheckStyle(filename, clean_lines, line, file_extension, class_state, error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3155	CheckLanguage(filename, clean_lines, line, file_extension, include_state,
				3156	error)
				3157	CheckForNonStandardConstructs(filename, clean_lines, line,
				3158	class_state, error)
				3159	CheckPosixThreading(filename, clean_lines, line, error)
				3160	CheckInvalidIncrement(filename, clean_lines, line, error)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3161	CheckMakePairUsesDeduction(filename, clean_lines, line, error)
				3162	for check_fn in extra_check_functions:
				3163	check_fn(filename, clean_lines, line, error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3164
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3165	def ProcessFileData(filename, file_extension, lines, error,
				3166	extra_check_functions=[]):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3167	"""Performs lint checks and reports any errors to the given error function.
				3168
				3169	Args:
				3170	filename: Filename of the file that is being processed.
				3171	file_extension: The extension (dot not included) of the file.
				3172	lines: An array of strings, each representing a line of the file, with the
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3173	last element being empty if the file is terminated with a newline.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3174	error: A callable to which errors are reported, which takes 4 arguments:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3175	filename, line number, error level, and message
				3176	extra_check_functions: An array of additional check functions that will be
				3177	run on each source line. Each function takes 4
				3178	arguments: filename, clean_lines, line, error
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3179	"""
				3180	lines = (['// marker so line numbers and indices both start at 1'] + lines +
				3181	['// marker so line numbers end in a known way'])
				3182
				3183	include_state = _IncludeState()
				3184	function_state = _FunctionState()
				3185	class_state = _ClassState()
				3186
				3187	ResetNolintSuppressions()
				3188
				3189	CheckForCopyright(filename, lines, error)
				3190
				3191	if file_extension == 'h':
				3192	CheckForHeaderGuard(filename, lines, error)
				3193
				3194	RemoveMultiLineComments(filename, lines, error)
				3195	clean_lines = CleansedLines(lines)
				3196	for line in xrange(clean_lines.NumLines()):
				3197	ProcessLine(filename, file_extension, clean_lines, line,
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3198	include_state, function_state, class_state, error,
				3199	extra_check_functions)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3200	class_state.CheckFinished(filename, error)
				3201
				3202	CheckForIncludeWhatYouUse(filename, clean_lines, include_state, error)
				3203
				3204	# We check here rather than inside ProcessLine so that we see raw
				3205	# lines rather than "cleaned" lines.
				3206	CheckForUnicodeReplacementCharacters(filename, lines, error)
				3207
				3208	CheckForNewlineAtEOF(filename, lines, error)
				3209
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3210	def ProcessFile(filename, vlevel, extra_check_functions=[]):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3211	"""Does google-lint on a single file.
				3212
				3213	Args:
				3214	filename: The name of the file to parse.
				3215
				3216	vlevel: The level of errors to report. Every error of confidence
				3217	>= verbose_level will be reported. 0 is a good default.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3218
				3219	extra_check_functions: An array of additional check functions that will be
				3220	run on each source line. Each function takes 4
				3221	arguments: filename, clean_lines, line, error
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3222	"""
				3223
				3224	_SetVerboseLevel(vlevel)
				3225
				3226	try:
				3227	# Support the UNIX convention of using "-" for stdin. Note that
				3228	# we are not opening the file with universal newline support
				3229	# (which codecs doesn't support anyway), so the resulting lines do
				3230	# contain trailing '\r' characters if we are reading a file that
				3231	# has CRLF endings.
				3232	# If after the split a trailing '\r' is present, it is removed
				3233	# below. If it is not expected to be present (i.e. os.linesep !=
				3234	# '\r\n' as in Windows), a warning is issued below if this file
				3235	# is processed.
				3236
				3237	if filename == '-':
				3238	lines = codecs.StreamReaderWriter(sys.stdin,
				3239	codecs.getreader('utf8'),
				3240	codecs.getwriter('utf8'),
				3241	'replace').read().split('\n')
				3242	else:
				3243	lines = codecs.open(filename, 'r', 'utf8', 'replace').read().split('\n')
				3244
				3245	carriage_return_found = False
				3246	# Remove trailing '\r'.
				3247	for linenum in range(len(lines)):
				3248	if lines[linenum].endswith('\r'):
				3249	lines[linenum] = lines[linenum].rstrip('\r')
				3250	carriage_return_found = True
				3251
				3252	except IOError:
				3253	sys.stderr.write(
				3254	"Skipping input '%s': Can't open for reading\n" % filename)
				3255	return
				3256
				3257	# Note, if no dot is found, this will give the entire filename as the ext.
				3258	file_extension = filename[filename.rfind('.') + 1:]
				3259
				3260	# When reading from stdin, the extension is unknown, so no cpplint tests
				3261	# should rely on the extension.
				3262	if (filename != '-' and file_extension != 'cc' and file_extension != 'h'
				3263	and file_extension != 'cpp'):
				3264	sys.stderr.write('Ignoring %s; not a .cc or .h file\n' % filename)
				3265	else:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3266	ProcessFileData(filename, file_extension, lines, Error,
				3267	extra_check_functions)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3268	if carriage_return_found and os.linesep != '\r\n':
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3269	# Use 0 for linenum since outputting only one error for potentially
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3270	# several lines.
				3271	Error(filename, 0, 'whitespace/newline', 1,
				3272	'One or more unexpected \\r (^M) found;'
				3273	'better to use only a \\n')
				3274
				3275	sys.stderr.write('Done processing %s\n' % filename)
				3276
				3277
				3278	def PrintUsage(message):
				3279	"""Prints a brief usage string and exits, optionally with an error message.
				3280
				3281	Args:
				3282	message: The optional error message.
				3283	"""
				3284	sys.stderr.write(_USAGE)
				3285	if message:
				3286	sys.exit('\nFATAL ERROR: ' + message)
				3287	else:
				3288	sys.exit(1)
				3289
				3290
				3291	def PrintCategories():
				3292	"""Prints a list of all the error-categories used by error messages.
				3293
				3294	These are the categories used to filter messages via --filter.
				3295	"""
				3296	sys.stderr.write(''.join(' %s\n' % cat for cat in _ERROR_CATEGORIES))
				3297	sys.exit(0)
				3298
				3299
				3300	def ParseArguments(args):
				3301	"""Parses the command line arguments.
				3302
				3303	This may set the output format and verbosity level as side-effects.
				3304
				3305	Args:
				3306	args: The command line arguments:
				3307
				3308	Returns:
				3309	The list of filenames to lint.
				3310	"""
				3311	try:
				3312	(opts, filenames) = getopt.getopt(args, '', ['help', 'output=', 'verbose=',
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3313	'stdout', # TODO(enh): added --stdout
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3314	'counting=',
				3315	'filter='])
				3316	except getopt.GetoptError:
				3317	PrintUsage('Invalid arguments.')
				3318
				3319	verbosity = _VerboseLevel()
				3320	output_format = _OutputFormat()
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3321	output_stream = sys.stderr # TODO(enh): added --stdout
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3322	filters = ''
				3323	counting_style = ''
				3324
				3325	for (opt, val) in opts:
				3326	if opt == '--help':
				3327	PrintUsage(None)
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3328	elif opt == '--stdout': # TODO(enh): added --stdout
				3329	output_stream = sys.stdout # TODO(enh): added --stdout
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3330	elif opt == '--output':
				3331	if not val in ('emacs', 'vs7'):
				3332	PrintUsage('The only allowed output formats are emacs and vs7.')
				3333	output_format = val
				3334	elif opt == '--verbose':
				3335	verbosity = int(val)
				3336	elif opt == '--filter':
				3337	filters = val
				3338	if not filters:
				3339	PrintCategories()
				3340	elif opt == '--counting':
				3341	if val not in ('total', 'toplevel', 'detailed'):
				3342	PrintUsage('Valid counting options are total, toplevel, and detailed')
				3343	counting_style = val
				3344
				3345	if not filenames:
				3346	PrintUsage('No files were specified.')
				3347
				3348	_SetOutputFormat(output_format)
				3349	_SetVerboseLevel(verbosity)
				3350	_SetFilters(filters)
				3351	_SetCountingStyle(counting_style)
				3352
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3353	sys.stderr = output_stream # TODO(enh): added --stdout
				3354
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3355	return filenames
				3356
				3357
				3358	def main():
				3359	filenames = ParseArguments(sys.argv[1:])
				3360
				3361	# Change stderr to write with replacement characters so we don't die
				3362	# if we try to print something containing non-ASCII characters.
				3363	sys.stderr = codecs.StreamReaderWriter(sys.stderr,
				3364	codecs.getreader('utf8'),
				3365	codecs.getwriter('utf8'),
				3366	'replace')
				3367
				3368	_cpplint_state.ResetErrorCounts()
				3369	for filename in filenames:
				3370	ProcessFile(filename, _cpplint_state.verbose_level)
				3371	_cpplint_state.PrintErrorCounts()
				3372
				3373	sys.exit(_cpplint_state.error_count > 0)
				3374
				3375
				3376	if __name__ == '__main__':
				3377	main()