Blame - tools/cpplint.py - platform/art

blob: 30c712856e942c208efe18a44c6386c5fc3ae27a [file] [log] [blame]

Elliott Hughes	08b82a9	2012-04-05 12:13:56 -0700	[diff] [blame]	1	#!/usr/bin/python
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2	#
				3	# Copyright (c) 2009 Google Inc. All rights reserved.
				4	#
				5	# Redistribution and use in source and binary forms, with or without
				6	# modification, are permitted provided that the following conditions are
				7	# met:
				8	#
				9	# * Redistributions of source code must retain the above copyright
				10	# notice, this list of conditions and the following disclaimer.
				11	# * Redistributions in binary form must reproduce the above
				12	# copyright notice, this list of conditions and the following disclaimer
				13	# in the documentation and/or other materials provided with the
				14	# distribution.
				15	# * Neither the name of Google Inc. nor the names of its
				16	# contributors may be used to endorse or promote products derived from
				17	# this software without specific prior written permission.
				18	#
				19	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				20	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				21	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				22	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
				23	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
				24	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
				25	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
				26	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
				27	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
				28	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
				29	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
				30
				31	# Here are some issues that I've had people identify in my code during reviews,
				32	# that I think are possible to flag automatically in a lint tool. If these were
				33	# caught by lint, it would save time both for myself and that of my reviewers.
				34	# Most likely, some of these are beyond the scope of the current lint framework,
				35	# but I think it is valuable to retain these wish-list items even if they cannot
				36	# be immediately implemented.
				37	#
				38	# Suggestions
				39	# -----------
				40	# - Check for no 'explicit' for multi-arg ctor
				41	# - Check for boolean assign RHS in parens
				42	# - Check for ctor initializer-list colon position and spacing
				43	# - Check that if there's a ctor, there should be a dtor
				44	# - Check accessors that return non-pointer member variables are
				45	# declared const
				46	# - Check accessors that return non-const pointer member vars are
				47	# not declared const
				48	# - Check for using public includes for testing
				49	# - Check for spaces between brackets in one-line inline method
				50	# - Check for no assert()
				51	# - Check for spaces surrounding operators
				52	# - Check for 0 in pointer context (should be NULL)
				53	# - Check for 0 in char context (should be '\0')
				54	# - Check for camel-case method name conventions for methods
				55	# that are not simple inline getters and setters
				56	# - Check that base classes have virtual destructors
				57	# put " // namespace" after } that closes a namespace, with
				58	# namespace's name after 'namespace' if it is named.
				59	# - Do not indent namespace contents
				60	# - Avoid inlining non-trivial constructors in header files
				61	# include base/basictypes.h if DISALLOW_EVIL_CONSTRUCTORS is used
				62	# - Check for old-school (void) cast for call-sites of functions
				63	# ignored return value
				64	# - Check gUnit usage of anonymous namespace
				65	# - Check for class declaration order (typedefs, consts, enums,
				66	# ctor(s?), dtor, friend declarations, methods, member vars)
				67	#
				68
				69	"""Does google-lint on c++ files.
				70
				71	The goal of this script is to identify places in the code that may
				72	be in non-compliance with google style. It does not attempt to fix
				73	up these problems -- the point is to educate. It does also not
				74	attempt to find all problems, or to ensure that everything it does
				75	find is legitimately a problem.
				76
				77	In particular, we can get very confused by /* and // inside strings!
				78	We do a small hack, which is to ignore //'s with "'s after them on the
				79	same line, but it is far from perfect (in either direction).
				80	"""
				81
				82	import codecs
				83	import getopt
				84	import math # for log
				85	import os
				86	import re
				87	import sre_compile
				88	import string
				89	import sys
				90	import unicodedata
				91
				92
				93	_USAGE = """
				94	Syntax: cpplint.py [--verbose=#] [--output=vs7] [--filter=-x,+y,...]
				95	[--counting=total\|toplevel\|detailed]
				96	<file> [file] ...
				97
				98	The style guidelines this tries to follow are those in
				99	http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml
				100
				101	Every problem is given a confidence score from 1-5, with 5 meaning we are
				102	certain of the problem, and 1 meaning it could be a legitimate construct.
				103	This will miss some errors, and is not a substitute for a code review.
				104
				105	To suppress false-positive errors of a certain category, add a
				106	'NOLINT(category)' comment to the line. NOLINT or NOLINT(*)
				107	suppresses errors of all categories on that line.
				108
				109	The files passed in will be linted; at least one file must be provided.
				110	Linted extensions are .cc, .cpp, and .h. Other file types will be ignored.
				111
				112	Flags:
				113
				114	output=vs7
				115	By default, the output is formatted to ease emacs parsing. Visual Studio
				116	compatible output (vs7) may also be used. Other formats are unsupported.
				117
				118	verbose=#
				119	Specify a number 0-5 to restrict errors to certain verbosity levels.
				120
				121	filter=-x,+y,...
				122	Specify a comma-separated list of category-filters to apply: only
				123	error messages whose category names pass the filters will be printed.
				124	(Category names are printed with the message and look like
				125	"[whitespace/indent]".) Filters are evaluated left to right.
				126	"-FOO" and "FOO" means "do not print categories that start with FOO".
				127	"+FOO" means "do print categories that start with FOO".
				128
				129	Examples: --filter=-whitespace,+whitespace/braces
				130	--filter=whitespace,runtime/printf,+runtime/printf_format
				131	--filter=-,+build/include_what_you_use
				132
				133	To see a list of all the categories used in cpplint, pass no arg:
				134	--filter=
				135
				136	counting=total\|toplevel\|detailed
				137	The total number of errors found is always printed. If
				138	'toplevel' is provided, then the count of errors in each of
				139	the top-level categories like 'build' and 'whitespace' will
				140	also be printed. If 'detailed' is provided, then a count
				141	is provided for each category like 'build/class'.
				142	"""
				143
				144	# We categorize each error message we print. Here are the categories.
				145	# We want an explicit list so we can list them all in cpplint --filter=.
				146	# If you add a new error message with a new category, add it to the list
				147	# here! cpplint_unittest.py should tell you if you forget to do this.
				148	# \ used for clearer layout -- pylint: disable-msg=C6013
				149	_ERROR_CATEGORIES = [
				150	'build/class',
				151	'build/deprecated',
				152	'build/endif_comment',
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	153	'build/explicit_make_pair',
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	154	'build/forward_decl',
				155	'build/header_guard',
				156	'build/include',
				157	'build/include_alpha',
				158	'build/include_order',
				159	'build/include_what_you_use',
				160	'build/namespaces',
				161	'build/printf_format',
				162	'build/storage_class',
				163	'legal/copyright',
				164	'readability/braces',
				165	'readability/casting',
				166	'readability/check',
				167	'readability/constructors',
				168	'readability/fn_size',
				169	'readability/function',
				170	'readability/multiline_comment',
				171	'readability/multiline_string',
				172	'readability/nolint',
				173	'readability/streams',
				174	'readability/todo',
				175	'readability/utf8',
				176	'runtime/arrays',
				177	'runtime/casting',
				178	'runtime/explicit',
				179	'runtime/int',
				180	'runtime/init',
				181	'runtime/invalid_increment',
				182	'runtime/member_string_references',
				183	'runtime/memset',
				184	'runtime/operator',
				185	'runtime/printf',
				186	'runtime/printf_format',
				187	'runtime/references',
				188	'runtime/rtti',
				189	'runtime/sizeof',
				190	'runtime/string',
				191	'runtime/threadsafe_fn',
				192	'runtime/virtual',
				193	'whitespace/blank_line',
				194	'whitespace/braces',
				195	'whitespace/comma',
				196	'whitespace/comments',
				197	'whitespace/end_of_line',
				198	'whitespace/ending_newline',
				199	'whitespace/indent',
				200	'whitespace/labels',
				201	'whitespace/line_length',
				202	'whitespace/newline',
				203	'whitespace/operators',
				204	'whitespace/parens',
				205	'whitespace/semicolon',
				206	'whitespace/tab',
				207	'whitespace/todo'
				208	]
				209
				210	# The default state of the category filter. This is overrided by the --filter=
				211	# flag. By default all errors are on, so only add here categories that should be
				212	# off by default (i.e., categories that must be enabled by the --filter= flags).
				213	# All entries here should start with a '-' or '+', as in the --filter= flag.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	214	_DEFAULT_FILTERS = ['-build/include_alpha']
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	215
				216	# We used to check for high-bit characters, but after much discussion we
				217	# decided those were OK, as long as they were in UTF-8 and didn't represent
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	218	# hard-coded international strings, which belong in a separate i18n file.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	219
				220	# Headers that we consider STL headers.
				221	_STL_HEADERS = frozenset([
				222	'algobase.h', 'algorithm', 'alloc.h', 'bitset', 'deque', 'exception',
				223	'function.h', 'functional', 'hash_map', 'hash_map.h', 'hash_set',
				224	'hash_set.h', 'iterator', 'list', 'list.h', 'map', 'memory', 'new',
				225	'pair.h', 'pthread_alloc', 'queue', 'set', 'set.h', 'sstream', 'stack',
				226	'stl_alloc.h', 'stl_relops.h', 'type_traits.h',
				227	'utility', 'vector', 'vector.h',
				228	])
				229
				230
				231	# Non-STL C++ system headers.
				232	_CPP_HEADERS = frozenset([
				233	'algo.h', 'builtinbuf.h', 'bvector.h', 'cassert', 'cctype',
				234	'cerrno', 'cfloat', 'ciso646', 'climits', 'clocale', 'cmath',
				235	'complex', 'complex.h', 'csetjmp', 'csignal', 'cstdarg', 'cstddef',
				236	'cstdio', 'cstdlib', 'cstring', 'ctime', 'cwchar', 'cwctype',
				237	'defalloc.h', 'deque.h', 'editbuf.h', 'exception', 'fstream',
				238	'fstream.h', 'hashtable.h', 'heap.h', 'indstream.h', 'iomanip',
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	239	'iomanip.h', 'ios', 'iosfwd', 'iostream', 'iostream.h', 'istream',
				240	'istream.h', 'iterator.h', 'limits', 'map.h', 'multimap.h', 'multiset.h',
				241	'numeric', 'ostream', 'ostream.h', 'parsestream.h', 'pfstream.h',
				242	'PlotFile.h', 'procbuf.h', 'pthread_alloc.h', 'rope', 'rope.h',
				243	'ropeimpl.h', 'SFile.h', 'slist', 'slist.h', 'stack.h', 'stdexcept',
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	244	'stdiostream.h', 'streambuf.h', 'stream.h', 'strfile.h', 'string',
				245	'strstream', 'strstream.h', 'tempbuf.h', 'tree.h', 'typeinfo', 'valarray',
				246	])
				247
				248
				249	# Assertion macros. These are defined in base/logging.h and
				250	# testing/base/gunit.h. Note that the _M versions need to come first
				251	# for substring matching to work.
				252	_CHECK_MACROS = [
				253	'DCHECK', 'CHECK',
				254	'EXPECT_TRUE_M', 'EXPECT_TRUE',
				255	'ASSERT_TRUE_M', 'ASSERT_TRUE',
				256	'EXPECT_FALSE_M', 'EXPECT_FALSE',
				257	'ASSERT_FALSE_M', 'ASSERT_FALSE',
				258	]
				259
				260	# Replacement macros for CHECK/DCHECK/EXPECT_TRUE/EXPECT_FALSE
				261	_CHECK_REPLACEMENT = dict([(m, {}) for m in _CHECK_MACROS])
				262
				263	for op, replacement in [('==', 'EQ'), ('!=', 'NE'),
				264	('>=', 'GE'), ('>', 'GT'),
				265	('<=', 'LE'), ('<', 'LT')]:
				266	_CHECK_REPLACEMENT['DCHECK'][op] = 'DCHECK_%s' % replacement
				267	_CHECK_REPLACEMENT['CHECK'][op] = 'CHECK_%s' % replacement
				268	_CHECK_REPLACEMENT['EXPECT_TRUE'][op] = 'EXPECT_%s' % replacement
				269	_CHECK_REPLACEMENT['ASSERT_TRUE'][op] = 'ASSERT_%s' % replacement
				270	_CHECK_REPLACEMENT['EXPECT_TRUE_M'][op] = 'EXPECT_%s_M' % replacement
				271	_CHECK_REPLACEMENT['ASSERT_TRUE_M'][op] = 'ASSERT_%s_M' % replacement
				272
				273	for op, inv_replacement in [('==', 'NE'), ('!=', 'EQ'),
				274	('>=', 'LT'), ('>', 'LE'),
				275	('<=', 'GT'), ('<', 'GE')]:
				276	_CHECK_REPLACEMENT['EXPECT_FALSE'][op] = 'EXPECT_%s' % inv_replacement
				277	_CHECK_REPLACEMENT['ASSERT_FALSE'][op] = 'ASSERT_%s' % inv_replacement
				278	_CHECK_REPLACEMENT['EXPECT_FALSE_M'][op] = 'EXPECT_%s_M' % inv_replacement
				279	_CHECK_REPLACEMENT['ASSERT_FALSE_M'][op] = 'ASSERT_%s_M' % inv_replacement
				280
				281
				282	# These constants define types of headers for use with
				283	# _IncludeState.CheckNextIncludeOrder().
				284	_C_SYS_HEADER = 1
				285	_CPP_SYS_HEADER = 2
				286	_LIKELY_MY_HEADER = 3
				287	_POSSIBLE_MY_HEADER = 4
				288	_OTHER_HEADER = 5
				289
				290
				291	_regexp_compile_cache = {}
				292
				293	# Finds occurrences of NOLINT or NOLINT(...).
				294	_RE_SUPPRESSION = re.compile(r'\bNOLINT\b($[^)]*$)?')
				295
				296	# {str, set(int)}: a map from error categories to sets of linenumbers
				297	# on which those errors are expected and should be suppressed.
				298	_error_suppressions = {}
				299
				300	def ParseNolintSuppressions(filename, raw_line, linenum, error):
				301	"""Updates the global list of error-suppressions.
				302
				303	Parses any NOLINT comments on the current line, updating the global
				304	error_suppressions store. Reports an error if the NOLINT comment
				305	was malformed.
				306
				307	Args:
				308	filename: str, the name of the input file.
				309	raw_line: str, the line of input text, with comments.
				310	linenum: int, the number of the current line.
				311	error: function, an error handler.
				312	"""
				313	# FIXME(adonovan): "NOLINT(" is misparsed as NOLINT(*).
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	314	matched = _RE_SUPPRESSION.search(raw_line)
				315	if matched:
				316	category = matched.group(1)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	317	if category in (None, '(*)'): # => "suppress all"
				318	_error_suppressions.setdefault(None, set()).add(linenum)
				319	else:
				320	if category.startswith('(') and category.endswith(')'):
				321	category = category[1:-1]
				322	if category in _ERROR_CATEGORIES:
				323	_error_suppressions.setdefault(category, set()).add(linenum)
				324	else:
				325	error(filename, linenum, 'readability/nolint', 5,
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	326	'Unknown NOLINT error category: %s' % category)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	327
				328
				329	def ResetNolintSuppressions():
				330	"Resets the set of NOLINT suppressions to empty."
				331	_error_suppressions.clear()
				332
				333
				334	def IsErrorSuppressedByNolint(category, linenum):
				335	"""Returns true if the specified error category is suppressed on this line.
				336
				337	Consults the global error_suppressions map populated by
				338	ParseNolintSuppressions/ResetNolintSuppressions.
				339
				340	Args:
				341	category: str, the category of the error.
				342	linenum: int, the current line number.
				343	Returns:
				344	bool, True iff the error should be suppressed due to a NOLINT comment.
				345	"""
				346	return (linenum in _error_suppressions.get(category, set()) or
				347	linenum in _error_suppressions.get(None, set()))
				348
				349	def Match(pattern, s):
				350	"""Matches the string with the pattern, caching the compiled regexp."""
				351	# The regexp compilation caching is inlined in both Match and Search for
				352	# performance reasons; factoring it out into a separate function turns out
				353	# to be noticeably expensive.
				354	if not pattern in _regexp_compile_cache:
				355	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				356	return _regexp_compile_cache[pattern].match(s)
				357
				358
				359	def Search(pattern, s):
				360	"""Searches the string for the pattern, caching the compiled regexp."""
				361	if not pattern in _regexp_compile_cache:
				362	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				363	return _regexp_compile_cache[pattern].search(s)
				364
				365
				366	class _IncludeState(dict):
				367	"""Tracks line numbers for includes, and the order in which includes appear.
				368
				369	As a dict, an _IncludeState object serves as a mapping between include
				370	filename and line number on which that file was included.
				371
				372	Call CheckNextIncludeOrder() once for each header in the file, passing
				373	in the type constants defined above. Calls in an illegal order will
				374	raise an _IncludeError with an appropriate error message.
				375
				376	"""
				377	# self._section will move monotonically through this set. If it ever
				378	# needs to move backwards, CheckNextIncludeOrder will raise an error.
				379	_INITIAL_SECTION = 0
				380	_MY_H_SECTION = 1
				381	_C_SECTION = 2
				382	_CPP_SECTION = 3
				383	_OTHER_H_SECTION = 4
				384
				385	_TYPE_NAMES = {
				386	_C_SYS_HEADER: 'C system header',
				387	_CPP_SYS_HEADER: 'C++ system header',
				388	_LIKELY_MY_HEADER: 'header this file implements',
				389	_POSSIBLE_MY_HEADER: 'header this file may implement',
				390	_OTHER_HEADER: 'other header',
				391	}
				392	_SECTION_NAMES = {
				393	_INITIAL_SECTION: "... nothing. (This can't be an error.)",
				394	_MY_H_SECTION: 'a header this file implements',
				395	_C_SECTION: 'C system header',
				396	_CPP_SECTION: 'C++ system header',
				397	_OTHER_H_SECTION: 'other header',
				398	}
				399
				400	def __init__(self):
				401	dict.__init__(self)
				402	# The name of the current section.
				403	self._section = self._INITIAL_SECTION
				404	# The path of last found header.
				405	self._last_header = ''
				406
				407	def CanonicalizeAlphabeticalOrder(self, header_path):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	408	"""Returns a path canonicalized for alphabetical comparison.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	409
				410	- replaces "-" with "_" so they both cmp the same.
				411	- removes '-inl' since we don't require them to be after the main header.
				412	- lowercase everything, just in case.
				413
				414	Args:
				415	header_path: Path to be canonicalized.
				416
				417	Returns:
				418	Canonicalized path.
				419	"""
				420	return header_path.replace('-inl.h', '.h').replace('-', '_').lower()
				421
				422	def IsInAlphabeticalOrder(self, header_path):
				423	"""Check if a header is in alphabetical order with the previous header.
				424
				425	Args:
				426	header_path: Header to be checked.
				427
				428	Returns:
				429	Returns true if the header is in alphabetical order.
				430	"""
				431	canonical_header = self.CanonicalizeAlphabeticalOrder(header_path)
				432	if self._last_header > canonical_header:
				433	return False
				434	self._last_header = canonical_header
				435	return True
				436
				437	def CheckNextIncludeOrder(self, header_type):
				438	"""Returns a non-empty error message if the next header is out of order.
				439
				440	This function also updates the internal state to be ready to check
				441	the next include.
				442
				443	Args:
				444	header_type: One of the _XXX_HEADER constants defined above.
				445
				446	Returns:
				447	The empty string if the header is in the right order, or an
				448	error message describing what's wrong.
				449
				450	"""
				451	error_message = ('Found %s after %s' %
				452	(self._TYPE_NAMES[header_type],
				453	self._SECTION_NAMES[self._section]))
				454
				455	last_section = self._section
				456
				457	if header_type == _C_SYS_HEADER:
				458	if self._section <= self._C_SECTION:
				459	self._section = self._C_SECTION
				460	else:
				461	self._last_header = ''
				462	return error_message
				463	elif header_type == _CPP_SYS_HEADER:
				464	if self._section <= self._CPP_SECTION:
				465	self._section = self._CPP_SECTION
				466	else:
				467	self._last_header = ''
				468	return error_message
				469	elif header_type == _LIKELY_MY_HEADER:
				470	if self._section <= self._MY_H_SECTION:
				471	self._section = self._MY_H_SECTION
				472	else:
				473	self._section = self._OTHER_H_SECTION
				474	elif header_type == _POSSIBLE_MY_HEADER:
				475	if self._section <= self._MY_H_SECTION:
				476	self._section = self._MY_H_SECTION
				477	else:
				478	# This will always be the fallback because we're not sure
				479	# enough that the header is associated with this file.
				480	self._section = self._OTHER_H_SECTION
				481	else:
				482	assert header_type == _OTHER_HEADER
				483	self._section = self._OTHER_H_SECTION
				484
				485	if last_section != self._section:
				486	self._last_header = ''
				487
				488	return ''
				489
				490
				491	class _CppLintState(object):
				492	"""Maintains module-wide state.."""
				493
				494	def __init__(self):
				495	self.verbose_level = 1 # global setting.
				496	self.error_count = 0 # global count of reported errors
				497	# filters to apply when emitting error messages
				498	self.filters = _DEFAULT_FILTERS[:]
				499	self.counting = 'total' # In what way are we counting errors?
				500	self.errors_by_category = {} # string to int dict storing error counts
				501
				502	# output format:
				503	# "emacs" - format that emacs can parse (default)
				504	# "vs7" - format that Microsoft Visual Studio 7 can parse
				505	self.output_format = 'emacs'
				506
				507	def SetOutputFormat(self, output_format):
				508	"""Sets the output format for errors."""
				509	self.output_format = output_format
				510
				511	def SetVerboseLevel(self, level):
				512	"""Sets the module's verbosity, and returns the previous setting."""
				513	last_verbose_level = self.verbose_level
				514	self.verbose_level = level
				515	return last_verbose_level
				516
				517	def SetCountingStyle(self, counting_style):
				518	"""Sets the module's counting options."""
				519	self.counting = counting_style
				520
				521	def SetFilters(self, filters):
				522	"""Sets the error-message filters.
				523
				524	These filters are applied when deciding whether to emit a given
				525	error message.
				526
				527	Args:
				528	filters: A string of comma-separated filters (eg "+whitespace/indent").
				529	Each filter should start with + or -; else we die.
				530
				531	Raises:
				532	ValueError: The comma-separated filters did not all start with '+' or '-'.
				533	E.g. "-,+whitespace,-whitespace/indent,whitespace/badfilter"
				534	"""
				535	# Default filters always have less priority than the flag ones.
				536	self.filters = _DEFAULT_FILTERS[:]
				537	for filt in filters.split(','):
				538	clean_filt = filt.strip()
				539	if clean_filt:
				540	self.filters.append(clean_filt)
				541	for filt in self.filters:
				542	if not (filt.startswith('+') or filt.startswith('-')):
				543	raise ValueError('Every filter in --filters must start with + or -'
				544	' (%s does not)' % filt)
				545
				546	def ResetErrorCounts(self):
				547	"""Sets the module's error statistic back to zero."""
				548	self.error_count = 0
				549	self.errors_by_category = {}
				550
				551	def IncrementErrorCount(self, category):
				552	"""Bumps the module's error statistic."""
				553	self.error_count += 1
				554	if self.counting in ('toplevel', 'detailed'):
				555	if self.counting != 'detailed':
				556	category = category.split('/')[0]
				557	if category not in self.errors_by_category:
				558	self.errors_by_category[category] = 0
				559	self.errors_by_category[category] += 1
				560
				561	def PrintErrorCounts(self):
				562	"""Print a summary of errors by category, and the total."""
				563	for category, count in self.errors_by_category.iteritems():
				564	sys.stderr.write('Category \'%s\' errors found: %d\n' %
				565	(category, count))
				566	sys.stderr.write('Total errors found: %d\n' % self.error_count)
				567
				568	_cpplint_state = _CppLintState()
				569
				570
				571	def _OutputFormat():
				572	"""Gets the module's output format."""
				573	return _cpplint_state.output_format
				574
				575
				576	def _SetOutputFormat(output_format):
				577	"""Sets the module's output format."""
				578	_cpplint_state.SetOutputFormat(output_format)
				579
				580
				581	def _VerboseLevel():
				582	"""Returns the module's verbosity setting."""
				583	return _cpplint_state.verbose_level
				584
				585
				586	def _SetVerboseLevel(level):
				587	"""Sets the module's verbosity, and returns the previous setting."""
				588	return _cpplint_state.SetVerboseLevel(level)
				589
				590
				591	def _SetCountingStyle(level):
				592	"""Sets the module's counting options."""
				593	_cpplint_state.SetCountingStyle(level)
				594
				595
				596	def _Filters():
				597	"""Returns the module's list of output filters, as a list."""
				598	return _cpplint_state.filters
				599
				600
				601	def _SetFilters(filters):
				602	"""Sets the module's error-message filters.
				603
				604	These filters are applied when deciding whether to emit a given
				605	error message.
				606
				607	Args:
				608	filters: A string of comma-separated filters (eg "whitespace/indent").
				609	Each filter should start with + or -; else we die.
				610	"""
				611	_cpplint_state.SetFilters(filters)
				612
				613
				614	class _FunctionState(object):
				615	"""Tracks current function name and the number of lines in its body."""
				616
				617	_NORMAL_TRIGGER = 250 # for --v=0, 500 for --v=1, etc.
				618	_TEST_TRIGGER = 400 # about 50% more than _NORMAL_TRIGGER.
				619
				620	def __init__(self):
				621	self.in_a_function = False
				622	self.lines_in_function = 0
				623	self.current_function = ''
				624
				625	def Begin(self, function_name):
				626	"""Start analyzing function body.
				627
				628	Args:
				629	function_name: The name of the function being tracked.
				630	"""
				631	self.in_a_function = True
				632	self.lines_in_function = 0
				633	self.current_function = function_name
				634
				635	def Count(self):
				636	"""Count line in current function body."""
				637	if self.in_a_function:
				638	self.lines_in_function += 1
				639
				640	def Check(self, error, filename, linenum):
				641	"""Report if too many lines in function body.
				642
				643	Args:
				644	error: The function to call with any errors found.
				645	filename: The name of the current file.
				646	linenum: The number of the line to check.
				647	"""
				648	if Match(r'T(EST\|est)', self.current_function):
				649	base_trigger = self._TEST_TRIGGER
				650	else:
				651	base_trigger = self._NORMAL_TRIGGER
				652	trigger = base_trigger * 2**_VerboseLevel()
				653
				654	if self.lines_in_function > trigger:
				655	error_level = int(math.log(self.lines_in_function / base_trigger, 2))
				656	# 50 => 0, 100 => 1, 200 => 2, 400 => 3, 800 => 4, 1600 => 5, ...
				657	if error_level > 5:
				658	error_level = 5
				659	error(filename, linenum, 'readability/fn_size', error_level,
				660	'Small and focused functions are preferred:'
				661	' %s has %d non-comment lines'
				662	' (error triggered by exceeding %d lines).' % (
				663	self.current_function, self.lines_in_function, trigger))
				664
				665	def End(self):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	666	"""Stop analyzing function body."""
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	667	self.in_a_function = False
				668
				669
				670	class _IncludeError(Exception):
				671	"""Indicates a problem with the include order in a file."""
				672	pass
				673
				674
				675	class FileInfo:
				676	"""Provides utility functions for filenames.
				677
				678	FileInfo provides easy access to the components of a file's path
				679	relative to the project root.
				680	"""
				681
				682	def __init__(self, filename):
				683	self._filename = filename
				684
				685	def FullName(self):
				686	"""Make Windows paths like Unix."""
				687	return os.path.abspath(self._filename).replace('\\', '/')
				688
				689	def RepositoryName(self):
				690	"""FullName after removing the local path to the repository.
				691
				692	If we have a real absolute path name here we can try to do something smart:
				693	detecting the root of the checkout and truncating /path/to/checkout from
				694	the name so that we get header guards that don't include things like
				695	"C:\Documents and Settings\..." or "/home/username/..." in them and thus
				696	people on different computers who have checked the source out to different
				697	locations won't see bogus errors.
				698	"""
				699	fullname = self.FullName()
				700
				701	if os.path.exists(fullname):
				702	project_dir = os.path.dirname(fullname)
				703
				704	if os.path.exists(os.path.join(project_dir, ".svn")):
				705	# If there's a .svn file in the current directory, we recursively look
				706	# up the directory tree for the top of the SVN checkout
				707	root_dir = project_dir
				708	one_up_dir = os.path.dirname(root_dir)
				709	while os.path.exists(os.path.join(one_up_dir, ".svn")):
				710	root_dir = os.path.dirname(root_dir)
				711	one_up_dir = os.path.dirname(one_up_dir)
				712
				713	prefix = os.path.commonprefix([root_dir, project_dir])
				714	return fullname[len(prefix) + 1:]
				715
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	716	# Not SVN <= 1.6? Try to find a git, hg, or svn top level directory by
				717	# searching up from the current path.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	718	root_dir = os.path.dirname(fullname)
				719	while (root_dir != os.path.dirname(root_dir) and
				720	not os.path.exists(os.path.join(root_dir, ".git")) and
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	721	not os.path.exists(os.path.join(root_dir, ".hg")) and
				722	not os.path.exists(os.path.join(root_dir, ".svn"))):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	723	root_dir = os.path.dirname(root_dir)
				724
				725	if (os.path.exists(os.path.join(root_dir, ".git")) or
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	726	os.path.exists(os.path.join(root_dir, ".hg")) or
				727	os.path.exists(os.path.join(root_dir, ".svn"))):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	728	prefix = os.path.commonprefix([root_dir, project_dir])
Brian Carlstrom	fc0e321	2013-07-17 14:40:12 -0700	[diff] [blame^]	729	# BEGIN android-changed
				730	# return fullname[len(prefix) + 1:]
				731	return "art/" + fullname[len(prefix) + 1:]
				732	# END android-changed
				733
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	734
				735	# Don't know what to do; header guard warnings may be wrong...
				736	return fullname
				737
				738	def Split(self):
				739	"""Splits the file into the directory, basename, and extension.
				740
				741	For 'chrome/browser/browser.cc', Split() would
				742	return ('chrome/browser', 'browser', '.cc')
				743
				744	Returns:
				745	A tuple of (directory, basename, extension).
				746	"""
				747
				748	googlename = self.RepositoryName()
				749	project, rest = os.path.split(googlename)
				750	return (project,) + os.path.splitext(rest)
				751
				752	def BaseName(self):
				753	"""File base name - text after the final slash, before the final period."""
				754	return self.Split()[1]
				755
				756	def Extension(self):
				757	"""File extension - text following the final period."""
				758	return self.Split()[2]
				759
				760	def NoExtension(self):
				761	"""File has no source file extension."""
				762	return '/'.join(self.Split()[0:2])
				763
				764	def IsSource(self):
				765	"""File has a source file extension."""
				766	return self.Extension()[1:] in ('c', 'cc', 'cpp', 'cxx')
				767
				768
				769	def _ShouldPrintError(category, confidence, linenum):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	770	"""If confidence >= verbose, category passes filter and is not suppressed."""
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	771
				772	# There are three ways we might decide not to print an error message:
				773	# a "NOLINT(category)" comment appears in the source,
				774	# the verbosity level isn't high enough, or the filters filter it out.
				775	if IsErrorSuppressedByNolint(category, linenum):
				776	return False
				777	if confidence < _cpplint_state.verbose_level:
				778	return False
				779
				780	is_filtered = False
				781	for one_filter in _Filters():
				782	if one_filter.startswith('-'):
				783	if category.startswith(one_filter[1:]):
				784	is_filtered = True
				785	elif one_filter.startswith('+'):
				786	if category.startswith(one_filter[1:]):
				787	is_filtered = False
				788	else:
				789	assert False # should have been checked for in SetFilter.
				790	if is_filtered:
				791	return False
				792
				793	return True
				794
				795
				796	def Error(filename, linenum, category, confidence, message):
				797	"""Logs the fact we've found a lint error.
				798
				799	We log where the error was found, and also our confidence in the error,
				800	that is, how certain we are this is a legitimate style regression, and
				801	not a misidentification or a use that's sometimes justified.
				802
				803	False positives can be suppressed by the use of
				804	"cpplint(category)" comments on the offending line. These are
				805	parsed into _error_suppressions.
				806
				807	Args:
				808	filename: The name of the file containing the error.
				809	linenum: The number of the line containing the error.
				810	category: A string used to describe the "category" this bug
				811	falls under: "whitespace", say, or "runtime". Categories
				812	may have a hierarchy separated by slashes: "whitespace/indent".
				813	confidence: A number from 1-5 representing a confidence score for
				814	the error, with 5 meaning that we are certain of the problem,
				815	and 1 meaning that it could be a legitimate construct.
				816	message: The error message.
				817	"""
				818	if _ShouldPrintError(category, confidence, linenum):
				819	_cpplint_state.IncrementErrorCount(category)
				820	if _cpplint_state.output_format == 'vs7':
				821	sys.stderr.write('%s(%s): %s [%s] [%d]\n' % (
				822	filename, linenum, message, category, confidence))
				823	else:
				824	sys.stderr.write('%s:%s: %s [%s] [%d]\n' % (
				825	filename, linenum, message, category, confidence))
				826
				827
				828	# Matches standard C++ escape esequences per 2.13.2.3 of the C++ standard.
				829	_RE_PATTERN_CLEANSE_LINE_ESCAPES = re.compile(
				830	r'\\([abfnrtv?"\\\']\|\d+\|x[0-9a-fA-F]+)')
				831	# Matches strings. Escape codes should already be removed by ESCAPES.
				832	_RE_PATTERN_CLEANSE_LINE_DOUBLE_QUOTES = re.compile(r'"[^"]*"')
				833	# Matches characters. Escape codes should already be removed by ESCAPES.
				834	_RE_PATTERN_CLEANSE_LINE_SINGLE_QUOTES = re.compile(r"'.'")
				835	# Matches multi-line C++ comments.
				836	# This RE is a little bit more complicated than one might expect, because we
				837	# have to take care of space removals tools so we can handle comments inside
				838	# statements better.
				839	# The current rule is: We only clear spaces from both sides when we're at the
				840	# end of the line. Otherwise, we try to remove spaces from the right side,
				841	# if this doesn't work we try on left side but only if there's a non-character
				842	# on the right.
				843	_RE_PATTERN_CLEANSE_LINE_C_COMMENTS = re.compile(
				844	r"""(\s/\.\/\s*$\|
				845	/\.\*/\s+\|
				846	\s+/\.\*/(?=\W)\|
				847	/\.\*/)""", re.VERBOSE)
				848
				849
				850	def IsCppString(line):
				851	"""Does line terminate so, that the next symbol is in string constant.
				852
				853	This function does not consider single-line nor multi-line comments.
				854
				855	Args:
				856	line: is a partial line of code starting from the 0..n.
				857
				858	Returns:
				859	True, if next character appended to 'line' is inside a
				860	string constant.
				861	"""
				862
				863	line = line.replace(r'\\', 'XX') # after this, \\" does not match to \"
				864	return ((line.count('"') - line.count(r'\"') - line.count("'\"'")) & 1) == 1
				865
				866
				867	def FindNextMultiLineCommentStart(lines, lineix):
				868	"""Find the beginning marker for a multiline comment."""
				869	while lineix < len(lines):
				870	if lines[lineix].strip().startswith('/*'):
				871	# Only return this marker if the comment goes beyond this line
				872	if lines[lineix].strip().find('*/', 2) < 0:
				873	return lineix
				874	lineix += 1
				875	return len(lines)
				876
				877
				878	def FindNextMultiLineCommentEnd(lines, lineix):
				879	"""We are inside a comment, find the end marker."""
				880	while lineix < len(lines):
				881	if lines[lineix].strip().endswith('*/'):
				882	return lineix
				883	lineix += 1
				884	return len(lines)
				885
				886
				887	def RemoveMultiLineCommentsFromRange(lines, begin, end):
				888	"""Clears a range of lines for multi-line comments."""
				889	# Having // dummy comments makes the lines non-empty, so we will not get
				890	# unnecessary blank line warnings later in the code.
				891	for i in range(begin, end):
				892	lines[i] = '// dummy'
				893
				894
				895	def RemoveMultiLineComments(filename, lines, error):
				896	"""Removes multiline (c-style) comments from lines."""
				897	lineix = 0
				898	while lineix < len(lines):
				899	lineix_begin = FindNextMultiLineCommentStart(lines, lineix)
				900	if lineix_begin >= len(lines):
				901	return
				902	lineix_end = FindNextMultiLineCommentEnd(lines, lineix_begin)
				903	if lineix_end >= len(lines):
				904	error(filename, lineix_begin + 1, 'readability/multiline_comment', 5,
				905	'Could not find end of multi-line comment')
				906	return
				907	RemoveMultiLineCommentsFromRange(lines, lineix_begin, lineix_end + 1)
				908	lineix = lineix_end + 1
				909
				910
				911	def CleanseComments(line):
				912	"""Removes //-comments and single-line C-style /* */ comments.
				913
				914	Args:
				915	line: A line of C++ source.
				916
				917	Returns:
				918	The line with single-line comments removed.
				919	"""
				920	commentpos = line.find('//')
				921	if commentpos != -1 and not IsCppString(line[:commentpos]):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	922	line = line[:commentpos].rstrip()
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	923	# get rid of /* ... */
				924	return _RE_PATTERN_CLEANSE_LINE_C_COMMENTS.sub('', line)
				925
				926
				927	class CleansedLines(object):
				928	"""Holds 3 copies of all lines with different preprocessing applied to them.
				929
				930	1) elided member contains lines without strings and comments,
				931	2) lines member contains lines without comments, and
				932	3) raw member contains all the lines without processing.
				933	All these three members are of <type 'list'>, and of the same length.
				934	"""
				935
				936	def __init__(self, lines):
				937	self.elided = []
				938	self.lines = []
				939	self.raw_lines = lines
				940	self.num_lines = len(lines)
				941	for linenum in range(len(lines)):
				942	self.lines.append(CleanseComments(lines[linenum]))
				943	elided = self._CollapseStrings(lines[linenum])
				944	self.elided.append(CleanseComments(elided))
				945
				946	def NumLines(self):
				947	"""Returns the number of lines represented."""
				948	return self.num_lines
				949
				950	@staticmethod
				951	def _CollapseStrings(elided):
				952	"""Collapses strings and chars on a line to simple "" or '' blocks.
				953
				954	We nix strings first so we're not fooled by text like '"http://"'
				955
				956	Args:
				957	elided: The line being processed.
				958
				959	Returns:
				960	The line with collapsed strings.
				961	"""
				962	if not _RE_PATTERN_INCLUDE.match(elided):
				963	# Remove escaped characters first to make quote/single quote collapsing
				964	# basic. Things that look like escaped characters shouldn't occur
				965	# outside of strings and chars.
				966	elided = _RE_PATTERN_CLEANSE_LINE_ESCAPES.sub('', elided)
				967	elided = _RE_PATTERN_CLEANSE_LINE_SINGLE_QUOTES.sub("''", elided)
				968	elided = _RE_PATTERN_CLEANSE_LINE_DOUBLE_QUOTES.sub('""', elided)
				969	return elided
				970
				971
				972	def CloseExpression(clean_lines, linenum, pos):
				973	"""If input points to ( or { or [, finds the position that closes it.
				974
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	975	If lines[linenum][pos] points to a '(' or '{' or '[', finds the
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	976	linenum/pos that correspond to the closing of the expression.
				977
				978	Args:
				979	clean_lines: A CleansedLines instance containing the file.
				980	linenum: The number of the line to check.
				981	pos: A position on the line.
				982
				983	Returns:
				984	A tuple (line, linenum, pos) pointer past the closing brace, or
				985	(line, len(lines), -1) if we never find a close. Note we ignore
				986	strings and comments when matching; and the line we return is the
				987	'cleansed' line at linenum.
				988	"""
				989
				990	line = clean_lines.elided[linenum]
				991	startchar = line[pos]
				992	if startchar not in '({[':
				993	return (line, clean_lines.NumLines(), -1)
				994	if startchar == '(': endchar = ')'
				995	if startchar == '[': endchar = ']'
				996	if startchar == '{': endchar = '}'
				997
				998	num_open = line.count(startchar) - line.count(endchar)
				999	while linenum < clean_lines.NumLines() and num_open > 0:
				1000	linenum += 1
				1001	line = clean_lines.elided[linenum]
				1002	num_open += line.count(startchar) - line.count(endchar)
				1003	# OK, now find the endchar that actually got us back to even
				1004	endpos = len(line)
				1005	while num_open >= 0:
				1006	endpos = line.rfind(')', 0, endpos)
				1007	num_open -= 1 # chopped off another )
				1008	return (line, linenum, endpos + 1)
				1009
				1010
				1011	def CheckForCopyright(filename, lines, error):
				1012	"""Logs an error if no Copyright message appears at the top of the file."""
				1013
				1014	# We'll say it should occur by line 10. Don't forget there's a
				1015	# dummy line at the front.
				1016	for line in xrange(1, min(len(lines), 11)):
				1017	if re.search(r'Copyright', lines[line], re.I): break
				1018	else: # means no copyright line was found
				1019	error(filename, 0, 'legal/copyright', 5,
				1020	'No copyright message found. '
				1021	'You should have a line: "Copyright [year] <Copyright Owner>"')
				1022
				1023
				1024	def GetHeaderGuardCPPVariable(filename):
				1025	"""Returns the CPP variable that should be used as a header guard.
				1026
				1027	Args:
				1028	filename: The name of a C++ header file.
				1029
				1030	Returns:
				1031	The CPP variable that should be used as a header guard in the
				1032	named file.
				1033
				1034	"""
				1035
				1036	# Restores original filename in case that cpplint is invoked from Emacs's
				1037	# flymake.
				1038	filename = re.sub(r'_flymake\.h$', '.h', filename)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1039	fileinfo = FileInfo(filename)
				1040	return re.sub(r'[-./\s]', '_', fileinfo.RepositoryName()).upper() + '_'
				1041
				1042
				1043	def CheckForHeaderGuard(filename, lines, error):
				1044	"""Checks that the file contains a header guard.
				1045
				1046	Logs an error if no #ifndef header guard is present. For other
				1047	headers, checks that the full pathname is used.
				1048
				1049	Args:
				1050	filename: The name of the C++ header file.
				1051	lines: An array of strings, each representing a line of the file.
				1052	error: The function to call with any errors found.
				1053	"""
				1054
				1055	cppvar = GetHeaderGuardCPPVariable(filename)
				1056
				1057	ifndef = None
				1058	ifndef_linenum = 0
				1059	define = None
				1060	endif = None
				1061	endif_linenum = 0
				1062	for linenum, line in enumerate(lines):
				1063	linesplit = line.split()
				1064	if len(linesplit) >= 2:
				1065	# find the first occurrence of #ifndef and #define, save arg
				1066	if not ifndef and linesplit[0] == '#ifndef':
				1067	# set ifndef to the header guard presented on the #ifndef line.
				1068	ifndef = linesplit[1]
				1069	ifndef_linenum = linenum
				1070	if not define and linesplit[0] == '#define':
				1071	define = linesplit[1]
				1072	# find the last occurrence of #endif, save entire line
				1073	if line.startswith('#endif'):
				1074	endif = line
				1075	endif_linenum = linenum
				1076
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1077	if not ifndef:
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1078	error(filename, 0, 'build/header_guard', 5,
				1079	'No #ifndef header guard found, suggested CPP variable is: %s' %
				1080	cppvar)
				1081	return
				1082
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1083	if not define:
				1084	error(filename, 0, 'build/header_guard', 5,
				1085	'No #define header guard found, suggested CPP variable is: %s' %
				1086	cppvar)
				1087	return
				1088
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1089	# The guard should be PATH_FILE_H_, but we also allow PATH_FILE_H__
				1090	# for backward compatibility.
				1091	if ifndef != cppvar:
				1092	error_level = 0
				1093	if ifndef != cppvar + '_':
				1094	error_level = 5
				1095
				1096	ParseNolintSuppressions(filename, lines[ifndef_linenum], ifndef_linenum,
				1097	error)
				1098	error(filename, ifndef_linenum, 'build/header_guard', error_level,
				1099	'#ifndef header guard has wrong style, please use: %s' % cppvar)
				1100
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1101	if define != ifndef:
				1102	error(filename, 0, 'build/header_guard', 5,
				1103	'#ifndef and #define don\'t match, suggested CPP variable is: %s' %
				1104	cppvar)
				1105	return
				1106
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1107	if endif != ('#endif // %s' % cppvar):
				1108	error_level = 0
				1109	if endif != ('#endif // %s' % (cppvar + '_')):
				1110	error_level = 5
				1111
				1112	ParseNolintSuppressions(filename, lines[endif_linenum], endif_linenum,
				1113	error)
				1114	error(filename, endif_linenum, 'build/header_guard', error_level,
				1115	'#endif line should be "#endif // %s"' % cppvar)
				1116
				1117
				1118	def CheckForUnicodeReplacementCharacters(filename, lines, error):
				1119	"""Logs an error for each line containing Unicode replacement characters.
				1120
				1121	These indicate that either the file contained invalid UTF-8 (likely)
				1122	or Unicode replacement characters (which it shouldn't). Note that
				1123	it's possible for this to throw off line numbering if the invalid
				1124	UTF-8 occurred adjacent to a newline.
				1125
				1126	Args:
				1127	filename: The name of the current file.
				1128	lines: An array of strings, each representing a line of the file.
				1129	error: The function to call with any errors found.
				1130	"""
				1131	for linenum, line in enumerate(lines):
				1132	if u'\ufffd' in line:
				1133	error(filename, linenum, 'readability/utf8', 5,
				1134	'Line contains invalid UTF-8 (or Unicode replacement character).')
				1135
				1136
				1137	def CheckForNewlineAtEOF(filename, lines, error):
				1138	"""Logs an error if there is no newline char at the end of the file.
				1139
				1140	Args:
				1141	filename: The name of the current file.
				1142	lines: An array of strings, each representing a line of the file.
				1143	error: The function to call with any errors found.
				1144	"""
				1145
				1146	# The array lines() was created by adding two newlines to the
				1147	# original file (go figure), then splitting on \n.
				1148	# To verify that the file ends in \n, we just have to make sure the
				1149	# last-but-two element of lines() exists and is empty.
				1150	if len(lines) < 3 or lines[-2]:
				1151	error(filename, len(lines) - 2, 'whitespace/ending_newline', 5,
				1152	'Could not find a newline character at the end of the file.')
				1153
				1154
				1155	def CheckForMultilineCommentsAndStrings(filename, clean_lines, linenum, error):
				1156	"""Logs an error if we see /* ... */ or "..." that extend past one line.
				1157
				1158	/* ... */ comments are legit inside macros, for one line.
				1159	Otherwise, we prefer // comments, so it's ok to warn about the
				1160	other. Likewise, it's ok for strings to extend across multiple
				1161	lines, as long as a line continuation character (backslash)
				1162	terminates each line. Although not currently prohibited by the C++
				1163	style guide, it's ugly and unnecessary. We don't do well with either
				1164	in this lint program, so we warn about both.
				1165
				1166	Args:
				1167	filename: The name of the current file.
				1168	clean_lines: A CleansedLines instance containing the file.
				1169	linenum: The number of the line to check.
				1170	error: The function to call with any errors found.
				1171	"""
				1172	line = clean_lines.elided[linenum]
				1173
				1174	# Remove all \\ (escaped backslashes) from the line. They are OK, and the
				1175	# second (escaped) slash may trigger later \" detection erroneously.
				1176	line = line.replace('\\\\', '')
				1177
				1178	if line.count('/') > line.count('/'):
				1179	error(filename, linenum, 'readability/multiline_comment', 5,
				1180	'Complex multi-line /.../-style comment found. '
				1181	'Lint may give bogus warnings. '
				1182	'Consider replacing these with //-style comments, '
				1183	'with #if 0...#endif, '
				1184	'or with more clearly structured multi-line comments.')
				1185
				1186	if (line.count('"') - line.count('\\"')) % 2:
				1187	error(filename, linenum, 'readability/multiline_string', 5,
				1188	'Multi-line string ("...") found. This lint script doesn\'t '
				1189	'do well with such strings, and may give bogus warnings. They\'re '
				1190	'ugly and unnecessary, and you should use concatenation instead".')
				1191
				1192
				1193	threading_list = (
				1194	('asctime(', 'asctime_r('),
				1195	('ctime(', 'ctime_r('),
				1196	('getgrgid(', 'getgrgid_r('),
				1197	('getgrnam(', 'getgrnam_r('),
				1198	('getlogin(', 'getlogin_r('),
				1199	('getpwnam(', 'getpwnam_r('),
				1200	('getpwuid(', 'getpwuid_r('),
				1201	('gmtime(', 'gmtime_r('),
				1202	('localtime(', 'localtime_r('),
				1203	('rand(', 'rand_r('),
				1204	('readdir(', 'readdir_r('),
				1205	('strtok(', 'strtok_r('),
				1206	('ttyname(', 'ttyname_r('),
				1207	)
				1208
				1209
				1210	def CheckPosixThreading(filename, clean_lines, linenum, error):
				1211	"""Checks for calls to thread-unsafe functions.
				1212
				1213	Much code has been originally written without consideration of
				1214	multi-threading. Also, engineers are relying on their old experience;
				1215	they have learned posix before threading extensions were added. These
				1216	tests guide the engineers to use thread-safe functions (when using
				1217	posix directly).
				1218
				1219	Args:
				1220	filename: The name of the current file.
				1221	clean_lines: A CleansedLines instance containing the file.
				1222	linenum: The number of the line to check.
				1223	error: The function to call with any errors found.
				1224	"""
				1225	line = clean_lines.elided[linenum]
				1226	for single_thread_function, multithread_safe_function in threading_list:
				1227	ix = line.find(single_thread_function)
				1228	# Comparisons made explicit for clarity -- pylint: disable-msg=C6403
				1229	if ix >= 0 and (ix == 0 or (not line[ix - 1].isalnum() and
				1230	line[ix - 1] not in ('_', '.', '>'))):
				1231	error(filename, linenum, 'runtime/threadsafe_fn', 2,
				1232	'Consider using ' + multithread_safe_function +
				1233	'...) instead of ' + single_thread_function +
				1234	'...) for improved thread safety.')
				1235
				1236
				1237	# Matches invalid increment: *count++, which moves pointer instead of
				1238	# incrementing a value.
				1239	_RE_PATTERN_INVALID_INCREMENT = re.compile(
				1240	r'^\s\\w+(\+\+\|--);')
				1241
				1242
				1243	def CheckInvalidIncrement(filename, clean_lines, linenum, error):
				1244	"""Checks for invalid increment *count++.
				1245
				1246	For example following function:
				1247	void increment_counter(int* count) {
				1248	*count++;
				1249	}
				1250	is invalid, because it effectively does count++, moving pointer, and should
				1251	be replaced with ++count, (count)++ or *count += 1.
				1252
				1253	Args:
				1254	filename: The name of the current file.
				1255	clean_lines: A CleansedLines instance containing the file.
				1256	linenum: The number of the line to check.
				1257	error: The function to call with any errors found.
				1258	"""
				1259	line = clean_lines.elided[linenum]
				1260	if _RE_PATTERN_INVALID_INCREMENT.match(line):
				1261	error(filename, linenum, 'runtime/invalid_increment', 5,
				1262	'Changing pointer instead of value (or unused value of operator*).')
				1263
				1264
				1265	class _ClassInfo(object):
				1266	"""Stores information about a class."""
				1267
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1268	def __init__(self, name, clean_lines, linenum):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1269	self.name = name
				1270	self.linenum = linenum
				1271	self.seen_open_brace = False
				1272	self.is_derived = False
				1273	self.virtual_method_linenumber = None
				1274	self.has_virtual_destructor = False
				1275	self.brace_depth = 0
				1276
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1277	# Try to find the end of the class. This will be confused by things like:
				1278	# class A {
				1279	# } *x = { ...
				1280	#
				1281	# But it's still good enough for CheckSectionSpacing.
				1282	self.last_line = 0
				1283	depth = 0
				1284	for i in range(linenum, clean_lines.NumLines()):
				1285	line = clean_lines.lines[i]
				1286	depth += line.count('{') - line.count('}')
				1287	if not depth:
				1288	self.last_line = i
				1289	break
				1290
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1291
				1292	class _ClassState(object):
				1293	"""Holds the current state of the parse relating to class declarations.
				1294
				1295	It maintains a stack of _ClassInfos representing the parser's guess
				1296	as to the current nesting of class declarations. The innermost class
				1297	is at the top (back) of the stack. Typically, the stack will either
				1298	be empty or have exactly one entry.
				1299	"""
				1300
				1301	def __init__(self):
				1302	self.classinfo_stack = []
				1303
				1304	def CheckFinished(self, filename, error):
				1305	"""Checks that all classes have been completely parsed.
				1306
				1307	Call this when all lines in a file have been processed.
				1308	Args:
				1309	filename: The name of the current file.
				1310	error: The function to call with any errors found.
				1311	"""
				1312	if self.classinfo_stack:
				1313	# Note: This test can result in false positives if #ifdef constructs
				1314	# get in the way of brace matching. See the testBuildClass test in
				1315	# cpplint_unittest.py for an example of this.
				1316	error(filename, self.classinfo_stack[0].linenum, 'build/class', 5,
				1317	'Failed to find complete declaration of class %s' %
				1318	self.classinfo_stack[0].name)
				1319
				1320
				1321	def CheckForNonStandardConstructs(filename, clean_lines, linenum,
				1322	class_state, error):
				1323	"""Logs an error if we see certain non-ANSI constructs ignored by gcc-2.
				1324
				1325	Complain about several constructs which gcc-2 accepts, but which are
				1326	not standard C++. Warning about these in lint is one way to ease the
				1327	transition to new compilers.
				1328	- put storage class first (e.g. "static const" instead of "const static").
				1329	- "%lld" instead of %qd" in printf-type functions.
				1330	- "%1$d" is non-standard in printf-type functions.
				1331	- "\%" is an undefined character escape sequence.
				1332	- text after #endif is not allowed.
				1333	- invalid inner-style forward declaration.
				1334	- >? and <? operators, and their >?= and <?= cousins.
				1335	- classes with virtual methods need virtual destructors (compiler warning
				1336	available, but not turned on yet.)
				1337
				1338	Additionally, check for constructor/destructor style violations and reference
				1339	members, as it is very convenient to do so while checking for
				1340	gcc-2 compliance.
				1341
				1342	Args:
				1343	filename: The name of the current file.
				1344	clean_lines: A CleansedLines instance containing the file.
				1345	linenum: The number of the line to check.
				1346	class_state: A _ClassState instance which maintains information about
				1347	the current stack of nested class declarations being parsed.
				1348	error: A callable to which errors are reported, which takes 4 arguments:
				1349	filename, line number, error level, and message
				1350	"""
				1351
				1352	# Remove comments from the line, but leave in strings for now.
				1353	line = clean_lines.lines[linenum]
				1354
				1355	if Search(r'printf\s\(.".%[-+ ]?\dq', line):
				1356	error(filename, linenum, 'runtime/printf_format', 3,
				1357	'%q in format strings is deprecated. Use %ll instead.')
				1358
				1359	if Search(r'printf\s\(.".*%\d+\$', line):
				1360	error(filename, linenum, 'runtime/printf_format', 2,
				1361	'%N$ formats are unconventional. Try rewriting to avoid them.')
				1362
				1363	# Remove escaped backslashes before looking for undefined escapes.
				1364	line = line.replace('\\\\', '')
				1365
				1366	if Search(r'("\|\').*\\(%\|\[\|\(\|{)', line):
				1367	error(filename, linenum, 'build/printf_format', 3,
				1368	'%, [, (, and { are undefined character escapes. Unescape them.')
				1369
				1370	# For the rest, work with both comments and strings removed.
				1371	line = clean_lines.elided[linenum]
				1372
				1373	if Search(r'\b(const\|volatile\|void\|char\|short\|int\|long'
				1374	r'\|float\|double\|signed\|unsigned'
				1375	r'\|schar\|u?int8\|u?int16\|u?int32\|u?int64)'
				1376	r'\s+(auto\|register\|static\|extern\|typedef)\b',
				1377	line):
				1378	error(filename, linenum, 'build/storage_class', 5,
				1379	'Storage class (static, extern, typedef, etc) should be first.')
				1380
				1381	if Match(r'\s#\sendif\s*[^/\s]+', line):
				1382	error(filename, linenum, 'build/endif_comment', 5,
				1383	'Uncommented text after #endif is non-standard. Use a comment.')
				1384
				1385	if Match(r'\sclass\s+(\w+\s::\s)+\w+\s;', line):
				1386	error(filename, linenum, 'build/forward_decl', 5,
				1387	'Inner-style forward declarations are invalid. Remove this line.')
				1388
				1389	if Search(r'(\w+\|[+-]?\d+(\.\d)?)\s(<\|>)\?=?\s(\w+\|[+-]?\d+)(\.\d)?',
				1390	line):
				1391	error(filename, linenum, 'build/deprecated', 3,
				1392	'>? and <? (max and min) operators are non-standard and deprecated.')
				1393
				1394	if Search(r'^\sconst\sstring\s&\s\w+\s*;', line):
				1395	# TODO(unknown): Could it be expanded safely to arbitrary references,
				1396	# without triggering too many false positives? The first
				1397	# attempt triggered 5 warnings for mostly benign code in the regtest, hence
				1398	# the restriction.
				1399	# Here's the original regexp, for the reference:
				1400	# type_name = r'\w+((\s::\s\w+)\|(\s<\s\w+?\s*>))?'
				1401	# r'\sconst\s' + type_name + '\s&\s\w+\s*;'
				1402	error(filename, linenum, 'runtime/member_string_references', 2,
				1403	'const string& members are dangerous. It is much better to use '
				1404	'alternatives, such as pointers or simple constants.')
				1405
				1406	# Track class entry and exit, and attempt to find cases within the
				1407	# class declaration that don't meet the C++ style
				1408	# guidelines. Tracking is very dependent on the code matching Google
				1409	# style guidelines, but it seems to perform well enough in testing
				1410	# to be a worthwhile addition to the checks.
				1411	classinfo_stack = class_state.classinfo_stack
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1412	# Look for a class declaration. The regexp accounts for decorated classes
				1413	# such as in:
				1414	# class LOCKABLE API Object {
				1415	# };
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1416	class_decl_match = Match(
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1417	r'\s(template\s<[\w\s<>,:]>\s)?'
				1418	'(class\|struct)\s+([A-Z_]+\s+)(\w+(::\w+))', line)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1419	if class_decl_match:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1420	classinfo_stack.append(_ClassInfo(
				1421	class_decl_match.group(4), clean_lines, linenum))
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1422
				1423	# Everything else in this function uses the top of the stack if it's
				1424	# not empty.
				1425	if not classinfo_stack:
				1426	return
				1427
				1428	classinfo = classinfo_stack[-1]
				1429
				1430	# If the opening brace hasn't been seen look for it and also
				1431	# parent class declarations.
				1432	if not classinfo.seen_open_brace:
				1433	# If the line has a ';' in it, assume it's a forward declaration or
				1434	# a single-line class declaration, which we won't process.
				1435	if line.find(';') != -1:
				1436	classinfo_stack.pop()
				1437	return
				1438	classinfo.seen_open_brace = (line.find('{') != -1)
				1439	# Look for a bare ':'
				1440	if Search('(^\|[^:]):($\|[^:])', line):
				1441	classinfo.is_derived = True
				1442	if not classinfo.seen_open_brace:
				1443	return # Everything else in this function is for after open brace
				1444
				1445	# The class may have been declared with namespace or classname qualifiers.
				1446	# The constructor and destructor will not have those qualifiers.
				1447	base_classname = classinfo.name.split('::')[-1]
				1448
				1449	# Look for single-argument constructors that aren't marked explicit.
				1450	# Technically a valid construct, but against style.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1451	args = Match(r'\s+(?:inline\s+)?%s\s*$([^,()]+)$'
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1452	% re.escape(base_classname),
				1453	line)
				1454	if (args and
				1455	args.group(1) != 'void' and
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1456	not Match(r'(const\s+)?%s\s(?:<\w+>\s)?&' % re.escape(base_classname),
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1457	args.group(1).strip())):
				1458	error(filename, linenum, 'runtime/explicit', 5,
				1459	'Single-argument constructors should be marked explicit.')
				1460
				1461	# Look for methods declared virtual.
				1462	if Search(r'\bvirtual\b', line):
				1463	classinfo.virtual_method_linenumber = linenum
				1464	# Only look for a destructor declaration on the same line. It would
				1465	# be extremely unlikely for the destructor declaration to occupy
				1466	# more than one line.
				1467	if Search(r'~%s\s*\(' % base_classname, line):
				1468	classinfo.has_virtual_destructor = True
				1469
				1470	# Look for class end.
				1471	brace_depth = classinfo.brace_depth
				1472	brace_depth = brace_depth + line.count('{') - line.count('}')
				1473	if brace_depth <= 0:
				1474	classinfo = classinfo_stack.pop()
				1475	# Try to detect missing virtual destructor declarations.
				1476	# For now, only warn if a non-derived class with virtual methods lacks
				1477	# a virtual destructor. This is to make it less likely that people will
				1478	# declare derived virtual destructors without declaring the base
				1479	# destructor virtual.
				1480	if ((classinfo.virtual_method_linenumber is not None) and
				1481	(not classinfo.has_virtual_destructor) and
				1482	(not classinfo.is_derived)): # Only warn for base classes
				1483	error(filename, classinfo.linenum, 'runtime/virtual', 4,
				1484	'The class %s probably needs a virtual destructor due to '
				1485	'having virtual method(s), one declared at line %d.'
				1486	% (classinfo.name, classinfo.virtual_method_linenumber))
				1487	else:
				1488	classinfo.brace_depth = brace_depth
				1489
				1490
				1491	def CheckSpacingForFunctionCall(filename, line, linenum, error):
				1492	"""Checks for the correctness of various spacing around function calls.
				1493
				1494	Args:
				1495	filename: The name of the current file.
				1496	line: The text of the line to check.
				1497	linenum: The number of the line to check.
				1498	error: The function to call with any errors found.
				1499	"""
				1500
				1501	# Since function calls often occur inside if/for/while/switch
				1502	# expressions - which have their own, more liberal conventions - we
				1503	# first see if we should be looking inside such an expression for a
				1504	# function call, to which we can apply more strict standards.
				1505	fncall = line # if there's no control flow construct, look at whole line
				1506	for pattern in (r'\bif\s$(.)$\s*{',
				1507	r'\bfor\s$(.)$\s*{',
				1508	r'\bwhile\s$(.)$\s*[{;]',
				1509	r'\bswitch\s$(.)$\s*{'):
				1510	match = Search(pattern, line)
				1511	if match:
				1512	fncall = match.group(1) # look inside the parens for function calls
				1513	break
				1514
				1515	# Except in if/for/while/switch, there should never be space
				1516	# immediately inside parens (eg "f( 3, 4 )"). We make an exception
				1517	# for nested parens ( (a+b) + c ). Likewise, there should never be
				1518	# a space before a ( when it's a function argument. I assume it's a
				1519	# function argument when the char before the whitespace is legal in
				1520	# a function name (alnum + _) and we're not starting a macro. Also ignore
				1521	# pointers and references to arrays and functions coz they're too tricky:
				1522	# we use a very simple way to recognize these:
				1523	# " (something)(maybe-something)" or
				1524	# " (something)(maybe-something," or
				1525	# " (something)[something]"
				1526	# Note that we assume the contents of [] to be short enough that
				1527	# they'll never need to wrap.
				1528	if ( # Ignore control structures.
				1529	not Search(r'\b(if\|for\|while\|switch\|return\|delete)\b', fncall) and
				1530	# Ignore pointers/references to functions.
				1531	not Search(r' $[^)]+$$[^)]*($\|,$)', fncall) and
				1532	# Ignore pointers/references to arrays.
				1533	not Search(r' $[^)]+$\[[^\]]+\]', fncall)):
				1534	if Search(r'\w\s\(\s(?!\s\\$)', fncall): # a ( used for a fn call
				1535	error(filename, linenum, 'whitespace/parens', 4,
				1536	'Extra space after ( in function call')
				1537	elif Search(r'$\s+(?!(\s*\$\|\()', fncall):
				1538	error(filename, linenum, 'whitespace/parens', 2,
				1539	'Extra space after (')
				1540	if (Search(r'\w\s+\(', fncall) and
				1541	not Search(r'#\s*define\|typedef', fncall)):
				1542	error(filename, linenum, 'whitespace/parens', 4,
				1543	'Extra space before ( in function call')
				1544	# If the ) is followed only by a newline or a { + newline, assume it's
				1545	# part of a control statement (if/while/etc), and don't complain
				1546	if Search(r'[^)]\s+\)\s*[^{\s]', fncall):
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1547	# If the closing parenthesis is preceded by only whitespaces,
				1548	# try to give a more descriptive error message.
				1549	if Search(r'^\s+\)', fncall):
				1550	error(filename, linenum, 'whitespace/parens', 2,
				1551	'Closing ) should be moved to the previous line')
				1552	else:
				1553	error(filename, linenum, 'whitespace/parens', 2,
				1554	'Extra space before )')
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1555
				1556
				1557	def IsBlankLine(line):
				1558	"""Returns true if the given line is blank.
				1559
				1560	We consider a line to be blank if the line is empty or consists of
				1561	only white spaces.
				1562
				1563	Args:
				1564	line: A line of a string.
				1565
				1566	Returns:
				1567	True, if the given line is blank.
				1568	"""
				1569	return not line or line.isspace()
				1570
				1571
				1572	def CheckForFunctionLengths(filename, clean_lines, linenum,
				1573	function_state, error):
				1574	"""Reports for long function bodies.
				1575
				1576	For an overview why this is done, see:
				1577	http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml#Write_Short_Functions
				1578
				1579	Uses a simplistic algorithm assuming other style guidelines
				1580	(especially spacing) are followed.
				1581	Only checks unindented functions, so class members are unchecked.
				1582	Trivial bodies are unchecked, so constructors with huge initializer lists
				1583	may be missed.
				1584	Blank/comment lines are not counted so as to avoid encouraging the removal
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1585	of vertical space and comments just to get through a lint check.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1586	NOLINT on the last line of a function disables this check.
				1587
				1588	Args:
				1589	filename: The name of the current file.
				1590	clean_lines: A CleansedLines instance containing the file.
				1591	linenum: The number of the line to check.
				1592	function_state: Current function name and lines in body so far.
				1593	error: The function to call with any errors found.
				1594	"""
				1595	lines = clean_lines.lines
				1596	line = lines[linenum]
				1597	raw = clean_lines.raw_lines
				1598	raw_line = raw[linenum]
				1599	joined_line = ''
				1600
				1601	starting_func = False
				1602	regexp = r'(\w(\w\|::\|\\|\&\|\s))\(' # decls * & space::name( ...
				1603	match_result = Match(regexp, line)
				1604	if match_result:
				1605	# If the name is all caps and underscores, figure it's a macro and
				1606	# ignore it, unless it's TEST or TEST_F.
				1607	function_name = match_result.group(1).split()[-1]
				1608	if function_name == 'TEST' or function_name == 'TEST_F' or (
				1609	not Match(r'[A-Z_]+$', function_name)):
				1610	starting_func = True
				1611
				1612	if starting_func:
				1613	body_found = False
				1614	for start_linenum in xrange(linenum, clean_lines.NumLines()):
				1615	start_line = lines[start_linenum]
				1616	joined_line += ' ' + start_line.lstrip()
				1617	if Search(r'(;\|})', start_line): # Declarations and trivial functions
				1618	body_found = True
				1619	break # ... ignore
				1620	elif Search(r'{', start_line):
				1621	body_found = True
				1622	function = Search(r'((\w\|:)*)\(', line).group(1)
				1623	if Match(r'TEST', function): # Handle TEST... macros
				1624	parameter_regexp = Search(r'($.*$)', joined_line)
				1625	if parameter_regexp: # Ignore bad syntax
				1626	function += parameter_regexp.group(1)
				1627	else:
				1628	function += '()'
				1629	function_state.Begin(function)
				1630	break
				1631	if not body_found:
				1632	# No body for the function (or evidence of a non-function) was found.
				1633	error(filename, linenum, 'readability/fn_size', 5,
				1634	'Lint failed to find start of function body.')
				1635	elif Match(r'^\}\s*$', line): # function end
				1636	function_state.Check(error, filename, linenum)
				1637	function_state.End()
				1638	elif not Match(r'^\s*$', line):
				1639	function_state.Count() # Count non-blank/non-comment lines.
				1640
				1641
				1642	_RE_PATTERN_TODO = re.compile(r'^//(\s*)TODO($.+?$)?:?(\s\|$)?')
				1643
				1644
				1645	def CheckComment(comment, filename, linenum, error):
				1646	"""Checks for common mistakes in TODO comments.
				1647
				1648	Args:
				1649	comment: The text of the comment from the line in question.
				1650	filename: The name of the current file.
				1651	linenum: The number of the line to check.
				1652	error: The function to call with any errors found.
				1653	"""
				1654	match = _RE_PATTERN_TODO.match(comment)
				1655	if match:
				1656	# One whitespace is correct; zero whitespace is handled elsewhere.
				1657	leading_whitespace = match.group(1)
				1658	if len(leading_whitespace) > 1:
				1659	error(filename, linenum, 'whitespace/todo', 2,
				1660	'Too many spaces before TODO')
				1661
				1662	username = match.group(2)
				1663	if not username:
				1664	error(filename, linenum, 'readability/todo', 2,
				1665	'Missing username in TODO; it should look like '
				1666	'"// TODO(my_username): Stuff."')
				1667
				1668	middle_whitespace = match.group(3)
				1669	# Comparisons made explicit for correctness -- pylint: disable-msg=C6403
				1670	if middle_whitespace != ' ' and middle_whitespace != '':
				1671	error(filename, linenum, 'whitespace/todo', 2,
				1672	'TODO(my_username) should be followed by a space')
				1673
				1674
				1675	def CheckSpacing(filename, clean_lines, linenum, error):
				1676	"""Checks for the correctness of various spacing issues in the code.
				1677
				1678	Things we check for: spaces around operators, spaces after
				1679	if/for/while/switch, no spaces around parens in function calls, two
				1680	spaces between code and comment, don't start a block with a blank
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1681	line, don't end a function with a blank line, don't add a blank line
				1682	after public/protected/private, don't have too many blank lines in a row.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1683
				1684	Args:
				1685	filename: The name of the current file.
				1686	clean_lines: A CleansedLines instance containing the file.
				1687	linenum: The number of the line to check.
				1688	error: The function to call with any errors found.
				1689	"""
				1690
				1691	raw = clean_lines.raw_lines
				1692	line = raw[linenum]
				1693
				1694	# Before nixing comments, check if the line is blank for no good
				1695	# reason. This includes the first line after a block is opened, and
				1696	# blank lines at the end of a function (ie, right before a line like '}'
				1697	if IsBlankLine(line):
				1698	elided = clean_lines.elided
				1699	prev_line = elided[linenum - 1]
				1700	prevbrace = prev_line.rfind('{')
				1701	# TODO(unknown): Don't complain if line before blank line, and line after,
				1702	# both start with alnums and are indented the same amount.
				1703	# This ignores whitespace at the start of a namespace block
				1704	# because those are not usually indented.
				1705	if (prevbrace != -1 and prev_line[prevbrace:].find('}') == -1
				1706	and prev_line[:prevbrace].find('namespace') == -1):
				1707	# OK, we have a blank line at the start of a code block. Before we
				1708	# complain, we check if it is an exception to the rule: The previous
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1709	# non-empty line has the parameters of a function header that are indented
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1710	# 4 spaces (because they did not fit in a 80 column line when placed on
				1711	# the same line as the function name). We also check for the case where
				1712	# the previous line is indented 6 spaces, which may happen when the
				1713	# initializers of a constructor do not fit into a 80 column line.
				1714	exception = False
				1715	if Match(r' {6}\w', prev_line): # Initializer list?
				1716	# We are looking for the opening column of initializer list, which
				1717	# should be indented 4 spaces to cause 6 space indentation afterwards.
				1718	search_position = linenum-2
				1719	while (search_position >= 0
				1720	and Match(r' {6}\w', elided[search_position])):
				1721	search_position -= 1
				1722	exception = (search_position >= 0
				1723	and elided[search_position][:5] == ' :')
				1724	else:
				1725	# Search for the function arguments or an initializer list. We use a
				1726	# simple heuristic here: If the line is indented 4 spaces; and we have a
				1727	# closing paren, without the opening paren, followed by an opening brace
				1728	# or colon (for initializer lists) we assume that it is the last line of
				1729	# a function header. If we have a colon indented 4 spaces, it is an
				1730	# initializer list.
				1731	exception = (Match(r' {4}\w[^$]$\s(const\s)?(\{\s$\|:)',
				1732	prev_line)
				1733	or Match(r' {4}:', prev_line))
				1734
				1735	if not exception:
				1736	error(filename, linenum, 'whitespace/blank_line', 2,
				1737	'Blank line at the start of a code block. Is this needed?')
				1738	# This doesn't ignore whitespace at the end of a namespace block
				1739	# because that is too hard without pairing open/close braces;
				1740	# however, a special exception is made for namespace closing
				1741	# brackets which have a comment containing "namespace".
				1742	#
				1743	# Also, ignore blank lines at the end of a block in a long if-else
				1744	# chain, like this:
				1745	# if (condition1) {
				1746	# // Something followed by a blank line
				1747	#
				1748	# } else if (condition2) {
				1749	# // Something else
				1750	# }
				1751	if linenum + 1 < clean_lines.NumLines():
				1752	next_line = raw[linenum + 1]
				1753	if (next_line
				1754	and Match(r'\s*}', next_line)
				1755	and next_line.find('namespace') == -1
				1756	and next_line.find('} else ') == -1):
				1757	error(filename, linenum, 'whitespace/blank_line', 3,
				1758	'Blank line at the end of a code block. Is this needed?')
				1759
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1760	matched = Match(r'\s*(public\|protected\|private):', prev_line)
				1761	if matched:
				1762	error(filename, linenum, 'whitespace/blank_line', 3,
				1763	'Do not leave a blank line after "%s:"' % matched.group(1))
				1764
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1765	# Next, we complain if there's a comment too near the text
				1766	commentpos = line.find('//')
				1767	if commentpos != -1:
				1768	# Check if the // may be in quotes. If so, ignore it
				1769	# Comparisons made explicit for clarity -- pylint: disable-msg=C6403
				1770	if (line.count('"', 0, commentpos) -
				1771	line.count('\\"', 0, commentpos)) % 2 == 0: # not in quotes
				1772	# Allow one space for new scopes, two spaces otherwise:
				1773	if (not Match(r'^\s*{ //', line) and
				1774	((commentpos >= 1 and
				1775	line[commentpos-1] not in string.whitespace) or
				1776	(commentpos >= 2 and
				1777	line[commentpos-2] not in string.whitespace))):
				1778	error(filename, linenum, 'whitespace/comments', 2,
				1779	'At least two spaces is best between code and comments')
				1780	# There should always be a space between the // and the comment
				1781	commentend = commentpos + 2
				1782	if commentend < len(line) and not line[commentend] == ' ':
				1783	# but some lines are exceptions -- e.g. if they're big
				1784	# comment delimiters like:
				1785	# //----------------------------------------------------------
				1786	# or are an empty C++ style Doxygen comment, like:
				1787	# ///
				1788	# or they begin with multiple slashes followed by a space:
				1789	# //////// Header comment
				1790	match = (Search(r'[=/-]{4,}\s*$', line[commentend:]) or
				1791	Search(r'^/$', line[commentend:]) or
				1792	Search(r'^/+ ', line[commentend:]))
				1793	if not match:
				1794	error(filename, linenum, 'whitespace/comments', 4,
				1795	'Should have a space between // and comment')
				1796	CheckComment(line[commentpos:], filename, linenum, error)
				1797
				1798	line = clean_lines.elided[linenum] # get rid of comments and strings
				1799
				1800	# Don't try to do spacing checks for operator methods
				1801	line = re.sub(r'operator(==\|!=\|<\|<<\|<=\|>=\|>>\|>)\(', 'operator\(', line)
				1802
				1803	# We allow no-spaces around = within an if: "if ( (a=Foo()) == 0 )".
				1804	# Otherwise not. Note we only check for non-spaces on both sides;
				1805	# sometimes people put non-spaces on one side when aligning ='s among
				1806	# many lines (not that this is behavior that I approve of...)
				1807	if Search(r'[\w.]=[\w.]', line) and not Search(r'\b(if\|while) ', line):
				1808	error(filename, linenum, 'whitespace/operators', 4,
				1809	'Missing spaces around =')
				1810
				1811	# It's ok not to have spaces around binary operators like + - * /, but if
				1812	# there's too little whitespace, we get concerned. It's hard to tell,
				1813	# though, so we punt on this one for now. TODO.
				1814
				1815	# You should always have whitespace around binary operators.
				1816	# Alas, we can't test < or > because they're legitimately used sans spaces
				1817	# (a->b, vector<int> a). The only time we can tell is a < with no >, and
				1818	# only if it's not template params list spilling into the next line.
				1819	match = Search(r'[^<>=!\s](==\|!=\|<=\|>=)[^<>=!\s]', line)
				1820	if not match:
				1821	# Note that while it seems that the '<[^<]*' term in the following
				1822	# regexp could be simplified to '<.*', which would indeed match
				1823	# the same class of strings, the [^<] means that searching for the
				1824	# regexp takes linear rather than quadratic time.
				1825	if not Search(r'<[^<],\s$', line): # template params spill
				1826	match = Search(r'[^<>=!\s](<)[^<>=!\s]([^>]\|->)*$', line)
				1827	if match:
				1828	error(filename, linenum, 'whitespace/operators', 3,
				1829	'Missing spaces around %s' % match.group(1))
				1830	# We allow no-spaces around << and >> when used like this: 10<<20, but
				1831	# not otherwise (particularly, not when used as streams)
				1832	match = Search(r'[^0-9\s](<<\|>>)[^0-9\s]', line)
				1833	if match:
				1834	error(filename, linenum, 'whitespace/operators', 3,
				1835	'Missing spaces around %s' % match.group(1))
				1836
				1837	# There shouldn't be space around unary operators
				1838	match = Search(r'(!\s\|~\s\|[\s]--[\s;]\|[\s]\+\+[\s;])', line)
				1839	if match:
				1840	error(filename, linenum, 'whitespace/operators', 4,
				1841	'Extra space for operator %s' % match.group(1))
				1842
				1843	# A pet peeve of mine: no spaces after an if, while, switch, or for
				1844	match = Search(r' (if\(\|for\(\|while\(\|switch\()', line)
				1845	if match:
				1846	error(filename, linenum, 'whitespace/parens', 5,
				1847	'Missing space before ( in %s' % match.group(1))
				1848
				1849	# For if/for/while/switch, the left and right parens should be
				1850	# consistent about how many spaces are inside the parens, and
				1851	# there should either be zero or one spaces inside the parens.
				1852	# We don't want: "if ( foo)" or "if ( foo )".
				1853	# Exception: "for ( ; foo; bar)" and "for (foo; bar; )" are allowed.
				1854	match = Search(r'\b(if\|for\|while\|switch)\s*'
				1855	r'$([ ])(.).[^ ]+([ ])$\s{\s*$',
				1856	line)
				1857	if match:
				1858	if len(match.group(2)) != len(match.group(4)):
				1859	if not (match.group(3) == ';' and
				1860	len(match.group(2)) == 1 + len(match.group(4)) or
				1861	not match.group(2) and Search(r'\bfor\s$.; $', line)):
				1862	error(filename, linenum, 'whitespace/parens', 5,
				1863	'Mismatching spaces inside () in %s' % match.group(1))
				1864	if not len(match.group(2)) in [0, 1]:
				1865	error(filename, linenum, 'whitespace/parens', 5,
				1866	'Should have zero or one spaces inside ( and ) in %s' %
				1867	match.group(1))
				1868
				1869	# You should always have a space after a comma (either as fn arg or operator)
				1870	if Search(r',[^\s]', line):
				1871	error(filename, linenum, 'whitespace/comma', 3,
				1872	'Missing space after ,')
				1873
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1874	# You should always have a space after a semicolon
				1875	# except for few corner cases
				1876	# TODO(unknown): clarify if 'if (1) { return 1;}' is requires one more
				1877	# space after ;
				1878	if Search(r';[^\s};\\)/]', line):
				1879	error(filename, linenum, 'whitespace/semicolon', 3,
				1880	'Missing space after ;')
				1881
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1882	# Next we will look for issues with function calls.
				1883	CheckSpacingForFunctionCall(filename, line, linenum, error)
				1884
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1885	# Except after an opening paren, or after another opening brace (in case of
				1886	# an initializer list, for instance), you should have spaces before your
				1887	# braces. And since you should never have braces at the beginning of a line,
				1888	# this is an easy test.
				1889	if Search(r'[^ ({]{', line):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1890	error(filename, linenum, 'whitespace/braces', 5,
				1891	'Missing space before {')
				1892
				1893	# Make sure '} else {' has spaces.
				1894	if Search(r'}else', line):
				1895	error(filename, linenum, 'whitespace/braces', 5,
				1896	'Missing space before else')
				1897
				1898	# You shouldn't have spaces before your brackets, except maybe after
				1899	# 'delete []' or 'new char * []'.
				1900	if Search(r'\w\s+\[', line) and not Search(r'delete\s+\[', line):
				1901	error(filename, linenum, 'whitespace/braces', 5,
				1902	'Extra space before [')
				1903
				1904	# You shouldn't have a space before a semicolon at the end of the line.
				1905	# There's a special case for "for" since the style guide allows space before
				1906	# the semicolon there.
				1907	if Search(r':\s;\s$', line):
				1908	error(filename, linenum, 'whitespace/semicolon', 5,
				1909	'Semicolon defining empty statement. Use { } instead.')
				1910	elif Search(r'^\s;\s$', line):
				1911	error(filename, linenum, 'whitespace/semicolon', 5,
				1912	'Line contains only semicolon. If this should be an empty statement, '
				1913	'use { } instead.')
				1914	elif (Search(r'\s+;\s*$', line) and
				1915	not Search(r'\bfor\b', line)):
				1916	error(filename, linenum, 'whitespace/semicolon', 5,
				1917	'Extra space before last semicolon. If this should be an empty '
				1918	'statement, use { } instead.')
				1919
				1920
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	1921	def CheckSectionSpacing(filename, clean_lines, class_info, linenum, error):
				1922	"""Checks for additional blank line issues related to sections.
				1923
				1924	Currently the only thing checked here is blank line before protected/private.
				1925
				1926	Args:
				1927	filename: The name of the current file.
				1928	clean_lines: A CleansedLines instance containing the file.
				1929	class_info: A _ClassInfo objects.
				1930	linenum: The number of the line to check.
				1931	error: The function to call with any errors found.
				1932	"""
				1933	# Skip checks if the class is small, where small means 25 lines or less.
				1934	# 25 lines seems like a good cutoff since that's the usual height of
				1935	# terminals, and any class that can't fit in one screen can't really
				1936	# be considered "small".
				1937	#
				1938	# Also skip checks if we are on the first line. This accounts for
				1939	# classes that look like
				1940	# class Foo { public: ... };
				1941	#
				1942	# If we didn't find the end of the class, last_line would be zero,
				1943	# and the check will be skipped by the first condition.
				1944	if (class_info.last_line - class_info.linenum <= 24 or
				1945	linenum <= class_info.linenum):
				1946	return
				1947
				1948	matched = Match(r'\s*(public\|protected\|private):', clean_lines.lines[linenum])
				1949	if matched:
				1950	# Issue warning if the line before public/protected/private was
				1951	# not a blank line, but don't do this if the previous line contains
				1952	# "class" or "struct". This can happen two ways:
				1953	# - We are at the beginning of the class.
				1954	# - We are forward-declaring an inner class that is semantically
				1955	# private, but needed to be public for implementation reasons.
				1956	prev_line = clean_lines.lines[linenum - 1]
				1957	if (not IsBlankLine(prev_line) and
				1958	not Search(r'\b(class\|struct)\b', prev_line)):
				1959	# Try a bit harder to find the beginning of the class. This is to
				1960	# account for multi-line base-specifier lists, e.g.:
				1961	# class Derived
				1962	# : public Base {
				1963	end_class_head = class_info.linenum
				1964	for i in range(class_info.linenum, linenum):
				1965	if Search(r'\{\s*$', clean_lines.lines[i]):
				1966	end_class_head = i
				1967	break
				1968	if end_class_head < linenum - 1:
				1969	error(filename, linenum, 'whitespace/blank_line', 3,
				1970	'"%s:" should be preceded by a blank line' % matched.group(1))
				1971
				1972
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	1973	def GetPreviousNonBlankLine(clean_lines, linenum):
				1974	"""Return the most recent non-blank line and its line number.
				1975
				1976	Args:
				1977	clean_lines: A CleansedLines instance containing the file contents.
				1978	linenum: The number of the line to check.
				1979
				1980	Returns:
				1981	A tuple with two elements. The first element is the contents of the last
				1982	non-blank line before the current line, or the empty string if this is the
				1983	first non-blank line. The second is the line number of that line, or -1
				1984	if this is the first non-blank line.
				1985	"""
				1986
				1987	prevlinenum = linenum - 1
				1988	while prevlinenum >= 0:
				1989	prevline = clean_lines.elided[prevlinenum]
				1990	if not IsBlankLine(prevline): # if not a blank line...
				1991	return (prevline, prevlinenum)
				1992	prevlinenum -= 1
				1993	return ('', -1)
				1994
				1995
				1996	def CheckBraces(filename, clean_lines, linenum, error):
				1997	"""Looks for misplaced braces (e.g. at the end of line).
				1998
				1999	Args:
				2000	filename: The name of the current file.
				2001	clean_lines: A CleansedLines instance containing the file.
				2002	linenum: The number of the line to check.
				2003	error: The function to call with any errors found.
				2004	"""
				2005
				2006	line = clean_lines.elided[linenum] # get rid of comments and strings
				2007
				2008	if Match(r'\s{\s$', line):
				2009	# We allow an open brace to start a line in the case where someone
				2010	# is using braces in a block to explicitly create a new scope,
				2011	# which is commonly used to control the lifetime of
				2012	# stack-allocated variables. We don't detect this perfectly: we
				2013	# just don't complain if the last non-whitespace character on the
				2014	# previous non-blank line is ';', ':', '{', or '}'.
				2015	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
				2016	if not Search(r'[;:}{]\s*$', prevline):
				2017	error(filename, linenum, 'whitespace/braces', 4,
				2018	'{ should almost always be at the end of the previous line')
				2019
				2020	# An else clause should be on the same line as the preceding closing brace.
				2021	if Match(r'\selse\s', line):
				2022	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
				2023	if Match(r'\s}\s$', prevline):
				2024	error(filename, linenum, 'whitespace/newline', 4,
				2025	'An else should appear on the same line as the preceding }')
				2026
				2027	# If braces come on one side of an else, they should be on both.
				2028	# However, we have to worry about "else if" that spans multiple lines!
				2029	if Search(r'}\selse[^{]$', line) or Match(r'[^}]else\s{', line):
				2030	if Search(r'}\selse if([^{])$', line): # could be multi-line if
				2031	# find the ( after the if
				2032	pos = line.find('else if')
				2033	pos = line.find('(', pos)
				2034	if pos > 0:
				2035	(endline, _, endpos) = CloseExpression(clean_lines, linenum, pos)
				2036	if endline[endpos:].find('{') == -1: # must be brace after if
				2037	error(filename, linenum, 'readability/braces', 5,
				2038	'If an else has a brace on one side, it should have it on both')
				2039	else: # common case: else not followed by a multi-line if
				2040	error(filename, linenum, 'readability/braces', 5,
				2041	'If an else has a brace on one side, it should have it on both')
				2042
				2043	# Likewise, an else should never have the else clause on the same line
				2044	if Search(r'\belse [^\s{]', line) and not Search(r'\belse if\b', line):
				2045	error(filename, linenum, 'whitespace/newline', 4,
				2046	'Else clause should never be on same line as else (use 2 lines)')
				2047
				2048	# In the same way, a do/while should never be on one line
				2049	if Match(r'\s*do [^\s{]', line):
				2050	error(filename, linenum, 'whitespace/newline', 4,
				2051	'do/while clauses should not be on a single line')
				2052
				2053	# Braces shouldn't be followed by a ; unless they're defining a struct
				2054	# or initializing an array.
				2055	# We can't tell in general, but we can for some common cases.
				2056	prevlinenum = linenum
				2057	while True:
				2058	(prevline, prevlinenum) = GetPreviousNonBlankLine(clean_lines, prevlinenum)
				2059	if Match(r'\s+{.}\s;', line) and not prevline.count(';'):
				2060	line = prevline + line
				2061	else:
				2062	break
				2063	if (Search(r'{.}\s;', line) and
				2064	line.count('{') == line.count('}') and
				2065	not Search(r'struct\|class\|enum\|\s=\s{', line)):
				2066	error(filename, linenum, 'readability/braces', 4,
				2067	"You don't need a ; after a }")
				2068
				2069
				2070	def ReplaceableCheck(operator, macro, line):
				2071	"""Determine whether a basic CHECK can be replaced with a more specific one.
				2072
				2073	For example suggest using CHECK_EQ instead of CHECK(a == b) and
				2074	similarly for CHECK_GE, CHECK_GT, CHECK_LE, CHECK_LT, CHECK_NE.
				2075
				2076	Args:
				2077	operator: The C++ operator used in the CHECK.
				2078	macro: The CHECK or EXPECT macro being called.
				2079	line: The current source line.
				2080
				2081	Returns:
				2082	True if the CHECK can be replaced with a more specific one.
				2083	"""
				2084
				2085	# This matches decimal and hex integers, strings, and chars (in that order).
				2086	match_constant = r'([-+]?(\d+\|0[xX][0-9a-fA-F]+)[lLuU]{0,3}\|"."\|\'.\')'
				2087
				2088	# Expression to match two sides of the operator with something that
				2089	# looks like a literal, since CHECK(x == iterator) won't compile.
				2090	# This means we can't catch all the cases where a more specific
				2091	# CHECK is possible, but it's less annoying than dealing with
				2092	# extraneous warnings.
				2093	match_this = (r'\s' + macro + r'\((\s' +
				2094	match_constant + r'\s' + operator + r'[^<>].\|'
				2095	r'.[^<>]' + operator + r'\s' + match_constant +
				2096	r'\s*\))')
				2097
				2098	# Don't complain about CHECK(x == NULL) or similar because
				2099	# CHECK_EQ(x, NULL) won't compile (requires a cast).
				2100	# Also, don't complain about more complex boolean expressions
				2101	# involving && or \|\| such as CHECK(a == b \|\| c == d).
				2102	return Match(match_this, line) and not Search(r'NULL\|&&\|\\|\\|', line)
				2103
				2104
				2105	def CheckCheck(filename, clean_lines, linenum, error):
				2106	"""Checks the use of CHECK and EXPECT macros.
				2107
				2108	Args:
				2109	filename: The name of the current file.
				2110	clean_lines: A CleansedLines instance containing the file.
				2111	linenum: The number of the line to check.
				2112	error: The function to call with any errors found.
				2113	"""
				2114
				2115	# Decide the set of replacement macros that should be suggested
				2116	raw_lines = clean_lines.raw_lines
				2117	current_macro = ''
				2118	for macro in _CHECK_MACROS:
				2119	if raw_lines[linenum].find(macro) >= 0:
				2120	current_macro = macro
				2121	break
				2122	if not current_macro:
				2123	# Don't waste time here if line doesn't contain 'CHECK' or 'EXPECT'
				2124	return
				2125
				2126	line = clean_lines.elided[linenum] # get rid of comments and strings
				2127
				2128	# Encourage replacing plain CHECKs with CHECK_EQ/CHECK_NE/etc.
				2129	for operator in ['==', '!=', '>=', '>', '<=', '<']:
				2130	if ReplaceableCheck(operator, current_macro, line):
				2131	error(filename, linenum, 'readability/check', 2,
				2132	'Consider using %s instead of %s(a %s b)' % (
				2133	_CHECK_REPLACEMENT[current_macro][operator],
				2134	current_macro, operator))
				2135	break
				2136
				2137
				2138	def GetLineWidth(line):
				2139	"""Determines the width of the line in column positions.
				2140
				2141	Args:
				2142	line: A string, which may be a Unicode string.
				2143
				2144	Returns:
				2145	The width of the line in column positions, accounting for Unicode
				2146	combining characters and wide characters.
				2147	"""
				2148	if isinstance(line, unicode):
				2149	width = 0
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2150	for uc in unicodedata.normalize('NFC', line):
				2151	if unicodedata.east_asian_width(uc) in ('W', 'F'):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2152	width += 2
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2153	elif not unicodedata.combining(uc):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2154	width += 1
				2155	return width
				2156	else:
				2157	return len(line)
				2158
				2159
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2160	def CheckStyle(filename, clean_lines, linenum, file_extension, class_state,
				2161	error):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2162	"""Checks rules from the 'C++ style rules' section of cppguide.html.
				2163
				2164	Most of these rules are hard to test (naming, comment style), but we
				2165	do what we can. In particular we check for 2-space indents, line lengths,
				2166	tab usage, spaces inside code, etc.
				2167
				2168	Args:
				2169	filename: The name of the current file.
				2170	clean_lines: A CleansedLines instance containing the file.
				2171	linenum: The number of the line to check.
				2172	file_extension: The extension (without the dot) of the filename.
				2173	error: The function to call with any errors found.
				2174	"""
				2175
				2176	raw_lines = clean_lines.raw_lines
				2177	line = raw_lines[linenum]
				2178
				2179	if line.find('\t') != -1:
				2180	error(filename, linenum, 'whitespace/tab', 1,
				2181	'Tab found; better to use spaces')
				2182
				2183	# One or three blank spaces at the beginning of the line is weird; it's
				2184	# hard to reconcile that with 2-space indents.
				2185	# NOTE: here are the conditions rob pike used for his tests. Mine aren't
				2186	# as sophisticated, but it may be worth becoming so: RLENGTH==initial_spaces
				2187	# if(RLENGTH > 20) complain = 0;
				2188	# if(match($0, " +(error\|private\|public\|protected):")) complain = 0;
				2189	# if(match(prev, "&& *$")) complain = 0;
				2190	# if(match(prev, "\\\|\\\| *$")) complain = 0;
				2191	# if(match(prev, "[\",=><] *$")) complain = 0;
				2192	# if(match($0, " <<")) complain = 0;
				2193	# if(match(prev, " +for \\(")) complain = 0;
				2194	# if(prevodd && match(prevprev, " +for \\(")) complain = 0;
				2195	initial_spaces = 0
				2196	cleansed_line = clean_lines.elided[linenum]
				2197	while initial_spaces < len(line) and line[initial_spaces] == ' ':
				2198	initial_spaces += 1
				2199	if line and line[-1].isspace():
				2200	error(filename, linenum, 'whitespace/end_of_line', 4,
				2201	'Line ends in whitespace. Consider deleting these extra spaces.')
				2202	# There are certain situations we allow one space, notably for labels
				2203	elif ((initial_spaces == 1 or initial_spaces == 3) and
				2204	not Match(r'\s\w+\s:\s*$', cleansed_line)):
				2205	error(filename, linenum, 'whitespace/indent', 3,
				2206	'Weird number of spaces at line-start. '
				2207	'Are you using a 2-space indent?')
				2208	# Labels should always be indented at least one space.
				2209	elif not initial_spaces and line[:2] != '//' and Search(r'[^:]:\s*$',
				2210	line):
				2211	error(filename, linenum, 'whitespace/labels', 4,
				2212	'Labels should always be indented at least one space. '
				2213	'If this is a member-initializer list in a constructor or '
				2214	'the base class list in a class definition, the colon should '
				2215	'be on the following line.')
				2216
				2217
				2218	# Check if the line is a header guard.
				2219	is_header_guard = False
				2220	if file_extension == 'h':
				2221	cppvar = GetHeaderGuardCPPVariable(filename)
				2222	if (line.startswith('#ifndef %s' % cppvar) or
				2223	line.startswith('#define %s' % cppvar) or
				2224	line.startswith('#endif // %s' % cppvar)):
				2225	is_header_guard = True
				2226	# #include lines and header guards can be long, since there's no clean way to
				2227	# split them.
				2228	#
				2229	# URLs can be long too. It's possible to split these, but it makes them
				2230	# harder to cut&paste.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2231	#
				2232	# The "$Id:...$" comment may also get very long without it being the
				2233	# developers fault.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2234	if (not line.startswith('#include') and not is_header_guard and
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2235	not Match(r'^\s//.http(s?)://\S*$', line) and
				2236	not Match(r'^// \$Id:.*#[0-9]+ \$$', line)):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2237	line_width = GetLineWidth(line)
				2238	if line_width > 100:
				2239	error(filename, linenum, 'whitespace/line_length', 4,
				2240	'Lines should very rarely be longer than 100 characters')
				2241	elif line_width > 80:
				2242	error(filename, linenum, 'whitespace/line_length', 2,
				2243	'Lines should be <= 80 characters long')
				2244
				2245	if (cleansed_line.count(';') > 1 and
				2246	# for loops are allowed two ;'s (and may run over two lines).
				2247	cleansed_line.find('for') == -1 and
				2248	(GetPreviousNonBlankLine(clean_lines, linenum)[0].find('for') == -1 or
				2249	GetPreviousNonBlankLine(clean_lines, linenum)[0].find(';') != -1) and
				2250	# It's ok to have many commands in a switch case that fits in 1 line
				2251	not ((cleansed_line.find('case ') != -1 or
				2252	cleansed_line.find('default:') != -1) and
				2253	cleansed_line.find('break;') != -1)):
				2254	error(filename, linenum, 'whitespace/newline', 4,
				2255	'More than one command on the same line')
				2256
				2257	# Some more style checks
				2258	CheckBraces(filename, clean_lines, linenum, error)
				2259	CheckSpacing(filename, clean_lines, linenum, error)
				2260	CheckCheck(filename, clean_lines, linenum, error)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2261	if class_state and class_state.classinfo_stack:
				2262	CheckSectionSpacing(filename, clean_lines,
				2263	class_state.classinfo_stack[-1], linenum, error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2264
				2265
				2266	_RE_PATTERN_INCLUDE_NEW_STYLE = re.compile(r'#include +"[^/]+\.h"')
				2267	_RE_PATTERN_INCLUDE = re.compile(r'^\s#\sinclude\s([<"])([^>"])[>"].*$')
				2268	# Matches the first component of a filename delimited by -s and _s. That is:
				2269	# _RE_FIRST_COMPONENT.match('foo').group(0) == 'foo'
				2270	# _RE_FIRST_COMPONENT.match('foo.cc').group(0) == 'foo'
				2271	# _RE_FIRST_COMPONENT.match('foo-bar_baz.cc').group(0) == 'foo'
				2272	# _RE_FIRST_COMPONENT.match('foo_bar-baz.cc').group(0) == 'foo'
				2273	_RE_FIRST_COMPONENT = re.compile(r'^[^-_.]+')
				2274
				2275
				2276	def _DropCommonSuffixes(filename):
				2277	"""Drops common suffixes like _test.cc or -inl.h from filename.
				2278
				2279	For example:
				2280	>>> _DropCommonSuffixes('foo/foo-inl.h')
				2281	'foo/foo'
				2282	>>> _DropCommonSuffixes('foo/bar/foo.cc')
				2283	'foo/bar/foo'
				2284	>>> _DropCommonSuffixes('foo/foo_internal.h')
				2285	'foo/foo'
				2286	>>> _DropCommonSuffixes('foo/foo_unusualinternal.h')
				2287	'foo/foo_unusualinternal'
				2288
				2289	Args:
				2290	filename: The input filename.
				2291
				2292	Returns:
				2293	The filename with the common suffix removed.
				2294	"""
				2295	for suffix in ('test.cc', 'regtest.cc', 'unittest.cc',
				2296	'inl.h', 'impl.h', 'internal.h'):
				2297	if (filename.endswith(suffix) and len(filename) > len(suffix) and
				2298	filename[-len(suffix) - 1] in ('-', '_')):
				2299	return filename[:-len(suffix) - 1]
				2300	return os.path.splitext(filename)[0]
				2301
				2302
				2303	def _IsTestFilename(filename):
				2304	"""Determines if the given filename has a suffix that identifies it as a test.
				2305
				2306	Args:
				2307	filename: The input filename.
				2308
				2309	Returns:
				2310	True if 'filename' looks like a test, False otherwise.
				2311	"""
				2312	if (filename.endswith('_test.cc') or
				2313	filename.endswith('_unittest.cc') or
				2314	filename.endswith('_regtest.cc')):
				2315	return True
				2316	else:
				2317	return False
				2318
				2319
				2320	def _ClassifyInclude(fileinfo, include, is_system):
				2321	"""Figures out what kind of header 'include' is.
				2322
				2323	Args:
				2324	fileinfo: The current file cpplint is running over. A FileInfo instance.
				2325	include: The path to a #included file.
				2326	is_system: True if the #include used <> rather than "".
				2327
				2328	Returns:
				2329	One of the _XXX_HEADER constants.
				2330
				2331	For example:
				2332	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'stdio.h', True)
				2333	_C_SYS_HEADER
				2334	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'string', True)
				2335	_CPP_SYS_HEADER
				2336	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'foo/foo.h', False)
				2337	_LIKELY_MY_HEADER
				2338	>>> _ClassifyInclude(FileInfo('foo/foo_unknown_extension.cc'),
				2339	... 'bar/foo_other_ext.h', False)
				2340	_POSSIBLE_MY_HEADER
				2341	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'foo/bar.h', False)
				2342	_OTHER_HEADER
				2343	"""
				2344	# This is a list of all standard c++ header files, except
				2345	# those already checked for above.
				2346	is_stl_h = include in _STL_HEADERS
				2347	is_cpp_h = is_stl_h or include in _CPP_HEADERS
				2348
				2349	if is_system:
				2350	if is_cpp_h:
				2351	return _CPP_SYS_HEADER
				2352	else:
				2353	return _C_SYS_HEADER
				2354
				2355	# If the target file and the include we're checking share a
				2356	# basename when we drop common extensions, and the include
				2357	# lives in . , then it's likely to be owned by the target file.
				2358	target_dir, target_base = (
				2359	os.path.split(_DropCommonSuffixes(fileinfo.RepositoryName())))
				2360	include_dir, include_base = os.path.split(_DropCommonSuffixes(include))
				2361	if target_base == include_base and (
				2362	include_dir == target_dir or
				2363	include_dir == os.path.normpath(target_dir + '/../public')):
				2364	return _LIKELY_MY_HEADER
				2365
				2366	# If the target and include share some initial basename
				2367	# component, it's possible the target is implementing the
				2368	# include, so it's allowed to be first, but we'll never
				2369	# complain if it's not there.
				2370	target_first_component = _RE_FIRST_COMPONENT.match(target_base)
				2371	include_first_component = _RE_FIRST_COMPONENT.match(include_base)
				2372	if (target_first_component and include_first_component and
				2373	target_first_component.group(0) ==
				2374	include_first_component.group(0)):
				2375	return _POSSIBLE_MY_HEADER
				2376
				2377	return _OTHER_HEADER
				2378
				2379
				2380
				2381	def CheckIncludeLine(filename, clean_lines, linenum, include_state, error):
				2382	"""Check rules that are applicable to #include lines.
				2383
				2384	Strings on #include lines are NOT removed from elided line, to make
				2385	certain tasks easier. However, to prevent false positives, checks
				2386	applicable to #include lines in CheckLanguage must be put here.
				2387
				2388	Args:
				2389	filename: The name of the current file.
				2390	clean_lines: A CleansedLines instance containing the file.
				2391	linenum: The number of the line to check.
				2392	include_state: An _IncludeState instance in which the headers are inserted.
				2393	error: The function to call with any errors found.
				2394	"""
				2395	fileinfo = FileInfo(filename)
				2396
				2397	line = clean_lines.lines[linenum]
				2398
				2399	# "include" should use the new style "foo/bar.h" instead of just "bar.h"
				2400	if _RE_PATTERN_INCLUDE_NEW_STYLE.search(line):
				2401	error(filename, linenum, 'build/include', 4,
				2402	'Include the directory when naming .h files')
				2403
				2404	# we shouldn't include a file more than once. actually, there are a
				2405	# handful of instances where doing so is okay, but in general it's
				2406	# not.
				2407	match = _RE_PATTERN_INCLUDE.search(line)
				2408	if match:
				2409	include = match.group(2)
				2410	is_system = (match.group(1) == '<')
				2411	if include in include_state:
				2412	error(filename, linenum, 'build/include', 4,
				2413	'"%s" already included at %s:%s' %
				2414	(include, filename, include_state[include]))
				2415	else:
				2416	include_state[include] = linenum
				2417
				2418	# We want to ensure that headers appear in the right order:
				2419	# 1) for foo.cc, foo.h (preferred location)
				2420	# 2) c system files
				2421	# 3) cpp system files
				2422	# 4) for foo.cc, foo.h (deprecated location)
				2423	# 5) other google headers
				2424	#
				2425	# We classify each include statement as one of those 5 types
				2426	# using a number of techniques. The include_state object keeps
				2427	# track of the highest type seen, and complains if we see a
				2428	# lower type after that.
				2429	error_message = include_state.CheckNextIncludeOrder(
				2430	_ClassifyInclude(fileinfo, include, is_system))
				2431	if error_message:
				2432	error(filename, linenum, 'build/include_order', 4,
				2433	'%s. Should be: %s.h, c system, c++ system, other.' %
				2434	(error_message, fileinfo.BaseName()))
				2435	if not include_state.IsInAlphabeticalOrder(include):
				2436	error(filename, linenum, 'build/include_alpha', 4,
				2437	'Include "%s" not in alphabetical order' % include)
				2438
				2439	# Look for any of the stream classes that are part of standard C++.
				2440	match = _RE_PATTERN_INCLUDE.match(line)
				2441	if match:
				2442	include = match.group(2)
				2443	if Match(r'(f\|ind\|io\|i\|o\|parse\|pf\|stdio\|str\|)?stream$', include):
				2444	# Many unit tests use cout, so we exempt them.
				2445	if not _IsTestFilename(filename):
				2446	error(filename, linenum, 'readability/streams', 3,
				2447	'Streams are highly discouraged.')
				2448
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2449
				2450	def _GetTextInside(text, start_pattern):
				2451	"""Retrieves all the text between matching open and close parentheses.
				2452
				2453	Given a string of lines and a regular expression string, retrieve all the text
				2454	following the expression and between opening punctuation symbols like
				2455	(, [, or {, and the matching close-punctuation symbol. This properly nested
				2456	occurrences of the punctuations, so for the text like
				2457	printf(a(), b(c()));
				2458	a call to _GetTextInside(text, r'printf\(') will return 'a(), b(c())'.
				2459	start_pattern must match string having an open punctuation symbol at the end.
				2460
				2461	Args:
				2462	text: The lines to extract text. Its comments and strings must be elided.
				2463	It can be single line and can span multiple lines.
				2464	start_pattern: The regexp string indicating where to start extracting
				2465	the text.
				2466	Returns:
				2467	The extracted text.
				2468	None if either the opening string or ending punctuation could not be found.
				2469	"""
				2470	# TODO(sugawarayu): Audit cpplint.py to see what places could be profitably
				2471	# rewritten to use _GetTextInside (and use inferior regexp matching today).
				2472
				2473	# Give opening punctuations to get the matching close-punctuations.
				2474	matching_punctuation = {'(': ')', '{': '}', '[': ']'}
				2475	closing_punctuation = set(matching_punctuation.itervalues())
				2476
				2477	# Find the position to start extracting text.
				2478	match = re.search(start_pattern, text, re.M)
				2479	if not match: # start_pattern not found in text.
				2480	return None
				2481	start_position = match.end(0)
				2482
				2483	assert start_position > 0, (
				2484	'start_pattern must ends with an opening punctuation.')
				2485	assert text[start_position - 1] in matching_punctuation, (
				2486	'start_pattern must ends with an opening punctuation.')
				2487	# Stack of closing punctuations we expect to have in text after position.
				2488	punctuation_stack = [matching_punctuation[text[start_position - 1]]]
				2489	position = start_position
				2490	while punctuation_stack and position < len(text):
				2491	if text[position] == punctuation_stack[-1]:
				2492	punctuation_stack.pop()
				2493	elif text[position] in closing_punctuation:
				2494	# A closing punctuation without matching opening punctuations.
				2495	return None
				2496	elif text[position] in matching_punctuation:
				2497	punctuation_stack.append(matching_punctuation[text[position]])
				2498	position += 1
				2499	if punctuation_stack:
				2500	# Opening punctuations left without matching close-punctuations.
				2501	return None
				2502	# punctuations match.
				2503	return text[start_position:position - 1]
				2504
				2505
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2506	def CheckLanguage(filename, clean_lines, linenum, file_extension, include_state,
				2507	error):
				2508	"""Checks rules from the 'C++ language rules' section of cppguide.html.
				2509
				2510	Some of these rules are hard to test (function overloading, using
				2511	uint32 inappropriately), but we do the best we can.
				2512
				2513	Args:
				2514	filename: The name of the current file.
				2515	clean_lines: A CleansedLines instance containing the file.
				2516	linenum: The number of the line to check.
				2517	file_extension: The extension (without the dot) of the filename.
				2518	include_state: An _IncludeState instance in which the headers are inserted.
				2519	error: The function to call with any errors found.
				2520	"""
				2521	# If the line is empty or consists of entirely a comment, no need to
				2522	# check it.
				2523	line = clean_lines.elided[linenum]
				2524	if not line:
				2525	return
				2526
				2527	match = _RE_PATTERN_INCLUDE.search(line)
				2528	if match:
				2529	CheckIncludeLine(filename, clean_lines, linenum, include_state, error)
				2530	return
				2531
				2532	# Create an extended_line, which is the concatenation of the current and
				2533	# next lines, for more effective checking of code that may span more than one
				2534	# line.
				2535	if linenum + 1 < clean_lines.NumLines():
				2536	extended_line = line + clean_lines.elided[linenum + 1]
				2537	else:
				2538	extended_line = line
				2539
				2540	# Make Windows paths like Unix.
				2541	fullname = os.path.abspath(filename).replace('\\', '/')
				2542
				2543	# TODO(unknown): figure out if they're using default arguments in fn proto.
				2544
				2545	# Check for non-const references in functions. This is tricky because &
				2546	# is also used to take the address of something. We allow <> for templates,
				2547	# (ignoring whatever is between the braces) and : for classes.
				2548	# These are complicated re's. They try to capture the following:
				2549	# paren (for fn-prototype start), typename, &, varname. For the const
				2550	# version, we're willing for const to be before typename or after
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2551	# Don't check the implementation on same line.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2552	fnline = line.split('{', 1)[0]
				2553	if (len(re.findall(r'\([^()]\b(?:[\w:]\|<[^()]>)+(\s?&\|&\s?)\w+', fnline)) >
				2554	len(re.findall(r'\([^()]*\bconst\s+(?:typename\s+)?(?:struct\s+)?'
				2555	r'(?:[\w:]\|<[^()]*>)+(\s?&\|&\s?)\w+', fnline)) +
				2556	len(re.findall(r'\([^()]\b(?:[\w:]\|<[^()]>)+\s+const(\s?&\|&\s?)[\w]+',
				2557	fnline))):
				2558
				2559	# We allow non-const references in a few standard places, like functions
				2560	# called "swap()" or iostream operators like "<<" or ">>".
				2561	if not Search(
				2562	r'(swap\|Swap\|operator[<>][<>])\s\(\s(?:[\w:]\|<.>)+\s&',
				2563	fnline):
				2564	error(filename, linenum, 'runtime/references', 2,
				2565	'Is this a non-const reference? '
				2566	'If so, make const or use a pointer.')
				2567
				2568	# Check to see if they're using an conversion function cast.
				2569	# I just try to capture the most common basic types, though there are more.
				2570	# Parameterless conversion functions, such as bool(), are allowed as they are
				2571	# probably a member operator declaration or default constructor.
				2572	match = Search(
				2573	r'(\bnew\s+)?\b' # Grab 'new' operator, if it's there
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	2574	r'(int\|float\|double\|bool\|char\|u?int(8\|16\|32\|64)_t)\([^)]', line) # TODO(enh): upstream change to handle all stdint types.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2575	if match:
				2576	# gMock methods are defined using some variant of MOCK_METHODx(name, type)
				2577	# where type may be float(), int(string), etc. Without context they are
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2578	# virtually indistinguishable from int(x) casts. Likewise, gMock's
				2579	# MockCallback takes a template parameter of the form return_type(arg_type),
				2580	# which looks much like the cast we're trying to detect.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2581	if (match.group(1) is None and # If new operator, then this isn't a cast
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2582	not (Match(r'^\s*MOCK_(CONST_)?METHOD\d+(_T)?\(', line) or
				2583	Match(r'^\sMockCallback<.>', line))):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2584	error(filename, linenum, 'readability/casting', 4,
				2585	'Using deprecated casting style. '
				2586	'Use static_cast<%s>(...) instead' %
				2587	match.group(2))
				2588
				2589	CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				2590	'static_cast',
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	2591	r'$(int\|float\|double\|bool\|char\|u?int(8\|16\|32\|64))$', error) # TODO(enh): upstream change to handle all stdint types.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2592
				2593	# This doesn't catch all cases. Consider (const char * const)"hello".
				2594	#
				2595	# (char *) "foo" should always be a const_cast (reinterpret_cast won't
				2596	# compile).
				2597	if CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				2598	'const_cast', r'$(char\s?\+\s?)$\s"', error):
				2599	pass
				2600	else:
				2601	# Check pointer casts for other than string constants
				2602	CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				2603	'reinterpret_cast', r'$(\w+\s?\*+\s?)$', error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2604
				2605	# In addition, we look for people taking the address of a cast. This
				2606	# is dangerous -- casts can assign to temporaries, so the pointer doesn't
				2607	# point where you think.
				2608	if Search(
				2609	r'(&$[^)]+$[\w(])\|(&(static\|dynamic\|reinterpret)_cast\b)', line):
				2610	error(filename, linenum, 'runtime/casting', 4,
				2611	('Are you taking an address of a cast? '
				2612	'This is dangerous: could be a temp var. '
				2613	'Take the address before doing the cast, rather than after'))
				2614
				2615	# Check for people declaring static/global STL strings at the top level.
				2616	# This is dangerous because the C++ language does not guarantee that
				2617	# globals with constructors are initialized before the first access.
				2618	match = Match(
				2619	r'((?:\|static +)(?:\|const +))string +([a-zA-Z0-9_:]+)\b(.*)',
				2620	line)
				2621	# Make sure it's not a function.
				2622	# Function template specialization looks like: "string foo<Type>(...".
				2623	# Class template definitions look like: "string Foo<Type>::Method(...".
				2624	if match and not Match(r'\s(<.>)?(::[a-zA-Z0-9_]+)?\s*\(([^"]\|$)',
				2625	match.group(3)):
				2626	error(filename, linenum, 'runtime/string', 4,
				2627	'For a static/global string constant, use a C style string instead: '
				2628	'"%schar %s[]".' %
				2629	(match.group(1), match.group(2)))
				2630
				2631	# Check that we're not using RTTI outside of testing code.
				2632	if Search(r'\bdynamic_cast<', line) and not _IsTestFilename(filename):
				2633	error(filename, linenum, 'runtime/rtti', 5,
				2634	'Do not use dynamic_cast<>. If you need to cast within a class '
				2635	"hierarchy, use static_cast<> to upcast. Google doesn't support "
				2636	'RTTI.')
				2637
				2638	if Search(r'\b([A-Za-z0-9_]*_)$\1$', line):
				2639	error(filename, linenum, 'runtime/init', 4,
				2640	'You seem to be initializing a member variable with itself.')
				2641
				2642	if file_extension == 'h':
				2643	# TODO(unknown): check that 1-arg constructors are explicit.
				2644	# How to tell it's a constructor?
				2645	# (handled in CheckForNonStandardConstructs for now)
				2646	# TODO(unknown): check that classes have DISALLOW_EVIL_CONSTRUCTORS
				2647	# (level 1 error)
				2648	pass
				2649
				2650	# Check if people are using the verboten C basic types. The only exception
				2651	# we regularly allow is "unsigned short port" for port.
				2652	if Search(r'\bshort port\b', line):
				2653	if not Search(r'\bunsigned short port\b', line):
				2654	error(filename, linenum, 'runtime/int', 4,
				2655	'Use "unsigned short" for ports, not "short"')
				2656	else:
				2657	match = Search(r'\b(short\|long(?! +double)\|long long)\b', line)
				2658	if match:
				2659	error(filename, linenum, 'runtime/int', 4,
				2660	'Use int16/int64/etc, rather than the C type %s' % match.group(1))
				2661
				2662	# When snprintf is used, the second argument shouldn't be a literal.
				2663	match = Search(r'snprintf\s\(([^,]),\s([0-9])\s*,', line)
				2664	if match and match.group(2) != '0':
				2665	# If 2nd arg is zero, snprintf is used to calculate size.
				2666	error(filename, linenum, 'runtime/printf', 3,
				2667	'If you can, use sizeof(%s) instead of %s as the 2nd arg '
				2668	'to snprintf.' % (match.group(1), match.group(2)))
				2669
				2670	# Check if some verboten C functions are being used.
				2671	if Search(r'\bsprintf\b', line):
				2672	error(filename, linenum, 'runtime/printf', 5,
				2673	'Never use sprintf. Use snprintf instead.')
				2674	match = Search(r'\b(strcpy\|strcat)\b', line)
				2675	if match:
				2676	error(filename, linenum, 'runtime/printf', 4,
				2677	'Almost always, snprintf is better than %s' % match.group(1))
				2678
				2679	if Search(r'\bsscanf\b', line):
				2680	error(filename, linenum, 'runtime/printf', 1,
				2681	'sscanf can be ok, but is slow and can overflow buffers.')
				2682
				2683	# Check if some verboten operator overloading is going on
				2684	# TODO(unknown): catch out-of-line unary operator&:
				2685	# class X {};
				2686	# int operator&(const X& x) { return 42; } // unary operator&
				2687	# The trick is it's hard to tell apart from binary operator&:
				2688	# class Y { int operator&(const Y& x) { return 23; } }; // binary operator&
				2689	if Search(r'\boperator\s&\s$\s*$', line):
				2690	error(filename, linenum, 'runtime/operator', 4,
				2691	'Unary operator& is dangerous. Do not use it.')
				2692
				2693	# Check for suspicious usage of "if" like
				2694	# } if (a == b) {
				2695	if Search(r'\}\sif\s\(', line):
				2696	error(filename, linenum, 'readability/braces', 4,
				2697	'Did you mean "else if"? If not, start a new line for "if".')
				2698
				2699	# Check for potential format string bugs like printf(foo).
				2700	# We constrain the pattern not to pick things like DocidForPrintf(foo).
				2701	# Not perfect but it can catch printf(foo.c_str()) and printf(foo->c_str())
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2702	# TODO(sugawarayu): Catch the following case. Need to change the calling
				2703	# convention of the whole function to process multiple line to handle it.
				2704	# printf(
				2705	# boy_this_is_a_really_long_variable_that_cannot_fit_on_the_prev_line);
				2706	printf_args = _GetTextInside(line, r'(?i)\b(string)?printf\s*\(')
				2707	if printf_args:
				2708	match = Match(r'([\w.\->()]+)$', printf_args)
				2709	if match:
				2710	function_name = re.search(r'\b((?:string)?printf)\s*\(',
				2711	line, re.I).group(1)
				2712	error(filename, linenum, 'runtime/printf', 4,
				2713	'Potential format string bug. Do %s("%%s", %s) instead.'
				2714	% (function_name, match.group(1)))
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2715
				2716	# Check for potential memset bugs like memset(buf, sizeof(buf), 0).
				2717	match = Search(r'memset\s$([^,]),\s([^,]),\s0\s$', line)
				2718	if match and not Match(r"^''\|-?[0-9]+\|0x[0-9A-Fa-f]$", match.group(2)):
				2719	error(filename, linenum, 'runtime/memset', 4,
				2720	'Did you mean "memset(%s, 0, %s)"?'
				2721	% (match.group(1), match.group(2)))
				2722
				2723	if Search(r'\busing namespace\b', line):
				2724	error(filename, linenum, 'build/namespaces', 5,
				2725	'Do not use namespace using-directives. '
				2726	'Use using-declarations instead.')
				2727
				2728	# Detect variable-length arrays.
				2729	match = Match(r'\s(.+::)?(\w+) [a-z]\w\[(.+)];', line)
				2730	if (match and match.group(2) != 'return' and match.group(2) != 'delete' and
				2731	match.group(3).find(']') == -1):
				2732	# Split the size using space and arithmetic operators as delimiters.
				2733	# If any of the resulting tokens are not compile time constants then
				2734	# report the error.
				2735	tokens = re.split(r'\s\|\+\|\-\|\*\|\/\|<<\|>>]', match.group(3))
				2736	is_const = True
				2737	skip_next = False
				2738	for tok in tokens:
				2739	if skip_next:
				2740	skip_next = False
				2741	continue
				2742
				2743	if Search(r'sizeof$.+$', tok): continue
				2744	if Search(r'arraysize$\w+$', tok): continue
				2745
				2746	tok = tok.lstrip('(')
				2747	tok = tok.rstrip(')')
				2748	if not tok: continue
				2749	if Match(r'\d+', tok): continue
				2750	if Match(r'0[xX][0-9a-fA-F]+', tok): continue
				2751	if Match(r'k[A-Z0-9]\w*', tok): continue
				2752	if Match(r'(.+::)?k[A-Z0-9]\w*', tok): continue
				2753	if Match(r'(.+::)?[A-Z][A-Z0-9_]*', tok): continue
				2754	# A catch all for tricky sizeof cases, including 'sizeof expression',
				2755	# 'sizeof(*type)', 'sizeof(const type)', 'sizeof(struct StructName)'
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2756	# requires skipping the next token because we split on ' ' and '*'.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2757	if tok.startswith('sizeof'):
				2758	skip_next = True
				2759	continue
				2760	is_const = False
				2761	break
				2762	if not is_const:
				2763	error(filename, linenum, 'runtime/arrays', 1,
				2764	'Do not use variable-length arrays. Use an appropriately named '
				2765	"('k' followed by CamelCase) compile-time constant for the size.")
				2766
				2767	# If DISALLOW_EVIL_CONSTRUCTORS, DISALLOW_COPY_AND_ASSIGN, or
				2768	# DISALLOW_IMPLICIT_CONSTRUCTORS is present, then it should be the last thing
				2769	# in the class declaration.
				2770	match = Match(
				2771	(r'\s*'
				2772	r'(DISALLOW_(EVIL_CONSTRUCTORS\|COPY_AND_ASSIGN\|IMPLICIT_CONSTRUCTORS))'
				2773	r'$.*$;$'),
				2774	line)
				2775	if match and linenum + 1 < clean_lines.NumLines():
				2776	next_line = clean_lines.elided[linenum + 1]
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2777	# We allow some, but not all, declarations of variables to be present
				2778	# in the statement that defines the class. The [\w\,\s] fragment of
				2779	# the regular expression below allows users to declare instances of
				2780	# the class or pointers to instances, but not less common types such
				2781	# as function pointers or arrays. It's a tradeoff between allowing
				2782	# reasonable code and avoiding trying to parse more C++ using regexps.
				2783	if not Search(r'^\s}[\w\,\s]*;', next_line):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2784	error(filename, linenum, 'readability/constructors', 3,
				2785	match.group(1) + ' should be the last thing in the class')
				2786
				2787	# Check for use of unnamed namespaces in header files. Registration
				2788	# macros are typically OK, so we allow use of "namespace {" on lines
				2789	# that end with backslashes.
				2790	if (file_extension == 'h'
				2791	and Search(r'\bnamespace\s*{', line)
				2792	and line[-1] != '\\'):
				2793	error(filename, linenum, 'build/namespaces', 4,
				2794	'Do not use unnamed namespaces in header files. See '
				2795	'http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml#Namespaces'
				2796	' for more information.')
				2797
				2798
				2799	def CheckCStyleCast(filename, linenum, line, raw_line, cast_type, pattern,
				2800	error):
				2801	"""Checks for a C-style cast by looking for the pattern.
				2802
				2803	This also handles sizeof(type) warnings, due to similarity of content.
				2804
				2805	Args:
				2806	filename: The name of the current file.
				2807	linenum: The number of the line to check.
				2808	line: The line of code to check.
				2809	raw_line: The raw line of code to check, with comments.
				2810	cast_type: The string for the C++ cast to recommend. This is either
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2811	reinterpret_cast, static_cast, or const_cast, depending.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2812	pattern: The regular expression used to find C-style casts.
				2813	error: The function to call with any errors found.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2814
				2815	Returns:
				2816	True if an error was emitted.
				2817	False otherwise.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2818	"""
				2819	match = Search(pattern, line)
				2820	if not match:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2821	return False
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2822
				2823	# e.g., sizeof(int)
				2824	sizeof_match = Match(r'.sizeof\s$', line[0:match.start(1) - 1])
				2825	if sizeof_match:
				2826	error(filename, linenum, 'runtime/sizeof', 1,
				2827	'Using sizeof(type). Use sizeof(varname) instead if possible')
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2828	return True
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2829
				2830	remainder = line[match.end(0):]
				2831
				2832	# The close paren is for function pointers as arguments to a function.
				2833	# eg, void foo(void (*bar)(int));
				2834	# The semicolon check is a more basic function check; also possibly a
				2835	# function pointer typedef.
				2836	# eg, void foo(int); or void foo(int) const;
				2837	# The equals check is for function pointer assignment.
				2838	# eg, void (foo)(int) = ...
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2839	# The > is for MockCallback<...> ...
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2840	#
				2841	# Right now, this will only catch cases where there's a single argument, and
				2842	# it's unnamed. It should probably be expanded to check for multiple
				2843	# arguments with some unnamed.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2844	function_match = Match(r'\s(\)\|=\|(const)?\s(;\|\{\|throw\|>))', remainder)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2845	if function_match:
				2846	if (not function_match.group(3) or
				2847	function_match.group(3) == ';' or
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2848	('MockCallback<' not in raw_line and
				2849	'/*' not in raw_line)):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2850	error(filename, linenum, 'readability/function', 3,
				2851	'All parameters should be named in a function')
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2852	return True
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2853
				2854	# At this point, all that should be left is actual casts.
				2855	error(filename, linenum, 'readability/casting', 4,
				2856	'Using C-style cast. Use %s<%s>(...) instead' %
				2857	(cast_type, match.group(1)))
				2858
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	2859	return True
				2860
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2861
				2862	_HEADERS_CONTAINING_TEMPLATES = (
				2863	('<deque>', ('deque',)),
				2864	('<functional>', ('unary_function', 'binary_function',
				2865	'plus', 'minus', 'multiplies', 'divides', 'modulus',
				2866	'negate',
				2867	'equal_to', 'not_equal_to', 'greater', 'less',
				2868	'greater_equal', 'less_equal',
				2869	'logical_and', 'logical_or', 'logical_not',
				2870	'unary_negate', 'not1', 'binary_negate', 'not2',
				2871	'bind1st', 'bind2nd',
				2872	'pointer_to_unary_function',
				2873	'pointer_to_binary_function',
				2874	'ptr_fun',
				2875	'mem_fun_t', 'mem_fun', 'mem_fun1_t', 'mem_fun1_ref_t',
				2876	'mem_fun_ref_t',
				2877	'const_mem_fun_t', 'const_mem_fun1_t',
				2878	'const_mem_fun_ref_t', 'const_mem_fun1_ref_t',
				2879	'mem_fun_ref',
				2880	)),
				2881	('<limits>', ('numeric_limits',)),
				2882	('<list>', ('list',)),
				2883	('<map>', ('map', 'multimap',)),
				2884	('<memory>', ('allocator',)),
				2885	('<queue>', ('queue', 'priority_queue',)),
				2886	('<set>', ('set', 'multiset',)),
				2887	('<stack>', ('stack',)),
				2888	('<string>', ('char_traits', 'basic_string',)),
				2889	('<utility>', ('pair',)),
				2890	('<vector>', ('vector',)),
				2891
				2892	# gcc extensions.
				2893	# Note: std::hash is their hash, ::hash is our hash
				2894	('<hash_map>', ('hash_map', 'hash_multimap',)),
				2895	('<hash_set>', ('hash_set', 'hash_multiset',)),
				2896	('<slist>', ('slist',)),
				2897	)
				2898
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	2899	_RE_PATTERN_STRING = re.compile(r'\bstring\b')
				2900
				2901	_re_pattern_algorithm_header = []
				2902	for _template in ('copy', 'max', 'min', 'min_element', 'sort', 'swap',
				2903	'transform'):
				2904	# Match max<type>(..., ...), max(..., ...), but not foo->max, foo.max or
				2905	# type::max().
				2906	_re_pattern_algorithm_header.append(
				2907	(re.compile(r'[^>.]\b' + _template + r'(<.*?>)?$[^$]'),
				2908	_template,
				2909	'<algorithm>'))
				2910
				2911	_re_pattern_templates = []
				2912	for _header, _templates in _HEADERS_CONTAINING_TEMPLATES:
				2913	for _template in _templates:
				2914	_re_pattern_templates.append(
				2915	(re.compile(r'(\<\|\b)' + _template + r'\s*\<'),
				2916	_template + '<>',
				2917	_header))
				2918
				2919
				2920	def FilesBelongToSameModule(filename_cc, filename_h):
				2921	"""Check if these two filenames belong to the same module.
				2922
				2923	The concept of a 'module' here is a as follows:
				2924	foo.h, foo-inl.h, foo.cc, foo_test.cc and foo_unittest.cc belong to the
				2925	same 'module' if they are in the same directory.
				2926	some/path/public/xyzzy and some/path/internal/xyzzy are also considered
				2927	to belong to the same module here.
				2928
				2929	If the filename_cc contains a longer path than the filename_h, for example,
				2930	'/absolute/path/to/base/sysinfo.cc', and this file would include
				2931	'base/sysinfo.h', this function also produces the prefix needed to open the
				2932	header. This is used by the caller of this function to more robustly open the
				2933	header file. We don't have access to the real include paths in this context,
				2934	so we need this guesswork here.
				2935
				2936	Known bugs: tools/base/bar.cc and base/bar.h belong to the same module
				2937	according to this implementation. Because of this, this function gives
				2938	some false positives. This should be sufficiently rare in practice.
				2939
				2940	Args:
				2941	filename_cc: is the path for the .cc file
				2942	filename_h: is the path for the header path
				2943
				2944	Returns:
				2945	Tuple with a bool and a string:
				2946	bool: True if filename_cc and filename_h belong to the same module.
				2947	string: the additional prefix needed to open the header file.
				2948	"""
				2949
				2950	if not filename_cc.endswith('.cc'):
				2951	return (False, '')
				2952	filename_cc = filename_cc[:-len('.cc')]
				2953	if filename_cc.endswith('_unittest'):
				2954	filename_cc = filename_cc[:-len('_unittest')]
				2955	elif filename_cc.endswith('_test'):
				2956	filename_cc = filename_cc[:-len('_test')]
				2957	filename_cc = filename_cc.replace('/public/', '/')
				2958	filename_cc = filename_cc.replace('/internal/', '/')
				2959
				2960	if not filename_h.endswith('.h'):
				2961	return (False, '')
				2962	filename_h = filename_h[:-len('.h')]
				2963	if filename_h.endswith('-inl'):
				2964	filename_h = filename_h[:-len('-inl')]
				2965	filename_h = filename_h.replace('/public/', '/')
				2966	filename_h = filename_h.replace('/internal/', '/')
				2967
				2968	files_belong_to_same_module = filename_cc.endswith(filename_h)
				2969	common_path = ''
				2970	if files_belong_to_same_module:
				2971	common_path = filename_cc[:-len(filename_h)]
				2972	return files_belong_to_same_module, common_path
				2973
				2974
				2975	def UpdateIncludeState(filename, include_state, io=codecs):
				2976	"""Fill up the include_state with new includes found from the file.
				2977
				2978	Args:
				2979	filename: the name of the header to read.
				2980	include_state: an _IncludeState instance in which the headers are inserted.
				2981	io: The io factory to use to read the file. Provided for testability.
				2982
				2983	Returns:
				2984	True if a header was succesfully added. False otherwise.
				2985	"""
				2986	headerfile = None
				2987	try:
				2988	headerfile = io.open(filename, 'r', 'utf8', 'replace')
				2989	except IOError:
				2990	return False
				2991	linenum = 0
				2992	for line in headerfile:
				2993	linenum += 1
				2994	clean_line = CleanseComments(line)
				2995	match = _RE_PATTERN_INCLUDE.search(clean_line)
				2996	if match:
				2997	include = match.group(2)
				2998	# The value formatting is cute, but not really used right now.
				2999	# What matters here is that the key is in include_state.
				3000	include_state.setdefault(include, '%s:%d' % (filename, linenum))
				3001	return True
				3002
				3003
				3004	def CheckForIncludeWhatYouUse(filename, clean_lines, include_state, error,
				3005	io=codecs):
				3006	"""Reports for missing stl includes.
				3007
				3008	This function will output warnings to make sure you are including the headers
				3009	necessary for the stl containers and functions that you use. We only give one
				3010	reason to include a header. For example, if you use both equal_to<> and
				3011	less<> in a .h file, only one (the latter in the file) of these will be
				3012	reported as a reason to include the <functional>.
				3013
				3014	Args:
				3015	filename: The name of the current file.
				3016	clean_lines: A CleansedLines instance containing the file.
				3017	include_state: An _IncludeState instance.
				3018	error: The function to call with any errors found.
				3019	io: The IO factory to use to read the header file. Provided for unittest
				3020	injection.
				3021	"""
				3022	required = {} # A map of header name to linenumber and the template entity.
				3023	# Example of required: { '<functional>': (1219, 'less<>') }
				3024
				3025	for linenum in xrange(clean_lines.NumLines()):
				3026	line = clean_lines.elided[linenum]
				3027	if not line or line[0] == '#':
				3028	continue
				3029
				3030	# String is special -- it is a non-templatized type in STL.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3031	matched = _RE_PATTERN_STRING.search(line)
				3032	if matched:
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3033	# Don't warn about strings in non-STL namespaces:
				3034	# (We check only the first match per line; good enough.)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3035	prefix = line[:matched.start()]
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3036	if prefix.endswith('std::') or not prefix.endswith('::'):
				3037	required['<string>'] = (linenum, 'string')
				3038
				3039	for pattern, template, header in _re_pattern_algorithm_header:
				3040	if pattern.search(line):
				3041	required[header] = (linenum, template)
				3042
				3043	# The following function is just a speed up, no semantics are changed.
				3044	if not '<' in line: # Reduces the cpu time usage by skipping lines.
				3045	continue
				3046
				3047	for pattern, template, header in _re_pattern_templates:
				3048	if pattern.search(line):
				3049	required[header] = (linenum, template)
				3050
				3051	# The policy is that if you #include something in foo.h you don't need to
				3052	# include it again in foo.cc. Here, we will look at possible includes.
				3053	# Let's copy the include_state so it is only messed up within this function.
				3054	include_state = include_state.copy()
				3055
				3056	# Did we find the header for this file (if any) and succesfully load it?
				3057	header_found = False
				3058
				3059	# Use the absolute path so that matching works properly.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3060	abs_filename = FileInfo(filename).FullName()
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3061
				3062	# For Emacs's flymake.
				3063	# If cpplint is invoked from Emacs's flymake, a temporary file is generated
				3064	# by flymake and that file name might end with '_flymake.cc'. In that case,
				3065	# restore original file name here so that the corresponding header file can be
				3066	# found.
				3067	# e.g. If the file name is 'foo_flymake.cc', we should search for 'foo.h'
				3068	# instead of 'foo_flymake.h'
				3069	abs_filename = re.sub(r'_flymake\.cc$', '.cc', abs_filename)
				3070
				3071	# include_state is modified during iteration, so we iterate over a copy of
				3072	# the keys.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3073	header_keys = include_state.keys()
				3074	for header in header_keys:
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3075	(same_module, common_path) = FilesBelongToSameModule(abs_filename, header)
				3076	fullpath = common_path + header
				3077	if same_module and UpdateIncludeState(fullpath, include_state, io):
				3078	header_found = True
				3079
				3080	# If we can't find the header file for a .cc, assume it's because we don't
				3081	# know where to look. In that case we'll give up as we're not sure they
				3082	# didn't include it in the .h file.
				3083	# TODO(unknown): Do a better job of finding .h files so we are confident that
				3084	# not having the .h file means there isn't one.
				3085	if filename.endswith('.cc') and not header_found:
				3086	return
				3087
				3088	# All the lines have been processed, report the errors found.
				3089	for required_header_unstripped in required:
				3090	template = required[required_header_unstripped][1]
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3091	if required_header_unstripped.strip('<>"') not in include_state:
				3092	error(filename, required[required_header_unstripped][0],
				3093	'build/include_what_you_use', 4,
				3094	'Add #include ' + required_header_unstripped + ' for ' + template)
				3095
				3096
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3097	_RE_PATTERN_EXPLICIT_MAKEPAIR = re.compile(r'\bmake_pair\s*<')
				3098
				3099
				3100	def CheckMakePairUsesDeduction(filename, clean_lines, linenum, error):
				3101	"""Check that make_pair's template arguments are deduced.
				3102
				3103	G++ 4.6 in C++0x mode fails badly if make_pair's template arguments are
				3104	specified explicitly, and such use isn't intended in any case.
				3105
				3106	Args:
				3107	filename: The name of the current file.
				3108	clean_lines: A CleansedLines instance containing the file.
				3109	linenum: The number of the line to check.
				3110	error: The function to call with any errors found.
				3111	"""
				3112	raw = clean_lines.raw_lines
				3113	line = raw[linenum]
				3114	match = _RE_PATTERN_EXPLICIT_MAKEPAIR.search(line)
				3115	if match:
				3116	error(filename, linenum, 'build/explicit_make_pair',
				3117	4, # 4 = high confidence
				3118	'Omit template arguments from make_pair OR use pair directly OR'
				3119	' if appropriate, construct a pair directly')
				3120
				3121
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3122	def ProcessLine(filename, file_extension,
				3123	clean_lines, line, include_state, function_state,
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3124	class_state, error, extra_check_functions=[]):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3125	"""Processes a single line in the file.
				3126
				3127	Args:
				3128	filename: Filename of the file that is being processed.
				3129	file_extension: The extension (dot not included) of the file.
				3130	clean_lines: An array of strings, each representing a line of the file,
				3131	with comments stripped.
				3132	line: Number of line being processed.
				3133	include_state: An _IncludeState instance in which the headers are inserted.
				3134	function_state: A _FunctionState instance which counts function lines, etc.
				3135	class_state: A _ClassState instance which maintains information about
				3136	the current stack of nested class declarations being parsed.
				3137	error: A callable to which errors are reported, which takes 4 arguments:
				3138	filename, line number, error level, and message
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3139	extra_check_functions: An array of additional check functions that will be
				3140	run on each source line. Each function takes 4
				3141	arguments: filename, clean_lines, line, error
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3142	"""
				3143	raw_lines = clean_lines.raw_lines
				3144	ParseNolintSuppressions(filename, raw_lines[line], line, error)
				3145	CheckForFunctionLengths(filename, clean_lines, line, function_state, error)
				3146	CheckForMultilineCommentsAndStrings(filename, clean_lines, line, error)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3147	CheckStyle(filename, clean_lines, line, file_extension, class_state, error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3148	CheckLanguage(filename, clean_lines, line, file_extension, include_state,
				3149	error)
				3150	CheckForNonStandardConstructs(filename, clean_lines, line,
				3151	class_state, error)
				3152	CheckPosixThreading(filename, clean_lines, line, error)
				3153	CheckInvalidIncrement(filename, clean_lines, line, error)
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3154	CheckMakePairUsesDeduction(filename, clean_lines, line, error)
				3155	for check_fn in extra_check_functions:
				3156	check_fn(filename, clean_lines, line, error)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3157
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3158	def ProcessFileData(filename, file_extension, lines, error,
				3159	extra_check_functions=[]):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3160	"""Performs lint checks and reports any errors to the given error function.
				3161
				3162	Args:
				3163	filename: Filename of the file that is being processed.
				3164	file_extension: The extension (dot not included) of the file.
				3165	lines: An array of strings, each representing a line of the file, with the
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3166	last element being empty if the file is terminated with a newline.
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3167	error: A callable to which errors are reported, which takes 4 arguments:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3168	filename, line number, error level, and message
				3169	extra_check_functions: An array of additional check functions that will be
				3170	run on each source line. Each function takes 4
				3171	arguments: filename, clean_lines, line, error
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3172	"""
				3173	lines = (['// marker so line numbers and indices both start at 1'] + lines +
				3174	['// marker so line numbers end in a known way'])
				3175
				3176	include_state = _IncludeState()
				3177	function_state = _FunctionState()
				3178	class_state = _ClassState()
				3179
				3180	ResetNolintSuppressions()
				3181
				3182	CheckForCopyright(filename, lines, error)
				3183
				3184	if file_extension == 'h':
				3185	CheckForHeaderGuard(filename, lines, error)
				3186
				3187	RemoveMultiLineComments(filename, lines, error)
				3188	clean_lines = CleansedLines(lines)
				3189	for line in xrange(clean_lines.NumLines()):
				3190	ProcessLine(filename, file_extension, clean_lines, line,
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3191	include_state, function_state, class_state, error,
				3192	extra_check_functions)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3193	class_state.CheckFinished(filename, error)
				3194
				3195	CheckForIncludeWhatYouUse(filename, clean_lines, include_state, error)
				3196
				3197	# We check here rather than inside ProcessLine so that we see raw
				3198	# lines rather than "cleaned" lines.
				3199	CheckForUnicodeReplacementCharacters(filename, lines, error)
				3200
				3201	CheckForNewlineAtEOF(filename, lines, error)
				3202
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3203	def ProcessFile(filename, vlevel, extra_check_functions=[]):
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3204	"""Does google-lint on a single file.
				3205
				3206	Args:
				3207	filename: The name of the file to parse.
				3208
				3209	vlevel: The level of errors to report. Every error of confidence
				3210	>= verbose_level will be reported. 0 is a good default.
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3211
				3212	extra_check_functions: An array of additional check functions that will be
				3213	run on each source line. Each function takes 4
				3214	arguments: filename, clean_lines, line, error
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3215	"""
				3216
				3217	_SetVerboseLevel(vlevel)
				3218
				3219	try:
				3220	# Support the UNIX convention of using "-" for stdin. Note that
				3221	# we are not opening the file with universal newline support
				3222	# (which codecs doesn't support anyway), so the resulting lines do
				3223	# contain trailing '\r' characters if we are reading a file that
				3224	# has CRLF endings.
				3225	# If after the split a trailing '\r' is present, it is removed
				3226	# below. If it is not expected to be present (i.e. os.linesep !=
				3227	# '\r\n' as in Windows), a warning is issued below if this file
				3228	# is processed.
				3229
				3230	if filename == '-':
				3231	lines = codecs.StreamReaderWriter(sys.stdin,
				3232	codecs.getreader('utf8'),
				3233	codecs.getwriter('utf8'),
				3234	'replace').read().split('\n')
				3235	else:
				3236	lines = codecs.open(filename, 'r', 'utf8', 'replace').read().split('\n')
				3237
				3238	carriage_return_found = False
				3239	# Remove trailing '\r'.
				3240	for linenum in range(len(lines)):
				3241	if lines[linenum].endswith('\r'):
				3242	lines[linenum] = lines[linenum].rstrip('\r')
				3243	carriage_return_found = True
				3244
				3245	except IOError:
				3246	sys.stderr.write(
				3247	"Skipping input '%s': Can't open for reading\n" % filename)
				3248	return
				3249
				3250	# Note, if no dot is found, this will give the entire filename as the ext.
				3251	file_extension = filename[filename.rfind('.') + 1:]
				3252
				3253	# When reading from stdin, the extension is unknown, so no cpplint tests
				3254	# should rely on the extension.
				3255	if (filename != '-' and file_extension != 'cc' and file_extension != 'h'
				3256	and file_extension != 'cpp'):
				3257	sys.stderr.write('Ignoring %s; not a .cc or .h file\n' % filename)
				3258	else:
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3259	ProcessFileData(filename, file_extension, lines, Error,
				3260	extra_check_functions)
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3261	if carriage_return_found and os.linesep != '\r\n':
Elliott Hughes	db38570	2012-06-21 10:41:20 -0700	[diff] [blame]	3262	# Use 0 for linenum since outputting only one error for potentially
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3263	# several lines.
				3264	Error(filename, 0, 'whitespace/newline', 1,
				3265	'One or more unexpected \\r (^M) found;'
				3266	'better to use only a \\n')
				3267
				3268	sys.stderr.write('Done processing %s\n' % filename)
				3269
				3270
				3271	def PrintUsage(message):
				3272	"""Prints a brief usage string and exits, optionally with an error message.
				3273
				3274	Args:
				3275	message: The optional error message.
				3276	"""
				3277	sys.stderr.write(_USAGE)
				3278	if message:
				3279	sys.exit('\nFATAL ERROR: ' + message)
				3280	else:
				3281	sys.exit(1)
				3282
				3283
				3284	def PrintCategories():
				3285	"""Prints a list of all the error-categories used by error messages.
				3286
				3287	These are the categories used to filter messages via --filter.
				3288	"""
				3289	sys.stderr.write(''.join(' %s\n' % cat for cat in _ERROR_CATEGORIES))
				3290	sys.exit(0)
				3291
				3292
				3293	def ParseArguments(args):
				3294	"""Parses the command line arguments.
				3295
				3296	This may set the output format and verbosity level as side-effects.
				3297
				3298	Args:
				3299	args: The command line arguments:
				3300
				3301	Returns:
				3302	The list of filenames to lint.
				3303	"""
				3304	try:
				3305	(opts, filenames) = getopt.getopt(args, '', ['help', 'output=', 'verbose=',
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3306	'stdout', # TODO(enh): added --stdout
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3307	'counting=',
				3308	'filter='])
				3309	except getopt.GetoptError:
				3310	PrintUsage('Invalid arguments.')
				3311
				3312	verbosity = _VerboseLevel()
				3313	output_format = _OutputFormat()
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3314	output_stream = sys.stderr # TODO(enh): added --stdout
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3315	filters = ''
				3316	counting_style = ''
				3317
				3318	for (opt, val) in opts:
				3319	if opt == '--help':
				3320	PrintUsage(None)
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3321	elif opt == '--stdout': # TODO(enh): added --stdout
				3322	output_stream = sys.stdout # TODO(enh): added --stdout
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3323	elif opt == '--output':
				3324	if not val in ('emacs', 'vs7'):
				3325	PrintUsage('The only allowed output formats are emacs and vs7.')
				3326	output_format = val
				3327	elif opt == '--verbose':
				3328	verbosity = int(val)
				3329	elif opt == '--filter':
				3330	filters = val
				3331	if not filters:
				3332	PrintCategories()
				3333	elif opt == '--counting':
				3334	if val not in ('total', 'toplevel', 'detailed'):
				3335	PrintUsage('Valid counting options are total, toplevel, and detailed')
				3336	counting_style = val
				3337
				3338	if not filenames:
				3339	PrintUsage('No files were specified.')
				3340
				3341	_SetOutputFormat(output_format)
				3342	_SetVerboseLevel(verbosity)
				3343	_SetFilters(filters)
				3344	_SetCountingStyle(counting_style)
				3345
Elliott Hughes	08fc03a	2012-06-26 17:34:00 -0700	[diff] [blame]	3346	sys.stderr = output_stream # TODO(enh): added --stdout
				3347
Brian Carlstrom	59848da	2011-07-23 20:35:19 -0700	[diff] [blame]	3348	return filenames
				3349
				3350
				3351	def main():
				3352	filenames = ParseArguments(sys.argv[1:])
				3353
				3354	# Change stderr to write with replacement characters so we don't die
				3355	# if we try to print something containing non-ASCII characters.
				3356	sys.stderr = codecs.StreamReaderWriter(sys.stderr,
				3357	codecs.getreader('utf8'),
				3358	codecs.getwriter('utf8'),
				3359	'replace')
				3360
				3361	_cpplint_state.ResetErrorCounts()
				3362	for filename in filenames:
				3363	ProcessFile(filename, _cpplint_state.verbose_level)
				3364	_cpplint_state.PrintErrorCounts()
				3365
				3366	sys.exit(_cpplint_state.error_count > 0)
				3367
				3368
				3369	if __name__ == '__main__':
				3370	main()