Blame - cpplint.py - chromium.googlesource.com/chromium/tools/depot_tools

blob: 92384dc37181f6e982d0e6f74afe93d393c5de19 [file] [log] [blame]

erg@chromium.org	d528f8b	2012-05-11 17:31:08 +0000	[diff] [blame]	1	#!/usr/bin/env python
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2	#
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	3	# Copyright (c) 2009 Google Inc. All rights reserved.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4	#
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5	# Redistribution and use in source and binary forms, with or without
				6	# modification, are permitted provided that the following conditions are
				7	# met:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	8	#
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	9	# * Redistributions of source code must retain the above copyright
				10	# notice, this list of conditions and the following disclaimer.
				11	# * Redistributions in binary form must reproduce the above
				12	# copyright notice, this list of conditions and the following disclaimer
				13	# in the documentation and/or other materials provided with the
				14	# distribution.
				15	# * Neither the name of Google Inc. nor the names of its
				16	# contributors may be used to endorse or promote products derived from
				17	# this software without specific prior written permission.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	18	#
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	19	# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
				20	# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
				21	# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
				22	# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
				23	# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
				24	# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
				25	# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
				26	# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
				27	# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
				28	# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
				29	# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	30
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	31	"""Does google-lint on c++ files.
				32
				33	The goal of this script is to identify places in the code that may
				34	be in non-compliance with google style. It does not attempt to fix
				35	up these problems -- the point is to educate. It does also not
				36	attempt to find all problems, or to ensure that everything it does
				37	find is legitimately a problem.
				38
				39	In particular, we can get very confused by /* and // inside strings!
				40	We do a small hack, which is to ignore //'s with "'s after them on the
				41	same line, but it is far from perfect (in either direction).
				42	"""
				43
				44	import codecs
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	45	import copy
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	46	import getopt
				47	import math # for log
				48	import os
				49	import re
				50	import sre_compile
				51	import string
				52	import sys
				53	import unicodedata
				54
				55
				56	_USAGE = """
				57	Syntax: cpplint.py [--verbose=#] [--output=vs7] [--filter=-x,+y,...]
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	58	[--counting=total\|toplevel\|detailed] [--root=subdir]
				59	[--linelength=digits]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	60	<file> [file] ...
				61
				62	The style guidelines this tries to follow are those in
				63	http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml
				64
				65	Every problem is given a confidence score from 1-5, with 5 meaning we are
				66	certain of the problem, and 1 meaning it could be a legitimate construct.
				67	This will miss some errors, and is not a substitute for a code review.
				68
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	69	To suppress false-positive errors of a certain category, add a
				70	'NOLINT(category)' comment to the line. NOLINT or NOLINT(*)
				71	suppresses errors of all categories on that line.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	72
				73	The files passed in will be linted; at least one file must be provided.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	74	Default linted extensions are .cc, .cpp, .cu, .cuh and .h. Change the
				75	extensions with the --extensions flag.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	76
				77	Flags:
				78
				79	output=vs7
				80	By default, the output is formatted to ease emacs parsing. Visual Studio
				81	compatible output (vs7) may also be used. Other formats are unsupported.
				82
				83	verbose=#
				84	Specify a number 0-5 to restrict errors to certain verbosity levels.
				85
				86	filter=-x,+y,...
				87	Specify a comma-separated list of category-filters to apply: only
				88	error messages whose category names pass the filters will be printed.
				89	(Category names are printed with the message and look like
				90	"[whitespace/indent]".) Filters are evaluated left to right.
				91	"-FOO" and "FOO" means "do not print categories that start with FOO".
				92	"+FOO" means "do print categories that start with FOO".
				93
				94	Examples: --filter=-whitespace,+whitespace/braces
				95	--filter=whitespace,runtime/printf,+runtime/printf_format
				96	--filter=-,+build/include_what_you_use
				97
				98	To see a list of all the categories used in cpplint, pass no arg:
				99	--filter=
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	100
				101	counting=total\|toplevel\|detailed
				102	The total number of errors found is always printed. If
				103	'toplevel' is provided, then the count of errors in each of
				104	the top-level categories like 'build' and 'whitespace' will
				105	also be printed. If 'detailed' is provided, then a count
				106	is provided for each category like 'build/class'.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	107
				108	root=subdir
				109	The root directory used for deriving header guard CPP variable.
				110	By default, the header guard CPP variable is calculated as the relative
				111	path to the directory that contains .git, .hg, or .svn. When this flag
				112	is specified, the relative path is calculated from the specified
				113	directory. If the specified directory does not exist, this flag is
				114	ignored.
				115
				116	Examples:
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	117	Assuming that src/.git exists, the header guard CPP variables for
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	118	src/chrome/browser/ui/browser.h are:
				119
				120	No flag => CHROME_BROWSER_UI_BROWSER_H_
				121	--root=chrome => BROWSER_UI_BROWSER_H_
				122	--root=chrome/browser => UI_BROWSER_H_
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	123
				124	linelength=digits
				125	This is the allowed line length for the project. The default value is
				126	80 characters.
				127
				128	Examples:
				129	--linelength=120
				130
				131	extensions=extension,extension,...
				132	The allowed file extensions that cpplint will check
				133
				134	Examples:
				135	--extensions=hpp,cpp
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	136	"""
				137
				138	# We categorize each error message we print. Here are the categories.
				139	# We want an explicit list so we can list them all in cpplint --filter=.
				140	# If you add a new error message with a new category, add it to the list
				141	# here! cpplint_unittest.py should tell you if you forget to do this.
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	142	_ERROR_CATEGORIES = [
				143	'build/class',
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	144	'build/c++11',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	145	'build/deprecated',
				146	'build/endif_comment',
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	147	'build/explicit_make_pair',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	148	'build/forward_decl',
				149	'build/header_guard',
				150	'build/include',
				151	'build/include_alpha',
				152	'build/include_order',
				153	'build/include_what_you_use',
				154	'build/namespaces',
				155	'build/printf_format',
				156	'build/storage_class',
				157	'legal/copyright',
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	158	'readability/alt_tokens',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	159	'readability/braces',
				160	'readability/casting',
				161	'readability/check',
				162	'readability/constructors',
				163	'readability/fn_size',
				164	'readability/function',
				165	'readability/multiline_comment',
				166	'readability/multiline_string',
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	167	'readability/namespace',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	168	'readability/nolint',
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	169	'readability/nul',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	170	'readability/streams',
				171	'readability/todo',
				172	'readability/utf8',
				173	'runtime/arrays',
				174	'runtime/casting',
				175	'runtime/explicit',
				176	'runtime/int',
				177	'runtime/init',
				178	'runtime/invalid_increment',
				179	'runtime/member_string_references',
				180	'runtime/memset',
				181	'runtime/operator',
				182	'runtime/printf',
				183	'runtime/printf_format',
				184	'runtime/references',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	185	'runtime/string',
				186	'runtime/threadsafe_fn',
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	187	'runtime/vlog',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	188	'whitespace/blank_line',
				189	'whitespace/braces',
				190	'whitespace/comma',
				191	'whitespace/comments',
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	192	'whitespace/empty_conditional_body',
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	193	'whitespace/empty_loop_body',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	194	'whitespace/end_of_line',
				195	'whitespace/ending_newline',
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	196	'whitespace/forcolon',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	197	'whitespace/indent',
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	198	'whitespace/line_length',
				199	'whitespace/newline',
				200	'whitespace/operators',
				201	'whitespace/parens',
				202	'whitespace/semicolon',
				203	'whitespace/tab',
				204	'whitespace/todo'
				205	]
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	206
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	207	# The default state of the category filter. This is overridden by the --filter=
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	208	# flag. By default all errors are on, so only add here categories that should be
				209	# off by default (i.e., categories that must be enabled by the --filter= flags).
				210	# All entries here should start with a '-' or '+', as in the --filter= flag.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	211	_DEFAULT_FILTERS = ['-build/include_alpha']
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	212
				213	# We used to check for high-bit characters, but after much discussion we
				214	# decided those were OK, as long as they were in UTF-8 and didn't represent
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	215	# hard-coded international strings, which belong in a separate i18n file.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	216
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	217	# C++ headers
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	218	_CPP_HEADERS = frozenset([
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	219	# Legacy
				220	'algobase.h',
				221	'algo.h',
				222	'alloc.h',
				223	'builtinbuf.h',
				224	'bvector.h',
				225	'complex.h',
				226	'defalloc.h',
				227	'deque.h',
				228	'editbuf.h',
				229	'fstream.h',
				230	'function.h',
				231	'hash_map',
				232	'hash_map.h',
				233	'hash_set',
				234	'hash_set.h',
				235	'hashtable.h',
				236	'heap.h',
				237	'indstream.h',
				238	'iomanip.h',
				239	'iostream.h',
				240	'istream.h',
				241	'iterator.h',
				242	'list.h',
				243	'map.h',
				244	'multimap.h',
				245	'multiset.h',
				246	'ostream.h',
				247	'pair.h',
				248	'parsestream.h',
				249	'pfstream.h',
				250	'procbuf.h',
				251	'pthread_alloc',
				252	'pthread_alloc.h',
				253	'rope',
				254	'rope.h',
				255	'ropeimpl.h',
				256	'set.h',
				257	'slist',
				258	'slist.h',
				259	'stack.h',
				260	'stdiostream.h',
				261	'stl_alloc.h',
				262	'stl_relops.h',
				263	'streambuf.h',
				264	'stream.h',
				265	'strfile.h',
				266	'strstream.h',
				267	'tempbuf.h',
				268	'tree.h',
				269	'type_traits.h',
				270	'vector.h',
				271	# 17.6.1.2 C++ library headers
				272	'algorithm',
				273	'array',
				274	'atomic',
				275	'bitset',
				276	'chrono',
				277	'codecvt',
				278	'complex',
				279	'condition_variable',
				280	'deque',
				281	'exception',
				282	'forward_list',
				283	'fstream',
				284	'functional',
				285	'future',
				286	'initializer_list',
				287	'iomanip',
				288	'ios',
				289	'iosfwd',
				290	'iostream',
				291	'istream',
				292	'iterator',
				293	'limits',
				294	'list',
				295	'locale',
				296	'map',
				297	'memory',
				298	'mutex',
				299	'new',
				300	'numeric',
				301	'ostream',
				302	'queue',
				303	'random',
				304	'ratio',
				305	'regex',
				306	'set',
				307	'sstream',
				308	'stack',
				309	'stdexcept',
				310	'streambuf',
				311	'string',
				312	'strstream',
				313	'system_error',
				314	'thread',
				315	'tuple',
				316	'typeindex',
				317	'typeinfo',
				318	'type_traits',
				319	'unordered_map',
				320	'unordered_set',
				321	'utility',
				322	'valarray',
				323	'vector',
				324	# 17.6.1.2 C++ headers for C library facilities
				325	'cassert',
				326	'ccomplex',
				327	'cctype',
				328	'cerrno',
				329	'cfenv',
				330	'cfloat',
				331	'cinttypes',
				332	'ciso646',
				333	'climits',
				334	'clocale',
				335	'cmath',
				336	'csetjmp',
				337	'csignal',
				338	'cstdalign',
				339	'cstdarg',
				340	'cstdbool',
				341	'cstddef',
				342	'cstdint',
				343	'cstdio',
				344	'cstdlib',
				345	'cstring',
				346	'ctgmath',
				347	'ctime',
				348	'cuchar',
				349	'cwchar',
				350	'cwctype',
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	351	])
				352
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	353
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	354	# Assertion macros. These are defined in base/logging.h and
				355	# testing/base/gunit.h. Note that the _M versions need to come first
				356	# for substring matching to work.
				357	_CHECK_MACROS = [
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	358	'DCHECK', 'CHECK',
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	359	'EXPECT_TRUE_M', 'EXPECT_TRUE',
				360	'ASSERT_TRUE_M', 'ASSERT_TRUE',
				361	'EXPECT_FALSE_M', 'EXPECT_FALSE',
				362	'ASSERT_FALSE_M', 'ASSERT_FALSE',
				363	]
				364
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	365	# Replacement macros for CHECK/DCHECK/EXPECT_TRUE/EXPECT_FALSE
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	366	_CHECK_REPLACEMENT = dict([(m, {}) for m in _CHECK_MACROS])
				367
				368	for op, replacement in [('==', 'EQ'), ('!=', 'NE'),
				369	('>=', 'GE'), ('>', 'GT'),
				370	('<=', 'LE'), ('<', 'LT')]:
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	371	_CHECK_REPLACEMENT['DCHECK'][op] = 'DCHECK_%s' % replacement
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	372	_CHECK_REPLACEMENT['CHECK'][op] = 'CHECK_%s' % replacement
				373	_CHECK_REPLACEMENT['EXPECT_TRUE'][op] = 'EXPECT_%s' % replacement
				374	_CHECK_REPLACEMENT['ASSERT_TRUE'][op] = 'ASSERT_%s' % replacement
				375	_CHECK_REPLACEMENT['EXPECT_TRUE_M'][op] = 'EXPECT_%s_M' % replacement
				376	_CHECK_REPLACEMENT['ASSERT_TRUE_M'][op] = 'ASSERT_%s_M' % replacement
				377
				378	for op, inv_replacement in [('==', 'NE'), ('!=', 'EQ'),
				379	('>=', 'LT'), ('>', 'LE'),
				380	('<=', 'GT'), ('<', 'GE')]:
				381	_CHECK_REPLACEMENT['EXPECT_FALSE'][op] = 'EXPECT_%s' % inv_replacement
				382	_CHECK_REPLACEMENT['ASSERT_FALSE'][op] = 'ASSERT_%s' % inv_replacement
				383	_CHECK_REPLACEMENT['EXPECT_FALSE_M'][op] = 'EXPECT_%s_M' % inv_replacement
				384	_CHECK_REPLACEMENT['ASSERT_FALSE_M'][op] = 'ASSERT_%s_M' % inv_replacement
				385
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	386	# Alternative tokens and their replacements. For full list, see section 2.5
				387	# Alternative tokens [lex.digraph] in the C++ standard.
				388	#
				389	# Digraphs (such as '%:') are not included here since it's a mess to
				390	# match those on a word boundary.
				391	_ALT_TOKEN_REPLACEMENT = {
				392	'and': '&&',
				393	'bitor': '\|',
				394	'or': '\|\|',
				395	'xor': '^',
				396	'compl': '~',
				397	'bitand': '&',
				398	'and_eq': '&=',
				399	'or_eq': '\|=',
				400	'xor_eq': '^=',
				401	'not': '!',
				402	'not_eq': '!='
				403	}
				404
				405	# Compile regular expression that matches all the above keywords. The "[ =()]"
				406	# bit is meant to avoid matching these keywords outside of boolean expressions.
				407	#
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	408	# False positives include C-style multi-line comments and multi-line strings
				409	# but those have always been troublesome for cpplint.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	410	_ALT_TOKEN_REPLACEMENT_PATTERN = re.compile(
				411	r'[ =()](' + ('\|'.join(_ALT_TOKEN_REPLACEMENT.keys())) + r')(?=[ (]\|$)')
				412
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	413
				414	# These constants define types of headers for use with
				415	# _IncludeState.CheckNextIncludeOrder().
				416	_C_SYS_HEADER = 1
				417	_CPP_SYS_HEADER = 2
				418	_LIKELY_MY_HEADER = 3
				419	_POSSIBLE_MY_HEADER = 4
				420	_OTHER_HEADER = 5
				421
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	422	# These constants define the current inline assembly state
				423	_NO_ASM = 0 # Outside of inline assembly block
				424	_INSIDE_ASM = 1 # Inside inline assembly block
				425	_END_ASM = 2 # Last line of inline assembly block
				426	_BLOCK_ASM = 3 # The whole block is an inline assembly block
				427
				428	# Match start of assembly blocks
				429	_MATCH_ASM = re.compile(r'^\s*(?:asm\|_asm\|__asm\|__asm__)'
				430	r'(?:\s+(volatile\|__volatile__))?'
				431	r'\s*[{(]')
				432
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	433
				434	_regexp_compile_cache = {}
				435
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	436	# Finds occurrences of NOLINT or NOLINT(...).
				437	_RE_SUPPRESSION = re.compile(r'\bNOLINT\b($[^)]*$)?')
				438
				439	# {str, set(int)}: a map from error categories to sets of linenumbers
				440	# on which those errors are expected and should be suppressed.
				441	_error_suppressions = {}
				442
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	443	# The root directory used for deriving header guard CPP variable.
				444	# This is set by --root flag.
				445	_root = None
				446
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	447	# The allowed line length of files.
				448	# This is set by --linelength flag.
				449	_line_length = 80
				450
				451	# The allowed extensions for file names
				452	# This is set by --extensions flag.
				453	_valid_extensions = set(['cc', 'h', 'cpp', 'cu', 'cuh'])
				454
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	455	def ParseNolintSuppressions(filename, raw_line, linenum, error):
				456	"""Updates the global list of error-suppressions.
				457
				458	Parses any NOLINT comments on the current line, updating the global
				459	error_suppressions store. Reports an error if the NOLINT comment
				460	was malformed.
				461
				462	Args:
				463	filename: str, the name of the input file.
				464	raw_line: str, the line of input text, with comments.
				465	linenum: int, the number of the current line.
				466	error: function, an error handler.
				467	"""
				468	# FIXME(adonovan): "NOLINT(" is misparsed as NOLINT(*).
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	469	matched = _RE_SUPPRESSION.search(raw_line)
				470	if matched:
				471	category = matched.group(1)
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	472	if category in (None, '(*)'): # => "suppress all"
				473	_error_suppressions.setdefault(None, set()).add(linenum)
				474	else:
				475	if category.startswith('(') and category.endswith(')'):
				476	category = category[1:-1]
				477	if category in _ERROR_CATEGORIES:
				478	_error_suppressions.setdefault(category, set()).add(linenum)
				479	else:
				480	error(filename, linenum, 'readability/nolint', 5,
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	481	'Unknown NOLINT error category: %s' % category)
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	482
				483
				484	def ResetNolintSuppressions():
				485	"Resets the set of NOLINT suppressions to empty."
				486	_error_suppressions.clear()
				487
				488
				489	def IsErrorSuppressedByNolint(category, linenum):
				490	"""Returns true if the specified error category is suppressed on this line.
				491
				492	Consults the global error_suppressions map populated by
				493	ParseNolintSuppressions/ResetNolintSuppressions.
				494
				495	Args:
				496	category: str, the category of the error.
				497	linenum: int, the current line number.
				498	Returns:
				499	bool, True iff the error should be suppressed due to a NOLINT comment.
				500	"""
				501	return (linenum in _error_suppressions.get(category, set()) or
				502	linenum in _error_suppressions.get(None, set()))
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	503
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	504
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	505	def Match(pattern, s):
				506	"""Matches the string with the pattern, caching the compiled regexp."""
				507	# The regexp compilation caching is inlined in both Match and Search for
				508	# performance reasons; factoring it out into a separate function turns out
				509	# to be noticeably expensive.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	510	if pattern not in _regexp_compile_cache:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	511	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				512	return _regexp_compile_cache[pattern].match(s)
				513
				514
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	515	def ReplaceAll(pattern, rep, s):
				516	"""Replaces instances of pattern in a string with a replacement.
				517
				518	The compiled regex is kept in a cache shared by Match and Search.
				519
				520	Args:
				521	pattern: regex pattern
				522	rep: replacement text
				523	s: search string
				524
				525	Returns:
				526	string with replacements made (or original string if no replacements)
				527	"""
				528	if pattern not in _regexp_compile_cache:
				529	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				530	return _regexp_compile_cache[pattern].sub(rep, s)
				531
				532
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	533	def Search(pattern, s):
				534	"""Searches the string for the pattern, caching the compiled regexp."""
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	535	if pattern not in _regexp_compile_cache:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	536	_regexp_compile_cache[pattern] = sre_compile.compile(pattern)
				537	return _regexp_compile_cache[pattern].search(s)
				538
				539
				540	class _IncludeState(dict):
				541	"""Tracks line numbers for includes, and the order in which includes appear.
				542
				543	As a dict, an _IncludeState object serves as a mapping between include
				544	filename and line number on which that file was included.
				545
				546	Call CheckNextIncludeOrder() once for each header in the file, passing
				547	in the type constants defined above. Calls in an illegal order will
				548	raise an _IncludeError with an appropriate error message.
				549
				550	"""
				551	# self._section will move monotonically through this set. If it ever
				552	# needs to move backwards, CheckNextIncludeOrder will raise an error.
				553	_INITIAL_SECTION = 0
				554	_MY_H_SECTION = 1
				555	_C_SECTION = 2
				556	_CPP_SECTION = 3
				557	_OTHER_H_SECTION = 4
				558
				559	_TYPE_NAMES = {
				560	_C_SYS_HEADER: 'C system header',
				561	_CPP_SYS_HEADER: 'C++ system header',
				562	_LIKELY_MY_HEADER: 'header this file implements',
				563	_POSSIBLE_MY_HEADER: 'header this file may implement',
				564	_OTHER_HEADER: 'other header',
				565	}
				566	_SECTION_NAMES = {
				567	_INITIAL_SECTION: "... nothing. (This can't be an error.)",
				568	_MY_H_SECTION: 'a header this file implements',
				569	_C_SECTION: 'C system header',
				570	_CPP_SECTION: 'C++ system header',
				571	_OTHER_H_SECTION: 'other header',
				572	}
				573
				574	def __init__(self):
				575	dict.__init__(self)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	576	self.ResetSection()
				577
				578	def ResetSection(self):
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	579	# The name of the current section.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	580	self._section = self._INITIAL_SECTION
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	581	# The path of last found header.
				582	self._last_header = ''
				583
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	584	def SetLastHeader(self, header_path):
				585	self._last_header = header_path
				586
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	587	def CanonicalizeAlphabeticalOrder(self, header_path):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	588	"""Returns a path canonicalized for alphabetical comparison.
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	589
				590	- replaces "-" with "_" so they both cmp the same.
				591	- removes '-inl' since we don't require them to be after the main header.
				592	- lowercase everything, just in case.
				593
				594	Args:
				595	header_path: Path to be canonicalized.
				596
				597	Returns:
				598	Canonicalized path.
				599	"""
				600	return header_path.replace('-inl.h', '.h').replace('-', '_').lower()
				601
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	602	def IsInAlphabeticalOrder(self, clean_lines, linenum, header_path):
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	603	"""Check if a header is in alphabetical order with the previous header.
				604
				605	Args:
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	606	clean_lines: A CleansedLines instance containing the file.
				607	linenum: The number of the line to check.
				608	header_path: Canonicalized header to be checked.
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	609
				610	Returns:
				611	Returns true if the header is in alphabetical order.
				612	"""
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	613	# If previous section is different from current section, _last_header will
				614	# be reset to empty string, so it's always less than current header.
				615	#
				616	# If previous line was a blank line, assume that the headers are
				617	# intentionally sorted the way they are.
				618	if (self._last_header > header_path and
				619	not Match(r'^\s*$', clean_lines.elided[linenum - 1])):
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	620	return False
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	621	return True
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	622
				623	def CheckNextIncludeOrder(self, header_type):
				624	"""Returns a non-empty error message if the next header is out of order.
				625
				626	This function also updates the internal state to be ready to check
				627	the next include.
				628
				629	Args:
				630	header_type: One of the _XXX_HEADER constants defined above.
				631
				632	Returns:
				633	The empty string if the header is in the right order, or an
				634	error message describing what's wrong.
				635
				636	"""
				637	error_message = ('Found %s after %s' %
				638	(self._TYPE_NAMES[header_type],
				639	self._SECTION_NAMES[self._section]))
				640
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	641	last_section = self._section
				642
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	643	if header_type == _C_SYS_HEADER:
				644	if self._section <= self._C_SECTION:
				645	self._section = self._C_SECTION
				646	else:
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	647	self._last_header = ''
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	648	return error_message
				649	elif header_type == _CPP_SYS_HEADER:
				650	if self._section <= self._CPP_SECTION:
				651	self._section = self._CPP_SECTION
				652	else:
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	653	self._last_header = ''
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	654	return error_message
				655	elif header_type == _LIKELY_MY_HEADER:
				656	if self._section <= self._MY_H_SECTION:
				657	self._section = self._MY_H_SECTION
				658	else:
				659	self._section = self._OTHER_H_SECTION
				660	elif header_type == _POSSIBLE_MY_HEADER:
				661	if self._section <= self._MY_H_SECTION:
				662	self._section = self._MY_H_SECTION
				663	else:
				664	# This will always be the fallback because we're not sure
				665	# enough that the header is associated with this file.
				666	self._section = self._OTHER_H_SECTION
				667	else:
				668	assert header_type == _OTHER_HEADER
				669	self._section = self._OTHER_H_SECTION
				670
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	671	if last_section != self._section:
				672	self._last_header = ''
				673
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	674	return ''
				675
				676
				677	class _CppLintState(object):
				678	"""Maintains module-wide state.."""
				679
				680	def __init__(self):
				681	self.verbose_level = 1 # global setting.
				682	self.error_count = 0 # global count of reported errors
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	683	# filters to apply when emitting error messages
				684	self.filters = _DEFAULT_FILTERS[:]
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	685	self.counting = 'total' # In what way are we counting errors?
				686	self.errors_by_category = {} # string to int dict storing error counts
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	687
				688	# output format:
				689	# "emacs" - format that emacs can parse (default)
				690	# "vs7" - format that Microsoft Visual Studio 7 can parse
				691	self.output_format = 'emacs'
				692
				693	def SetOutputFormat(self, output_format):
				694	"""Sets the output format for errors."""
				695	self.output_format = output_format
				696
				697	def SetVerboseLevel(self, level):
				698	"""Sets the module's verbosity, and returns the previous setting."""
				699	last_verbose_level = self.verbose_level
				700	self.verbose_level = level
				701	return last_verbose_level
				702
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	703	def SetCountingStyle(self, counting_style):
				704	"""Sets the module's counting options."""
				705	self.counting = counting_style
				706
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	707	def SetFilters(self, filters):
				708	"""Sets the error-message filters.
				709
				710	These filters are applied when deciding whether to emit a given
				711	error message.
				712
				713	Args:
				714	filters: A string of comma-separated filters (eg "+whitespace/indent").
				715	Each filter should start with + or -; else we die.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	716
				717	Raises:
				718	ValueError: The comma-separated filters did not all start with '+' or '-'.
				719	E.g. "-,+whitespace,-whitespace/indent,whitespace/badfilter"
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	720	"""
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	721	# Default filters always have less priority than the flag ones.
				722	self.filters = _DEFAULT_FILTERS[:]
				723	for filt in filters.split(','):
				724	clean_filt = filt.strip()
				725	if clean_filt:
				726	self.filters.append(clean_filt)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	727	for filt in self.filters:
				728	if not (filt.startswith('+') or filt.startswith('-')):
				729	raise ValueError('Every filter in --filters must start with + or -'
				730	' (%s does not)' % filt)
				731
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	732	def ResetErrorCounts(self):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	733	"""Sets the module's error statistic back to zero."""
				734	self.error_count = 0
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	735	self.errors_by_category = {}
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	736
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	737	def IncrementErrorCount(self, category):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	738	"""Bumps the module's error statistic."""
				739	self.error_count += 1
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	740	if self.counting in ('toplevel', 'detailed'):
				741	if self.counting != 'detailed':
				742	category = category.split('/')[0]
				743	if category not in self.errors_by_category:
				744	self.errors_by_category[category] = 0
				745	self.errors_by_category[category] += 1
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	746
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	747	def PrintErrorCounts(self):
				748	"""Print a summary of errors by category, and the total."""
				749	for category, count in self.errors_by_category.iteritems():
				750	sys.stderr.write('Category \'%s\' errors found: %d\n' %
				751	(category, count))
				752	sys.stderr.write('Total errors found: %d\n' % self.error_count)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	753
				754	_cpplint_state = _CppLintState()
				755
				756
				757	def _OutputFormat():
				758	"""Gets the module's output format."""
				759	return _cpplint_state.output_format
				760
				761
				762	def _SetOutputFormat(output_format):
				763	"""Sets the module's output format."""
				764	_cpplint_state.SetOutputFormat(output_format)
				765
				766
				767	def _VerboseLevel():
				768	"""Returns the module's verbosity setting."""
				769	return _cpplint_state.verbose_level
				770
				771
				772	def _SetVerboseLevel(level):
				773	"""Sets the module's verbosity, and returns the previous setting."""
				774	return _cpplint_state.SetVerboseLevel(level)
				775
				776
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	777	def _SetCountingStyle(level):
				778	"""Sets the module's counting options."""
				779	_cpplint_state.SetCountingStyle(level)
				780
				781
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	782	def _Filters():
				783	"""Returns the module's list of output filters, as a list."""
				784	return _cpplint_state.filters
				785
				786
				787	def _SetFilters(filters):
				788	"""Sets the module's error-message filters.
				789
				790	These filters are applied when deciding whether to emit a given
				791	error message.
				792
				793	Args:
				794	filters: A string of comma-separated filters (eg "whitespace/indent").
				795	Each filter should start with + or -; else we die.
				796	"""
				797	_cpplint_state.SetFilters(filters)
				798
				799
				800	class _FunctionState(object):
				801	"""Tracks current function name and the number of lines in its body."""
				802
				803	_NORMAL_TRIGGER = 250 # for --v=0, 500 for --v=1, etc.
				804	_TEST_TRIGGER = 400 # about 50% more than _NORMAL_TRIGGER.
				805
				806	def __init__(self):
				807	self.in_a_function = False
				808	self.lines_in_function = 0
				809	self.current_function = ''
				810
				811	def Begin(self, function_name):
				812	"""Start analyzing function body.
				813
				814	Args:
				815	function_name: The name of the function being tracked.
				816	"""
				817	self.in_a_function = True
				818	self.lines_in_function = 0
				819	self.current_function = function_name
				820
				821	def Count(self):
				822	"""Count line in current function body."""
				823	if self.in_a_function:
				824	self.lines_in_function += 1
				825
				826	def Check(self, error, filename, linenum):
				827	"""Report if too many lines in function body.
				828
				829	Args:
				830	error: The function to call with any errors found.
				831	filename: The name of the current file.
				832	linenum: The number of the line to check.
				833	"""
				834	if Match(r'T(EST\|est)', self.current_function):
				835	base_trigger = self._TEST_TRIGGER
				836	else:
				837	base_trigger = self._NORMAL_TRIGGER
				838	trigger = base_trigger * 2**_VerboseLevel()
				839
				840	if self.lines_in_function > trigger:
				841	error_level = int(math.log(self.lines_in_function / base_trigger, 2))
				842	# 50 => 0, 100 => 1, 200 => 2, 400 => 3, 800 => 4, 1600 => 5, ...
				843	if error_level > 5:
				844	error_level = 5
				845	error(filename, linenum, 'readability/fn_size', error_level,
				846	'Small and focused functions are preferred:'
				847	' %s has %d non-comment lines'
				848	' (error triggered by exceeding %d lines).' % (
				849	self.current_function, self.lines_in_function, trigger))
				850
				851	def End(self):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	852	"""Stop analyzing function body."""
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	853	self.in_a_function = False
				854
				855
				856	class _IncludeError(Exception):
				857	"""Indicates a problem with the include order in a file."""
				858	pass
				859
				860
				861	class FileInfo:
				862	"""Provides utility functions for filenames.
				863
				864	FileInfo provides easy access to the components of a file's path
				865	relative to the project root.
				866	"""
				867
				868	def __init__(self, filename):
				869	self._filename = filename
				870
				871	def FullName(self):
				872	"""Make Windows paths like Unix."""
				873	return os.path.abspath(self._filename).replace('\\', '/')
				874
				875	def RepositoryName(self):
				876	"""FullName after removing the local path to the repository.
				877
				878	If we have a real absolute path name here we can try to do something smart:
				879	detecting the root of the checkout and truncating /path/to/checkout from
				880	the name so that we get header guards that don't include things like
				881	"C:\Documents and Settings\..." or "/home/username/..." in them and thus
				882	people on different computers who have checked the source out to different
				883	locations won't see bogus errors.
				884	"""
				885	fullname = self.FullName()
				886
				887	if os.path.exists(fullname):
				888	project_dir = os.path.dirname(fullname)
				889
				890	if os.path.exists(os.path.join(project_dir, ".svn")):
				891	# If there's a .svn file in the current directory, we recursively look
				892	# up the directory tree for the top of the SVN checkout
				893	root_dir = project_dir
				894	one_up_dir = os.path.dirname(root_dir)
				895	while os.path.exists(os.path.join(one_up_dir, ".svn")):
				896	root_dir = os.path.dirname(root_dir)
				897	one_up_dir = os.path.dirname(one_up_dir)
				898
				899	prefix = os.path.commonprefix([root_dir, project_dir])
				900	return fullname[len(prefix) + 1:]
				901
erg@chromium.org	7956a87	2011-11-30 01:44:03 +0000	[diff] [blame]	902	# Not SVN <= 1.6? Try to find a git, hg, or svn top level directory by
				903	# searching up from the current path.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	904	root_dir = os.path.dirname(fullname)
				905	while (root_dir != os.path.dirname(root_dir) and
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	906	not os.path.exists(os.path.join(root_dir, ".git")) and
erg@chromium.org	7956a87	2011-11-30 01:44:03 +0000	[diff] [blame]	907	not os.path.exists(os.path.join(root_dir, ".hg")) and
				908	not os.path.exists(os.path.join(root_dir, ".svn"))):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	909	root_dir = os.path.dirname(root_dir)
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	910
				911	if (os.path.exists(os.path.join(root_dir, ".git")) or
erg@chromium.org	7956a87	2011-11-30 01:44:03 +0000	[diff] [blame]	912	os.path.exists(os.path.join(root_dir, ".hg")) or
				913	os.path.exists(os.path.join(root_dir, ".svn"))):
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	914	prefix = os.path.commonprefix([root_dir, project_dir])
				915	return fullname[len(prefix) + 1:]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	916
				917	# Don't know what to do; header guard warnings may be wrong...
				918	return fullname
				919
				920	def Split(self):
				921	"""Splits the file into the directory, basename, and extension.
				922
				923	For 'chrome/browser/browser.cc', Split() would
				924	return ('chrome/browser', 'browser', '.cc')
				925
				926	Returns:
				927	A tuple of (directory, basename, extension).
				928	"""
				929
				930	googlename = self.RepositoryName()
				931	project, rest = os.path.split(googlename)
				932	return (project,) + os.path.splitext(rest)
				933
				934	def BaseName(self):
				935	"""File base name - text after the final slash, before the final period."""
				936	return self.Split()[1]
				937
				938	def Extension(self):
				939	"""File extension - text following the final period."""
				940	return self.Split()[2]
				941
				942	def NoExtension(self):
				943	"""File has no source file extension."""
				944	return '/'.join(self.Split()[0:2])
				945
				946	def IsSource(self):
				947	"""File has a source file extension."""
				948	return self.Extension()[1:] in ('c', 'cc', 'cpp', 'cxx')
				949
				950
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	951	def _ShouldPrintError(category, confidence, linenum):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	952	"""If confidence >= verbose, category passes filter and is not suppressed."""
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	953
				954	# There are three ways we might decide not to print an error message:
				955	# a "NOLINT(category)" comment appears in the source,
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	956	# the verbosity level isn't high enough, or the filters filter it out.
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	957	if IsErrorSuppressedByNolint(category, linenum):
				958	return False
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	959
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	960	if confidence < _cpplint_state.verbose_level:
				961	return False
				962
				963	is_filtered = False
				964	for one_filter in _Filters():
				965	if one_filter.startswith('-'):
				966	if category.startswith(one_filter[1:]):
				967	is_filtered = True
				968	elif one_filter.startswith('+'):
				969	if category.startswith(one_filter[1:]):
				970	is_filtered = False
				971	else:
				972	assert False # should have been checked for in SetFilter.
				973	if is_filtered:
				974	return False
				975
				976	return True
				977
				978
				979	def Error(filename, linenum, category, confidence, message):
				980	"""Logs the fact we've found a lint error.
				981
				982	We log where the error was found, and also our confidence in the error,
				983	that is, how certain we are this is a legitimate style regression, and
				984	not a misidentification or a use that's sometimes justified.
				985
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	986	False positives can be suppressed by the use of
				987	"cpplint(category)" comments on the offending line. These are
				988	parsed into _error_suppressions.
				989
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	990	Args:
				991	filename: The name of the file containing the error.
				992	linenum: The number of the line containing the error.
				993	category: A string used to describe the "category" this bug
				994	falls under: "whitespace", say, or "runtime". Categories
				995	may have a hierarchy separated by slashes: "whitespace/indent".
				996	confidence: A number from 1-5 representing a confidence score for
				997	the error, with 5 meaning that we are certain of the problem,
				998	and 1 meaning that it could be a legitimate construct.
				999	message: The error message.
				1000	"""
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1001	if _ShouldPrintError(category, confidence, linenum):
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	1002	_cpplint_state.IncrementErrorCount(category)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1003	if _cpplint_state.output_format == 'vs7':
				1004	sys.stderr.write('%s(%s): %s [%s] [%d]\n' % (
				1005	filename, linenum, message, category, confidence))
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1006	elif _cpplint_state.output_format == 'eclipse':
				1007	sys.stderr.write('%s:%s: warning: %s [%s] [%d]\n' % (
				1008	filename, linenum, message, category, confidence))
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1009	else:
				1010	sys.stderr.write('%s:%s: %s [%s] [%d]\n' % (
				1011	filename, linenum, message, category, confidence))
				1012
				1013
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1014	# Matches standard C++ escape sequences per 2.13.2.3 of the C++ standard.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1015	_RE_PATTERN_CLEANSE_LINE_ESCAPES = re.compile(
				1016	r'\\([abfnrtv?"\\\']\|\d+\|x[0-9a-fA-F]+)')
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1017	# Match a single C style comment on the same line.
				1018	_RE_PATTERN_C_COMMENTS = r'/\(?:[^]\|\(?!/))\*/'
				1019	# Matches multi-line C style comments.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1020	# This RE is a little bit more complicated than one might expect, because we
				1021	# have to take care of space removals tools so we can handle comments inside
				1022	# statements better.
				1023	# The current rule is: We only clear spaces from both sides when we're at the
				1024	# end of the line. Otherwise, we try to remove spaces from the right side,
				1025	# if this doesn't work we try on left side but only if there's a non-character
				1026	# on the right.
				1027	_RE_PATTERN_CLEANSE_LINE_C_COMMENTS = re.compile(
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1028	r'(\s' + _RE_PATTERN_C_COMMENTS + r'\s$\|' +
				1029	_RE_PATTERN_C_COMMENTS + r'\s+\|' +
				1030	r'\s+' + _RE_PATTERN_C_COMMENTS + r'(?=\W)\|' +
				1031	_RE_PATTERN_C_COMMENTS + r')')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1032
				1033
				1034	def IsCppString(line):
				1035	"""Does line terminate so, that the next symbol is in string constant.
				1036
				1037	This function does not consider single-line nor multi-line comments.
				1038
				1039	Args:
				1040	line: is a partial line of code starting from the 0..n.
				1041
				1042	Returns:
				1043	True, if next character appended to 'line' is inside a
				1044	string constant.
				1045	"""
				1046
				1047	line = line.replace(r'\\', 'XX') # after this, \\" does not match to \"
				1048	return ((line.count('"') - line.count(r'\"') - line.count("'\"'")) & 1) == 1
				1049
				1050
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1051	def CleanseRawStrings(raw_lines):
				1052	"""Removes C++11 raw strings from lines.
				1053
				1054	Before:
				1055	static const char kData[] = R"(
				1056	multi-line string
				1057	)";
				1058
				1059	After:
				1060	static const char kData[] = ""
				1061	(replaced by blank line)
				1062	"";
				1063
				1064	Args:
				1065	raw_lines: list of raw lines.
				1066
				1067	Returns:
				1068	list of lines with C++11 raw strings replaced by empty strings.
				1069	"""
				1070
				1071	delimiter = None
				1072	lines_without_raw_strings = []
				1073	for line in raw_lines:
				1074	if delimiter:
				1075	# Inside a raw string, look for the end
				1076	end = line.find(delimiter)
				1077	if end >= 0:
				1078	# Found the end of the string, match leading space for this
				1079	# line and resume copying the original lines, and also insert
				1080	# a "" on the last line.
				1081	leading_space = Match(r'^(\s*)\S', line)
				1082	line = leading_space.group(1) + '""' + line[end + len(delimiter):]
				1083	delimiter = None
				1084	else:
				1085	# Haven't found the end yet, append a blank line.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1086	line = '""'
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1087
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1088	# Look for beginning of a raw string, and replace them with
				1089	# empty strings. This is done in a loop to handle multiple raw
				1090	# strings on the same line.
				1091	while delimiter is None:
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1092	# Look for beginning of a raw string.
				1093	# See 2.14.15 [lex.string] for syntax.
				1094	matched = Match(r'^(.)\b(?:R\|u8R\|uR\|UR\|LR)"([^\s\\()])\((.*)$', line)
				1095	if matched:
				1096	delimiter = ')' + matched.group(2) + '"'
				1097
				1098	end = matched.group(3).find(delimiter)
				1099	if end >= 0:
				1100	# Raw string ended on same line
				1101	line = (matched.group(1) + '""' +
				1102	matched.group(3)[end + len(delimiter):])
				1103	delimiter = None
				1104	else:
				1105	# Start of a multi-line raw string
				1106	line = matched.group(1) + '""'
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1107	else:
				1108	break
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1109
				1110	lines_without_raw_strings.append(line)
				1111
				1112	# TODO(unknown): if delimiter is not None here, we might want to
				1113	# emit a warning for unterminated string.
				1114	return lines_without_raw_strings
				1115
				1116
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1117	def FindNextMultiLineCommentStart(lines, lineix):
				1118	"""Find the beginning marker for a multiline comment."""
				1119	while lineix < len(lines):
				1120	if lines[lineix].strip().startswith('/*'):
				1121	# Only return this marker if the comment goes beyond this line
				1122	if lines[lineix].strip().find('*/', 2) < 0:
				1123	return lineix
				1124	lineix += 1
				1125	return len(lines)
				1126
				1127
				1128	def FindNextMultiLineCommentEnd(lines, lineix):
				1129	"""We are inside a comment, find the end marker."""
				1130	while lineix < len(lines):
				1131	if lines[lineix].strip().endswith('*/'):
				1132	return lineix
				1133	lineix += 1
				1134	return len(lines)
				1135
				1136
				1137	def RemoveMultiLineCommentsFromRange(lines, begin, end):
				1138	"""Clears a range of lines for multi-line comments."""
				1139	# Having // dummy comments makes the lines non-empty, so we will not get
				1140	# unnecessary blank line warnings later in the code.
				1141	for i in range(begin, end):
				1142	lines[i] = '// dummy'
				1143
				1144
				1145	def RemoveMultiLineComments(filename, lines, error):
				1146	"""Removes multiline (c-style) comments from lines."""
				1147	lineix = 0
				1148	while lineix < len(lines):
				1149	lineix_begin = FindNextMultiLineCommentStart(lines, lineix)
				1150	if lineix_begin >= len(lines):
				1151	return
				1152	lineix_end = FindNextMultiLineCommentEnd(lines, lineix_begin)
				1153	if lineix_end >= len(lines):
				1154	error(filename, lineix_begin + 1, 'readability/multiline_comment', 5,
				1155	'Could not find end of multi-line comment')
				1156	return
				1157	RemoveMultiLineCommentsFromRange(lines, lineix_begin, lineix_end + 1)
				1158	lineix = lineix_end + 1
				1159
				1160
				1161	def CleanseComments(line):
				1162	"""Removes //-comments and single-line C-style /* */ comments.
				1163
				1164	Args:
				1165	line: A line of C++ source.
				1166
				1167	Returns:
				1168	The line with single-line comments removed.
				1169	"""
				1170	commentpos = line.find('//')
				1171	if commentpos != -1 and not IsCppString(line[:commentpos]):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	1172	line = line[:commentpos].rstrip()
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1173	# get rid of /* ... */
				1174	return _RE_PATTERN_CLEANSE_LINE_C_COMMENTS.sub('', line)
				1175
				1176
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	1177	class CleansedLines(object):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1178	"""Holds 3 copies of all lines with different preprocessing applied to them.
				1179
				1180	1) elided member contains lines without strings and comments,
				1181	2) lines member contains lines without comments, and
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1182	3) raw_lines member contains all the lines without processing.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1183	All these three members are of <type 'list'>, and of the same length.
				1184	"""
				1185
				1186	def __init__(self, lines):
				1187	self.elided = []
				1188	self.lines = []
				1189	self.raw_lines = lines
				1190	self.num_lines = len(lines)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1191	self.lines_without_raw_strings = CleanseRawStrings(lines)
				1192	for linenum in range(len(self.lines_without_raw_strings)):
				1193	self.lines.append(CleanseComments(
				1194	self.lines_without_raw_strings[linenum]))
				1195	elided = self._CollapseStrings(self.lines_without_raw_strings[linenum])
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1196	self.elided.append(CleanseComments(elided))
				1197
				1198	def NumLines(self):
				1199	"""Returns the number of lines represented."""
				1200	return self.num_lines
				1201
				1202	@staticmethod
				1203	def _CollapseStrings(elided):
				1204	"""Collapses strings and chars on a line to simple "" or '' blocks.
				1205
				1206	We nix strings first so we're not fooled by text like '"http://"'
				1207
				1208	Args:
				1209	elided: The line being processed.
				1210
				1211	Returns:
				1212	The line with collapsed strings.
				1213	"""
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1214	if _RE_PATTERN_INCLUDE.match(elided):
				1215	return elided
				1216
				1217	# Remove escaped characters first to make quote/single quote collapsing
				1218	# basic. Things that look like escaped characters shouldn't occur
				1219	# outside of strings and chars.
				1220	elided = _RE_PATTERN_CLEANSE_LINE_ESCAPES.sub('', elided)
				1221
				1222	# Replace quoted strings and digit separators. Both single quotes
				1223	# and double quotes are processed in the same loop, otherwise
				1224	# nested quotes wouldn't work.
				1225	collapsed = ''
				1226	while True:
				1227	# Find the first quote character
				1228	match = Match(r'^([^\'"])([\'"])(.)$', elided)
				1229	if not match:
				1230	collapsed += elided
				1231	break
				1232	head, quote, tail = match.groups()
				1233
				1234	if quote == '"':
				1235	# Collapse double quoted strings
				1236	second_quote = tail.find('"')
				1237	if second_quote >= 0:
				1238	collapsed += head + '""'
				1239	elided = tail[second_quote + 1:]
				1240	else:
				1241	# Unmatched double quote, don't bother processing the rest
				1242	# of the line since this is probably a multiline string.
				1243	collapsed += elided
				1244	break
				1245	else:
				1246	# Found single quote, check nearby text to eliminate digit separators.
				1247	#
				1248	# There is no special handling for floating point here, because
				1249	# the integer/fractional/exponent parts would all be parsed
				1250	# correctly as long as there are digits on both sides of the
				1251	# separator. So we are fine as long as we don't see something
				1252	# like "0.'3" (gcc 4.9.0 will not allow this literal).
				1253	if Search(r'\b(?:0[bBxX]?\|[1-9])[0-9a-fA-F]*$', head):
				1254	match_literal = Match(r'^((?:\'?[0-9a-zA-Z_]))(.)$', "'" + tail)
				1255	collapsed += head + match_literal.group(1).replace("'", '')
				1256	elided = match_literal.group(2)
				1257	else:
				1258	second_quote = tail.find('\'')
				1259	if second_quote >= 0:
				1260	collapsed += head + "''"
				1261	elided = tail[second_quote + 1:]
				1262	else:
				1263	# Unmatched single quote
				1264	collapsed += elided
				1265	break
				1266
				1267	return collapsed
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1268
				1269
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1270	def FindEndOfExpressionInLine(line, startpos, stack):
				1271	"""Find the position just after the end of current parenthesized expression.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1272
				1273	Args:
				1274	line: a CleansedLines line.
				1275	startpos: start searching at this position.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1276	stack: nesting stack at startpos.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1277
				1278	Returns:
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1279	On finding matching end: (index just after matching end, None)
				1280	On finding an unclosed expression: (-1, None)
				1281	Otherwise: (-1, new stack at end of this line)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1282	"""
				1283	for i in xrange(startpos, len(line)):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1284	char = line[i]
				1285	if char in '([{':
				1286	# Found start of parenthesized expression, push to expression stack
				1287	stack.append(char)
				1288	elif char == '<':
				1289	# Found potential start of template argument list
				1290	if i > 0 and line[i - 1] == '<':
				1291	# Left shift operator
				1292	if stack and stack[-1] == '<':
				1293	stack.pop()
				1294	if not stack:
				1295	return (-1, None)
				1296	elif i > 0 and Search(r'\boperator\s*$', line[0:i]):
				1297	# operator<, don't add to stack
				1298	continue
				1299	else:
				1300	# Tentative start of template argument list
				1301	stack.append('<')
				1302	elif char in ')]}':
				1303	# Found end of parenthesized expression.
				1304	#
				1305	# If we are currently expecting a matching '>', the pending '<'
				1306	# must have been an operator. Remove them from expression stack.
				1307	while stack and stack[-1] == '<':
				1308	stack.pop()
				1309	if not stack:
				1310	return (-1, None)
				1311	if ((stack[-1] == '(' and char == ')') or
				1312	(stack[-1] == '[' and char == ']') or
				1313	(stack[-1] == '{' and char == '}')):
				1314	stack.pop()
				1315	if not stack:
				1316	return (i + 1, None)
				1317	else:
				1318	# Mismatched parentheses
				1319	return (-1, None)
				1320	elif char == '>':
				1321	# Found potential end of template argument list.
				1322
				1323	# Ignore "->" and operator functions
				1324	if (i > 0 and
				1325	(line[i - 1] == '-' or Search(r'\boperator\s*$', line[0:i - 1]))):
				1326	continue
				1327
				1328	# Pop the stack if there is a matching '<'. Otherwise, ignore
				1329	# this '>' since it must be an operator.
				1330	if stack:
				1331	if stack[-1] == '<':
				1332	stack.pop()
				1333	if not stack:
				1334	return (i + 1, None)
				1335	elif char == ';':
				1336	# Found something that look like end of statements. If we are currently
				1337	# expecting a '>', the matching '<' must have been an operator, since
				1338	# template argument list should not contain statements.
				1339	while stack and stack[-1] == '<':
				1340	stack.pop()
				1341	if not stack:
				1342	return (-1, None)
				1343
				1344	# Did not find end of expression or unbalanced parentheses on this line
				1345	return (-1, stack)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1346
				1347
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1348	def CloseExpression(clean_lines, linenum, pos):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1349	"""If input points to ( or { or [ or <, finds the position that closes it.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1350
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1351	If lines[linenum][pos] points to a '(' or '{' or '[' or '<', finds the
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1352	linenum/pos that correspond to the closing of the expression.
				1353
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1354	TODO(unknown): cpplint spends a fair bit of time matching parentheses.
				1355	Ideally we would want to index all opening and closing parentheses once
				1356	and have CloseExpression be just a simple lookup, but due to preprocessor
				1357	tricks, this is not so easy.
				1358
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1359	Args:
				1360	clean_lines: A CleansedLines instance containing the file.
				1361	linenum: The number of the line to check.
				1362	pos: A position on the line.
				1363
				1364	Returns:
				1365	A tuple (line, linenum, pos) pointer past the closing brace, or
				1366	(line, len(lines), -1) if we never find a close. Note we ignore
				1367	strings and comments when matching; and the line we return is the
				1368	'cleansed' line at linenum.
				1369	"""
				1370
				1371	line = clean_lines.elided[linenum]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1372	if (line[pos] not in '({[<') or Match(r'<[<=]', line[pos:]):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1373	return (line, clean_lines.NumLines(), -1)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1374
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1375	# Check first line
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1376	(end_pos, stack) = FindEndOfExpressionInLine(line, pos, [])
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1377	if end_pos > -1:
				1378	return (line, linenum, end_pos)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1379
				1380	# Continue scanning forward
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1381	while stack and linenum < clean_lines.NumLines() - 1:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1382	linenum += 1
				1383	line = clean_lines.elided[linenum]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1384	(end_pos, stack) = FindEndOfExpressionInLine(line, 0, stack)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1385	if end_pos > -1:
				1386	return (line, linenum, end_pos)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1387
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1388	# Did not find end of expression before end of file, give up
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1389	return (line, clean_lines.NumLines(), -1)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1390
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1391
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1392	def FindStartOfExpressionInLine(line, endpos, stack):
				1393	"""Find position at the matching start of current expression.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1394
				1395	This is almost the reverse of FindEndOfExpressionInLine, but note
				1396	that the input position and returned position differs by 1.
				1397
				1398	Args:
				1399	line: a CleansedLines line.
				1400	endpos: start searching at this position.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1401	stack: nesting stack at endpos.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1402
				1403	Returns:
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1404	On finding matching start: (index at matching start, None)
				1405	On finding an unclosed expression: (-1, None)
				1406	Otherwise: (-1, new stack at beginning of this line)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1407	"""
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1408	i = endpos
				1409	while i >= 0:
				1410	char = line[i]
				1411	if char in ')]}':
				1412	# Found end of expression, push to expression stack
				1413	stack.append(char)
				1414	elif char == '>':
				1415	# Found potential end of template argument list.
				1416	#
				1417	# Ignore it if it's a "->" or ">=" or "operator>"
				1418	if (i > 0 and
				1419	(line[i - 1] == '-' or
				1420	Match(r'\s>=\s', line[i - 1:]) or
				1421	Search(r'\boperator\s*$', line[0:i]))):
				1422	i -= 1
				1423	else:
				1424	stack.append('>')
				1425	elif char == '<':
				1426	# Found potential start of template argument list
				1427	if i > 0 and line[i - 1] == '<':
				1428	# Left shift operator
				1429	i -= 1
				1430	else:
				1431	# If there is a matching '>', we can pop the expression stack.
				1432	# Otherwise, ignore this '<' since it must be an operator.
				1433	if stack and stack[-1] == '>':
				1434	stack.pop()
				1435	if not stack:
				1436	return (i, None)
				1437	elif char in '([{':
				1438	# Found start of expression.
				1439	#
				1440	# If there are any unmatched '>' on the stack, they must be
				1441	# operators. Remove those.
				1442	while stack and stack[-1] == '>':
				1443	stack.pop()
				1444	if not stack:
				1445	return (-1, None)
				1446	if ((char == '(' and stack[-1] == ')') or
				1447	(char == '[' and stack[-1] == ']') or
				1448	(char == '{' and stack[-1] == '}')):
				1449	stack.pop()
				1450	if not stack:
				1451	return (i, None)
				1452	else:
				1453	# Mismatched parentheses
				1454	return (-1, None)
				1455	elif char == ';':
				1456	# Found something that look like end of statements. If we are currently
				1457	# expecting a '<', the matching '>' must have been an operator, since
				1458	# template argument list should not contain statements.
				1459	while stack and stack[-1] == '>':
				1460	stack.pop()
				1461	if not stack:
				1462	return (-1, None)
				1463
				1464	i -= 1
				1465
				1466	return (-1, stack)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1467
				1468
				1469	def ReverseCloseExpression(clean_lines, linenum, pos):
				1470	"""If input points to ) or } or ] or >, finds the position that opens it.
				1471
				1472	If lines[linenum][pos] points to a ')' or '}' or ']' or '>', finds the
				1473	linenum/pos that correspond to the opening of the expression.
				1474
				1475	Args:
				1476	clean_lines: A CleansedLines instance containing the file.
				1477	linenum: The number of the line to check.
				1478	pos: A position on the line.
				1479
				1480	Returns:
				1481	A tuple (line, linenum, pos) pointer at the opening brace, or
				1482	(line, 0, -1) if we never find the matching opening brace. Note
				1483	we ignore strings and comments when matching; and the line we
				1484	return is the 'cleansed' line at linenum.
				1485	"""
				1486	line = clean_lines.elided[linenum]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1487	if line[pos] not in ')}]>':
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1488	return (line, 0, -1)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1489
				1490	# Check last line
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1491	(start_pos, stack) = FindStartOfExpressionInLine(line, pos, [])
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1492	if start_pos > -1:
				1493	return (line, linenum, start_pos)
				1494
				1495	# Continue scanning backward
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1496	while stack and linenum > 0:
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1497	linenum -= 1
				1498	line = clean_lines.elided[linenum]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1499	(start_pos, stack) = FindStartOfExpressionInLine(line, len(line) - 1, stack)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1500	if start_pos > -1:
				1501	return (line, linenum, start_pos)
				1502
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1503	# Did not find start of expression before beginning of file, give up
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1504	return (line, 0, -1)
				1505
				1506
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1507	def CheckForCopyright(filename, lines, error):
				1508	"""Logs an error if no Copyright message appears at the top of the file."""
				1509
				1510	# We'll say it should occur by line 10. Don't forget there's a
				1511	# dummy line at the front.
				1512	for line in xrange(1, min(len(lines), 11)):
				1513	if re.search(r'Copyright', lines[line], re.I): break
				1514	else: # means no copyright line was found
				1515	error(filename, 0, 'legal/copyright', 5,
				1516	'No copyright message found. '
				1517	'You should have a line: "Copyright [year] <Copyright Owner>"')
				1518
				1519
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1520	def GetIndentLevel(line):
				1521	"""Return the number of leading spaces in line.
				1522
				1523	Args:
				1524	line: A string to check.
				1525
				1526	Returns:
				1527	An integer count of leading spaces, possibly zero.
				1528	"""
				1529	indent = Match(r'^( *)\S', line)
				1530	if indent:
				1531	return len(indent.group(1))
				1532	else:
				1533	return 0
				1534
				1535
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1536	def GetHeaderGuardCPPVariable(filename):
				1537	"""Returns the CPP variable that should be used as a header guard.
				1538
				1539	Args:
				1540	filename: The name of a C++ header file.
				1541
				1542	Returns:
				1543	The CPP variable that should be used as a header guard in the
				1544	named file.
				1545
				1546	"""
				1547
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1548	# Restores original filename in case that cpplint is invoked from Emacs's
				1549	# flymake.
				1550	filename = re.sub(r'_flymake\.h$', '.h', filename)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1551	filename = re.sub(r'/\.flymake/([^/]*)$', r'/\1', filename)
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1552
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1553	fileinfo = FileInfo(filename)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1554	file_path_from_root = fileinfo.RepositoryName()
				1555	if _root:
				1556	file_path_from_root = re.sub('^' + _root + os.sep, '', file_path_from_root)
				1557	return re.sub(r'[-./\s]', '_', file_path_from_root).upper() + '_'
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1558
				1559
				1560	def CheckForHeaderGuard(filename, lines, error):
				1561	"""Checks that the file contains a header guard.
				1562
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	1563	Logs an error if no #ifndef header guard is present. For other
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1564	headers, checks that the full pathname is used.
				1565
				1566	Args:
				1567	filename: The name of the C++ header file.
				1568	lines: An array of strings, each representing a line of the file.
				1569	error: The function to call with any errors found.
				1570	"""
				1571
				1572	cppvar = GetHeaderGuardCPPVariable(filename)
				1573
				1574	ifndef = None
				1575	ifndef_linenum = 0
				1576	define = None
				1577	endif = None
				1578	endif_linenum = 0
				1579	for linenum, line in enumerate(lines):
				1580	linesplit = line.split()
				1581	if len(linesplit) >= 2:
				1582	# find the first occurrence of #ifndef and #define, save arg
				1583	if not ifndef and linesplit[0] == '#ifndef':
				1584	# set ifndef to the header guard presented on the #ifndef line.
				1585	ifndef = linesplit[1]
				1586	ifndef_linenum = linenum
				1587	if not define and linesplit[0] == '#define':
				1588	define = linesplit[1]
				1589	# find the last occurrence of #endif, save entire line
				1590	if line.startswith('#endif'):
				1591	endif = line
				1592	endif_linenum = linenum
				1593
erg@chromium.org	c452fea	2012-01-26 21:10:45 +0000	[diff] [blame]	1594	if not ifndef:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1595	error(filename, 0, 'build/header_guard', 5,
				1596	'No #ifndef header guard found, suggested CPP variable is: %s' %
				1597	cppvar)
				1598	return
				1599
erg@chromium.org	c452fea	2012-01-26 21:10:45 +0000	[diff] [blame]	1600	if not define:
				1601	error(filename, 0, 'build/header_guard', 5,
				1602	'No #define header guard found, suggested CPP variable is: %s' %
				1603	cppvar)
				1604	return
				1605
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1606	# The guard should be PATH_FILE_H_, but we also allow PATH_FILE_H__
				1607	# for backward compatibility.
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1608	if ifndef != cppvar:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1609	error_level = 0
				1610	if ifndef != cppvar + '_':
				1611	error_level = 5
				1612
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1613	ParseNolintSuppressions(filename, lines[ifndef_linenum], ifndef_linenum,
				1614	error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1615	error(filename, ifndef_linenum, 'build/header_guard', error_level,
				1616	'#ifndef header guard has wrong style, please use: %s' % cppvar)
				1617
erg@chromium.org	c452fea	2012-01-26 21:10:45 +0000	[diff] [blame]	1618	if define != ifndef:
				1619	error(filename, 0, 'build/header_guard', 5,
				1620	'#ifndef and #define don\'t match, suggested CPP variable is: %s' %
				1621	cppvar)
				1622	return
				1623
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1624	if endif != ('#endif // %s' % cppvar):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1625	error_level = 0
				1626	if endif != ('#endif // %s' % (cppvar + '_')):
				1627	error_level = 5
				1628
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	1629	ParseNolintSuppressions(filename, lines[endif_linenum], endif_linenum,
				1630	error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1631	error(filename, endif_linenum, 'build/header_guard', error_level,
				1632	'#endif line should be "#endif // %s"' % cppvar)
				1633
				1634
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1635	def CheckForBadCharacters(filename, lines, error):
				1636	"""Logs an error for each line containing bad characters.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1637
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1638	Two kinds of bad characters:
				1639
				1640	1. Unicode replacement characters: These indicate that either the file
				1641	contained invalid UTF-8 (likely) or Unicode replacement characters (which
				1642	it shouldn't). Note that it's possible for this to throw off line
				1643	numbering if the invalid UTF-8 occurred adjacent to a newline.
				1644
				1645	2. NUL bytes. These are problematic for some tools.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1646
				1647	Args:
				1648	filename: The name of the current file.
				1649	lines: An array of strings, each representing a line of the file.
				1650	error: The function to call with any errors found.
				1651	"""
				1652	for linenum, line in enumerate(lines):
				1653	if u'\ufffd' in line:
				1654	error(filename, linenum, 'readability/utf8', 5,
				1655	'Line contains invalid UTF-8 (or Unicode replacement character).')
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1656	if '\0' in line:
				1657	error(filename, linenum, 'readability/nul', 5, 'Line contains NUL byte.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1658
				1659
				1660	def CheckForNewlineAtEOF(filename, lines, error):
				1661	"""Logs an error if there is no newline char at the end of the file.
				1662
				1663	Args:
				1664	filename: The name of the current file.
				1665	lines: An array of strings, each representing a line of the file.
				1666	error: The function to call with any errors found.
				1667	"""
				1668
				1669	# The array lines() was created by adding two newlines to the
				1670	# original file (go figure), then splitting on \n.
				1671	# To verify that the file ends in \n, we just have to make sure the
				1672	# last-but-two element of lines() exists and is empty.
				1673	if len(lines) < 3 or lines[-2]:
				1674	error(filename, len(lines) - 2, 'whitespace/ending_newline', 5,
				1675	'Could not find a newline character at the end of the file.')
				1676
				1677
				1678	def CheckForMultilineCommentsAndStrings(filename, clean_lines, linenum, error):
				1679	"""Logs an error if we see /* ... */ or "..." that extend past one line.
				1680
				1681	/* ... */ comments are legit inside macros, for one line.
				1682	Otherwise, we prefer // comments, so it's ok to warn about the
				1683	other. Likewise, it's ok for strings to extend across multiple
				1684	lines, as long as a line continuation character (backslash)
				1685	terminates each line. Although not currently prohibited by the C++
				1686	style guide, it's ugly and unnecessary. We don't do well with either
				1687	in this lint program, so we warn about both.
				1688
				1689	Args:
				1690	filename: The name of the current file.
				1691	clean_lines: A CleansedLines instance containing the file.
				1692	linenum: The number of the line to check.
				1693	error: The function to call with any errors found.
				1694	"""
				1695	line = clean_lines.elided[linenum]
				1696
				1697	# Remove all \\ (escaped backslashes) from the line. They are OK, and the
				1698	# second (escaped) slash may trigger later \" detection erroneously.
				1699	line = line.replace('\\\\', '')
				1700
				1701	if line.count('/') > line.count('/'):
				1702	error(filename, linenum, 'readability/multiline_comment', 5,
				1703	'Complex multi-line /.../-style comment found. '
				1704	'Lint may give bogus warnings. '
				1705	'Consider replacing these with //-style comments, '
				1706	'with #if 0...#endif, '
				1707	'or with more clearly structured multi-line comments.')
				1708
				1709	if (line.count('"') - line.count('\\"')) % 2:
				1710	error(filename, linenum, 'readability/multiline_string', 5,
				1711	'Multi-line string ("...") found. This lint script doesn\'t '
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1712	'do well with such strings, and may give bogus warnings. '
				1713	'Use C++11 raw strings or concatenation instead.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1714
				1715
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1716	# (non-threadsafe name, thread-safe alternative, validation pattern)
				1717	#
				1718	# The validation pattern is used to eliminate false positives such as:
				1719	# _rand(); // false positive due to substring match.
				1720	# ->rand(); // some member function rand().
				1721	# ACMRandom rand(seed); // some variable named rand.
				1722	# ISAACRandom rand(); // another variable named rand.
				1723	#
				1724	# Basically we require the return value of these functions to be used
				1725	# in some expression context on the same line by matching on some
				1726	# operator before the function name. This eliminates constructors and
				1727	# member function calls.
				1728	_UNSAFE_FUNC_PREFIX = r'(?:[-+/=%^&\|(<]\s\|>\s+)'
				1729	_THREADING_LIST = (
				1730	('asctime(', 'asctime_r(', _UNSAFE_FUNC_PREFIX + r'asctime$[^)]+$'),
				1731	('ctime(', 'ctime_r(', _UNSAFE_FUNC_PREFIX + r'ctime$[^)]+$'),
				1732	('getgrgid(', 'getgrgid_r(', _UNSAFE_FUNC_PREFIX + r'getgrgid$[^)]+$'),
				1733	('getgrnam(', 'getgrnam_r(', _UNSAFE_FUNC_PREFIX + r'getgrnam$[^)]+$'),
				1734	('getlogin(', 'getlogin_r(', _UNSAFE_FUNC_PREFIX + r'getlogin'),
				1735	('getpwnam(', 'getpwnam_r(', _UNSAFE_FUNC_PREFIX + r'getpwnam$[^)]+$'),
				1736	('getpwuid(', 'getpwuid_r(', _UNSAFE_FUNC_PREFIX + r'getpwuid$[^)]+$'),
				1737	('gmtime(', 'gmtime_r(', _UNSAFE_FUNC_PREFIX + r'gmtime$[^)]+$'),
				1738	('localtime(', 'localtime_r(', _UNSAFE_FUNC_PREFIX + r'localtime$[^)]+$'),
				1739	('rand(', 'rand_r(', _UNSAFE_FUNC_PREFIX + r'rand'),
				1740	('strtok(', 'strtok_r(',
				1741	_UNSAFE_FUNC_PREFIX + r'strtok$[^)]+$'),
				1742	('ttyname(', 'ttyname_r(', _UNSAFE_FUNC_PREFIX + r'ttyname$[^)]+$'),
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1743	)
				1744
				1745
				1746	def CheckPosixThreading(filename, clean_lines, linenum, error):
				1747	"""Checks for calls to thread-unsafe functions.
				1748
				1749	Much code has been originally written without consideration of
				1750	multi-threading. Also, engineers are relying on their old experience;
				1751	they have learned posix before threading extensions were added. These
				1752	tests guide the engineers to use thread-safe functions (when using
				1753	posix directly).
				1754
				1755	Args:
				1756	filename: The name of the current file.
				1757	clean_lines: A CleansedLines instance containing the file.
				1758	linenum: The number of the line to check.
				1759	error: The function to call with any errors found.
				1760	"""
				1761	line = clean_lines.elided[linenum]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1762	for single_thread_func, multithread_safe_func, pattern in _THREADING_LIST:
				1763	# Additional pattern matching check to confirm that this is the
				1764	# function we are looking for
				1765	if Search(pattern, line):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1766	error(filename, linenum, 'runtime/threadsafe_fn', 2,
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1767	'Consider using ' + multithread_safe_func +
				1768	'...) instead of ' + single_thread_func +
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1769	'...) for improved thread safety.')
				1770
				1771
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1772	def CheckVlogArguments(filename, clean_lines, linenum, error):
				1773	"""Checks that VLOG() is only used for defining a logging level.
				1774
				1775	For example, VLOG(2) is correct. VLOG(INFO), VLOG(WARNING), VLOG(ERROR), and
				1776	VLOG(FATAL) are not.
				1777
				1778	Args:
				1779	filename: The name of the current file.
				1780	clean_lines: A CleansedLines instance containing the file.
				1781	linenum: The number of the line to check.
				1782	error: The function to call with any errors found.
				1783	"""
				1784	line = clean_lines.elided[linenum]
				1785	if Search(r'\bVLOG$(INFO\|ERROR\|WARNING\|DFATAL\|FATAL)$', line):
				1786	error(filename, linenum, 'runtime/vlog', 5,
				1787	'VLOG() should be used with numeric verbosity level. '
				1788	'Use LOG() if you want symbolic severity levels.')
				1789
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	1790	# Matches invalid increment: *count++, which moves pointer instead of
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	1791	# incrementing a value.
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	1792	_RE_PATTERN_INVALID_INCREMENT = re.compile(
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	1793	r'^\s\\w+(\+\+\|--);')
				1794
				1795
				1796	def CheckInvalidIncrement(filename, clean_lines, linenum, error):
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	1797	"""Checks for invalid increment *count++.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	1798
				1799	For example following function:
				1800	void increment_counter(int* count) {
				1801	*count++;
				1802	}
				1803	is invalid, because it effectively does count++, moving pointer, and should
				1804	be replaced with ++count, (count)++ or *count += 1.
				1805
				1806	Args:
				1807	filename: The name of the current file.
				1808	clean_lines: A CleansedLines instance containing the file.
				1809	linenum: The number of the line to check.
				1810	error: The function to call with any errors found.
				1811	"""
				1812	line = clean_lines.elided[linenum]
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	1813	if _RE_PATTERN_INVALID_INCREMENT.match(line):
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	1814	error(filename, linenum, 'runtime/invalid_increment', 5,
				1815	'Changing pointer instead of value (or unused value of operator*).')
				1816
				1817
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1818	class _BlockInfo(object):
				1819	"""Stores information about a generic block of code."""
				1820
				1821	def __init__(self, seen_open_brace):
				1822	self.seen_open_brace = seen_open_brace
				1823	self.open_parentheses = 0
				1824	self.inline_asm = _NO_ASM
				1825
				1826	def CheckBegin(self, filename, clean_lines, linenum, error):
				1827	"""Run checks that applies to text up to the opening brace.
				1828
				1829	This is mostly for checking the text after the class identifier
				1830	and the "{", usually where the base class is specified. For other
				1831	blocks, there isn't much to check, so we always pass.
				1832
				1833	Args:
				1834	filename: The name of the current file.
				1835	clean_lines: A CleansedLines instance containing the file.
				1836	linenum: The number of the line to check.
				1837	error: The function to call with any errors found.
				1838	"""
				1839	pass
				1840
				1841	def CheckEnd(self, filename, clean_lines, linenum, error):
				1842	"""Run checks that applies to text after the closing brace.
				1843
				1844	This is mostly used for checking end of namespace comments.
				1845
				1846	Args:
				1847	filename: The name of the current file.
				1848	clean_lines: A CleansedLines instance containing the file.
				1849	linenum: The number of the line to check.
				1850	error: The function to call with any errors found.
				1851	"""
				1852	pass
				1853
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1854	def IsBlockInfo(self):
				1855	"""Returns true if this block is a _BlockInfo.
				1856
				1857	This is convenient for verifying that an object is an instance of
				1858	a _BlockInfo, but not an instance of any of the derived classes.
				1859
				1860	Returns:
				1861	True for this class, False for derived classes.
				1862	"""
				1863	return self.__class__ == _BlockInfo
				1864
				1865
				1866	class _ExternCInfo(_BlockInfo):
				1867	"""Stores information about an 'extern "C"' block."""
				1868
				1869	def __init__(self):
				1870	_BlockInfo.__init__(self, True)
				1871
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1872
				1873	class _ClassInfo(_BlockInfo):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1874	"""Stores information about a class."""
				1875
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1876	def __init__(self, name, class_or_struct, clean_lines, linenum):
				1877	_BlockInfo.__init__(self, False)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1878	self.name = name
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1879	self.starting_linenum = linenum
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1880	self.is_derived = False
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1881	if class_or_struct == 'struct':
				1882	self.access = 'public'
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1883	self.is_struct = True
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1884	else:
				1885	self.access = 'private'
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1886	self.is_struct = False
				1887
				1888	# Remember initial indentation level for this class. Using raw_lines here
				1889	# instead of elided to account for leading comments.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1890	self.class_indent = GetIndentLevel(clean_lines.raw_lines[linenum])
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1891
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	1892	# Try to find the end of the class. This will be confused by things like:
				1893	# class A {
				1894	# } *x = { ...
				1895	#
				1896	# But it's still good enough for CheckSectionSpacing.
				1897	self.last_line = 0
				1898	depth = 0
				1899	for i in range(linenum, clean_lines.NumLines()):
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1900	line = clean_lines.elided[i]
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	1901	depth += line.count('{') - line.count('}')
				1902	if not depth:
				1903	self.last_line = i
				1904	break
				1905
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1906	def CheckBegin(self, filename, clean_lines, linenum, error):
				1907	# Look for a bare ':'
				1908	if Search('(^\|[^:]):($\|[^:])', clean_lines.elided[linenum]):
				1909	self.is_derived = True
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1910
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1911	def CheckEnd(self, filename, clean_lines, linenum, error):
				1912	# Check that closing brace is aligned with beginning of the class.
				1913	# Only do this if the closing brace is indented by only whitespaces.
				1914	# This means we will not check single-line class definitions.
				1915	indent = Match(r'^( *)\}', clean_lines.elided[linenum])
				1916	if indent and len(indent.group(1)) != self.class_indent:
				1917	if self.is_struct:
				1918	parent = 'struct ' + self.name
				1919	else:
				1920	parent = 'class ' + self.name
				1921	error(filename, linenum, 'whitespace/indent', 3,
				1922	'Closing brace should be aligned with beginning of %s' % parent)
				1923
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	1924
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1925	class _NamespaceInfo(_BlockInfo):
				1926	"""Stores information about a namespace."""
				1927
				1928	def __init__(self, name, linenum):
				1929	_BlockInfo.__init__(self, False)
				1930	self.name = name or ''
				1931	self.starting_linenum = linenum
				1932
				1933	def CheckEnd(self, filename, clean_lines, linenum, error):
				1934	"""Check end of namespace comments."""
				1935	line = clean_lines.raw_lines[linenum]
				1936
				1937	# Check how many lines is enclosed in this namespace. Don't issue
				1938	# warning for missing namespace comments if there aren't enough
				1939	# lines. However, do apply checks if there is already an end of
				1940	# namespace comment and it's incorrect.
				1941	#
				1942	# TODO(unknown): We always want to check end of namespace comments
				1943	# if a namespace is large, but sometimes we also want to apply the
				1944	# check if a short namespace contained nontrivial things (something
				1945	# other than forward declarations). There is currently no logic on
				1946	# deciding what these nontrivial things are, so this check is
				1947	# triggered by namespace size only, which works most of the time.
				1948	if (linenum - self.starting_linenum < 10
				1949	and not Match(r'};\s(//\|/\).\bnamespace\b', line)):
				1950	return
				1951
				1952	# Look for matching comment at end of namespace.
				1953	#
				1954	# Note that we accept C style "/* */" comments for terminating
				1955	# namespaces, so that code that terminate namespaces inside
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1956	# preprocessor macros can be cpplint clean.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1957	#
				1958	# We also accept stuff like "// end of namespace <name>." with the
				1959	# period at the end.
				1960	#
				1961	# Besides these, we don't accept anything else, otherwise we might
				1962	# get false negatives when existing comment is a substring of the
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	1963	# expected namespace.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1964	if self.name:
				1965	# Named namespace
				1966	if not Match((r'};\s(//\|/\).\bnamespace\s+' + re.escape(self.name) +
				1967	r'[\/\.\\\s]$'),
				1968	line):
				1969	error(filename, linenum, 'readability/namespace', 5,
				1970	'Namespace should be terminated with "// namespace %s"' %
				1971	self.name)
				1972	else:
				1973	# Anonymous namespace
				1974	if not Match(r'};\s(//\|/\).\bnamespace[\/\.\\\s]$', line):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	1975	# If "// namespace anonymous" or "// anonymous namespace (more text)",
				1976	# mention "// anonymous namespace" as an acceptable form
				1977	if Match(r'}.*\b(namespace anonymous\|anonymous namespace)\b', line):
				1978	error(filename, linenum, 'readability/namespace', 5,
				1979	'Anonymous namespace should be terminated with "// namespace"'
				1980	' or "// anonymous namespace"')
				1981	else:
				1982	error(filename, linenum, 'readability/namespace', 5,
				1983	'Anonymous namespace should be terminated with "// namespace"')
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	1984
				1985
				1986	class _PreprocessorInfo(object):
				1987	"""Stores checkpoints of nesting stacks when #if/#else is seen."""
				1988
				1989	def __init__(self, stack_before_if):
				1990	# The entire nesting stack before #if
				1991	self.stack_before_if = stack_before_if
				1992
				1993	# The entire nesting stack up to #else
				1994	self.stack_before_else = []
				1995
				1996	# Whether we have already seen #else or #elif
				1997	self.seen_else = False
				1998
				1999
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2000	class NestingState(object):
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2001	"""Holds states related to parsing braces."""
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2002
				2003	def __init__(self):
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2004	# Stack for tracking all braces. An object is pushed whenever we
				2005	# see a "{", and popped when we see a "}". Only 3 types of
				2006	# objects are possible:
				2007	# - _ClassInfo: a class or struct.
				2008	# - _NamespaceInfo: a namespace.
				2009	# - _BlockInfo: some other type of block.
				2010	self.stack = []
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2011
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2012	# Top of the previous stack before each Update().
				2013	#
				2014	# Because the nesting_stack is updated at the end of each line, we
				2015	# had to do some convoluted checks to find out what is the current
				2016	# scope at the beginning of the line. This check is simplified by
				2017	# saving the previous top of nesting stack.
				2018	#
				2019	# We could save the full stack, but we only need the top. Copying
				2020	# the full nesting stack would slow down cpplint by ~10%.
				2021	self.previous_stack_top = []
				2022
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2023	# Stack of _PreprocessorInfo objects.
				2024	self.pp_stack = []
				2025
				2026	def SeenOpenBrace(self):
				2027	"""Check if we have seen the opening brace for the innermost block.
				2028
				2029	Returns:
				2030	True if we have seen the opening brace, False if the innermost
				2031	block is still expecting an opening brace.
				2032	"""
				2033	return (not self.stack) or self.stack[-1].seen_open_brace
				2034
				2035	def InNamespaceBody(self):
				2036	"""Check if we are currently one level inside a namespace body.
				2037
				2038	Returns:
				2039	True if top of the stack is a namespace block, False otherwise.
				2040	"""
				2041	return self.stack and isinstance(self.stack[-1], _NamespaceInfo)
				2042
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2043	def InExternC(self):
				2044	"""Check if we are currently one level inside an 'extern "C"' block.
				2045
				2046	Returns:
				2047	True if top of the stack is an extern block, False otherwise.
				2048	"""
				2049	return self.stack and isinstance(self.stack[-1], _ExternCInfo)
				2050
				2051	def InClassDeclaration(self):
				2052	"""Check if we are currently one level inside a class or struct declaration.
				2053
				2054	Returns:
				2055	True if top of the stack is a class/struct, False otherwise.
				2056	"""
				2057	return self.stack and isinstance(self.stack[-1], _ClassInfo)
				2058
				2059	def InAsmBlock(self):
				2060	"""Check if we are currently one level inside an inline ASM block.
				2061
				2062	Returns:
				2063	True if the top of the stack is a block containing inline ASM.
				2064	"""
				2065	return self.stack and self.stack[-1].inline_asm != _NO_ASM
				2066
				2067	def InTemplateArgumentList(self, clean_lines, linenum, pos):
				2068	"""Check if current position is inside template argument list.
				2069
				2070	Args:
				2071	clean_lines: A CleansedLines instance containing the file.
				2072	linenum: The number of the line to check.
				2073	pos: position just after the suspected template argument.
				2074	Returns:
				2075	True if (linenum, pos) is inside template arguments.
				2076	"""
				2077	while linenum < clean_lines.NumLines():
				2078	# Find the earliest character that might indicate a template argument
				2079	line = clean_lines.elided[linenum]
				2080	match = Match(r'^[^{};=\[\]\.<>]*(.)', line[pos:])
				2081	if not match:
				2082	linenum += 1
				2083	pos = 0
				2084	continue
				2085	token = match.group(1)
				2086	pos += len(match.group(0))
				2087
				2088	# These things do not look like template argument list:
				2089	# class Suspect {
				2090	# class Suspect x; }
				2091	if token in ('{', '}', ';'): return False
				2092
				2093	# These things look like template argument list:
				2094	# template <class Suspect>
				2095	# template <class Suspect = default_value>
				2096	# template <class Suspect[]>
				2097	# template <class Suspect...>
				2098	if token in ('>', '=', '[', ']', '.'): return True
				2099
				2100	# Check if token is an unmatched '<'.
				2101	# If not, move on to the next character.
				2102	if token != '<':
				2103	pos += 1
				2104	if pos >= len(line):
				2105	linenum += 1
				2106	pos = 0
				2107	continue
				2108
				2109	# We can't be sure if we just find a single '<', and need to
				2110	# find the matching '>'.
				2111	(_, end_line, end_pos) = CloseExpression(clean_lines, linenum, pos - 1)
				2112	if end_pos < 0:
				2113	# Not sure if template argument list or syntax error in file
				2114	return False
				2115	linenum = end_line
				2116	pos = end_pos
				2117	return False
				2118
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2119	def UpdatePreprocessor(self, line):
				2120	"""Update preprocessor stack.
				2121
				2122	We need to handle preprocessors due to classes like this:
				2123	#ifdef SWIG
				2124	struct ResultDetailsPageElementExtensionPoint {
				2125	#else
				2126	struct ResultDetailsPageElementExtensionPoint : public Extension {
				2127	#endif
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2128
				2129	We make the following assumptions (good enough for most files):
				2130	- Preprocessor condition evaluates to true from #if up to first
				2131	#else/#elif/#endif.
				2132
				2133	- Preprocessor condition evaluates to false from #else/#elif up
				2134	to #endif. We still perform lint checks on these lines, but
				2135	these do not affect nesting stack.
				2136
				2137	Args:
				2138	line: current line to check.
				2139	"""
				2140	if Match(r'^\s#\s(if\|ifdef\|ifndef)\b', line):
				2141	# Beginning of #if block, save the nesting stack here. The saved
				2142	# stack will allow us to restore the parsing state in the #else case.
				2143	self.pp_stack.append(_PreprocessorInfo(copy.deepcopy(self.stack)))
				2144	elif Match(r'^\s#\s(else\|elif)\b', line):
				2145	# Beginning of #else block
				2146	if self.pp_stack:
				2147	if not self.pp_stack[-1].seen_else:
				2148	# This is the first #else or #elif block. Remember the
				2149	# whole nesting stack up to this point. This is what we
				2150	# keep after the #endif.
				2151	self.pp_stack[-1].seen_else = True
				2152	self.pp_stack[-1].stack_before_else = copy.deepcopy(self.stack)
				2153
				2154	# Restore the stack to how it was before the #if
				2155	self.stack = copy.deepcopy(self.pp_stack[-1].stack_before_if)
				2156	else:
				2157	# TODO(unknown): unexpected #else, issue warning?
				2158	pass
				2159	elif Match(r'^\s#\sendif\b', line):
				2160	# End of #if or #else blocks.
				2161	if self.pp_stack:
				2162	# If we saw an #else, we will need to restore the nesting
				2163	# stack to its former state before the #else, otherwise we
				2164	# will just continue from where we left off.
				2165	if self.pp_stack[-1].seen_else:
				2166	# Here we can just use a shallow copy since we are the last
				2167	# reference to it.
				2168	self.stack = self.pp_stack[-1].stack_before_else
				2169	# Drop the corresponding #if
				2170	self.pp_stack.pop()
				2171	else:
				2172	# TODO(unknown): unexpected #endif, issue warning?
				2173	pass
				2174
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2175	# TODO(unknown): Update() is too long, but we will refactor later.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2176	def Update(self, filename, clean_lines, linenum, error):
				2177	"""Update nesting state with current line.
				2178
				2179	Args:
				2180	filename: The name of the current file.
				2181	clean_lines: A CleansedLines instance containing the file.
				2182	linenum: The number of the line to check.
				2183	error: The function to call with any errors found.
				2184	"""
				2185	line = clean_lines.elided[linenum]
				2186
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2187	# Remember top of the previous nesting stack.
				2188	#
				2189	# The stack is always pushed/popped and not modified in place, so
				2190	# we can just do a shallow copy instead of copy.deepcopy. Using
				2191	# deepcopy would slow down cpplint by ~28%.
				2192	if self.stack:
				2193	self.previous_stack_top = self.stack[-1]
				2194	else:
				2195	self.previous_stack_top = None
				2196
				2197	# Update pp_stack
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2198	self.UpdatePreprocessor(line)
				2199
				2200	# Count parentheses. This is to avoid adding struct arguments to
				2201	# the nesting stack.
				2202	if self.stack:
				2203	inner_block = self.stack[-1]
				2204	depth_change = line.count('(') - line.count(')')
				2205	inner_block.open_parentheses += depth_change
				2206
				2207	# Also check if we are starting or ending an inline assembly block.
				2208	if inner_block.inline_asm in (_NO_ASM, _END_ASM):
				2209	if (depth_change != 0 and
				2210	inner_block.open_parentheses == 1 and
				2211	_MATCH_ASM.match(line)):
				2212	# Enter assembly block
				2213	inner_block.inline_asm = _INSIDE_ASM
				2214	else:
				2215	# Not entering assembly block. If previous line was _END_ASM,
				2216	# we will now shift to _NO_ASM state.
				2217	inner_block.inline_asm = _NO_ASM
				2218	elif (inner_block.inline_asm == _INSIDE_ASM and
				2219	inner_block.open_parentheses == 0):
				2220	# Exit assembly block
				2221	inner_block.inline_asm = _END_ASM
				2222
				2223	# Consume namespace declaration at the beginning of the line. Do
				2224	# this in a loop so that we catch same line declarations like this:
				2225	# namespace proto2 { namespace bridge { class MessageSet; } }
				2226	while True:
				2227	# Match start of namespace. The "\b\s*" below catches namespace
				2228	# declarations even if it weren't followed by a whitespace, this
				2229	# is so that we don't confuse our namespace checker. The
				2230	# missing spaces will be flagged by CheckSpacing.
				2231	namespace_decl_match = Match(r'^\snamespace\b\s([:\w]+)?(.*)$', line)
				2232	if not namespace_decl_match:
				2233	break
				2234
				2235	new_namespace = _NamespaceInfo(namespace_decl_match.group(1), linenum)
				2236	self.stack.append(new_namespace)
				2237
				2238	line = namespace_decl_match.group(2)
				2239	if line.find('{') != -1:
				2240	new_namespace.seen_open_brace = True
				2241	line = line[line.find('{') + 1:]
				2242
				2243	# Look for a class declaration in whatever is left of the line
				2244	# after parsing namespaces. The regexp accounts for decorated classes
				2245	# such as in:
				2246	# class LOCKABLE API Object {
				2247	# };
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2248	class_decl_match = Match(
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2249	r'^(\s(?:template\s<[\w\s<>,:]>\s)?'
				2250	r'(class\|struct)\s+(?:[A-Z_]+\s+)(\w+(?:::\w+)))'
				2251	r'(.*)$', line)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2252	if (class_decl_match and
				2253	(not self.stack or self.stack[-1].open_parentheses == 0)):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2254	# We do not want to accept classes that are actually template arguments:
				2255	# template <class Ignore1,
				2256	# class Ignore2 = Default<Args>,
				2257	# template <Args> class Ignore3>
				2258	# void Function() {};
				2259	#
				2260	# To avoid template argument cases, we scan forward and look for
				2261	# an unmatched '>'. If we see one, assume we are inside a
				2262	# template argument list.
				2263	end_declaration = len(class_decl_match.group(1))
				2264	if not self.InTemplateArgumentList(clean_lines, linenum, end_declaration):
				2265	self.stack.append(_ClassInfo(
				2266	class_decl_match.group(3), class_decl_match.group(2),
				2267	clean_lines, linenum))
				2268	line = class_decl_match.group(4)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2269
				2270	# If we have not yet seen the opening brace for the innermost block,
				2271	# run checks here.
				2272	if not self.SeenOpenBrace():
				2273	self.stack[-1].CheckBegin(filename, clean_lines, linenum, error)
				2274
				2275	# Update access control if we are inside a class/struct
				2276	if self.stack and isinstance(self.stack[-1], _ClassInfo):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2277	classinfo = self.stack[-1]
				2278	access_match = Match(
				2279	r'^(.)\b(public\|private\|protected\|signals)(\s+(?:slots\s)?)?'
				2280	r':(?:[^:]\|$)',
				2281	line)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2282	if access_match:
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2283	classinfo.access = access_match.group(2)
				2284
				2285	# Check that access keywords are indented +1 space. Skip this
				2286	# check if the keywords are not preceded by whitespaces.
				2287	indent = access_match.group(1)
				2288	if (len(indent) != classinfo.class_indent + 1 and
				2289	Match(r'^\s*$', indent)):
				2290	if classinfo.is_struct:
				2291	parent = 'struct ' + classinfo.name
				2292	else:
				2293	parent = 'class ' + classinfo.name
				2294	slots = ''
				2295	if access_match.group(3):
				2296	slots = access_match.group(3)
				2297	error(filename, linenum, 'whitespace/indent', 3,
				2298	'%s%s: should be indented +1 space inside %s' % (
				2299	access_match.group(2), slots, parent))
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2300
				2301	# Consume braces or semicolons from what's left of the line
				2302	while True:
				2303	# Match first brace, semicolon, or closed parenthesis.
				2304	matched = Match(r'^[^{;)}]([{;)}])(.)$', line)
				2305	if not matched:
				2306	break
				2307
				2308	token = matched.group(1)
				2309	if token == '{':
				2310	# If namespace or class hasn't seen a opening brace yet, mark
				2311	# namespace/class head as complete. Push a new block onto the
				2312	# stack otherwise.
				2313	if not self.SeenOpenBrace():
				2314	self.stack[-1].seen_open_brace = True
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2315	elif Match(r'^extern\s"[^"]"\s*\{', line):
				2316	self.stack.append(_ExternCInfo())
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2317	else:
				2318	self.stack.append(_BlockInfo(True))
				2319	if _MATCH_ASM.match(line):
				2320	self.stack[-1].inline_asm = _BLOCK_ASM
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2321
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2322	elif token == ';' or token == ')':
				2323	# If we haven't seen an opening brace yet, but we already saw
				2324	# a semicolon, this is probably a forward declaration. Pop
				2325	# the stack for these.
				2326	#
				2327	# Similarly, if we haven't seen an opening brace yet, but we
				2328	# already saw a closing parenthesis, then these are probably
				2329	# function arguments with extra "class" or "struct" keywords.
				2330	# Also pop these stack for these.
				2331	if not self.SeenOpenBrace():
				2332	self.stack.pop()
				2333	else: # token == '}'
				2334	# Perform end of block checks and pop the stack.
				2335	if self.stack:
				2336	self.stack[-1].CheckEnd(filename, clean_lines, linenum, error)
				2337	self.stack.pop()
				2338	line = matched.group(2)
				2339
				2340	def InnermostClass(self):
				2341	"""Get class info on the top of the stack.
				2342
				2343	Returns:
				2344	A _ClassInfo object if we are inside a class, or None otherwise.
				2345	"""
				2346	for i in range(len(self.stack), 0, -1):
				2347	classinfo = self.stack[i - 1]
				2348	if isinstance(classinfo, _ClassInfo):
				2349	return classinfo
				2350	return None
				2351
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2352	def CheckCompletedBlocks(self, filename, error):
				2353	"""Checks that all classes and namespaces have been completely parsed.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2354
				2355	Call this when all lines in a file have been processed.
				2356	Args:
				2357	filename: The name of the current file.
				2358	error: The function to call with any errors found.
				2359	"""
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2360	# Note: This test can result in false positives if #ifdef constructs
				2361	# get in the way of brace matching. See the testBuildClass test in
				2362	# cpplint_unittest.py for an example of this.
				2363	for obj in self.stack:
				2364	if isinstance(obj, _ClassInfo):
				2365	error(filename, obj.starting_linenum, 'build/class', 5,
				2366	'Failed to find complete declaration of class %s' %
				2367	obj.name)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2368	elif isinstance(obj, _NamespaceInfo):
				2369	error(filename, obj.starting_linenum, 'build/namespaces', 5,
				2370	'Failed to find complete declaration of namespace %s' %
				2371	obj.name)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2372
				2373
				2374	def CheckForNonStandardConstructs(filename, clean_lines, linenum,
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2375	nesting_state, error):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2376	r"""Logs an error if we see certain non-ANSI constructs ignored by gcc-2.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2377
				2378	Complain about several constructs which gcc-2 accepts, but which are
				2379	not standard C++. Warning about these in lint is one way to ease the
				2380	transition to new compilers.
				2381	- put storage class first (e.g. "static const" instead of "const static").
				2382	- "%lld" instead of %qd" in printf-type functions.
				2383	- "%1$d" is non-standard in printf-type functions.
				2384	- "\%" is an undefined character escape sequence.
				2385	- text after #endif is not allowed.
				2386	- invalid inner-style forward declaration.
				2387	- >? and <? operators, and their >?= and <?= cousins.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2388
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	2389	Additionally, check for constructor/destructor style violations and reference
				2390	members, as it is very convenient to do so while checking for
				2391	gcc-2 compliance.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2392
				2393	Args:
				2394	filename: The name of the current file.
				2395	clean_lines: A CleansedLines instance containing the file.
				2396	linenum: The number of the line to check.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2397	nesting_state: A NestingState instance which maintains information about
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2398	the current stack of nested blocks being parsed.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2399	error: A callable to which errors are reported, which takes 4 arguments:
				2400	filename, line number, error level, and message
				2401	"""
				2402
				2403	# Remove comments from the line, but leave in strings for now.
				2404	line = clean_lines.lines[linenum]
				2405
				2406	if Search(r'printf\s\(.".%[-+ ]?\dq', line):
				2407	error(filename, linenum, 'runtime/printf_format', 3,
				2408	'%q in format strings is deprecated. Use %ll instead.')
				2409
				2410	if Search(r'printf\s\(.".*%\d+\$', line):
				2411	error(filename, linenum, 'runtime/printf_format', 2,
				2412	'%N$ formats are unconventional. Try rewriting to avoid them.')
				2413
				2414	# Remove escaped backslashes before looking for undefined escapes.
				2415	line = line.replace('\\\\', '')
				2416
				2417	if Search(r'("\|\').*\\(%\|\[\|\(\|{)', line):
				2418	error(filename, linenum, 'build/printf_format', 3,
				2419	'%, [, (, and { are undefined character escapes. Unescape them.')
				2420
				2421	# For the rest, work with both comments and strings removed.
				2422	line = clean_lines.elided[linenum]
				2423
				2424	if Search(r'\b(const\|volatile\|void\|char\|short\|int\|long'
				2425	r'\|float\|double\|signed\|unsigned'
				2426	r'\|schar\|u?int8\|u?int16\|u?int32\|u?int64)'
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2427	r'\s+(register\|static\|extern\|typedef)\b',
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2428	line):
				2429	error(filename, linenum, 'build/storage_class', 5,
				2430	'Storage class (static, extern, typedef, etc) should be first.')
				2431
				2432	if Match(r'\s#\sendif\s*[^/\s]+', line):
				2433	error(filename, linenum, 'build/endif_comment', 5,
				2434	'Uncommented text after #endif is non-standard. Use a comment.')
				2435
				2436	if Match(r'\sclass\s+(\w+\s::\s)+\w+\s;', line):
				2437	error(filename, linenum, 'build/forward_decl', 5,
				2438	'Inner-style forward declarations are invalid. Remove this line.')
				2439
				2440	if Search(r'(\w+\|[+-]?\d+(\.\d)?)\s(<\|>)\?=?\s(\w+\|[+-]?\d+)(\.\d)?',
				2441	line):
				2442	error(filename, linenum, 'build/deprecated', 3,
				2443	'>? and <? (max and min) operators are non-standard and deprecated.')
				2444
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	2445	if Search(r'^\sconst\sstring\s&\s\w+\s*;', line):
				2446	# TODO(unknown): Could it be expanded safely to arbitrary references,
				2447	# without triggering too many false positives? The first
				2448	# attempt triggered 5 warnings for mostly benign code in the regtest, hence
				2449	# the restriction.
				2450	# Here's the original regexp, for the reference:
				2451	# type_name = r'\w+((\s::\s\w+)\|(\s<\s\w+?\s*>))?'
				2452	# r'\sconst\s' + type_name + '\s&\s\w+\s*;'
				2453	error(filename, linenum, 'runtime/member_string_references', 2,
				2454	'const string& members are dangerous. It is much better to use '
				2455	'alternatives, such as pointers or simple constants.')
				2456
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2457	# Everything else in this function operates on class declarations.
				2458	# Return early if the top of the nesting stack is not a class, or if
				2459	# the class head is not completed yet.
				2460	classinfo = nesting_state.InnermostClass()
				2461	if not classinfo or not classinfo.seen_open_brace:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2462	return
				2463
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2464	# The class may have been declared with namespace or classname qualifiers.
				2465	# The constructor and destructor will not have those qualifiers.
				2466	base_classname = classinfo.name.split('::')[-1]
				2467
				2468	# Look for single-argument constructors that aren't marked explicit.
				2469	# Technically a valid construct, but against style.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	2470	args = Match(r'\s+(?:inline\s+)?%s\s*$([^,()]+)$'
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2471	% re.escape(base_classname),
				2472	line)
				2473	if (args and
				2474	args.group(1) != 'void' and
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2475	not Search(r'\bstd::initializer_list\b', args.group(1)) and
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2476	not Match(r'(const\s+)?%s(\s+const)?\s(?:<\w+>\s)?&'
				2477	% re.escape(base_classname), args.group(1).strip())):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2478	error(filename, linenum, 'runtime/explicit', 5,
				2479	'Single-argument constructors should be marked explicit.')
				2480
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2481
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2482	def CheckSpacingForFunctionCall(filename, clean_lines, linenum, error):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2483	"""Checks for the correctness of various spacing around function calls.
				2484
				2485	Args:
				2486	filename: The name of the current file.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2487	clean_lines: A CleansedLines instance containing the file.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2488	linenum: The number of the line to check.
				2489	error: The function to call with any errors found.
				2490	"""
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2491	line = clean_lines.elided[linenum]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2492
				2493	# Since function calls often occur inside if/for/while/switch
				2494	# expressions - which have their own, more liberal conventions - we
				2495	# first see if we should be looking inside such an expression for a
				2496	# function call, to which we can apply more strict standards.
				2497	fncall = line # if there's no control flow construct, look at whole line
				2498	for pattern in (r'\bif\s$(.)$\s*{',
				2499	r'\bfor\s$(.)$\s*{',
				2500	r'\bwhile\s$(.)$\s*[{;]',
				2501	r'\bswitch\s$(.)$\s*{'):
				2502	match = Search(pattern, line)
				2503	if match:
				2504	fncall = match.group(1) # look inside the parens for function calls
				2505	break
				2506
				2507	# Except in if/for/while/switch, there should never be space
				2508	# immediately inside parens (eg "f( 3, 4 )"). We make an exception
				2509	# for nested parens ( (a+b) + c ). Likewise, there should never be
				2510	# a space before a ( when it's a function argument. I assume it's a
				2511	# function argument when the char before the whitespace is legal in
				2512	# a function name (alnum + _) and we're not starting a macro. Also ignore
				2513	# pointers and references to arrays and functions coz they're too tricky:
				2514	# we use a very simple way to recognize these:
				2515	# " (something)(maybe-something)" or
				2516	# " (something)(maybe-something," or
				2517	# " (something)[something]"
				2518	# Note that we assume the contents of [] to be short enough that
				2519	# they'll never need to wrap.
				2520	if ( # Ignore control structures.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2521	not Search(r'\b(if\|for\|while\|switch\|return\|new\|delete\|catch\|sizeof)\b',
				2522	fncall) and
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2523	# Ignore pointers/references to functions.
				2524	not Search(r' $[^)]+$$[^)]*($\|,$)', fncall) and
				2525	# Ignore pointers/references to arrays.
				2526	not Search(r' $[^)]+$\[[^\]]+\]', fncall)):
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2527	if Search(r'\w\s\(\s(?!\s\\$)', fncall): # a ( used for a fn call
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2528	error(filename, linenum, 'whitespace/parens', 4,
				2529	'Extra space after ( in function call')
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2530	elif Search(r'$\s+(?!(\s*\$\|\()', fncall):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2531	error(filename, linenum, 'whitespace/parens', 2,
				2532	'Extra space after (')
				2533	if (Search(r'\w\s+\(', fncall) and
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2534	not Search(r'#\sdefine\|typedef\|using\s+\w+\s=', fncall) and
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2535	not Search(r'\w\s+$(\w+::)\\w+$\(', fncall)):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2536	# TODO(unknown): Space after an operator function seem to be a common
				2537	# error, silence those for now by restricting them to highest verbosity.
				2538	if Search(r'\boperator_*\b', line):
				2539	error(filename, linenum, 'whitespace/parens', 0,
				2540	'Extra space before ( in function call')
				2541	else:
				2542	error(filename, linenum, 'whitespace/parens', 4,
				2543	'Extra space before ( in function call')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2544	# If the ) is followed only by a newline or a { + newline, assume it's
				2545	# part of a control statement (if/while/etc), and don't complain
				2546	if Search(r'[^)]\s+\)\s*[^{\s]', fncall):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	2547	# If the closing parenthesis is preceded by only whitespaces,
				2548	# try to give a more descriptive error message.
				2549	if Search(r'^\s+\)', fncall):
				2550	error(filename, linenum, 'whitespace/parens', 2,
				2551	'Closing ) should be moved to the previous line')
				2552	else:
				2553	error(filename, linenum, 'whitespace/parens', 2,
				2554	'Extra space before )')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2555
				2556
				2557	def IsBlankLine(line):
				2558	"""Returns true if the given line is blank.
				2559
				2560	We consider a line to be blank if the line is empty or consists of
				2561	only white spaces.
				2562
				2563	Args:
				2564	line: A line of a string.
				2565
				2566	Returns:
				2567	True, if the given line is blank.
				2568	"""
				2569	return not line or line.isspace()
				2570
				2571
				2572	def CheckForFunctionLengths(filename, clean_lines, linenum,
				2573	function_state, error):
				2574	"""Reports for long function bodies.
				2575
				2576	For an overview why this is done, see:
				2577	http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml#Write_Short_Functions
				2578
				2579	Uses a simplistic algorithm assuming other style guidelines
				2580	(especially spacing) are followed.
				2581	Only checks unindented functions, so class members are unchecked.
				2582	Trivial bodies are unchecked, so constructors with huge initializer lists
				2583	may be missed.
				2584	Blank/comment lines are not counted so as to avoid encouraging the removal
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	2585	of vertical space and comments just to get through a lint check.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2586	NOLINT on the last line of a function disables this check.
				2587
				2588	Args:
				2589	filename: The name of the current file.
				2590	clean_lines: A CleansedLines instance containing the file.
				2591	linenum: The number of the line to check.
				2592	function_state: Current function name and lines in body so far.
				2593	error: The function to call with any errors found.
				2594	"""
				2595	lines = clean_lines.lines
				2596	line = lines[linenum]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2597	joined_line = ''
				2598
				2599	starting_func = False
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2600	regexp = r'(\w(\w\|::\|\\|\&\|\s))\(' # decls * & space::name( ...
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2601	match_result = Match(regexp, line)
				2602	if match_result:
				2603	# If the name is all caps and underscores, figure it's a macro and
				2604	# ignore it, unless it's TEST or TEST_F.
				2605	function_name = match_result.group(1).split()[-1]
				2606	if function_name == 'TEST' or function_name == 'TEST_F' or (
				2607	not Match(r'[A-Z_]+$', function_name)):
				2608	starting_func = True
				2609
				2610	if starting_func:
				2611	body_found = False
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2612	for start_linenum in xrange(linenum, clean_lines.NumLines()):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2613	start_line = lines[start_linenum]
				2614	joined_line += ' ' + start_line.lstrip()
				2615	if Search(r'(;\|})', start_line): # Declarations and trivial functions
				2616	body_found = True
				2617	break # ... ignore
				2618	elif Search(r'{', start_line):
				2619	body_found = True
				2620	function = Search(r'((\w\|:)*)\(', line).group(1)
				2621	if Match(r'TEST', function): # Handle TEST... macros
				2622	parameter_regexp = Search(r'($.*$)', joined_line)
				2623	if parameter_regexp: # Ignore bad syntax
				2624	function += parameter_regexp.group(1)
				2625	else:
				2626	function += '()'
				2627	function_state.Begin(function)
				2628	break
				2629	if not body_found:
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2630	# No body for the function (or evidence of a non-function) was found.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2631	error(filename, linenum, 'readability/fn_size', 5,
				2632	'Lint failed to find start of function body.')
				2633	elif Match(r'^\}\s*$', line): # function end
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	2634	function_state.Check(error, filename, linenum)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2635	function_state.End()
				2636	elif not Match(r'^\s*$', line):
				2637	function_state.Count() # Count non-blank/non-comment lines.
				2638
				2639
				2640	_RE_PATTERN_TODO = re.compile(r'^//(\s*)TODO($.+?$)?:?(\s\|$)?')
				2641
				2642
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2643	def CheckComment(line, filename, linenum, next_line_start, error):
				2644	"""Checks for common mistakes in comments.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2645
				2646	Args:
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2647	line: The line in question.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2648	filename: The name of the current file.
				2649	linenum: The number of the line to check.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2650	next_line_start: The first non-whitespace column of the next line.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2651	error: The function to call with any errors found.
				2652	"""
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2653	commentpos = line.find('//')
				2654	if commentpos != -1:
				2655	# Check if the // may be in quotes. If so, ignore it
				2656	# Comparisons made explicit for clarity -- pylint: disable=g-explicit-bool-comparison
				2657	if (line.count('"', 0, commentpos) -
				2658	line.count('\\"', 0, commentpos)) % 2 == 0: # not in quotes
				2659	# Allow one space for new scopes, two spaces otherwise:
				2660	if (not (Match(r'^.{ //', line) and next_line_start == commentpos) and
				2661	((commentpos >= 1 and
				2662	line[commentpos-1] not in string.whitespace) or
				2663	(commentpos >= 2 and
				2664	line[commentpos-2] not in string.whitespace))):
				2665	error(filename, linenum, 'whitespace/comments', 2,
				2666	'At least two spaces is best between code and comments')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2667
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2668	# Checks for common mistakes in TODO comments.
				2669	comment = line[commentpos:]
				2670	match = _RE_PATTERN_TODO.match(comment)
				2671	if match:
				2672	# One whitespace is correct; zero whitespace is handled elsewhere.
				2673	leading_whitespace = match.group(1)
				2674	if len(leading_whitespace) > 1:
				2675	error(filename, linenum, 'whitespace/todo', 2,
				2676	'Too many spaces before TODO')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2677
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2678	username = match.group(2)
				2679	if not username:
				2680	error(filename, linenum, 'readability/todo', 2,
				2681	'Missing username in TODO; it should look like '
				2682	'"// TODO(my_username): Stuff."')
				2683
				2684	middle_whitespace = match.group(3)
				2685	# Comparisons made explicit for correctness -- pylint: disable=g-explicit-bool-comparison
				2686	if middle_whitespace != ' ' and middle_whitespace != '':
				2687	error(filename, linenum, 'whitespace/todo', 2,
				2688	'TODO(my_username) should be followed by a space')
				2689
				2690	# If the comment contains an alphanumeric character, there
				2691	# should be a space somewhere between it and the //.
				2692	if Match(r'//[^ ]*\w', comment):
				2693	error(filename, linenum, 'whitespace/comments', 4,
				2694	'Should have a space between // and comment')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2695
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2696	def CheckAccess(filename, clean_lines, linenum, nesting_state, error):
				2697	"""Checks for improper use of DISALLOW* macros.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2698
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2699	Args:
				2700	filename: The name of the current file.
				2701	clean_lines: A CleansedLines instance containing the file.
				2702	linenum: The number of the line to check.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2703	nesting_state: A NestingState instance which maintains information about
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2704	the current stack of nested blocks being parsed.
				2705	error: The function to call with any errors found.
				2706	"""
				2707	line = clean_lines.elided[linenum] # get rid of comments and strings
				2708
				2709	matched = Match((r'\s*(DISALLOW_COPY_AND_ASSIGN\|'
				2710	r'DISALLOW_EVIL_CONSTRUCTORS\|'
				2711	r'DISALLOW_IMPLICIT_CONSTRUCTORS)'), line)
				2712	if not matched:
				2713	return
				2714	if nesting_state.stack and isinstance(nesting_state.stack[-1], _ClassInfo):
				2715	if nesting_state.stack[-1].access != 'private':
				2716	error(filename, linenum, 'readability/constructors', 3,
				2717	'%s must be in the private: section' % matched.group(1))
				2718
				2719	else:
				2720	# Found DISALLOW* macro outside a class declaration, or perhaps it
				2721	# was used inside a function when it should have been part of the
				2722	# class declaration. We could issue a warning here, but it
				2723	# probably resulted in a compiler error already.
				2724	pass
				2725
				2726
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2727	def CheckSpacing(filename, clean_lines, linenum, nesting_state, error):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2728	"""Checks for the correctness of various spacing issues in the code.
				2729
				2730	Things we check for: spaces around operators, spaces after
				2731	if/for/while/switch, no spaces around parens in function calls, two
				2732	spaces between code and comment, don't start a block with a blank
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	2733	line, don't end a function with a blank line, don't add a blank line
				2734	after public/protected/private, don't have too many blank lines in a row.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2735
				2736	Args:
				2737	filename: The name of the current file.
				2738	clean_lines: A CleansedLines instance containing the file.
				2739	linenum: The number of the line to check.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2740	nesting_state: A NestingState instance which maintains information about
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2741	the current stack of nested blocks being parsed.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2742	error: The function to call with any errors found.
				2743	"""
				2744
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2745	# Don't use "elided" lines here, otherwise we can't check commented lines.
				2746	# Don't want to use "raw" either, because we don't want to check inside C++11
				2747	# raw strings,
				2748	raw = clean_lines.lines_without_raw_strings
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2749	line = raw[linenum]
				2750
				2751	# Before nixing comments, check if the line is blank for no good
				2752	# reason. This includes the first line after a block is opened, and
				2753	# blank lines at the end of a function (ie, right before a line like '}'
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2754	#
				2755	# Skip all the blank line checks if we are immediately inside a
				2756	# namespace body. In other words, don't issue blank line warnings
				2757	# for this block:
				2758	# namespace {
				2759	#
				2760	# }
				2761	#
				2762	# A warning about missing end of namespace comments will be issued instead.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2763	#
				2764	# Also skip blank line checks for 'extern "C"' blocks, which are formatted
				2765	# like namespaces.
				2766	if (IsBlankLine(line) and
				2767	not nesting_state.InNamespaceBody() and
				2768	not nesting_state.InExternC()):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2769	elided = clean_lines.elided
				2770	prev_line = elided[linenum - 1]
				2771	prevbrace = prev_line.rfind('{')
				2772	# TODO(unknown): Don't complain if line before blank line, and line after,
				2773	# both start with alnums and are indented the same amount.
				2774	# This ignores whitespace at the start of a namespace block
				2775	# because those are not usually indented.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2776	if prevbrace != -1 and prev_line[prevbrace:].find('}') == -1:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2777	# OK, we have a blank line at the start of a code block. Before we
				2778	# complain, we check if it is an exception to the rule: The previous
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	2779	# non-empty line has the parameters of a function header that are indented
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2780	# 4 spaces (because they did not fit in a 80 column line when placed on
				2781	# the same line as the function name). We also check for the case where
				2782	# the previous line is indented 6 spaces, which may happen when the
				2783	# initializers of a constructor do not fit into a 80 column line.
				2784	exception = False
				2785	if Match(r' {6}\w', prev_line): # Initializer list?
				2786	# We are looking for the opening column of initializer list, which
				2787	# should be indented 4 spaces to cause 6 space indentation afterwards.
				2788	search_position = linenum-2
				2789	while (search_position >= 0
				2790	and Match(r' {6}\w', elided[search_position])):
				2791	search_position -= 1
				2792	exception = (search_position >= 0
				2793	and elided[search_position][:5] == ' :')
				2794	else:
				2795	# Search for the function arguments or an initializer list. We use a
				2796	# simple heuristic here: If the line is indented 4 spaces; and we have a
				2797	# closing paren, without the opening paren, followed by an opening brace
				2798	# or colon (for initializer lists) we assume that it is the last line of
				2799	# a function header. If we have a colon indented 4 spaces, it is an
				2800	# initializer list.
				2801	exception = (Match(r' {4}\w[^$]$\s(const\s)?(\{\s$\|:)',
				2802	prev_line)
				2803	or Match(r' {4}:', prev_line))
				2804
				2805	if not exception:
				2806	error(filename, linenum, 'whitespace/blank_line', 2,
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2807	'Redundant blank line at the start of a code block '
				2808	'should be deleted.')
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2809	# Ignore blank lines at the end of a block in a long if-else
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2810	# chain, like this:
				2811	# if (condition1) {
				2812	# // Something followed by a blank line
				2813	#
				2814	# } else if (condition2) {
				2815	# // Something else
				2816	# }
				2817	if linenum + 1 < clean_lines.NumLines():
				2818	next_line = raw[linenum + 1]
				2819	if (next_line
				2820	and Match(r'\s*}', next_line)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2821	and next_line.find('} else ') == -1):
				2822	error(filename, linenum, 'whitespace/blank_line', 3,
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2823	'Redundant blank line at the end of a code block '
				2824	'should be deleted.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2825
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	2826	matched = Match(r'\s*(public\|protected\|private):', prev_line)
				2827	if matched:
				2828	error(filename, linenum, 'whitespace/blank_line', 3,
				2829	'Do not leave a blank line after "%s:"' % matched.group(1))
				2830
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2831	# Next, check comments
				2832	next_line_start = 0
				2833	if linenum + 1 < clean_lines.NumLines():
				2834	next_line = raw[linenum + 1]
				2835	next_line_start = len(next_line) - len(next_line.lstrip())
				2836	CheckComment(line, filename, linenum, next_line_start, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2837
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2838	# get rid of comments and strings
				2839	line = clean_lines.elided[linenum]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2840
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2841	# You shouldn't have spaces before your brackets, except maybe after
				2842	# 'delete []' or 'return []() {};'
				2843	if Search(r'\w\s+\[', line) and not Search(r'(?:delete\|return)\s+\[', line):
				2844	error(filename, linenum, 'whitespace/braces', 5,
				2845	'Extra space before [')
				2846
				2847	# In range-based for, we wanted spaces before and after the colon, but
				2848	# not around "::" tokens that might appear.
				2849	if (Search(r'for \(.[^:]:[^: ]', line) or
				2850	Search(r'for \(.[^: ]:[^:]', line)):
				2851	error(filename, linenum, 'whitespace/forcolon', 2,
				2852	'Missing space around colon in range-based for loop')
				2853
				2854
				2855	def CheckOperatorSpacing(filename, clean_lines, linenum, error):
				2856	"""Checks for horizontal spacing around operators.
				2857
				2858	Args:
				2859	filename: The name of the current file.
				2860	clean_lines: A CleansedLines instance containing the file.
				2861	linenum: The number of the line to check.
				2862	error: The function to call with any errors found.
				2863	"""
				2864	line = clean_lines.elided[linenum]
				2865
				2866	# Don't try to do spacing checks for operator methods. Do this by
				2867	# replacing the troublesome characters with something else,
				2868	# preserving column position for all other characters.
				2869	#
				2870	# The replacement is done repeatedly to avoid false positives from
				2871	# operators that call operators.
				2872	while True:
				2873	match = Match(r'^(.\boperator\b)(\S+)(\s\(.*)$', line)
				2874	if match:
				2875	line = match.group(1) + ('_' * len(match.group(2))) + match.group(3)
				2876	else:
				2877	break
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2878
				2879	# We allow no-spaces around = within an if: "if ( (a=Foo()) == 0 )".
				2880	# Otherwise not. Note we only check for non-spaces on both sides;
				2881	# sometimes people put non-spaces on one side when aligning ='s among
				2882	# many lines (not that this is behavior that I approve of...)
				2883	if Search(r'[\w.]=[\w.]', line) and not Search(r'\b(if\|while) ', line):
				2884	error(filename, linenum, 'whitespace/operators', 4,
				2885	'Missing spaces around =')
				2886
				2887	# It's ok not to have spaces around binary operators like + - * /, but if
				2888	# there's too little whitespace, we get concerned. It's hard to tell,
				2889	# though, so we punt on this one for now. TODO.
				2890
				2891	# You should always have whitespace around binary operators.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2892	#
				2893	# Check <= and >= first to avoid false positives with < and >, then
				2894	# check non-include lines for spacing around < and >.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2895	#
				2896	# If the operator is followed by a comma, assume it's be used in a
				2897	# macro context and don't do any checks. This avoids false
				2898	# positives.
				2899	#
				2900	# Note that && is not included here. Those are checked separately
				2901	# in CheckRValueReference
				2902	match = Search(r'[^<>=!\s](==\|!=\|<=\|>=\|\\|\\|)[^<>=!\s,;\)]', line)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2903	if match:
				2904	error(filename, linenum, 'whitespace/operators', 3,
				2905	'Missing spaces around %s' % match.group(1))
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2906	elif not Match(r'#.*include', line):
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2907	# Look for < that is not surrounded by spaces. This is only
				2908	# triggered if both sides are missing spaces, even though
				2909	# technically should should flag if at least one side is missing a
				2910	# space. This is done to avoid some false positives with shifts.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2911	match = Match(r'^(.*[^\s<])<[^\s=<,]', line)
				2912	if match:
				2913	(_, _, end_pos) = CloseExpression(
				2914	clean_lines, linenum, len(match.group(1)))
				2915	if end_pos <= -1:
				2916	error(filename, linenum, 'whitespace/operators', 3,
				2917	'Missing spaces around <')
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2918
				2919	# Look for > that is not surrounded by spaces. Similar to the
				2920	# above, we only trigger if both sides are missing spaces to avoid
				2921	# false positives with shifts.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2922	match = Match(r'^(.*[^-\s>])>[^\s=>,]', line)
				2923	if match:
				2924	(_, _, start_pos) = ReverseCloseExpression(
				2925	clean_lines, linenum, len(match.group(1)))
				2926	if start_pos <= -1:
				2927	error(filename, linenum, 'whitespace/operators', 3,
				2928	'Missing spaces around >')
				2929
				2930	# We allow no-spaces around << when used like this: 10<<20, but
				2931	# not otherwise (particularly, not when used as streams)
				2932	# We also allow operators following an opening parenthesis, since
				2933	# those tend to be macros that deal with operators.
				2934	match = Search(r'(operator\|\S)(?:L\|UL\|ULL\|l\|ul\|ull)?<<([^\s,=])', line)
				2935	if (match and match.group(1) != '(' and
				2936	not (match.group(1).isdigit() and match.group(2).isdigit()) and
				2937	not (match.group(1) == 'operator' and match.group(2) == ';')):
				2938	error(filename, linenum, 'whitespace/operators', 3,
				2939	'Missing spaces around <<')
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2940
				2941	# We allow no-spaces around >> for almost anything. This is because
				2942	# C++11 allows ">>" to close nested templates, which accounts for
				2943	# most cases when ">>" is not followed by a space.
				2944	#
				2945	# We still warn on ">>" followed by alpha character, because that is
				2946	# likely due to ">>" being used for right shifts, e.g.:
				2947	# value >> alpha
				2948	#
				2949	# When ">>" is used to close templates, the alphanumeric letter that
				2950	# follows would be part of an identifier, and there should still be
				2951	# a space separating the template type and the identifier.
				2952	# type<type<type>> alpha
				2953	match = Search(r'>>[a-zA-Z_]', line)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2954	if match:
				2955	error(filename, linenum, 'whitespace/operators', 3,
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	2956	'Missing spaces around >>')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2957
				2958	# There shouldn't be space around unary operators
				2959	match = Search(r'(!\s\|~\s\|[\s]--[\s;]\|[\s]\+\+[\s;])', line)
				2960	if match:
				2961	error(filename, linenum, 'whitespace/operators', 4,
				2962	'Extra space for operator %s' % match.group(1))
				2963
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	2964
				2965	def CheckParenthesisSpacing(filename, clean_lines, linenum, error):
				2966	"""Checks for horizontal spacing around parentheses.
				2967
				2968	Args:
				2969	filename: The name of the current file.
				2970	clean_lines: A CleansedLines instance containing the file.
				2971	linenum: The number of the line to check.
				2972	error: The function to call with any errors found.
				2973	"""
				2974	line = clean_lines.elided[linenum]
				2975
				2976	# No spaces after an if, while, switch, or for
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2977	match = Search(r' (if\(\|for\(\|while\(\|switch\()', line)
				2978	if match:
				2979	error(filename, linenum, 'whitespace/parens', 5,
				2980	'Missing space before ( in %s' % match.group(1))
				2981
				2982	# For if/for/while/switch, the left and right parens should be
				2983	# consistent about how many spaces are inside the parens, and
				2984	# there should either be zero or one spaces inside the parens.
				2985	# We don't want: "if ( foo)" or "if ( foo )".
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2986	# Exception: "for ( ; foo; bar)" and "for (foo; bar; )" are allowed.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2987	match = Search(r'\b(if\|for\|while\|switch)\s*'
				2988	r'$([ ])(.).[^ ]+([ ])$\s{\s*$',
				2989	line)
				2990	if match:
				2991	if len(match.group(2)) != len(match.group(4)):
				2992	if not (match.group(3) == ';' and
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	2993	len(match.group(2)) == 1 + len(match.group(4)) or
				2994	not match.group(2) and Search(r'\bfor\s$.; $', line)):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2995	error(filename, linenum, 'whitespace/parens', 5,
				2996	'Mismatching spaces inside () in %s' % match.group(1))
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	2997	if len(match.group(2)) not in [0, 1]:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	2998	error(filename, linenum, 'whitespace/parens', 5,
				2999	'Should have zero or one spaces inside ( and ) in %s' %
				3000	match.group(1))
				3001
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3002
				3003	def CheckCommaSpacing(filename, clean_lines, linenum, error):
				3004	"""Checks for horizontal spacing near commas and semicolons.
				3005
				3006	Args:
				3007	filename: The name of the current file.
				3008	clean_lines: A CleansedLines instance containing the file.
				3009	linenum: The number of the line to check.
				3010	error: The function to call with any errors found.
				3011	"""
				3012	raw = clean_lines.lines_without_raw_strings
				3013	line = clean_lines.elided[linenum]
				3014
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3015	# You should always have a space after a comma (either as fn arg or operator)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3016	#
				3017	# This does not apply when the non-space character following the
				3018	# comma is another comma, since the only time when that happens is
				3019	# for empty macro arguments.
				3020	#
				3021	# We run this check in two passes: first pass on elided lines to
				3022	# verify that lines contain missing whitespaces, second pass on raw
				3023	# lines to confirm that those missing whitespaces are not due to
				3024	# elided comments.
				3025	if Search(r',[^,\s]', line) and Search(r',[^,\s]', raw[linenum]):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3026	error(filename, linenum, 'whitespace/comma', 3,
				3027	'Missing space after ,')
				3028
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3029	# You should always have a space after a semicolon
				3030	# except for few corner cases
				3031	# TODO(unknown): clarify if 'if (1) { return 1;}' is requires one more
				3032	# space after ;
				3033	if Search(r';[^\s};\\)/]', line):
				3034	error(filename, linenum, 'whitespace/semicolon', 3,
				3035	'Missing space after ;')
				3036
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3037
				3038	def CheckBracesSpacing(filename, clean_lines, linenum, error):
				3039	"""Checks for horizontal spacing near commas.
				3040
				3041	Args:
				3042	filename: The name of the current file.
				3043	clean_lines: A CleansedLines instance containing the file.
				3044	linenum: The number of the line to check.
				3045	error: The function to call with any errors found.
				3046	"""
				3047	line = clean_lines.elided[linenum]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3048
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3049	# Except after an opening paren, or after another opening brace (in case of
				3050	# an initializer list, for instance), you should have spaces before your
				3051	# braces. And since you should never have braces at the beginning of a line,
				3052	# this is an easy test.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3053	match = Match(r'^(.*[^ ({]){', line)
				3054	if match:
				3055	# Try a bit harder to check for brace initialization. This
				3056	# happens in one of the following forms:
				3057	# Constructor() : initializer_list_{} { ... }
				3058	# Constructor{}.MemberFunction()
				3059	# Type variable{};
				3060	# FunctionCall(type{}, ...);
				3061	# LastArgument(..., type{});
				3062	# LOG(INFO) << type{} << " ...";
				3063	# map_of_type[{...}] = ...;
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3064	# ternary = expr ? new type{} : nullptr;
				3065	# OuterTemplate<InnerTemplateConstructor<Type>{}>
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3066	#
				3067	# We check for the character following the closing brace, and
				3068	# silence the warning if it's one of those listed above, i.e.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3069	# "{.;,)<>]:".
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3070	#
				3071	# To account for nested initializer list, we allow any number of
				3072	# closing braces up to "{;,)<". We can't simply silence the
				3073	# warning on first sight of closing brace, because that would
				3074	# cause false negatives for things that are not initializer lists.
				3075	# Silence this: But not this:
				3076	# Outer{ if (...) {
				3077	# Inner{...} if (...){ // Missing space before {
				3078	# }; }
				3079	#
				3080	# There is a false negative with this approach if people inserted
				3081	# spurious semicolons, e.g. "if (cond){};", but we will catch the
				3082	# spurious semicolon with a separate check.
				3083	(endline, endlinenum, endpos) = CloseExpression(
				3084	clean_lines, linenum, len(match.group(1)))
				3085	trailing_text = ''
				3086	if endpos > -1:
				3087	trailing_text = endline[endpos:]
				3088	for offset in xrange(endlinenum + 1,
				3089	min(endlinenum + 3, clean_lines.NumLines() - 1)):
				3090	trailing_text += clean_lines.elided[offset]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3091	if not Match(r'^[\s}]*[{.;,)<>\]:]', trailing_text):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3092	error(filename, linenum, 'whitespace/braces', 5,
				3093	'Missing space before {')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3094
				3095	# Make sure '} else {' has spaces.
				3096	if Search(r'}else', line):
				3097	error(filename, linenum, 'whitespace/braces', 5,
				3098	'Missing space before else')
				3099
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3100	# You shouldn't have a space before a semicolon at the end of the line.
				3101	# There's a special case for "for" since the style guide allows space before
				3102	# the semicolon there.
				3103	if Search(r':\s;\s$', line):
				3104	error(filename, linenum, 'whitespace/semicolon', 5,
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3105	'Semicolon defining empty statement. Use {} instead.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3106	elif Search(r'^\s;\s$', line):
				3107	error(filename, linenum, 'whitespace/semicolon', 5,
				3108	'Line contains only semicolon. If this should be an empty statement, '
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3109	'use {} instead.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3110	elif (Search(r'\s+;\s*$', line) and
				3111	not Search(r'\bfor\b', line)):
				3112	error(filename, linenum, 'whitespace/semicolon', 5,
				3113	'Extra space before last semicolon. If this should be an empty '
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3114	'statement, use {} instead.')
				3115
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3116
				3117	def IsDecltype(clean_lines, linenum, column):
				3118	"""Check if the token ending on (linenum, column) is decltype().
				3119
				3120	Args:
				3121	clean_lines: A CleansedLines instance containing the file.
				3122	linenum: the number of the line to check.
				3123	column: end column of the token to check.
				3124	Returns:
				3125	True if this token is decltype() expression, False otherwise.
				3126	"""
				3127	(text, _, start_col) = ReverseCloseExpression(clean_lines, linenum, column)
				3128	if start_col < 0:
				3129	return False
				3130	if Search(r'\bdecltype\s*$', text[0:start_col]):
				3131	return True
				3132	return False
				3133
				3134
				3135	def IsTemplateParameterList(clean_lines, linenum, column):
				3136	"""Check if the token ending on (linenum, column) is the end of template<>.
				3137
				3138	Args:
				3139	clean_lines: A CleansedLines instance containing the file.
				3140	linenum: the number of the line to check.
				3141	column: end column of the token to check.
				3142	Returns:
				3143	True if this token is end of a template parameter list, False otherwise.
				3144	"""
				3145	(_, startline, startpos) = ReverseCloseExpression(
				3146	clean_lines, linenum, column)
				3147	if (startpos > -1 and
				3148	Search(r'\btemplate\s*$', clean_lines.elided[startline][0:startpos])):
				3149	return True
				3150	return False
				3151
				3152
				3153	def IsRValueType(clean_lines, nesting_state, linenum, column):
				3154	"""Check if the token ending on (linenum, column) is a type.
				3155
				3156	Assumes that text to the right of the column is "&&" or a function
				3157	name.
				3158
				3159	Args:
				3160	clean_lines: A CleansedLines instance containing the file.
				3161	nesting_state: A NestingState instance which maintains information about
				3162	the current stack of nested blocks being parsed.
				3163	linenum: the number of the line to check.
				3164	column: end column of the token to check.
				3165	Returns:
				3166	True if this token is a type, False if we are not sure.
				3167	"""
				3168	prefix = clean_lines.elided[linenum][0:column]
				3169
				3170	# Get one word to the left. If we failed to do so, this is most
				3171	# likely not a type, since it's unlikely that the type name and "&&"
				3172	# would be split across multiple lines.
				3173	match = Match(r'^(.)(\b\w+\|[>)&])\s*$', prefix)
				3174	if not match:
				3175	return False
				3176
				3177	# Check text following the token. If it's "&&>" or "&&," or "&&...", it's
				3178	# most likely a rvalue reference used inside a template.
				3179	suffix = clean_lines.elided[linenum][column:]
				3180	if Match(r'&&\s*(?:[>,]\|\.\.\.)', suffix):
				3181	return True
				3182
				3183	# Check for simple type and end of templates:
				3184	# int&& variable
				3185	# vector<int>&& variable
				3186	#
				3187	# Because this function is called recursively, we also need to
				3188	# recognize pointer and reference types:
				3189	# int* Function()
				3190	# int& Function()
				3191	if match.group(2) in ['char', 'char16_t', 'char32_t', 'wchar_t', 'bool',
				3192	'short', 'int', 'long', 'signed', 'unsigned',
				3193	'float', 'double', 'void', 'auto', '>', '*', '&']:
				3194	return True
				3195
				3196	# If we see a close parenthesis, look for decltype on the other side.
				3197	# decltype would unambiguously identify a type, anything else is
				3198	# probably a parenthesized expression and not a type.
				3199	if match.group(2) == ')':
				3200	return IsDecltype(
				3201	clean_lines, linenum, len(match.group(1)) + len(match.group(2)) - 1)
				3202
				3203	# Check for casts and cv-qualifiers.
				3204	# match.group(1) remainder
				3205	# -------------- ---------
				3206	# const_cast< type&&
				3207	# const type&&
				3208	# type const&&
				3209	if Search(r'\b(?:const_cast\s<\|static_cast\s<\|dynamic_cast\s*<\|'
				3210	r'reinterpret_cast\s<\|\w+\s)\s$',
				3211	match.group(1)):
				3212	return True
				3213
				3214	# Look for a preceding symbol that might help differentiate the context.
				3215	# These are the cases that would be ambiguous:
				3216	# match.group(1) remainder
				3217	# -------------- ---------
				3218	# Call ( expression &&
				3219	# Declaration ( type&&
				3220	# sizeof ( type&&
				3221	# if ( expression &&
				3222	# while ( expression &&
				3223	# for ( type&&
				3224	# for( ; expression &&
				3225	# statement ; type&&
				3226	# block { type&&
				3227	# constructor { expression &&
				3228	start = linenum
				3229	line = match.group(1)
				3230	match_symbol = None
				3231	while start >= 0:
				3232	# We want to skip over identifiers and commas to get to a symbol.
				3233	# Commas are skipped so that we can find the opening parenthesis
				3234	# for function parameter lists.
				3235	match_symbol = Match(r'^(.)([^\w\s,])[\w\s,]$', line)
				3236	if match_symbol:
				3237	break
				3238	start -= 1
				3239	line = clean_lines.elided[start]
				3240
				3241	if not match_symbol:
				3242	# Probably the first statement in the file is an rvalue reference
				3243	return True
				3244
				3245	if match_symbol.group(2) == '}':
				3246	# Found closing brace, probably an indicate of this:
				3247	# block{} type&&
				3248	return True
				3249
				3250	if match_symbol.group(2) == ';':
				3251	# Found semicolon, probably one of these:
				3252	# for(; expression &&
				3253	# statement; type&&
				3254
				3255	# Look for the previous 'for(' in the previous lines.
				3256	before_text = match_symbol.group(1)
				3257	for i in xrange(start - 1, max(start - 6, 0), -1):
				3258	before_text = clean_lines.elided[i] + before_text
				3259	if Search(r'for\s\([^{};]$', before_text):
				3260	# This is the condition inside a for-loop
				3261	return False
				3262
				3263	# Did not find a for-init-statement before this semicolon, so this
				3264	# is probably a new statement and not a condition.
				3265	return True
				3266
				3267	if match_symbol.group(2) == '{':
				3268	# Found opening brace, probably one of these:
				3269	# block{ type&& = ... ; }
				3270	# constructor{ expression && expression }
				3271
				3272	# Look for a closing brace or a semicolon. If we see a semicolon
				3273	# first, this is probably a rvalue reference.
				3274	line = clean_lines.elided[start][0:len(match_symbol.group(1)) + 1]
				3275	end = start
				3276	depth = 1
				3277	while True:
				3278	for ch in line:
				3279	if ch == ';':
				3280	return True
				3281	elif ch == '{':
				3282	depth += 1
				3283	elif ch == '}':
				3284	depth -= 1
				3285	if depth == 0:
				3286	return False
				3287	end += 1
				3288	if end >= clean_lines.NumLines():
				3289	break
				3290	line = clean_lines.elided[end]
				3291	# Incomplete program?
				3292	return False
				3293
				3294	if match_symbol.group(2) == '(':
				3295	# Opening parenthesis. Need to check what's to the left of the
				3296	# parenthesis. Look back one extra line for additional context.
				3297	before_text = match_symbol.group(1)
				3298	if linenum > 1:
				3299	before_text = clean_lines.elided[linenum - 1] + before_text
				3300	before_text = match_symbol.group(1)
				3301
				3302	# Patterns that are likely to be types:
				3303	# [](type&&
				3304	# for (type&&
				3305	# sizeof(type&&
				3306	# operator=(type&&
				3307	#
				3308	if Search(r'(?:\]\|\bfor\|\bsizeof\|\boperator\s\S+\s)\s*$', before_text):
				3309	return True
				3310
				3311	# Patterns that are likely to be expressions:
				3312	# if (expression &&
				3313	# while (expression &&
				3314	# : initializer(expression &&
				3315	# , initializer(expression &&
				3316	# ( FunctionCall(expression &&
				3317	# + FunctionCall(expression &&
				3318	# + (expression &&
				3319	#
				3320	# The last '+' represents operators such as '+' and '-'.
				3321	if Search(r'(?:\bif\|\bwhile\|[-+=%^(<!?:,&]\s)$', before_text):
				3322	return False
				3323
				3324	# Something else. Check that tokens to the left look like
				3325	# return_type function_name
				3326	match_func = Match(r'^(.)\s+\w(?:\w\|::)(?:<[^<>]>)?\s$',
				3327	match_symbol.group(1))
				3328	if match_func:
				3329	# Check for constructors, which don't have return types.
				3330	if Search(r'\bexplicit$', match_func.group(1)):
				3331	return True
				3332	implicit_constructor = Match(r'\s*(\w+)\((?:const\s+)?(\w+)', prefix)
				3333	if (implicit_constructor and
				3334	implicit_constructor.group(1) == implicit_constructor.group(2)):
				3335	return True
				3336	return IsRValueType(clean_lines, nesting_state, linenum,
				3337	len(match_func.group(1)))
				3338
				3339	# Nothing before the function name. If this is inside a block scope,
				3340	# this is probably a function call.
				3341	return not (nesting_state.previous_stack_top and
				3342	nesting_state.previous_stack_top.IsBlockInfo())
				3343
				3344	if match_symbol.group(2) == '>':
				3345	# Possibly a closing bracket, check that what's on the other side
				3346	# looks like the start of a template.
				3347	return IsTemplateParameterList(
				3348	clean_lines, start, len(match_symbol.group(1)))
				3349
				3350	# Some other symbol, usually something like "a=b&&c". This is most
				3351	# likely not a type.
				3352	return False
				3353
				3354
				3355	def IsRValueAllowed(clean_lines, linenum):
				3356	"""Check if RValue reference is allowed within some range of lines.
				3357
				3358	Args:
				3359	clean_lines: A CleansedLines instance containing the file.
				3360	linenum: The number of the line to check.
				3361	Returns:
				3362	True if line is within the region where RValue references are allowed.
				3363	"""
				3364	for i in xrange(linenum, 0, -1):
				3365	line = clean_lines.elided[i]
				3366	if Match(r'GOOGLE_ALLOW_RVALUE_REFERENCES_(?:PUSH\|POP)', line):
				3367	if not line.endswith('PUSH'):
				3368	return False
				3369	for j in xrange(linenum, clean_lines.NumLines(), 1):
				3370	line = clean_lines.elided[j]
				3371	if Match(r'GOOGLE_ALLOW_RVALUE_REFERENCES_(?:PUSH\|POP)', line):
				3372	return line.endswith('POP')
				3373	return False
				3374
				3375
				3376	def CheckRValueReference(filename, clean_lines, linenum, nesting_state, error):
				3377	"""Check for rvalue references.
				3378
				3379	Args:
				3380	filename: The name of the current file.
				3381	clean_lines: A CleansedLines instance containing the file.
				3382	linenum: The number of the line to check.
				3383	nesting_state: A NestingState instance which maintains information about
				3384	the current stack of nested blocks being parsed.
				3385	error: The function to call with any errors found.
				3386	"""
				3387	# Find lines missing spaces around &&.
				3388	# TODO(unknown): currently we don't check for rvalue references
				3389	# with spaces surrounding the && to avoid false positives with
				3390	# boolean expressions.
				3391	line = clean_lines.elided[linenum]
				3392	match = Match(r'^(.*\S)&&', line)
				3393	if not match:
				3394	match = Match(r'(.*)&&\S', line)
				3395	if (not match) or '(&&)' in line or Search(r'\boperator\s*$', match.group(1)):
				3396	return
				3397
				3398	# Either poorly formed && or an rvalue reference, check the context
				3399	# to get a more accurate error message. Mostly we want to determine
				3400	# if what's to the left of "&&" is a type or not.
				3401	and_pos = len(match.group(1))
				3402	if IsRValueType(clean_lines, nesting_state, linenum, and_pos):
				3403	if not IsRValueAllowed(clean_lines, linenum):
				3404	error(filename, linenum, 'build/c++11', 3,
				3405	'RValue references are an unapproved C++ feature.')
				3406	else:
				3407	error(filename, linenum, 'whitespace/operators', 3,
				3408	'Missing spaces around &&')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3409
				3410
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3411	def CheckSectionSpacing(filename, clean_lines, class_info, linenum, error):
				3412	"""Checks for additional blank line issues related to sections.
				3413
				3414	Currently the only thing checked here is blank line before protected/private.
				3415
				3416	Args:
				3417	filename: The name of the current file.
				3418	clean_lines: A CleansedLines instance containing the file.
				3419	class_info: A _ClassInfo objects.
				3420	linenum: The number of the line to check.
				3421	error: The function to call with any errors found.
				3422	"""
				3423	# Skip checks if the class is small, where small means 25 lines or less.
				3424	# 25 lines seems like a good cutoff since that's the usual height of
				3425	# terminals, and any class that can't fit in one screen can't really
				3426	# be considered "small".
				3427	#
				3428	# Also skip checks if we are on the first line. This accounts for
				3429	# classes that look like
				3430	# class Foo { public: ... };
				3431	#
				3432	# If we didn't find the end of the class, last_line would be zero,
				3433	# and the check will be skipped by the first condition.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3434	if (class_info.last_line - class_info.starting_linenum <= 24 or
				3435	linenum <= class_info.starting_linenum):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3436	return
				3437
				3438	matched = Match(r'\s*(public\|protected\|private):', clean_lines.lines[linenum])
				3439	if matched:
				3440	# Issue warning if the line before public/protected/private was
				3441	# not a blank line, but don't do this if the previous line contains
				3442	# "class" or "struct". This can happen two ways:
				3443	# - We are at the beginning of the class.
				3444	# - We are forward-declaring an inner class that is semantically
				3445	# private, but needed to be public for implementation reasons.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3446	# Also ignores cases where the previous line ends with a backslash as can be
				3447	# common when defining classes in C macros.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3448	prev_line = clean_lines.lines[linenum - 1]
				3449	if (not IsBlankLine(prev_line) and
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3450	not Search(r'\b(class\|struct)\b', prev_line) and
				3451	not Search(r'\\$', prev_line)):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3452	# Try a bit harder to find the beginning of the class. This is to
				3453	# account for multi-line base-specifier lists, e.g.:
				3454	# class Derived
				3455	# : public Base {
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3456	end_class_head = class_info.starting_linenum
				3457	for i in range(class_info.starting_linenum, linenum):
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3458	if Search(r'\{\s*$', clean_lines.lines[i]):
				3459	end_class_head = i
				3460	break
				3461	if end_class_head < linenum - 1:
				3462	error(filename, linenum, 'whitespace/blank_line', 3,
				3463	'"%s:" should be preceded by a blank line' % matched.group(1))
				3464
				3465
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3466	def GetPreviousNonBlankLine(clean_lines, linenum):
				3467	"""Return the most recent non-blank line and its line number.
				3468
				3469	Args:
				3470	clean_lines: A CleansedLines instance containing the file contents.
				3471	linenum: The number of the line to check.
				3472
				3473	Returns:
				3474	A tuple with two elements. The first element is the contents of the last
				3475	non-blank line before the current line, or the empty string if this is the
				3476	first non-blank line. The second is the line number of that line, or -1
				3477	if this is the first non-blank line.
				3478	"""
				3479
				3480	prevlinenum = linenum - 1
				3481	while prevlinenum >= 0:
				3482	prevline = clean_lines.elided[prevlinenum]
				3483	if not IsBlankLine(prevline): # if not a blank line...
				3484	return (prevline, prevlinenum)
				3485	prevlinenum -= 1
				3486	return ('', -1)
				3487
				3488
				3489	def CheckBraces(filename, clean_lines, linenum, error):
				3490	"""Looks for misplaced braces (e.g. at the end of line).
				3491
				3492	Args:
				3493	filename: The name of the current file.
				3494	clean_lines: A CleansedLines instance containing the file.
				3495	linenum: The number of the line to check.
				3496	error: The function to call with any errors found.
				3497	"""
				3498
				3499	line = clean_lines.elided[linenum] # get rid of comments and strings
				3500
				3501	if Match(r'\s{\s$', line):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3502	# We allow an open brace to start a line in the case where someone is using
				3503	# braces in a block to explicitly create a new scope, which is commonly used
				3504	# to control the lifetime of stack-allocated variables. Braces are also
				3505	# used for brace initializers inside function calls. We don't detect this
				3506	# perfectly: we just don't complain if the last non-whitespace character on
				3507	# the previous non-blank line is ',', ';', ':', '(', '{', or '}', or if the
				3508	# previous line starts a preprocessor block.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3509	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3510	if (not Search(r'[,;:}{(]\s*$', prevline) and
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3511	not Match(r'\s*#', prevline)):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3512	error(filename, linenum, 'whitespace/braces', 4,
				3513	'{ should almost always be at the end of the previous line')
				3514
				3515	# An else clause should be on the same line as the preceding closing brace.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3516	if Match(r'\selse\b\s(?:if\b\|\{\|$)', line):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3517	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
				3518	if Match(r'\s}\s$', prevline):
				3519	error(filename, linenum, 'whitespace/newline', 4,
				3520	'An else should appear on the same line as the preceding }')
				3521
				3522	# If braces come on one side of an else, they should be on both.
				3523	# However, we have to worry about "else if" that spans multiple lines!
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3524	if Search(r'else if\s*\(', line): # could be multi-line if
				3525	brace_on_left = bool(Search(r'}\selse if\s\(', line))
				3526	# find the ( after the if
				3527	pos = line.find('else if')
				3528	pos = line.find('(', pos)
				3529	if pos > 0:
				3530	(endline, _, endpos) = CloseExpression(clean_lines, linenum, pos)
				3531	brace_on_right = endline[endpos:].find('{') != -1
				3532	if brace_on_left != brace_on_right: # must be brace after if
				3533	error(filename, linenum, 'readability/braces', 5,
				3534	'If an else has a brace on one side, it should have it on both')
				3535	elif Search(r'}\selse[^{]$', line) or Match(r'[^}]else\s{', line):
				3536	error(filename, linenum, 'readability/braces', 5,
				3537	'If an else has a brace on one side, it should have it on both')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3538
				3539	# Likewise, an else should never have the else clause on the same line
				3540	if Search(r'\belse [^\s{]', line) and not Search(r'\belse if\b', line):
				3541	error(filename, linenum, 'whitespace/newline', 4,
				3542	'Else clause should never be on same line as else (use 2 lines)')
				3543
				3544	# In the same way, a do/while should never be on one line
				3545	if Match(r'\s*do [^\s{]', line):
				3546	error(filename, linenum, 'whitespace/newline', 4,
				3547	'do/while clauses should not be on a single line')
				3548
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3549	# Check single-line if/else bodies. The style guide says 'curly braces are not
				3550	# required for single-line statements'. We additionally allow multi-line,
				3551	# single statements, but we reject anything with more than one semicolon in
				3552	# it. This means that the first semicolon after the if should be at the end of
				3553	# its line, and the line after that should have an indent level equal to or
				3554	# lower than the if. We also check for ambiguous if/else nesting without
				3555	# braces.
				3556	if_else_match = Search(r'\b(if\s*\(\|else\b)', line)
				3557	if if_else_match and not Match(r'\s*#', line):
				3558	if_indent = GetIndentLevel(line)
				3559	endline, endlinenum, endpos = line, linenum, if_else_match.end()
				3560	if_match = Search(r'\bif\s*\(', line)
				3561	if if_match:
				3562	# This could be a multiline if condition, so find the end first.
				3563	pos = if_match.end() - 1
				3564	(endline, endlinenum, endpos) = CloseExpression(clean_lines, linenum, pos)
				3565	# Check for an opening brace, either directly after the if or on the next
				3566	# line. If found, this isn't a single-statement conditional.
				3567	if (not Match(r'\s*{', endline[endpos:])
				3568	and not (Match(r'\s*$', endline[endpos:])
				3569	and endlinenum < (len(clean_lines.elided) - 1)
				3570	and Match(r'\s*{', clean_lines.elided[endlinenum + 1]))):
				3571	while (endlinenum < len(clean_lines.elided)
				3572	and ';' not in clean_lines.elided[endlinenum][endpos:]):
				3573	endlinenum += 1
				3574	endpos = 0
				3575	if endlinenum < len(clean_lines.elided):
				3576	endline = clean_lines.elided[endlinenum]
				3577	# We allow a mix of whitespace and closing braces (e.g. for one-liner
				3578	# methods) and a single \ after the semicolon (for macros)
				3579	endpos = endline.find(';')
				3580	if not Match(r';[\s}]*(\\?)$', endline[endpos:]):
				3581	# Semicolon isn't the last character, there's something trailing
				3582	error(filename, linenum, 'readability/braces', 4,
				3583	'If/else bodies with multiple statements require braces')
				3584	elif endlinenum < len(clean_lines.elided) - 1:
				3585	# Make sure the next line is dedented
				3586	next_line = clean_lines.elided[endlinenum + 1]
				3587	next_indent = GetIndentLevel(next_line)
				3588	# With ambiguous nested if statements, this will error out on the
				3589	# if that doesn't match the else, regardless of whether it's the
				3590	# inner one or outer one.
				3591	if (if_match and Match(r'\s*else\b', next_line)
				3592	and next_indent != if_indent):
				3593	error(filename, linenum, 'readability/braces', 4,
				3594	'Else clause should be indented at the same level as if. '
				3595	'Ambiguous nested if/else chains require braces.')
				3596	elif next_indent > if_indent:
				3597	error(filename, linenum, 'readability/braces', 4,
				3598	'If/else bodies with multiple statements require braces')
				3599
				3600
				3601	def CheckTrailingSemicolon(filename, clean_lines, linenum, error):
				3602	"""Looks for redundant trailing semicolon.
				3603
				3604	Args:
				3605	filename: The name of the current file.
				3606	clean_lines: A CleansedLines instance containing the file.
				3607	linenum: The number of the line to check.
				3608	error: The function to call with any errors found.
				3609	"""
				3610
				3611	line = clean_lines.elided[linenum]
				3612
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3613	# Block bodies should not be followed by a semicolon. Due to C++11
				3614	# brace initialization, there are more places where semicolons are
				3615	# required than not, so we use a whitelist approach to check these
				3616	# rather than a blacklist. These are the places where "};" should
				3617	# be replaced by just "}":
				3618	# 1. Some flavor of block following closing parenthesis:
				3619	# for (;;) {};
				3620	# while (...) {};
				3621	# switch (...) {};
				3622	# Function(...) {};
				3623	# if (...) {};
				3624	# if (...) else if (...) {};
				3625	#
				3626	# 2. else block:
				3627	# if (...) else {};
				3628	#
				3629	# 3. const member function:
				3630	# Function(...) const {};
				3631	#
				3632	# 4. Block following some statement:
				3633	# x = 42;
				3634	# {};
				3635	#
				3636	# 5. Block at the beginning of a function:
				3637	# Function(...) {
				3638	# {};
				3639	# }
				3640	#
				3641	# Note that naively checking for the preceding "{" will also match
				3642	# braces inside multi-dimensional arrays, but this is fine since
				3643	# that expression will not contain semicolons.
				3644	#
				3645	# 6. Block following another block:
				3646	# while (true) {}
				3647	# {};
				3648	#
				3649	# 7. End of namespaces:
				3650	# namespace {};
				3651	#
				3652	# These semicolons seems far more common than other kinds of
				3653	# redundant semicolons, possibly due to people converting classes
				3654	# to namespaces. For now we do not warn for this case.
				3655	#
				3656	# Try matching case 1 first.
				3657	match = Match(r'^(.\)\s)\{', line)
				3658	if match:
				3659	# Matched closing parenthesis (case 1). Check the token before the
				3660	# matching opening parenthesis, and don't warn if it looks like a
				3661	# macro. This avoids these false positives:
				3662	# - macro that defines a base class
				3663	# - multi-line macro that defines a base class
				3664	# - macro that defines the whole class-head
				3665	#
				3666	# But we still issue warnings for macros that we know are safe to
				3667	# warn, specifically:
				3668	# - TEST, TEST_F, TEST_P, MATCHER, MATCHER_P
				3669	# - TYPED_TEST
				3670	# - INTERFACE_DEF
				3671	# - EXCLUSIVE_LOCKS_REQUIRED, SHARED_LOCKS_REQUIRED, LOCKS_EXCLUDED:
				3672	#
				3673	# We implement a whitelist of safe macros instead of a blacklist of
				3674	# unsafe macros, even though the latter appears less frequently in
				3675	# google code and would have been easier to implement. This is because
				3676	# the downside for getting the whitelist wrong means some extra
				3677	# semicolons, while the downside for getting the blacklist wrong
				3678	# would result in compile errors.
				3679	#
				3680	# In addition to macros, we also don't want to warn on compound
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3681	# literals and lambdas.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3682	closing_brace_pos = match.group(1).rfind(')')
				3683	opening_parenthesis = ReverseCloseExpression(
				3684	clean_lines, linenum, closing_brace_pos)
				3685	if opening_parenthesis[2] > -1:
				3686	line_prefix = opening_parenthesis[0][0:opening_parenthesis[2]]
				3687	macro = Search(r'\b([A-Z_]+)\s*$', line_prefix)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3688	func = Match(r'^(.\])\s$', line_prefix)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3689	if ((macro and
				3690	macro.group(1) not in (
				3691	'TEST', 'TEST_F', 'MATCHER', 'MATCHER_P', 'TYPED_TEST',
				3692	'EXCLUSIVE_LOCKS_REQUIRED', 'SHARED_LOCKS_REQUIRED',
				3693	'LOCKS_EXCLUDED', 'INTERFACE_DEF')) or
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3694	(func and not Search(r'\boperator\s\[\s\]', func.group(1))) or
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3695	Search(r'\s+=\s*$', line_prefix)):
				3696	match = None
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3697	if (match and
				3698	opening_parenthesis[1] > 1 and
				3699	Search(r'\]\s*$', clean_lines.elided[opening_parenthesis[1] - 1])):
				3700	# Multi-line lambda-expression
				3701	match = None
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3702
				3703	else:
				3704	# Try matching cases 2-3.
				3705	match = Match(r'^(.(?:else\|\)\sconst)\s*)\{', line)
				3706	if not match:
				3707	# Try matching cases 4-6. These are always matched on separate lines.
				3708	#
				3709	# Note that we can't simply concatenate the previous line to the
				3710	# current line and do a single match, otherwise we may output
				3711	# duplicate warnings for the blank line case:
				3712	# if (cond) {
				3713	# // blank line
				3714	# }
				3715	prevline = GetPreviousNonBlankLine(clean_lines, linenum)[0]
				3716	if prevline and Search(r'[;{}]\s*$', prevline):
				3717	match = Match(r'^(\s*)\{', line)
				3718
				3719	# Check matching closing brace
				3720	if match:
				3721	(endline, endlinenum, endpos) = CloseExpression(
				3722	clean_lines, linenum, len(match.group(1)))
				3723	if endpos > -1 and Match(r'^\s*;', endline[endpos:]):
				3724	# Current {} pair is eligible for semicolon check, and we have found
				3725	# the redundant semicolon, output warning here.
				3726	#
				3727	# Note: because we are scanning forward for opening braces, and
				3728	# outputting warnings for the matching closing brace, if there are
				3729	# nested blocks with trailing semicolons, we will get the error
				3730	# messages in reversed order.
				3731	error(filename, endlinenum, 'readability/braces', 4,
				3732	"You don't need a ; after a }")
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3733
				3734
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3735	def CheckEmptyBlockBody(filename, clean_lines, linenum, error):
				3736	"""Look for empty loop/conditional body with only a single semicolon.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3737
				3738	Args:
				3739	filename: The name of the current file.
				3740	clean_lines: A CleansedLines instance containing the file.
				3741	linenum: The number of the line to check.
				3742	error: The function to call with any errors found.
				3743	"""
				3744
				3745	# Search for loop keywords at the beginning of the line. Because only
				3746	# whitespaces are allowed before the keywords, this will also ignore most
				3747	# do-while-loops, since those lines should start with closing brace.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3748	#
				3749	# We also check "if" blocks here, since an empty conditional block
				3750	# is likely an error.
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3751	line = clean_lines.elided[linenum]
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3752	matched = Match(r'\s(for\|while\|if)\s\(', line)
				3753	if matched:
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3754	# Find the end of the conditional expression
				3755	(end_line, end_linenum, end_pos) = CloseExpression(
				3756	clean_lines, linenum, line.find('('))
				3757
				3758	# Output warning if what follows the condition expression is a semicolon.
				3759	# No warning for all other cases, including whitespace or newline, since we
				3760	# have a separate check for semicolons preceded by whitespace.
				3761	if end_pos >= 0 and Match(r';', end_line[end_pos:]):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3762	if matched.group(1) == 'if':
				3763	error(filename, end_linenum, 'whitespace/empty_conditional_body', 5,
				3764	'Empty conditional bodies should use {}')
				3765	else:
				3766	error(filename, end_linenum, 'whitespace/empty_loop_body', 5,
				3767	'Empty loop bodies should use {} or continue')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3768
				3769
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3770	def FindCheckMacro(line):
				3771	"""Find a replaceable CHECK-like macro.
				3772
				3773	Args:
				3774	line: line to search on.
				3775	Returns:
				3776	(macro name, start position), or (None, -1) if no replaceable
				3777	macro is found.
				3778	"""
				3779	for macro in _CHECK_MACROS:
				3780	i = line.find(macro)
				3781	if i >= 0:
				3782	# Find opening parenthesis. Do a regular expression match here
				3783	# to make sure that we are matching the expected CHECK macro, as
				3784	# opposed to some other macro that happens to contain the CHECK
				3785	# substring.
				3786	matched = Match(r'^(.\b' + macro + r'\s)\(', line)
				3787	if not matched:
				3788	continue
				3789	return (macro, len(matched.group(1)))
				3790	return (None, -1)
				3791
				3792
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3793	def CheckCheck(filename, clean_lines, linenum, error):
				3794	"""Checks the use of CHECK and EXPECT macros.
				3795
				3796	Args:
				3797	filename: The name of the current file.
				3798	clean_lines: A CleansedLines instance containing the file.
				3799	linenum: The number of the line to check.
				3800	error: The function to call with any errors found.
				3801	"""
				3802
				3803	# Decide the set of replacement macros that should be suggested
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3804	lines = clean_lines.elided
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3805	(check_macro, start_pos) = FindCheckMacro(lines[linenum])
				3806	if not check_macro:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3807	return
				3808
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3809	# Find end of the boolean expression by matching parentheses
				3810	(last_line, end_line, end_pos) = CloseExpression(
				3811	clean_lines, linenum, start_pos)
				3812	if end_pos < 0:
				3813	return
				3814	if linenum == end_line:
				3815	expression = lines[linenum][start_pos + 1:end_pos - 1]
				3816	else:
				3817	expression = lines[linenum][start_pos + 1:]
				3818	for i in xrange(linenum + 1, end_line):
				3819	expression += lines[i]
				3820	expression += last_line[0:end_pos - 1]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3821
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3822	# Parse expression so that we can take parentheses into account.
				3823	# This avoids false positives for inputs like "CHECK((a < 4) == b)",
				3824	# which is not replaceable by CHECK_LE.
				3825	lhs = ''
				3826	rhs = ''
				3827	operator = None
				3828	while expression:
				3829	matched = Match(r'^\s(<<\|<<=\|>>\|>>=\|->\\|->\|&&\|\\|\\|\|'
				3830	r'==\|!=\|>=\|>\|<=\|<\|\()(.*)$', expression)
				3831	if matched:
				3832	token = matched.group(1)
				3833	if token == '(':
				3834	# Parenthesized operand
				3835	expression = matched.group(2)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3836	(end, _) = FindEndOfExpressionInLine(expression, 0, ['('])
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3837	if end < 0:
				3838	return # Unmatched parenthesis
				3839	lhs += '(' + expression[0:end]
				3840	expression = expression[end:]
				3841	elif token in ('&&', '\|\|'):
				3842	# Logical and/or operators. This means the expression
				3843	# contains more than one term, for example:
				3844	# CHECK(42 < a && a < b);
				3845	#
				3846	# These are not replaceable with CHECK_LE, so bail out early.
				3847	return
				3848	elif token in ('<<', '<<=', '>>', '>>=', '->*', '->'):
				3849	# Non-relational operator
				3850	lhs += token
				3851	expression = matched.group(2)
				3852	else:
				3853	# Relational operator
				3854	operator = token
				3855	rhs = matched.group(2)
				3856	break
				3857	else:
				3858	# Unparenthesized operand. Instead of appending to lhs one character
				3859	# at a time, we do another regular expression match to consume several
				3860	# characters at once if possible. Trivial benchmark shows that this
				3861	# is more efficient when the operands are longer than a single
				3862	# character, which is generally the case.
				3863	matched = Match(r'^([^-=!<>()&\|]+)(.*)$', expression)
				3864	if not matched:
				3865	matched = Match(r'^(\s\S)(.)$', expression)
				3866	if not matched:
				3867	break
				3868	lhs += matched.group(1)
				3869	expression = matched.group(2)
				3870
				3871	# Only apply checks if we got all parts of the boolean expression
				3872	if not (lhs and operator and rhs):
				3873	return
				3874
				3875	# Check that rhs do not contain logical operators. We already know
				3876	# that lhs is fine since the loop above parses out && and \|\|.
				3877	if rhs.find('&&') > -1 or rhs.find('\|\|') > -1:
				3878	return
				3879
				3880	# At least one of the operands must be a constant literal. This is
				3881	# to avoid suggesting replacements for unprintable things like
				3882	# CHECK(variable != iterator)
				3883	#
				3884	# The following pattern matches decimal, hex integers, strings, and
				3885	# characters (in that order).
				3886	lhs = lhs.strip()
				3887	rhs = rhs.strip()
				3888	match_constant = r'^([-+]?(\d+\|0[xX][0-9a-fA-F]+)[lLuU]{0,3}\|"."\|\'.\')$'
				3889	if Match(match_constant, lhs) or Match(match_constant, rhs):
				3890	# Note: since we know both lhs and rhs, we can provide a more
				3891	# descriptive error message like:
				3892	# Consider using CHECK_EQ(x, 42) instead of CHECK(x == 42)
				3893	# Instead of:
				3894	# Consider using CHECK_EQ instead of CHECK(a == b)
				3895	#
				3896	# We are still keeping the less descriptive message because if lhs
				3897	# or rhs gets long, the error message might become unreadable.
				3898	error(filename, linenum, 'readability/check', 2,
				3899	'Consider using %s instead of %s(a %s b)' % (
				3900	_CHECK_REPLACEMENT[check_macro][operator],
				3901	check_macro, operator))
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3902
				3903
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3904	def CheckAltTokens(filename, clean_lines, linenum, error):
				3905	"""Check alternative keywords being used in boolean expressions.
				3906
				3907	Args:
				3908	filename: The name of the current file.
				3909	clean_lines: A CleansedLines instance containing the file.
				3910	linenum: The number of the line to check.
				3911	error: The function to call with any errors found.
				3912	"""
				3913	line = clean_lines.elided[linenum]
				3914
				3915	# Avoid preprocessor lines
				3916	if Match(r'^\s*#', line):
				3917	return
				3918
				3919	# Last ditch effort to avoid multi-line comments. This will not help
				3920	# if the comment started before the current line or ended after the
				3921	# current line, but it catches most of the false positives. At least,
				3922	# it provides a way to workaround this warning for people who use
				3923	# multi-line comments in preprocessor macros.
				3924	#
				3925	# TODO(unknown): remove this once cpplint has better support for
				3926	# multi-line comments.
				3927	if line.find('/') >= 0 or line.find('/') >= 0:
				3928	return
				3929
				3930	for match in _ALT_TOKEN_REPLACEMENT_PATTERN.finditer(line):
				3931	error(filename, linenum, 'readability/alt_tokens', 2,
				3932	'Use operator %s instead of %s' % (
				3933	_ALT_TOKEN_REPLACEMENT[match.group(1)], match.group(1)))
				3934
				3935
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3936	def GetLineWidth(line):
				3937	"""Determines the width of the line in column positions.
				3938
				3939	Args:
				3940	line: A string, which may be a Unicode string.
				3941
				3942	Returns:
				3943	The width of the line in column positions, accounting for Unicode
				3944	combining characters and wide characters.
				3945	"""
				3946	if isinstance(line, unicode):
				3947	width = 0
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3948	for uc in unicodedata.normalize('NFC', line):
				3949	if unicodedata.east_asian_width(uc) in ('W', 'F'):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3950	width += 2
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3951	elif not unicodedata.combining(uc):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3952	width += 1
				3953	return width
				3954	else:
				3955	return len(line)
				3956
				3957
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3958	def CheckStyle(filename, clean_lines, linenum, file_extension, nesting_state,
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	3959	error):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3960	"""Checks rules from the 'C++ style rules' section of cppguide.html.
				3961
				3962	Most of these rules are hard to test (naming, comment style), but we
				3963	do what we can. In particular we check for 2-space indents, line lengths,
				3964	tab usage, spaces inside code, etc.
				3965
				3966	Args:
				3967	filename: The name of the current file.
				3968	clean_lines: A CleansedLines instance containing the file.
				3969	linenum: The number of the line to check.
				3970	file_extension: The extension (without the dot) of the filename.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3971	nesting_state: A NestingState instance which maintains information about
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	3972	the current stack of nested blocks being parsed.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3973	error: The function to call with any errors found.
				3974	"""
				3975
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	3976	# Don't use "elided" lines here, otherwise we can't check commented lines.
				3977	# Don't want to use "raw" either, because we don't want to check inside C++11
				3978	# raw strings,
				3979	raw_lines = clean_lines.lines_without_raw_strings
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	3980	line = raw_lines[linenum]
				3981
				3982	if line.find('\t') != -1:
				3983	error(filename, linenum, 'whitespace/tab', 1,
				3984	'Tab found; better to use spaces')
				3985
				3986	# One or three blank spaces at the beginning of the line is weird; it's
				3987	# hard to reconcile that with 2-space indents.
				3988	# NOTE: here are the conditions rob pike used for his tests. Mine aren't
				3989	# as sophisticated, but it may be worth becoming so: RLENGTH==initial_spaces
				3990	# if(RLENGTH > 20) complain = 0;
				3991	# if(match($0, " +(error\|private\|public\|protected):")) complain = 0;
				3992	# if(match(prev, "&& *$")) complain = 0;
				3993	# if(match(prev, "\\\|\\\| *$")) complain = 0;
				3994	# if(match(prev, "[\",=><] *$")) complain = 0;
				3995	# if(match($0, " <<")) complain = 0;
				3996	# if(match(prev, " +for \\(")) complain = 0;
				3997	# if(prevodd && match(prevprev, " +for \\(")) complain = 0;
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	3998	scope_or_label_pattern = r'\s\w+\s:\s*\\?$'
				3999	classinfo = nesting_state.InnermostClass()
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4000	initial_spaces = 0
				4001	cleansed_line = clean_lines.elided[linenum]
				4002	while initial_spaces < len(line) and line[initial_spaces] == ' ':
				4003	initial_spaces += 1
				4004	if line and line[-1].isspace():
				4005	error(filename, linenum, 'whitespace/end_of_line', 4,
				4006	'Line ends in whitespace. Consider deleting these extra spaces.')
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4007	# There are certain situations we allow one space, notably for
				4008	# section labels, and also lines containing multi-line raw strings.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4009	elif ((initial_spaces == 1 or initial_spaces == 3) and
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4010	not Match(scope_or_label_pattern, cleansed_line) and
				4011	not (clean_lines.raw_lines[linenum] != line and
				4012	Match(r'^\s*""', line))):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4013	error(filename, linenum, 'whitespace/indent', 3,
				4014	'Weird number of spaces at line-start. '
				4015	'Are you using a 2-space indent?')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4016
				4017	# Check if the line is a header guard.
				4018	is_header_guard = False
				4019	if file_extension == 'h':
				4020	cppvar = GetHeaderGuardCPPVariable(filename)
				4021	if (line.startswith('#ifndef %s' % cppvar) or
				4022	line.startswith('#define %s' % cppvar) or
				4023	line.startswith('#endif // %s' % cppvar)):
				4024	is_header_guard = True
				4025	# #include lines and header guards can be long, since there's no clean way to
				4026	# split them.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4027	#
				4028	# URLs can be long too. It's possible to split these, but it makes them
				4029	# harder to cut&paste.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4030	#
				4031	# The "$Id:...$" comment may also get very long without it being the
				4032	# developers fault.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4033	if (not line.startswith('#include') and not is_header_guard and
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4034	not Match(r'^\s//.http(s?)://\S*$', line) and
				4035	not Match(r'^// \$Id:.*#[0-9]+ \$$', line)):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4036	line_width = GetLineWidth(line)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4037	extended_length = int((_line_length * 1.25))
				4038	if line_width > extended_length:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4039	error(filename, linenum, 'whitespace/line_length', 4,
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4040	'Lines should very rarely be longer than %i characters' %
				4041	extended_length)
				4042	elif line_width > _line_length:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4043	error(filename, linenum, 'whitespace/line_length', 2,
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4044	'Lines should be <= %i characters long' % _line_length)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4045
				4046	if (cleansed_line.count(';') > 1 and
				4047	# for loops are allowed two ;'s (and may run over two lines).
				4048	cleansed_line.find('for') == -1 and
				4049	(GetPreviousNonBlankLine(clean_lines, linenum)[0].find('for') == -1 or
				4050	GetPreviousNonBlankLine(clean_lines, linenum)[0].find(';') != -1) and
				4051	# It's ok to have many commands in a switch case that fits in 1 line
				4052	not ((cleansed_line.find('case ') != -1 or
				4053	cleansed_line.find('default:') != -1) and
				4054	cleansed_line.find('break;') != -1)):
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	4055	error(filename, linenum, 'whitespace/newline', 0,
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4056	'More than one command on the same line')
				4057
				4058	# Some more style checks
				4059	CheckBraces(filename, clean_lines, linenum, error)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4060	CheckTrailingSemicolon(filename, clean_lines, linenum, error)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4061	CheckEmptyBlockBody(filename, clean_lines, linenum, error)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	4062	CheckAccess(filename, clean_lines, linenum, nesting_state, error)
				4063	CheckSpacing(filename, clean_lines, linenum, nesting_state, error)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4064	CheckOperatorSpacing(filename, clean_lines, linenum, error)
				4065	CheckParenthesisSpacing(filename, clean_lines, linenum, error)
				4066	CheckCommaSpacing(filename, clean_lines, linenum, error)
				4067	CheckBracesSpacing(filename, clean_lines, linenum, error)
				4068	CheckSpacingForFunctionCall(filename, clean_lines, linenum, error)
				4069	CheckRValueReference(filename, clean_lines, linenum, nesting_state, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4070	CheckCheck(filename, clean_lines, linenum, error)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	4071	CheckAltTokens(filename, clean_lines, linenum, error)
				4072	classinfo = nesting_state.InnermostClass()
				4073	if classinfo:
				4074	CheckSectionSpacing(filename, clean_lines, classinfo, linenum, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4075
				4076
				4077	_RE_PATTERN_INCLUDE_NEW_STYLE = re.compile(r'#include +"[^/]+\.h"')
				4078	_RE_PATTERN_INCLUDE = re.compile(r'^\s#\sinclude\s([<"])([^>"])[>"].*$')
				4079	# Matches the first component of a filename delimited by -s and _s. That is:
				4080	# _RE_FIRST_COMPONENT.match('foo').group(0) == 'foo'
				4081	# _RE_FIRST_COMPONENT.match('foo.cc').group(0) == 'foo'
				4082	# _RE_FIRST_COMPONENT.match('foo-bar_baz.cc').group(0) == 'foo'
				4083	# _RE_FIRST_COMPONENT.match('foo_bar-baz.cc').group(0) == 'foo'
				4084	_RE_FIRST_COMPONENT = re.compile(r'^[^-_.]+')
				4085
				4086
				4087	def _DropCommonSuffixes(filename):
				4088	"""Drops common suffixes like _test.cc or -inl.h from filename.
				4089
				4090	For example:
				4091	>>> _DropCommonSuffixes('foo/foo-inl.h')
				4092	'foo/foo'
				4093	>>> _DropCommonSuffixes('foo/bar/foo.cc')
				4094	'foo/bar/foo'
				4095	>>> _DropCommonSuffixes('foo/foo_internal.h')
				4096	'foo/foo'
				4097	>>> _DropCommonSuffixes('foo/foo_unusualinternal.h')
				4098	'foo/foo_unusualinternal'
				4099
				4100	Args:
				4101	filename: The input filename.
				4102
				4103	Returns:
				4104	The filename with the common suffix removed.
				4105	"""
				4106	for suffix in ('test.cc', 'regtest.cc', 'unittest.cc',
				4107	'inl.h', 'impl.h', 'internal.h'):
				4108	if (filename.endswith(suffix) and len(filename) > len(suffix) and
				4109	filename[-len(suffix) - 1] in ('-', '_')):
				4110	return filename[:-len(suffix) - 1]
				4111	return os.path.splitext(filename)[0]
				4112
				4113
				4114	def _IsTestFilename(filename):
				4115	"""Determines if the given filename has a suffix that identifies it as a test.
				4116
				4117	Args:
				4118	filename: The input filename.
				4119
				4120	Returns:
				4121	True if 'filename' looks like a test, False otherwise.
				4122	"""
				4123	if (filename.endswith('_test.cc') or
				4124	filename.endswith('_unittest.cc') or
				4125	filename.endswith('_regtest.cc')):
				4126	return True
				4127	else:
				4128	return False
				4129
				4130
				4131	def _ClassifyInclude(fileinfo, include, is_system):
				4132	"""Figures out what kind of header 'include' is.
				4133
				4134	Args:
				4135	fileinfo: The current file cpplint is running over. A FileInfo instance.
				4136	include: The path to a #included file.
				4137	is_system: True if the #include used <> rather than "".
				4138
				4139	Returns:
				4140	One of the _XXX_HEADER constants.
				4141
				4142	For example:
				4143	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'stdio.h', True)
				4144	_C_SYS_HEADER
				4145	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'string', True)
				4146	_CPP_SYS_HEADER
				4147	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'foo/foo.h', False)
				4148	_LIKELY_MY_HEADER
				4149	>>> _ClassifyInclude(FileInfo('foo/foo_unknown_extension.cc'),
				4150	... 'bar/foo_other_ext.h', False)
				4151	_POSSIBLE_MY_HEADER
				4152	>>> _ClassifyInclude(FileInfo('foo/foo.cc'), 'foo/bar.h', False)
				4153	_OTHER_HEADER
				4154	"""
				4155	# This is a list of all standard c++ header files, except
				4156	# those already checked for above.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4157	is_cpp_h = include in _CPP_HEADERS
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4158
				4159	if is_system:
				4160	if is_cpp_h:
				4161	return _CPP_SYS_HEADER
				4162	else:
				4163	return _C_SYS_HEADER
				4164
				4165	# If the target file and the include we're checking share a
				4166	# basename when we drop common extensions, and the include
				4167	# lives in . , then it's likely to be owned by the target file.
				4168	target_dir, target_base = (
				4169	os.path.split(_DropCommonSuffixes(fileinfo.RepositoryName())))
				4170	include_dir, include_base = os.path.split(_DropCommonSuffixes(include))
				4171	if target_base == include_base and (
				4172	include_dir == target_dir or
				4173	include_dir == os.path.normpath(target_dir + '/../public')):
				4174	return _LIKELY_MY_HEADER
				4175
				4176	# If the target and include share some initial basename
				4177	# component, it's possible the target is implementing the
				4178	# include, so it's allowed to be first, but we'll never
				4179	# complain if it's not there.
				4180	target_first_component = _RE_FIRST_COMPONENT.match(target_base)
				4181	include_first_component = _RE_FIRST_COMPONENT.match(include_base)
				4182	if (target_first_component and include_first_component and
				4183	target_first_component.group(0) ==
				4184	include_first_component.group(0)):
				4185	return _POSSIBLE_MY_HEADER
				4186
				4187	return _OTHER_HEADER
				4188
				4189
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4190
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4191	def CheckIncludeLine(filename, clean_lines, linenum, include_state, error):
				4192	"""Check rules that are applicable to #include lines.
				4193
				4194	Strings on #include lines are NOT removed from elided line, to make
				4195	certain tasks easier. However, to prevent false positives, checks
				4196	applicable to #include lines in CheckLanguage must be put here.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4197
				4198	Args:
				4199	filename: The name of the current file.
				4200	clean_lines: A CleansedLines instance containing the file.
				4201	linenum: The number of the line to check.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4202	include_state: An _IncludeState instance in which the headers are inserted.
				4203	error: The function to call with any errors found.
				4204	"""
				4205	fileinfo = FileInfo(filename)
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4206	line = clean_lines.lines[linenum]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4207
				4208	# "include" should use the new style "foo/bar.h" instead of just "bar.h"
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4209	if _RE_PATTERN_INCLUDE_NEW_STYLE.search(line):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4210	error(filename, linenum, 'build/include', 4,
				4211	'Include the directory when naming .h files')
				4212
				4213	# we shouldn't include a file more than once. actually, there are a
				4214	# handful of instances where doing so is okay, but in general it's
				4215	# not.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4216	match = _RE_PATTERN_INCLUDE.search(line)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4217	if match:
				4218	include = match.group(2)
				4219	is_system = (match.group(1) == '<')
				4220	if include in include_state:
				4221	error(filename, linenum, 'build/include', 4,
				4222	'"%s" already included at %s:%s' %
				4223	(include, filename, include_state[include]))
				4224	else:
				4225	include_state[include] = linenum
				4226
				4227	# We want to ensure that headers appear in the right order:
				4228	# 1) for foo.cc, foo.h (preferred location)
				4229	# 2) c system files
				4230	# 3) cpp system files
				4231	# 4) for foo.cc, foo.h (deprecated location)
				4232	# 5) other google headers
				4233	#
				4234	# We classify each include statement as one of those 5 types
				4235	# using a number of techniques. The include_state object keeps
				4236	# track of the highest type seen, and complains if we see a
				4237	# lower type after that.
				4238	error_message = include_state.CheckNextIncludeOrder(
				4239	_ClassifyInclude(fileinfo, include, is_system))
				4240	if error_message:
				4241	error(filename, linenum, 'build/include_order', 4,
				4242	'%s. Should be: %s.h, c system, c++ system, other.' %
				4243	(error_message, fileinfo.BaseName()))
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4244	canonical_include = include_state.CanonicalizeAlphabeticalOrder(include)
				4245	if not include_state.IsInAlphabeticalOrder(
				4246	clean_lines, linenum, canonical_include):
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	4247	error(filename, linenum, 'build/include_alpha', 4,
				4248	'Include "%s" not in alphabetical order' % include)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4249	include_state.SetLastHeader(canonical_include)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4250
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4251	# Look for any of the stream classes that are part of standard C++.
				4252	match = _RE_PATTERN_INCLUDE.match(line)
				4253	if match:
				4254	include = match.group(2)
				4255	if Match(r'(f\|ind\|io\|i\|o\|parse\|pf\|stdio\|str\|)?stream$', include):
				4256	# Many unit tests use cout, so we exempt them.
				4257	if not _IsTestFilename(filename):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4258	# Suggest a different header for ostream
				4259	if include == 'ostream':
				4260	error(filename, linenum, 'readability/streams', 3,
				4261	'For logging, include "base/logging.h" instead of <ostream>.')
				4262	else:
				4263	error(filename, linenum, 'readability/streams', 3,
				4264	'Streams are highly discouraged.')
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4265
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4266
				4267	def _GetTextInside(text, start_pattern):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4268	r"""Retrieves all the text between matching open and close parentheses.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4269
				4270	Given a string of lines and a regular expression string, retrieve all the text
				4271	following the expression and between opening punctuation symbols like
				4272	(, [, or {, and the matching close-punctuation symbol. This properly nested
				4273	occurrences of the punctuations, so for the text like
				4274	printf(a(), b(c()));
				4275	a call to _GetTextInside(text, r'printf\(') will return 'a(), b(c())'.
				4276	start_pattern must match string having an open punctuation symbol at the end.
				4277
				4278	Args:
				4279	text: The lines to extract text. Its comments and strings must be elided.
				4280	It can be single line and can span multiple lines.
				4281	start_pattern: The regexp string indicating where to start extracting
				4282	the text.
				4283	Returns:
				4284	The extracted text.
				4285	None if either the opening string or ending punctuation could not be found.
				4286	"""
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4287	# TODO(unknown): Audit cpplint.py to see what places could be profitably
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4288	# rewritten to use _GetTextInside (and use inferior regexp matching today).
				4289
				4290	# Give opening punctuations to get the matching close-punctuations.
				4291	matching_punctuation = {'(': ')', '{': '}', '[': ']'}
				4292	closing_punctuation = set(matching_punctuation.itervalues())
				4293
				4294	# Find the position to start extracting text.
				4295	match = re.search(start_pattern, text, re.M)
				4296	if not match: # start_pattern not found in text.
				4297	return None
				4298	start_position = match.end(0)
				4299
				4300	assert start_position > 0, (
				4301	'start_pattern must ends with an opening punctuation.')
				4302	assert text[start_position - 1] in matching_punctuation, (
				4303	'start_pattern must ends with an opening punctuation.')
				4304	# Stack of closing punctuations we expect to have in text after position.
				4305	punctuation_stack = [matching_punctuation[text[start_position - 1]]]
				4306	position = start_position
				4307	while punctuation_stack and position < len(text):
				4308	if text[position] == punctuation_stack[-1]:
				4309	punctuation_stack.pop()
				4310	elif text[position] in closing_punctuation:
				4311	# A closing punctuation without matching opening punctuations.
				4312	return None
				4313	elif text[position] in matching_punctuation:
				4314	punctuation_stack.append(matching_punctuation[text[position]])
				4315	position += 1
				4316	if punctuation_stack:
				4317	# Opening punctuations left without matching close-punctuations.
				4318	return None
				4319	# punctuations match.
				4320	return text[start_position:position - 1]
				4321
				4322
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4323	# Patterns for matching call-by-reference parameters.
				4324	#
				4325	# Supports nested templates up to 2 levels deep using this messy pattern:
				4326	# < (?: < (?: < [^<>]*
				4327	# >
				4328	# \| [^<>] )*
				4329	# >
				4330	# \| [^<>] )*
				4331	# >
				4332	_RE_PATTERN_IDENT = r'[_a-zA-Z]\w' # =~ [[:alpha:]][[:alnum:]]
				4333	_RE_PATTERN_TYPE = (
				4334	r'(?:const\s+)?(?:typename\s+\|class\s+\|struct\s+\|union\s+\|enum\s+)?'
				4335	r'(?:\w\|'
				4336	r'\s<(?:<(?:<[^<>]>\|[^<>])>\|[^<>])>\|'
				4337	r'::)+')
				4338	# A call-by-reference parameter ends with '& identifier'.
				4339	_RE_PATTERN_REF_PARAM = re.compile(
				4340	r'(' + _RE_PATTERN_TYPE + r'(?:\s(?:\bconst\b\|[]))\s'
				4341	r'&\s' + _RE_PATTERN_IDENT + r')\s(?:=[^,()]+)?[,)]')
				4342	# A call-by-const-reference parameter either ends with 'const& identifier'
				4343	# or looks like 'const type& identifier' when 'type' is atomic.
				4344	_RE_PATTERN_CONST_REF_PARAM = (
				4345	r'(?:.\s\bconst\s&\s' + _RE_PATTERN_IDENT +
				4346	r'\|const\s+' + _RE_PATTERN_TYPE + r'\s&\s' + _RE_PATTERN_IDENT + r')')
				4347
				4348
				4349	def CheckLanguage(filename, clean_lines, linenum, file_extension,
				4350	include_state, nesting_state, error):
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4351	"""Checks rules from the 'C++ language rules' section of cppguide.html.
				4352
				4353	Some of these rules are hard to test (function overloading, using
				4354	uint32 inappropriately), but we do the best we can.
				4355
				4356	Args:
				4357	filename: The name of the current file.
				4358	clean_lines: A CleansedLines instance containing the file.
				4359	linenum: The number of the line to check.
				4360	file_extension: The extension (without the dot) of the filename.
				4361	include_state: An _IncludeState instance in which the headers are inserted.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4362	nesting_state: A NestingState instance which maintains information about
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4363	the current stack of nested blocks being parsed.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4364	error: The function to call with any errors found.
				4365	"""
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4366	# If the line is empty or consists of entirely a comment, no need to
				4367	# check it.
				4368	line = clean_lines.elided[linenum]
				4369	if not line:
				4370	return
				4371
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	4372	match = _RE_PATTERN_INCLUDE.search(line)
				4373	if match:
				4374	CheckIncludeLine(filename, clean_lines, linenum, include_state, error)
				4375	return
				4376
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4377	# Reset include state across preprocessor directives. This is meant
				4378	# to silence warnings for conditional includes.
				4379	if Match(r'^\s#\s(?:ifdef\|elif\|else\|endif)\b', line):
				4380	include_state.ResetSection()
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4381
				4382	# Make Windows paths like Unix.
				4383	fullname = os.path.abspath(filename).replace('\\', '/')
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4384
				4385	# Perform other checks now that we are sure that this is not an include line
				4386	CheckCasts(filename, clean_lines, linenum, error)
				4387	CheckGlobalStatic(filename, clean_lines, linenum, error)
				4388	CheckPrintf(filename, clean_lines, linenum, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4389
				4390	if file_extension == 'h':
				4391	# TODO(unknown): check that 1-arg constructors are explicit.
				4392	# How to tell it's a constructor?
				4393	# (handled in CheckForNonStandardConstructs for now)
				4394	# TODO(unknown): check that classes have DISALLOW_EVIL_CONSTRUCTORS
				4395	# (level 1 error)
				4396	pass
				4397
				4398	# Check if people are using the verboten C basic types. The only exception
				4399	# we regularly allow is "unsigned short port" for port.
				4400	if Search(r'\bshort port\b', line):
				4401	if not Search(r'\bunsigned short port\b', line):
				4402	error(filename, linenum, 'runtime/int', 4,
				4403	'Use "unsigned short" for ports, not "short"')
				4404	else:
				4405	match = Search(r'\b(short\|long(?! +double)\|long long)\b', line)
				4406	if match:
				4407	error(filename, linenum, 'runtime/int', 4,
				4408	'Use int16/int64/etc, rather than the C type %s' % match.group(1))
				4409
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	4410	# Check if some verboten operator overloading is going on
				4411	# TODO(unknown): catch out-of-line unary operator&:
				4412	# class X {};
				4413	# int operator&(const X& x) { return 42; } // unary operator&
				4414	# The trick is it's hard to tell apart from binary operator&:
				4415	# class Y { int operator&(const Y& x) { return 23; } }; // binary operator&
				4416	if Search(r'\boperator\s&\s$\s*$', line):
				4417	error(filename, linenum, 'runtime/operator', 4,
				4418	'Unary operator& is dangerous. Do not use it.')
				4419
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4420	# Check for suspicious usage of "if" like
				4421	# } if (a == b) {
				4422	if Search(r'\}\sif\s\(', line):
				4423	error(filename, linenum, 'readability/braces', 4,
				4424	'Did you mean "else if"? If not, start a new line for "if".')
				4425
				4426	# Check for potential format string bugs like printf(foo).
				4427	# We constrain the pattern not to pick things like DocidForPrintf(foo).
				4428	# Not perfect but it can catch printf(foo.c_str()) and printf(foo->c_str())
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4429	# TODO(unknown): Catch the following case. Need to change the calling
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4430	# convention of the whole function to process multiple line to handle it.
				4431	# printf(
				4432	# boy_this_is_a_really_long_variable_that_cannot_fit_on_the_prev_line);
				4433	printf_args = _GetTextInside(line, r'(?i)\b(string)?printf\s*\(')
				4434	if printf_args:
				4435	match = Match(r'([\w.\->()]+)$', printf_args)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	4436	if match and match.group(1) != '__VA_ARGS__':
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4437	function_name = re.search(r'\b((?:string)?printf)\s*\(',
				4438	line, re.I).group(1)
				4439	error(filename, linenum, 'runtime/printf', 4,
				4440	'Potential format string bug. Do %s("%%s", %s) instead.'
				4441	% (function_name, match.group(1)))
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4442
				4443	# Check for potential memset bugs like memset(buf, sizeof(buf), 0).
				4444	match = Search(r'memset\s$([^,]),\s([^,]),\s0\s$', line)
				4445	if match and not Match(r"^''\|-?[0-9]+\|0x[0-9A-Fa-f]$", match.group(2)):
				4446	error(filename, linenum, 'runtime/memset', 4,
				4447	'Did you mean "memset(%s, 0, %s)"?'
				4448	% (match.group(1), match.group(2)))
				4449
				4450	if Search(r'\busing namespace\b', line):
				4451	error(filename, linenum, 'build/namespaces', 5,
				4452	'Do not use namespace using-directives. '
				4453	'Use using-declarations instead.')
				4454
				4455	# Detect variable-length arrays.
				4456	match = Match(r'\s(.+::)?(\w+) [a-z]\w\[(.+)];', line)
				4457	if (match and match.group(2) != 'return' and match.group(2) != 'delete' and
				4458	match.group(3).find(']') == -1):
				4459	# Split the size using space and arithmetic operators as delimiters.
				4460	# If any of the resulting tokens are not compile time constants then
				4461	# report the error.
				4462	tokens = re.split(r'\s\|\+\|\-\|\*\|\/\|<<\|>>]', match.group(3))
				4463	is_const = True
				4464	skip_next = False
				4465	for tok in tokens:
				4466	if skip_next:
				4467	skip_next = False
				4468	continue
				4469
				4470	if Search(r'sizeof$.+$', tok): continue
				4471	if Search(r'arraysize$\w+$', tok): continue
				4472
				4473	tok = tok.lstrip('(')
				4474	tok = tok.rstrip(')')
				4475	if not tok: continue
				4476	if Match(r'\d+', tok): continue
				4477	if Match(r'0[xX][0-9a-fA-F]+', tok): continue
				4478	if Match(r'k[A-Z0-9]\w*', tok): continue
				4479	if Match(r'(.+::)?k[A-Z0-9]\w*', tok): continue
				4480	if Match(r'(.+::)?[A-Z][A-Z0-9_]*', tok): continue
				4481	# A catch all for tricky sizeof cases, including 'sizeof expression',
				4482	# 'sizeof(*type)', 'sizeof(const type)', 'sizeof(struct StructName)'
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4483	# requires skipping the next token because we split on ' ' and '*'.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4484	if tok.startswith('sizeof'):
				4485	skip_next = True
				4486	continue
				4487	is_const = False
				4488	break
				4489	if not is_const:
				4490	error(filename, linenum, 'runtime/arrays', 1,
				4491	'Do not use variable-length arrays. Use an appropriately named '
				4492	"('k' followed by CamelCase) compile-time constant for the size.")
				4493
				4494	# If DISALLOW_EVIL_CONSTRUCTORS, DISALLOW_COPY_AND_ASSIGN, or
				4495	# DISALLOW_IMPLICIT_CONSTRUCTORS is present, then it should be the last thing
				4496	# in the class declaration.
				4497	match = Match(
				4498	(r'\s*'
				4499	r'(DISALLOW_(EVIL_CONSTRUCTORS\|COPY_AND_ASSIGN\|IMPLICIT_CONSTRUCTORS))'
				4500	r'$.*$;$'),
				4501	line)
				4502	if match and linenum + 1 < clean_lines.NumLines():
				4503	next_line = clean_lines.elided[linenum + 1]
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4504	# We allow some, but not all, declarations of variables to be present
				4505	# in the statement that defines the class. The [\w\,\s] fragment of
				4506	# the regular expression below allows users to declare instances of
				4507	# the class or pointers to instances, but not less common types such
				4508	# as function pointers or arrays. It's a tradeoff between allowing
				4509	# reasonable code and avoiding trying to parse more C++ using regexps.
				4510	if not Search(r'^\s}[\w\,\s]*;', next_line):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4511	error(filename, linenum, 'readability/constructors', 3,
				4512	match.group(1) + ' should be the last thing in the class')
				4513
				4514	# Check for use of unnamed namespaces in header files. Registration
				4515	# macros are typically OK, so we allow use of "namespace {" on lines
				4516	# that end with backslashes.
				4517	if (file_extension == 'h'
				4518	and Search(r'\bnamespace\s*{', line)
				4519	and line[-1] != '\\'):
				4520	error(filename, linenum, 'build/namespaces', 4,
				4521	'Do not use unnamed namespaces in header files. See '
				4522	'http://google-styleguide.googlecode.com/svn/trunk/cppguide.xml#Namespaces'
				4523	' for more information.')
				4524
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4525
				4526	def CheckGlobalStatic(filename, clean_lines, linenum, error):
				4527	"""Check for unsafe global or static objects.
				4528
				4529	Args:
				4530	filename: The name of the current file.
				4531	clean_lines: A CleansedLines instance containing the file.
				4532	linenum: The number of the line to check.
				4533	error: The function to call with any errors found.
				4534	"""
				4535	line = clean_lines.elided[linenum]
				4536
				4537	# Check for people declaring static/global STL strings at the top level.
				4538	# This is dangerous because the C++ language does not guarantee that
				4539	# globals with constructors are initialized before the first access.
				4540	match = Match(
				4541	r'((?:\|static +)(?:\|const +))string +([a-zA-Z0-9_:]+)\b(.*)',
				4542	line)
				4543	# Remove false positives:
				4544	# - String pointers (as opposed to values).
				4545	# string *pointer
				4546	# const string *pointer
				4547	# string const *pointer
				4548	# string *const pointer
				4549	#
				4550	# - Functions and template specializations.
				4551	# string Function<Type>(...
				4552	# string Class<Type>::Method(...
				4553	#
				4554	# - Operators. These are matched separately because operator names
				4555	# cross non-word boundaries, and trying to match both operators
				4556	# and functions at the same time would decrease accuracy of
				4557	# matching identifiers.
				4558	# string Class::operator*()
				4559	if (match and
				4560	not Search(r'\bstring\b(\s+const)?\s\\s*(const\s+)?\w', line) and
				4561	not Search(r'\boperator\W', line) and
				4562	not Match(r'\s(<.>)?(::[a-zA-Z0-9_]+)?\s*\(([^"]\|$)', match.group(3))):
				4563	error(filename, linenum, 'runtime/string', 4,
				4564	'For a static/global string constant, use a C style string instead: '
				4565	'"%schar %s[]".' %
				4566	(match.group(1), match.group(2)))
				4567
				4568	if Search(r'\b([A-Za-z0-9_]*_)$\1$', line):
				4569	error(filename, linenum, 'runtime/init', 4,
				4570	'You seem to be initializing a member variable with itself.')
				4571
				4572
				4573	def CheckPrintf(filename, clean_lines, linenum, error):
				4574	"""Check for printf related issues.
				4575
				4576	Args:
				4577	filename: The name of the current file.
				4578	clean_lines: A CleansedLines instance containing the file.
				4579	linenum: The number of the line to check.
				4580	error: The function to call with any errors found.
				4581	"""
				4582	line = clean_lines.elided[linenum]
				4583
				4584	# When snprintf is used, the second argument shouldn't be a literal.
				4585	match = Search(r'snprintf\s\(([^,]),\s([0-9])\s*,', line)
				4586	if match and match.group(2) != '0':
				4587	# If 2nd arg is zero, snprintf is used to calculate size.
				4588	error(filename, linenum, 'runtime/printf', 3,
				4589	'If you can, use sizeof(%s) instead of %s as the 2nd arg '
				4590	'to snprintf.' % (match.group(1), match.group(2)))
				4591
				4592	# Check if some verboten C functions are being used.
				4593	if Search(r'\bsprintf\b', line):
				4594	error(filename, linenum, 'runtime/printf', 5,
				4595	'Never use sprintf. Use snprintf instead.')
				4596	match = Search(r'\b(strcpy\|strcat)\b', line)
				4597	if match:
				4598	error(filename, linenum, 'runtime/printf', 4,
				4599	'Almost always, snprintf is better than %s' % match.group(1))
				4600
				4601
				4602	def IsDerivedFunction(clean_lines, linenum):
				4603	"""Check if current line contains an inherited function.
				4604
				4605	Args:
				4606	clean_lines: A CleansedLines instance containing the file.
				4607	linenum: The number of the line to check.
				4608	Returns:
				4609	True if current line contains a function with "override"
				4610	virt-specifier.
				4611	"""
				4612	# Look for leftmost opening parenthesis on current line
				4613	opening_paren = clean_lines.elided[linenum].find('(')
				4614	if opening_paren < 0: return False
				4615
				4616	# Look for "override" after the matching closing parenthesis
				4617	line, _, closing_paren = CloseExpression(clean_lines, linenum, opening_paren)
				4618	return closing_paren >= 0 and Search(r'\boverride\b', line[closing_paren:])
				4619
				4620
				4621	def IsInitializerList(clean_lines, linenum):
				4622	"""Check if current line is inside constructor initializer list.
				4623
				4624	Args:
				4625	clean_lines: A CleansedLines instance containing the file.
				4626	linenum: The number of the line to check.
				4627	Returns:
				4628	True if current line appears to be inside constructor initializer
				4629	list, False otherwise.
				4630	"""
				4631	for i in xrange(linenum, 1, -1):
				4632	line = clean_lines.elided[i]
				4633	if i == linenum:
				4634	remove_function_body = Match(r'^(.)\{\s$', line)
				4635	if remove_function_body:
				4636	line = remove_function_body.group(1)
				4637
				4638	if Search(r'\s:\s*\w+[({]', line):
				4639	# A lone colon tend to indicate the start of a constructor
				4640	# initializer list. It could also be a ternary operator, which
				4641	# also tend to appear in constructor initializer lists as
				4642	# opposed to parameter lists.
				4643	return True
				4644	if Search(r'\}\s,\s$', line):
				4645	# A closing brace followed by a comma is probably the end of a
				4646	# brace-initialized member in constructor initializer list.
				4647	return True
				4648	if Search(r'[{};]\s*$', line):
				4649	# Found one of the following:
				4650	# - A closing brace or semicolon, probably the end of the previous
				4651	# function.
				4652	# - An opening brace, probably the start of current class or namespace.
				4653	#
				4654	# Current line is probably not inside an initializer list since
				4655	# we saw one of those things without seeing the starting colon.
				4656	return False
				4657
				4658	# Got to the beginning of the file without seeing the start of
				4659	# constructor initializer list.
				4660	return False
				4661
				4662
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4663	def CheckForNonConstReference(filename, clean_lines, linenum,
				4664	nesting_state, error):
				4665	"""Check for non-const references.
				4666
				4667	Separate from CheckLanguage since it scans backwards from current
				4668	line, instead of scanning forward.
				4669
				4670	Args:
				4671	filename: The name of the current file.
				4672	clean_lines: A CleansedLines instance containing the file.
				4673	linenum: The number of the line to check.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4674	nesting_state: A NestingState instance which maintains information about
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4675	the current stack of nested blocks being parsed.
				4676	error: The function to call with any errors found.
				4677	"""
				4678	# Do nothing if there is no '&' on current line.
				4679	line = clean_lines.elided[linenum]
				4680	if '&' not in line:
				4681	return
				4682
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4683	# If a function is inherited, current function doesn't have much of
				4684	# a choice, so any non-const references should not be blamed on
				4685	# derived function.
				4686	if IsDerivedFunction(clean_lines, linenum):
				4687	return
				4688
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4689	# Long type names may be broken across multiple lines, usually in one
				4690	# of these forms:
				4691	# LongType
				4692	# ::LongTypeContinued &identifier
				4693	# LongType::
				4694	# LongTypeContinued &identifier
				4695	# LongType<
				4696	# ...>::LongTypeContinued &identifier
				4697	#
				4698	# If we detected a type split across two lines, join the previous
				4699	# line to current line so that we can match const references
				4700	# accordingly.
				4701	#
				4702	# Note that this only scans back one line, since scanning back
				4703	# arbitrary number of lines would be expensive. If you have a type
				4704	# that spans more than 2 lines, please use a typedef.
				4705	if linenum > 1:
				4706	previous = None
				4707	if Match(r'\s::(?:[\w<>]\|::)+\s&\s*\S', line):
				4708	# previous_line\n + ::current_line
				4709	previous = Search(r'\b((?:const\s)?(?:[\w<>]\|::)+[\w<>])\s$',
				4710	clean_lines.elided[linenum - 1])
				4711	elif Match(r'\s[a-zA-Z_]([\w<>]\|::)+\s&\s*\S', line):
				4712	# previous_line::\n + current_line
				4713	previous = Search(r'\b((?:const\s)?(?:[\w<>]\|::)+::)\s$',
				4714	clean_lines.elided[linenum - 1])
				4715	if previous:
				4716	line = previous.group(1) + line.lstrip()
				4717	else:
				4718	# Check for templated parameter that is split across multiple lines
				4719	endpos = line.rfind('>')
				4720	if endpos > -1:
				4721	(_, startline, startpos) = ReverseCloseExpression(
				4722	clean_lines, linenum, endpos)
				4723	if startpos > -1 and startline < linenum:
				4724	# Found the matching < on an earlier line, collect all
				4725	# pieces up to current line.
				4726	line = ''
				4727	for i in xrange(startline, linenum + 1):
				4728	line += clean_lines.elided[i].strip()
				4729
				4730	# Check for non-const references in function parameters. A single '&' may
				4731	# found in the following places:
				4732	# inside expression: binary & for bitwise AND
				4733	# inside expression: unary & for taking the address of something
				4734	# inside declarators: reference parameter
				4735	# We will exclude the first two cases by checking that we are not inside a
				4736	# function body, including one that was just introduced by a trailing '{'.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4737	# TODO(unknown): Doesn't account for 'catch(Exception& e)' [rare].
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4738	if (nesting_state.previous_stack_top and
				4739	not (isinstance(nesting_state.previous_stack_top, _ClassInfo) or
				4740	isinstance(nesting_state.previous_stack_top, _NamespaceInfo))):
				4741	# Not at toplevel, not within a class, and not within a namespace
				4742	return
				4743
				4744	# Avoid preprocessors
				4745	if Search(r'\\\s*$', line):
				4746	return
				4747
				4748	# Avoid constructor initializer lists
				4749	if IsInitializerList(clean_lines, linenum):
				4750	return
				4751
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4752	# We allow non-const references in a few standard places, like functions
				4753	# called "swap()" or iostream operators like "<<" or ">>". Do not check
				4754	# those function parameters.
				4755	#
				4756	# We also accept & in static_assert, which looks like a function but
				4757	# it's actually a declaration expression.
				4758	whitelisted_functions = (r'(?:[sS]wap(?:<\w:+>)?\|'
				4759	r'operator\s*[<>][<>]\|'
				4760	r'static_assert\|COMPILE_ASSERT'
				4761	r')\s*\(')
				4762	if Search(whitelisted_functions, line):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4763	return
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4764	elif not Search(r'\S+\([^)]*$', line):
				4765	# Don't see a whitelisted function on this line. Actually we
				4766	# didn't see any function name on this line, so this is likely a
				4767	# multi-line parameter list. Try a bit harder to catch this case.
				4768	for i in xrange(2):
				4769	if (linenum > i and
				4770	Search(whitelisted_functions, clean_lines.elided[linenum - i - 1])):
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4771	return
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4772
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4773	decls = ReplaceAll(r'{[^}]*}', ' ', line) # exclude function body
				4774	for parameter in re.findall(_RE_PATTERN_REF_PARAM, decls):
				4775	if not Match(_RE_PATTERN_CONST_REF_PARAM, parameter):
				4776	error(filename, linenum, 'runtime/references', 2,
				4777	'Is this a non-const reference? '
				4778	'If so, make const or use a pointer: ' +
				4779	ReplaceAll(' *<', '<', parameter))
				4780
				4781
				4782	def CheckCasts(filename, clean_lines, linenum, error):
				4783	"""Various cast related checks.
				4784
				4785	Args:
				4786	filename: The name of the current file.
				4787	clean_lines: A CleansedLines instance containing the file.
				4788	linenum: The number of the line to check.
				4789	error: The function to call with any errors found.
				4790	"""
				4791	line = clean_lines.elided[linenum]
				4792
				4793	# Check to see if they're using an conversion function cast.
				4794	# I just try to capture the most common basic types, though there are more.
				4795	# Parameterless conversion functions, such as bool(), are allowed as they are
				4796	# probably a member operator declaration or default constructor.
				4797	match = Search(
				4798	r'(\bnew\s+\|\S<\s*(?:const\s+)?)?\b'
				4799	r'(int\|float\|double\|bool\|char\|int32\|uint32\|int64\|uint64)'
				4800	r'(\([^)].*)', line)
				4801	expecting_function = ExpectingFunctionArgs(clean_lines, linenum)
				4802	if match and not expecting_function:
				4803	matched_type = match.group(2)
				4804
				4805	# matched_new_or_template is used to silence two false positives:
				4806	# - New operators
				4807	# - Template arguments with function types
				4808	#
				4809	# For template arguments, we match on types immediately following
				4810	# an opening bracket without any spaces. This is a fast way to
				4811	# silence the common case where the function type is the first
				4812	# template argument. False negative with less-than comparison is
				4813	# avoided because those operators are usually followed by a space.
				4814	#
				4815	# function<double(double)> // bracket + no space = false positive
				4816	# value < double(42) // bracket + space = true positive
				4817	matched_new_or_template = match.group(1)
				4818
				4819	# Other things to ignore:
				4820	# - Function pointers
				4821	# - Casts to pointer types
				4822	# - Placement new
				4823	# - Alias declarations
				4824	matched_funcptr = match.group(3)
				4825	if (matched_new_or_template is None and
				4826	not (matched_funcptr and
				4827	(Match(r'$(?:[^() ]+::\s\\s)?[^() ]+$\s\(',
				4828	matched_funcptr) or
				4829	matched_funcptr.startswith('(*)'))) and
				4830	not Match(r'\susing\s+\S+\s=\s*' + matched_type, line) and
				4831	not Search(r'new$\S+$\s*' + matched_type, line)):
				4832	error(filename, linenum, 'readability/casting', 4,
				4833	'Using deprecated casting style. '
				4834	'Use static_cast<%s>(...) instead' %
				4835	matched_type)
				4836
				4837	if not expecting_function:
				4838	CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				4839	'static_cast',
				4840	r'$(int\|float\|double\|bool\|char\|u?int(16\|32\|64))$', error)
				4841
				4842	# This doesn't catch all cases. Consider (const char * const)"hello".
				4843	#
				4844	# (char *) "foo" should always be a const_cast (reinterpret_cast won't
				4845	# compile).
				4846	if CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				4847	'const_cast', r'$(char\s?\+\s?)$\s"', error):
				4848	pass
				4849	else:
				4850	# Check pointer casts for other than string constants
				4851	CheckCStyleCast(filename, linenum, line, clean_lines.raw_lines[linenum],
				4852	'reinterpret_cast', r'$(\w+\s?\*+\s?)$', error)
				4853
				4854	# In addition, we look for people taking the address of a cast. This
				4855	# is dangerous -- casts can assign to temporaries, so the pointer doesn't
				4856	# point where you think.
				4857	match = Search(
				4858	r'(?:&$([^)]+)$[\w(])\|'
				4859	r'(?:&(static\|dynamic\|down\|reinterpret)_cast\b)', line)
				4860	if match and match.group(1) != '*':
				4861	# Try a better error message when the & is bound to something
				4862	# dereferenced by the casted pointer, as opposed to the casted
				4863	# pointer itself.
				4864	parenthesis_error = False
				4865	match = Match(r'^(.*&(?:static\|dynamic\|down\|reinterpret)_cast\b)<', line)
				4866	if match:
				4867	_, y1, x1 = CloseExpression(clean_lines, linenum, len(match.group(1)))
				4868	if x1 >= 0 and clean_lines.elided[y1][x1] == '(':
				4869	_, y2, x2 = CloseExpression(clean_lines, y1, x1)
				4870	if x2 >= 0:
				4871	extended_line = clean_lines.elided[y2][x2:]
				4872	if y2 < clean_lines.NumLines() - 1:
				4873	extended_line += clean_lines.elided[y2 + 1]
				4874	if Match(r'\s*(?:->\|\[)', extended_line):
				4875	parenthesis_error = True
				4876
				4877	if parenthesis_error:
				4878	error(filename, linenum, 'readability/casting', 4,
				4879	('Are you taking an address of something dereferenced '
				4880	'from a cast? Wrapping the dereferenced expression in '
				4881	'parentheses will make the binding more obvious'))
				4882	else:
				4883	error(filename, linenum, 'runtime/casting', 4,
				4884	('Are you taking an address of a cast? '
				4885	'This is dangerous: could be a temp var. '
				4886	'Take the address before doing the cast, rather than after'))
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4887
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4888
				4889	def CheckCStyleCast(filename, linenum, line, raw_line, cast_type, pattern,
				4890	error):
				4891	"""Checks for a C-style cast by looking for the pattern.
				4892
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4893	Args:
				4894	filename: The name of the current file.
				4895	linenum: The number of the line to check.
				4896	line: The line of code to check.
				4897	raw_line: The raw line of code to check, with comments.
				4898	cast_type: The string for the C++ cast to recommend. This is either
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4899	reinterpret_cast, static_cast, or const_cast, depending.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4900	pattern: The regular expression used to find C-style casts.
				4901	error: The function to call with any errors found.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4902
				4903	Returns:
				4904	True if an error was emitted.
				4905	False otherwise.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4906	"""
				4907	match = Search(pattern, line)
				4908	if not match:
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4909	return False
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4910
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4911	# Exclude lines with keywords that tend to look like casts, and also
				4912	# macros which are generally troublesome.
				4913	if Match(r'.\b(?:sizeof\|alignof\|alignas\|[A-Z_]+)\s$',
				4914	line[0:match.start(1) - 1]):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4915	return False
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4916
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	4917	# operator++(int) and operator--(int)
				4918	if (line[0:match.start(1) - 1].endswith(' operator++') or
				4919	line[0:match.start(1) - 1].endswith(' operator--')):
				4920	return False
				4921
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4922	# A single unnamed argument for a function tends to look like old
				4923	# style cast. If we see those, don't issue warnings for deprecated
				4924	# casts, instead issue warnings for unnamed arguments where
				4925	# appropriate.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4926	#
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4927	# These are things that we want warnings for, since the style guide
				4928	# explicitly require all parameters to be named:
				4929	# Function(int);
				4930	# Function(int) {
				4931	# ConstMember(int) const;
				4932	# ConstMember(int) const {
				4933	# ExceptionMember(int) throw (...);
				4934	# ExceptionMember(int) throw (...) {
				4935	# PureVirtual(int) = 0;
				4936	#
				4937	# These are functions of some sort, where the compiler would be fine
				4938	# if they had named parameters, but people often omit those
				4939	# identifiers to reduce clutter:
				4940	# (FunctionPointer)(int);
				4941	# (FunctionPointer)(int) = value;
				4942	# Function((function_pointer_arg)(int))
				4943	# <TemplateArgument(int)>;
				4944	# <(FunctionPointerTemplateArgument)(int)>;
				4945	remainder = line[match.end(0):]
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4946	if Match(r'^\s*(?:;\|const\b\|throw\b\|final\b\|override\b\|=\|>\|\{\|\))',
				4947	remainder):
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	4948	# Looks like an unnamed parameter.
				4949
				4950	# Don't warn on any kind of template arguments.
				4951	if Match(r'^\s*>', remainder):
				4952	return False
				4953
				4954	# Don't warn on assignments to function pointers, but keep warnings for
				4955	# unnamed parameters to pure virtual functions. Note that this pattern
				4956	# will also pass on assignments of "0" to function pointers, but the
				4957	# preferred values for those would be "nullptr" or "NULL".
				4958	matched_zero = Match(r'^\s=\s(\S+)\s;', remainder)
				4959	if matched_zero and matched_zero.group(1) != '0':
				4960	return False
				4961
				4962	# Don't warn on function pointer declarations. For this we need
				4963	# to check what came before the "(type)" string.
				4964	if Match(r'.\)\s$', line[0:match.start(0)]):
				4965	return False
				4966
				4967	# Don't warn if the parameter is named with block comments, e.g.:
				4968	# Function(int /unused_param/);
				4969	if '/*' in raw_line:
				4970	return False
				4971
				4972	# Passed all filters, issue warning here.
				4973	error(filename, linenum, 'readability/function', 3,
				4974	'All parameters should be named in a function')
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4975	return True
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4976
				4977	# At this point, all that should be left is actual casts.
				4978	error(filename, linenum, 'readability/casting', 4,
				4979	'Using C-style cast. Use %s<%s>(...) instead' %
				4980	(cast_type, match.group(1)))
				4981
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	4982	return True
				4983
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	4984
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	4985	def ExpectingFunctionArgs(clean_lines, linenum):
				4986	"""Checks whether where function type arguments are expected.
				4987
				4988	Args:
				4989	clean_lines: A CleansedLines instance containing the file.
				4990	linenum: The number of the line to check.
				4991
				4992	Returns:
				4993	True if the line at 'linenum' is inside something that expects arguments
				4994	of function types.
				4995	"""
				4996	line = clean_lines.elided[linenum]
				4997	return (Match(r'^\s*MOCK_(CONST_)?METHOD\d+(_T)?\(', line) or
				4998	(linenum >= 2 and
				4999	(Match(r'^\sMOCK_(?:CONST_)?METHOD\d+(?:_T)?\((?:\S+,)?\s$',
				5000	clean_lines.elided[linenum - 1]) or
				5001	Match(r'^\sMOCK_(?:CONST_)?METHOD\d+(?:_T)?\(\s$',
				5002	clean_lines.elided[linenum - 2]) or
				5003	Search(r'\bstd::m?function\s\<\s$',
				5004	clean_lines.elided[linenum - 1]))))
				5005
				5006
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5007	_HEADERS_CONTAINING_TEMPLATES = (
				5008	('<deque>', ('deque',)),
				5009	('<functional>', ('unary_function', 'binary_function',
				5010	'plus', 'minus', 'multiplies', 'divides', 'modulus',
				5011	'negate',
				5012	'equal_to', 'not_equal_to', 'greater', 'less',
				5013	'greater_equal', 'less_equal',
				5014	'logical_and', 'logical_or', 'logical_not',
				5015	'unary_negate', 'not1', 'binary_negate', 'not2',
				5016	'bind1st', 'bind2nd',
				5017	'pointer_to_unary_function',
				5018	'pointer_to_binary_function',
				5019	'ptr_fun',
				5020	'mem_fun_t', 'mem_fun', 'mem_fun1_t', 'mem_fun1_ref_t',
				5021	'mem_fun_ref_t',
				5022	'const_mem_fun_t', 'const_mem_fun1_t',
				5023	'const_mem_fun_ref_t', 'const_mem_fun1_ref_t',
				5024	'mem_fun_ref',
				5025	)),
				5026	('<limits>', ('numeric_limits',)),
				5027	('<list>', ('list',)),
				5028	('<map>', ('map', 'multimap',)),
				5029	('<memory>', ('allocator',)),
				5030	('<queue>', ('queue', 'priority_queue',)),
				5031	('<set>', ('set', 'multiset',)),
				5032	('<stack>', ('stack',)),
				5033	('<string>', ('char_traits', 'basic_string',)),
				5034	('<utility>', ('pair',)),
				5035	('<vector>', ('vector',)),
				5036
				5037	# gcc extensions.
				5038	# Note: std::hash is their hash, ::hash is our hash
				5039	('<hash_map>', ('hash_map', 'hash_multimap',)),
				5040	('<hash_set>', ('hash_set', 'hash_multiset',)),
				5041	('<slist>', ('slist',)),
				5042	)
				5043
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5044	_RE_PATTERN_STRING = re.compile(r'\bstring\b')
				5045
				5046	_re_pattern_algorithm_header = []
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5047	for _template in ('copy', 'max', 'min', 'min_element', 'sort', 'swap',
				5048	'transform'):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5049	# Match max<type>(..., ...), max(..., ...), but not foo->max, foo.max or
				5050	# type::max().
				5051	_re_pattern_algorithm_header.append(
				5052	(re.compile(r'[^>.]\b' + _template + r'(<.*?>)?$[^$]'),
				5053	_template,
				5054	'<algorithm>'))
				5055
				5056	_re_pattern_templates = []
				5057	for _header, _templates in _HEADERS_CONTAINING_TEMPLATES:
				5058	for _template in _templates:
				5059	_re_pattern_templates.append(
				5060	(re.compile(r'(\<\|\b)' + _template + r'\s*\<'),
				5061	_template + '<>',
				5062	_header))
				5063
				5064
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5065	def FilesBelongToSameModule(filename_cc, filename_h):
				5066	"""Check if these two filenames belong to the same module.
				5067
				5068	The concept of a 'module' here is a as follows:
				5069	foo.h, foo-inl.h, foo.cc, foo_test.cc and foo_unittest.cc belong to the
				5070	same 'module' if they are in the same directory.
				5071	some/path/public/xyzzy and some/path/internal/xyzzy are also considered
				5072	to belong to the same module here.
				5073
				5074	If the filename_cc contains a longer path than the filename_h, for example,
				5075	'/absolute/path/to/base/sysinfo.cc', and this file would include
				5076	'base/sysinfo.h', this function also produces the prefix needed to open the
				5077	header. This is used by the caller of this function to more robustly open the
				5078	header file. We don't have access to the real include paths in this context,
				5079	so we need this guesswork here.
				5080
				5081	Known bugs: tools/base/bar.cc and base/bar.h belong to the same module
				5082	according to this implementation. Because of this, this function gives
				5083	some false positives. This should be sufficiently rare in practice.
				5084
				5085	Args:
				5086	filename_cc: is the path for the .cc file
				5087	filename_h: is the path for the header path
				5088
				5089	Returns:
				5090	Tuple with a bool and a string:
				5091	bool: True if filename_cc and filename_h belong to the same module.
				5092	string: the additional prefix needed to open the header file.
				5093	"""
				5094
				5095	if not filename_cc.endswith('.cc'):
				5096	return (False, '')
				5097	filename_cc = filename_cc[:-len('.cc')]
				5098	if filename_cc.endswith('_unittest'):
				5099	filename_cc = filename_cc[:-len('_unittest')]
				5100	elif filename_cc.endswith('_test'):
				5101	filename_cc = filename_cc[:-len('_test')]
				5102	filename_cc = filename_cc.replace('/public/', '/')
				5103	filename_cc = filename_cc.replace('/internal/', '/')
				5104
				5105	if not filename_h.endswith('.h'):
				5106	return (False, '')
				5107	filename_h = filename_h[:-len('.h')]
				5108	if filename_h.endswith('-inl'):
				5109	filename_h = filename_h[:-len('-inl')]
				5110	filename_h = filename_h.replace('/public/', '/')
				5111	filename_h = filename_h.replace('/internal/', '/')
				5112
				5113	files_belong_to_same_module = filename_cc.endswith(filename_h)
				5114	common_path = ''
				5115	if files_belong_to_same_module:
				5116	common_path = filename_cc[:-len(filename_h)]
				5117	return files_belong_to_same_module, common_path
				5118
				5119
				5120	def UpdateIncludeState(filename, include_state, io=codecs):
				5121	"""Fill up the include_state with new includes found from the file.
				5122
				5123	Args:
				5124	filename: the name of the header to read.
				5125	include_state: an _IncludeState instance in which the headers are inserted.
				5126	io: The io factory to use to read the file. Provided for testability.
				5127
				5128	Returns:
				5129	True if a header was succesfully added. False otherwise.
				5130	"""
				5131	headerfile = None
				5132	try:
				5133	headerfile = io.open(filename, 'r', 'utf8', 'replace')
				5134	except IOError:
				5135	return False
				5136	linenum = 0
				5137	for line in headerfile:
				5138	linenum += 1
				5139	clean_line = CleanseComments(line)
				5140	match = _RE_PATTERN_INCLUDE.search(clean_line)
				5141	if match:
				5142	include = match.group(2)
				5143	# The value formatting is cute, but not really used right now.
				5144	# What matters here is that the key is in include_state.
				5145	include_state.setdefault(include, '%s:%d' % (filename, linenum))
				5146	return True
				5147
				5148
				5149	def CheckForIncludeWhatYouUse(filename, clean_lines, include_state, error,
				5150	io=codecs):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5151	"""Reports for missing stl includes.
				5152
				5153	This function will output warnings to make sure you are including the headers
				5154	necessary for the stl containers and functions that you use. We only give one
				5155	reason to include a header. For example, if you use both equal_to<> and
				5156	less<> in a .h file, only one (the latter in the file) of these will be
				5157	reported as a reason to include the <functional>.
				5158
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5159	Args:
				5160	filename: The name of the current file.
				5161	clean_lines: A CleansedLines instance containing the file.
				5162	include_state: An _IncludeState instance.
				5163	error: The function to call with any errors found.
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5164	io: The IO factory to use to read the header file. Provided for unittest
				5165	injection.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5166	"""
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5167	required = {} # A map of header name to linenumber and the template entity.
				5168	# Example of required: { '<functional>': (1219, 'less<>') }
				5169
				5170	for linenum in xrange(clean_lines.NumLines()):
				5171	line = clean_lines.elided[linenum]
				5172	if not line or line[0] == '#':
				5173	continue
				5174
				5175	# String is special -- it is a non-templatized type in STL.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5176	matched = _RE_PATTERN_STRING.search(line)
				5177	if matched:
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	5178	# Don't warn about strings in non-STL namespaces:
				5179	# (We check only the first match per line; good enough.)
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5180	prefix = line[:matched.start()]
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	5181	if prefix.endswith('std::') or not prefix.endswith('::'):
				5182	required['<string>'] = (linenum, 'string')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5183
				5184	for pattern, template, header in _re_pattern_algorithm_header:
				5185	if pattern.search(line):
				5186	required[header] = (linenum, template)
				5187
				5188	# The following function is just a speed up, no semantics are changed.
				5189	if not '<' in line: # Reduces the cpu time usage by skipping lines.
				5190	continue
				5191
				5192	for pattern, template, header in _re_pattern_templates:
				5193	if pattern.search(line):
				5194	required[header] = (linenum, template)
				5195
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5196	# The policy is that if you #include something in foo.h you don't need to
				5197	# include it again in foo.cc. Here, we will look at possible includes.
				5198	# Let's copy the include_state so it is only messed up within this function.
				5199	include_state = include_state.copy()
				5200
				5201	# Did we find the header for this file (if any) and succesfully load it?
				5202	header_found = False
				5203
				5204	# Use the absolute path so that matching works properly.
erg@chromium.org	8f92756	2012-01-30 19:51:28 +0000	[diff] [blame]	5205	abs_filename = FileInfo(filename).FullName()
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5206
				5207	# For Emacs's flymake.
				5208	# If cpplint is invoked from Emacs's flymake, a temporary file is generated
				5209	# by flymake and that file name might end with '_flymake.cc'. In that case,
				5210	# restore original file name here so that the corresponding header file can be
				5211	# found.
				5212	# e.g. If the file name is 'foo_flymake.cc', we should search for 'foo.h'
				5213	# instead of 'foo_flymake.h'
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	5214	abs_filename = re.sub(r'_flymake\.cc$', '.cc', abs_filename)
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5215
				5216	# include_state is modified during iteration, so we iterate over a copy of
				5217	# the keys.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5218	header_keys = include_state.keys()
				5219	for header in header_keys:
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5220	(same_module, common_path) = FilesBelongToSameModule(abs_filename, header)
				5221	fullpath = common_path + header
				5222	if same_module and UpdateIncludeState(fullpath, include_state, io):
				5223	header_found = True
				5224
				5225	# If we can't find the header file for a .cc, assume it's because we don't
				5226	# know where to look. In that case we'll give up as we're not sure they
				5227	# didn't include it in the .h file.
				5228	# TODO(unknown): Do a better job of finding .h files so we are confident that
				5229	# not having the .h file means there isn't one.
				5230	if filename.endswith('.cc') and not header_found:
				5231	return
				5232
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5233	# All the lines have been processed, report the errors found.
				5234	for required_header_unstripped in required:
				5235	template = required[required_header_unstripped][1]
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5236	if required_header_unstripped.strip('<>"') not in include_state:
				5237	error(filename, required[required_header_unstripped][0],
				5238	'build/include_what_you_use', 4,
				5239	'Add #include ' + required_header_unstripped + ' for ' + template)
				5240
				5241
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5242	_RE_PATTERN_EXPLICIT_MAKEPAIR = re.compile(r'\bmake_pair\s*<')
				5243
				5244
				5245	def CheckMakePairUsesDeduction(filename, clean_lines, linenum, error):
				5246	"""Check that make_pair's template arguments are deduced.
				5247
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5248	G++ 4.6 in C++11 mode fails badly if make_pair's template arguments are
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5249	specified explicitly, and such use isn't intended in any case.
				5250
				5251	Args:
				5252	filename: The name of the current file.
				5253	clean_lines: A CleansedLines instance containing the file.
				5254	linenum: The number of the line to check.
				5255	error: The function to call with any errors found.
				5256	"""
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5257	line = clean_lines.elided[linenum]
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5258	match = _RE_PATTERN_EXPLICIT_MAKEPAIR.search(line)
				5259	if match:
				5260	error(filename, linenum, 'build/explicit_make_pair',
				5261	4, # 4 = high confidence
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5262	'For C++11-compatibility, omit template arguments from make_pair'
				5263	' OR use pair directly OR if appropriate, construct a pair directly')
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5264	def CheckDefaultLambdaCaptures(filename, clean_lines, linenum, error):
				5265	"""Check that default lambda captures are not used.
				5266
				5267	Args:
				5268	filename: The name of the current file.
				5269	clean_lines: A CleansedLines instance containing the file.
				5270	linenum: The number of the line to check.
				5271	error: The function to call with any errors found.
				5272	"""
				5273	line = clean_lines.elided[linenum]
				5274
				5275	# A lambda introducer specifies a default capture if it starts with "[="
				5276	# or if it starts with "[&" _not_ followed by an identifier.
				5277	match = Match(r'^(.)\[\s(?:=\|&[^\w])', line)
				5278	if match:
				5279	# Found a potential error, check what comes after the lambda-introducer.
				5280	# If it's not open parenthesis (for lambda-declarator) or open brace
				5281	# (for compound-statement), it's not a lambda.
				5282	line, _, pos = CloseExpression(clean_lines, linenum, len(match.group(1)))
				5283	if pos >= 0 and Match(r'^\s*[{(]', line[pos:]):
				5284	error(filename, linenum, 'build/c++11',
				5285	4, # 4 = high confidence
				5286	'Default lambda captures are an unapproved C++ feature.')
				5287
				5288
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5289
				5290
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5291	def ProcessLine(filename, file_extension, clean_lines, line,
				5292	include_state, function_state, nesting_state, error,
				5293	extra_check_functions=[]):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5294	"""Processes a single line in the file.
				5295
				5296	Args:
				5297	filename: Filename of the file that is being processed.
				5298	file_extension: The extension (dot not included) of the file.
				5299	clean_lines: An array of strings, each representing a line of the file,
				5300	with comments stripped.
				5301	line: Number of line being processed.
				5302	include_state: An _IncludeState instance in which the headers are inserted.
				5303	function_state: A _FunctionState instance which counts function lines, etc.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5304	nesting_state: A NestingState instance which maintains information about
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5305	the current stack of nested blocks being parsed.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5306	error: A callable to which errors are reported, which takes 4 arguments:
				5307	filename, line number, error level, and message
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5308	extra_check_functions: An array of additional check functions that will be
				5309	run on each source line. Each function takes 4
				5310	arguments: filename, clean_lines, line, error
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5311	"""
				5312	raw_lines = clean_lines.raw_lines
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	5313	ParseNolintSuppressions(filename, raw_lines[line], line, error)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5314	nesting_state.Update(filename, clean_lines, line, error)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5315	if nesting_state.InAsmBlock(): return
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5316	CheckForFunctionLengths(filename, clean_lines, line, function_state, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5317	CheckForMultilineCommentsAndStrings(filename, clean_lines, line, error)
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5318	CheckStyle(filename, clean_lines, line, file_extension, nesting_state, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5319	CheckLanguage(filename, clean_lines, line, file_extension, include_state,
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5320	nesting_state, error)
				5321	CheckForNonConstReference(filename, clean_lines, line, nesting_state, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5322	CheckForNonStandardConstructs(filename, clean_lines, line,
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5323	nesting_state, error)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5324	CheckVlogArguments(filename, clean_lines, line, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5325	CheckPosixThreading(filename, clean_lines, line, error)
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5326	CheckInvalidIncrement(filename, clean_lines, line, error)
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5327	CheckMakePairUsesDeduction(filename, clean_lines, line, error)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5328	CheckDefaultLambdaCaptures(filename, clean_lines, line, error)
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5329	for check_fn in extra_check_functions:
				5330	check_fn(filename, clean_lines, line, error)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5331
				5332	def FlagCxx11Features(filename, clean_lines, linenum, error):
				5333	"""Flag those c++11 features that we only allow in certain places.
				5334
				5335	Args:
				5336	filename: The name of the current file.
				5337	clean_lines: A CleansedLines instance containing the file.
				5338	linenum: The number of the line to check.
				5339	error: The function to call with any errors found.
				5340	"""
				5341	line = clean_lines.elided[linenum]
				5342
				5343	# Flag unapproved C++11 headers.
				5344	include = Match(r'\s#\sinclude\s+[<"]([^<"]+)[">]', line)
				5345	if include and include.group(1) in ('cfenv',
				5346	'condition_variable',
				5347	'fenv.h',
				5348	'future',
				5349	'mutex',
				5350	'thread',
				5351	'chrono',
				5352	'ratio',
				5353	'regex',
				5354	'system_error',
				5355	):
				5356	error(filename, linenum, 'build/c++11', 5,
				5357	('<%s> is an unapproved C++11 header.') % include.group(1))
				5358
				5359	# The only place where we need to worry about C++11 keywords and library
				5360	# features in preprocessor directives is in macro definitions.
				5361	if Match(r'\s#', line) and not Match(r'\s#\s*define\b', line): return
				5362
				5363	# These are classes and free functions. The classes are always
				5364	# mentioned as std::*, but we only catch the free functions if
				5365	# they're not found by ADL. They're alphabetical by header.
				5366	for top_name in (
				5367	# type_traits
				5368	'alignment_of',
				5369	'aligned_union',
				5370
				5371	# utility
				5372	'forward',
				5373	):
				5374	if Search(r'\bstd::%s\b' % top_name, line):
				5375	error(filename, linenum, 'build/c++11', 5,
				5376	('std::%s is an unapproved C++11 class or function. Send c-style '
				5377	'an example of where it would make your code more readable, and '
				5378	'they may let you use it.') % top_name)
				5379
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5380
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5381	def ProcessFileData(filename, file_extension, lines, error,
				5382	extra_check_functions=[]):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5383	"""Performs lint checks and reports any errors to the given error function.
				5384
				5385	Args:
				5386	filename: Filename of the file that is being processed.
				5387	file_extension: The extension (dot not included) of the file.
				5388	lines: An array of strings, each representing a line of the file, with the
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5389	last element being empty if the file is terminated with a newline.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5390	error: A callable to which errors are reported, which takes 4 arguments:
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5391	filename, line number, error level, and message
				5392	extra_check_functions: An array of additional check functions that will be
				5393	run on each source line. Each function takes 4
				5394	arguments: filename, clean_lines, line, error
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5395	"""
				5396	lines = (['// marker so line numbers and indices both start at 1'] + lines +
				5397	['// marker so line numbers end in a known way'])
				5398
				5399	include_state = _IncludeState()
				5400	function_state = _FunctionState()
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5401	nesting_state = NestingState()
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5402
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	5403	ResetNolintSuppressions()
				5404
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5405	CheckForCopyright(filename, lines, error)
				5406
				5407	if file_extension == 'h':
				5408	CheckForHeaderGuard(filename, lines, error)
				5409
				5410	RemoveMultiLineComments(filename, lines, error)
				5411	clean_lines = CleansedLines(lines)
				5412	for line in xrange(clean_lines.NumLines()):
				5413	ProcessLine(filename, file_extension, clean_lines, line,
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5414	include_state, function_state, nesting_state, error,
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5415	extra_check_functions)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5416	FlagCxx11Features(filename, clean_lines, line, error)
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5417	nesting_state.CheckCompletedBlocks(filename, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5418
				5419	CheckForIncludeWhatYouUse(filename, clean_lines, include_state, error)
				5420
				5421	# We check here rather than inside ProcessLine so that we see raw
				5422	# lines rather than "cleaned" lines.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5423	CheckForBadCharacters(filename, lines, error)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5424
				5425	CheckForNewlineAtEOF(filename, lines, error)
				5426
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5427
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5428	def ProcessFile(filename, vlevel, extra_check_functions=[]):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5429	"""Does google-lint on a single file.
				5430
				5431	Args:
				5432	filename: The name of the file to parse.
				5433
				5434	vlevel: The level of errors to report. Every error of confidence
				5435	>= verbose_level will be reported. 0 is a good default.
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5436
				5437	extra_check_functions: An array of additional check functions that will be
				5438	run on each source line. Each function takes 4
				5439	arguments: filename, clean_lines, line, error
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5440	"""
				5441
				5442	_SetVerboseLevel(vlevel)
				5443
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5444	lf_lines = []
				5445	crlf_lines = []
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5446	try:
				5447	# Support the UNIX convention of using "-" for stdin. Note that
				5448	# we are not opening the file with universal newline support
				5449	# (which codecs doesn't support anyway), so the resulting lines do
				5450	# contain trailing '\r' characters if we are reading a file that
				5451	# has CRLF endings.
				5452	# If after the split a trailing '\r' is present, it is removed
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5453	# below.
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5454	if filename == '-':
				5455	lines = codecs.StreamReaderWriter(sys.stdin,
				5456	codecs.getreader('utf8'),
				5457	codecs.getwriter('utf8'),
				5458	'replace').read().split('\n')
				5459	else:
				5460	lines = codecs.open(filename, 'r', 'utf8', 'replace').read().split('\n')
				5461
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5462	# Remove trailing '\r'.
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5463	# The -1 accounts for the extra trailing blank line we get from split()
				5464	for linenum in range(len(lines) - 1):
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5465	if lines[linenum].endswith('\r'):
				5466	lines[linenum] = lines[linenum].rstrip('\r')
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5467	crlf_lines.append(linenum + 1)
				5468	else:
				5469	lf_lines.append(linenum + 1)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5470
				5471	except IOError:
				5472	sys.stderr.write(
				5473	"Skipping input '%s': Can't open for reading\n" % filename)
				5474	return
				5475
				5476	# Note, if no dot is found, this will give the entire filename as the ext.
				5477	file_extension = filename[filename.rfind('.') + 1:]
				5478
				5479	# When reading from stdin, the extension is unknown, so no cpplint tests
				5480	# should rely on the extension.
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5481	if filename != '-' and file_extension not in _valid_extensions:
				5482	sys.stderr.write('Ignoring %s; not a valid file name '
				5483	'(%s)\n' % (filename, ', '.join(_valid_extensions)))
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5484	else:
asvitkine@chromium.org	8b8d8be	2011-09-08 15:34:45 +0000	[diff] [blame]	5485	ProcessFileData(filename, file_extension, lines, Error,
				5486	extra_check_functions)
avakulenko@google.com	d39bbb5	2014-06-04 22:55:20 +0000	[diff] [blame]	5487
				5488	# If end-of-line sequences are a mix of LF and CR-LF, issue
				5489	# warnings on the lines with CR.
				5490	#
				5491	# Don't issue any warnings if all lines are uniformly LF or CR-LF,
				5492	# since critique can handle these just fine, and the style guide
				5493	# doesn't dictate a particular end of line sequence.
				5494	#
				5495	# We can't depend on os.linesep to determine what the desired
				5496	# end-of-line sequence should be, since that will return the
				5497	# server-side end-of-line sequence.
				5498	if lf_lines and crlf_lines:
				5499	# Warn on every line with CR. An alternative approach might be to
				5500	# check whether the file is mostly CRLF or just LF, and warn on the
				5501	# minority, we bias toward LF here since most tools prefer LF.
				5502	for linenum in crlf_lines:
				5503	Error(filename, linenum, 'whitespace/newline', 1,
				5504	'Unexpected \\r (^M) found; better to use only \\n')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5505
				5506	sys.stderr.write('Done processing %s\n' % filename)
				5507
				5508
				5509	def PrintUsage(message):
				5510	"""Prints a brief usage string and exits, optionally with an error message.
				5511
				5512	Args:
				5513	message: The optional error message.
				5514	"""
				5515	sys.stderr.write(_USAGE)
				5516	if message:
				5517	sys.exit('\nFATAL ERROR: ' + message)
				5518	else:
				5519	sys.exit(1)
				5520
				5521
				5522	def PrintCategories():
				5523	"""Prints a list of all the error-categories used by error messages.
				5524
				5525	These are the categories used to filter messages via --filter.
				5526	"""
erg@google.com	35589e6	2010-11-17 18:58:16 +0000	[diff] [blame]	5527	sys.stderr.write(''.join(' %s\n' % cat for cat in _ERROR_CATEGORIES))
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5528	sys.exit(0)
				5529
				5530
				5531	def ParseArguments(args):
				5532	"""Parses the command line arguments.
				5533
				5534	This may set the output format and verbosity level as side-effects.
				5535
				5536	Args:
				5537	args: The command line arguments:
				5538
				5539	Returns:
				5540	The list of filenames to lint.
				5541	"""
				5542	try:
				5543	(opts, filenames) = getopt.getopt(args, '', ['help', 'output=', 'verbose=',
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5544	'counting=',
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5545	'filter=',
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5546	'root=',
				5547	'linelength=',
				5548	'extensions='])
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5549	except getopt.GetoptError:
				5550	PrintUsage('Invalid arguments.')
				5551
				5552	verbosity = _VerboseLevel()
				5553	output_format = _OutputFormat()
				5554	filters = ''
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5555	counting_style = ''
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5556
				5557	for (opt, val) in opts:
				5558	if opt == '--help':
				5559	PrintUsage(None)
				5560	elif opt == '--output':
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5561	if val not in ('emacs', 'vs7', 'eclipse'):
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5562	PrintUsage('The only allowed output formats are emacs, vs7 and eclipse.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5563	output_format = val
				5564	elif opt == '--verbose':
				5565	verbosity = int(val)
				5566	elif opt == '--filter':
				5567	filters = val
erg@google.com	6317a9c	2009-06-25 00:28:19 +0000	[diff] [blame]	5568	if not filters:
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5569	PrintCategories()
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5570	elif opt == '--counting':
				5571	if val not in ('total', 'toplevel', 'detailed'):
				5572	PrintUsage('Valid counting options are total, toplevel, and detailed')
				5573	counting_style = val
mazda@chromium.org	3fffcec	2013-06-07 01:04:53 +0000	[diff] [blame]	5574	elif opt == '--root':
				5575	global _root
				5576	_root = val
raphael.kubo.da.costa@intel.com	331fbc4	2014-05-09 08:48:20 +0000	[diff] [blame]	5577	elif opt == '--linelength':
				5578	global _line_length
				5579	try:
				5580	_line_length = int(val)
				5581	except ValueError:
				5582	PrintUsage('Line length must be digits.')
				5583	elif opt == '--extensions':
				5584	global _valid_extensions
				5585	try:
				5586	_valid_extensions = set(val.split(','))
				5587	except ValueError:
				5588	PrintUsage('Extensions must be comma seperated list.')
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5589
				5590	if not filenames:
				5591	PrintUsage('No files were specified.')
				5592
				5593	_SetOutputFormat(output_format)
				5594	_SetVerboseLevel(verbosity)
				5595	_SetFilters(filters)
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5596	_SetCountingStyle(counting_style)
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5597
				5598	return filenames
				5599
				5600
				5601	def main():
				5602	filenames = ParseArguments(sys.argv[1:])
				5603
				5604	# Change stderr to write with replacement characters so we don't die
				5605	# if we try to print something containing non-ASCII characters.
				5606	sys.stderr = codecs.StreamReaderWriter(sys.stderr,
				5607	codecs.getreader('utf8'),
				5608	codecs.getwriter('utf8'),
				5609	'replace')
				5610
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5611	_cpplint_state.ResetErrorCounts()
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5612	for filename in filenames:
				5613	ProcessFile(filename, _cpplint_state.verbose_level)
erg@google.com	26970fa	2009-11-17 18:07:32 +0000	[diff] [blame]	5614	_cpplint_state.PrintErrorCounts()
				5615
maruel@google.com	fb2b8eb	2009-04-23 21:03:42 +0000	[diff] [blame]	5616	sys.exit(_cpplint_state.error_count > 0)
				5617
				5618
				5619	if __name__ == '__main__':
				5620	main()