# Copyright (c) 2009-2011, 2013-2014 LOGILAB S.A. (Paris, FRANCE) # Copyright (c) 2009, 2012, 2014 Google, Inc. # Copyright (c) 2012 Mike Bryant # Copyright (c) 2014 Brett Cannon # Copyright (c) 2014 Arun Persaud # Copyright (c) 2015-2020 Claudiu Popa # Copyright (c) 2015 Ionel Cristian Maries # Copyright (c) 2016, 2019-2020 Ashley Whetter # Copyright (c) 2016 Chris Murray # Copyright (c) 2017 guillaume2 # Copyright (c) 2017 Łukasz Rogalski # Copyright (c) 2018 Alan Chan # Copyright (c) 2018 Yury Gribov # Copyright (c) 2018 Mike Frysinger # Copyright (c) 2018 Mariatta Wijaya # Copyright (c) 2019-2021 Pierre Sassoulas # Copyright (c) 2019 Djailla # Copyright (c) 2019 Svet # Copyright (c) 2020 Anthony Sottile # Copyright (c) 2021 Nick Drozd # Copyright (c) 2021 Daniël van Noord <13665637+DanielNoord@users.noreply.github.com> # Copyright (c) 2021 Marc Mueller <30130371+cdce8p@users.noreply.github.com> # Licensed under the GPL: https://www.gnu.org/licenses/old-licenses/gpl-2.0.html # For details: https://github.com/PyCQA/pylint/blob/main/LICENSE """checker for use of Python logging """ import string from typing import Set import astroid from astroid import nodes from pylint import checkers, interfaces from pylint.checkers import utils from pylint.checkers.utils import check_messages, infer_all MSGS = { # pylint: disable=consider-using-namedtuple-or-dataclass "W1201": ( "Use %s formatting in logging functions", "logging-not-lazy", "Used when a logging statement has a call form of " '"logging.(format_string % (format_args...))". ' "Use another type of string formatting instead. " "You can use % formatting but leave interpolation to " "the logging function by passing the parameters as arguments. " "If logging-fstring-interpolation is disabled then " "you can use fstring formatting. " "If logging-format-interpolation is disabled then " "you can use str.format.", ), "W1202": ( "Use %s formatting in logging functions", "logging-format-interpolation", "Used when a logging statement has a call form of " '"logging.(format_string.format(format_args...))". ' "Use another type of string formatting instead. " "You can use % formatting but leave interpolation to " "the logging function by passing the parameters as arguments. " "If logging-fstring-interpolation is disabled then " "you can use fstring formatting. " "If logging-not-lazy is disabled then " "you can use % formatting as normal.", ), "W1203": ( "Use %s formatting in logging functions", "logging-fstring-interpolation", "Used when a logging statement has a call form of " '"logging.(f"...")".' "Use another type of string formatting instead. " "You can use % formatting but leave interpolation to " "the logging function by passing the parameters as arguments. " "If logging-format-interpolation is disabled then " "you can use str.format. " "If logging-not-lazy is disabled then " "you can use % formatting as normal.", ), "E1200": ( "Unsupported logging format character %r (%#02x) at index %d", "logging-unsupported-format", "Used when an unsupported format character is used in a logging " "statement format string.", ), "E1201": ( "Logging format string ends in middle of conversion specifier", "logging-format-truncated", "Used when a logging statement format string terminates before " "the end of a conversion specifier.", ), "E1205": ( "Too many arguments for logging format string", "logging-too-many-args", "Used when a logging format string is given too many arguments.", ), "E1206": ( "Not enough arguments for logging format string", "logging-too-few-args", "Used when a logging format string is given too few arguments.", ), } CHECKED_CONVENIENCE_FUNCTIONS = { "critical", "debug", "error", "exception", "fatal", "info", "warn", "warning", } def is_method_call(func, types=(), methods=()): """Determines if a BoundMethod node represents a method call. Args: func (astroid.BoundMethod): The BoundMethod AST node to check. types (Optional[String]): Optional sequence of caller type names to restrict check. methods (Optional[String]): Optional sequence of method names to restrict check. Returns: bool: true if the node represents a method call for the given type and method names, False otherwise. """ return ( isinstance(func, astroid.BoundMethod) and isinstance(func.bound, astroid.Instance) and (func.bound.name in types if types else True) and (func.name in methods if methods else True) ) class LoggingChecker(checkers.BaseChecker): """Checks use of the logging module.""" __implements__ = interfaces.IAstroidChecker name = "logging" msgs = MSGS options = ( ( "logging-modules", { "default": ("logging",), "type": "csv", "metavar": "", "help": "Logging modules to check that the string format " "arguments are in logging function parameter format.", }, ), ( "logging-format-style", { "default": "old", "type": "choice", "metavar": "", "choices": ["old", "new"], "help": "The type of string formatting that logging methods do. " "`old` means using % formatting, `new` is for `{}` formatting.", }, ), ) def visit_module(self, _: nodes.Module) -> None: """Clears any state left in this checker from last module checked.""" # The code being checked can just as easily "import logging as foo", # so it is necessary to process the imports and store in this field # what name the logging module is actually given. self._logging_names: Set[str] = set() logging_mods = self.config.logging_modules self._format_style = self.config.logging_format_style self._logging_modules = set(logging_mods) self._from_imports = {} for logging_mod in logging_mods: parts = logging_mod.rsplit(".", 1) if len(parts) > 1: self._from_imports[parts[0]] = parts[1] def visit_importfrom(self, node: nodes.ImportFrom) -> None: """Checks to see if a module uses a non-Python logging module.""" try: logging_name = self._from_imports[node.modname] for module, as_name in node.names: if module == logging_name: self._logging_names.add(as_name or module) except KeyError: pass def visit_import(self, node: nodes.Import) -> None: """Checks to see if this module uses Python's built-in logging.""" for module, as_name in node.names: if module in self._logging_modules: self._logging_names.add(as_name or module) @check_messages(*MSGS) def visit_call(self, node: nodes.Call) -> None: """Checks calls to logging methods.""" def is_logging_name(): return ( isinstance(node.func, nodes.Attribute) and isinstance(node.func.expr, nodes.Name) and node.func.expr.name in self._logging_names ) def is_logger_class(): for inferred in infer_all(node.func): if isinstance(inferred, astroid.BoundMethod): parent = inferred._proxied.parent if isinstance(parent, nodes.ClassDef) and ( parent.qname() == "logging.Logger" or any( ancestor.qname() == "logging.Logger" for ancestor in parent.ancestors() ) ): return True, inferred._proxied.name return False, None if is_logging_name(): name = node.func.attrname else: result, name = is_logger_class() if not result: return self._check_log_method(node, name) def _check_log_method(self, node, name): """Checks calls to logging.log(level, format, *format_args).""" if name == "log": if node.starargs or node.kwargs or len(node.args) < 2: # Either a malformed call, star args, or double-star args. Beyond # the scope of this checker. return format_pos = 1 elif name in CHECKED_CONVENIENCE_FUNCTIONS: if node.starargs or node.kwargs or not node.args: # Either no args, star args, or double-star args. Beyond the # scope of this checker. return format_pos = 0 else: return if isinstance(node.args[format_pos], nodes.BinOp): binop = node.args[format_pos] emit = binop.op == "%" if binop.op == "+": total_number_of_strings = sum( 1 for operand in (binop.left, binop.right) if self._is_operand_literal_str(utils.safe_infer(operand)) ) emit = total_number_of_strings > 0 if emit: self.add_message( "logging-not-lazy", node=node, args=(self._helper_string(node),), ) elif isinstance(node.args[format_pos], nodes.Call): self._check_call_func(node.args[format_pos]) elif isinstance(node.args[format_pos], nodes.Const): self._check_format_string(node, format_pos) elif isinstance(node.args[format_pos], nodes.JoinedStr): self.add_message( "logging-fstring-interpolation", node=node, args=(self._helper_string(node),), ) def _helper_string(self, node): """Create a string that lists the valid types of formatting for this node.""" valid_types = ["lazy %"] if not self.linter.is_message_enabled( "logging-fstring-formatting", node.fromlineno ): valid_types.append("fstring") if not self.linter.is_message_enabled( "logging-format-interpolation", node.fromlineno ): valid_types.append(".format()") if not self.linter.is_message_enabled("logging-not-lazy", node.fromlineno): valid_types.append("%") return " or ".join(valid_types) @staticmethod def _is_operand_literal_str(operand): """ Return True if the operand in argument is a literal string """ return isinstance(operand, nodes.Const) and operand.name == "str" def _check_call_func(self, node: nodes.Call): """Checks that function call is not format_string.format().""" func = utils.safe_infer(node.func) types = ("str", "unicode") methods = ("format",) if ( isinstance(func, astroid.BoundMethod) and is_method_call(func, types, methods) and not is_complex_format_str(func.bound) ): self.add_message( "logging-format-interpolation", node=node, args=(self._helper_string(node),), ) def _check_format_string(self, node, format_arg): """Checks that format string tokens match the supplied arguments. Args: node (nodes.NodeNG): AST node to be checked. format_arg (int): Index of the format string in the node arguments. """ num_args = _count_supplied_tokens(node.args[format_arg + 1 :]) if not num_args: # If no args were supplied the string is not interpolated and can contain # formatting characters - it's used verbatim. Don't check any further. return format_string = node.args[format_arg].value required_num_args = 0 if isinstance(format_string, bytes): format_string = format_string.decode() if isinstance(format_string, str): try: if self._format_style == "old": keyword_args, required_num_args, _, _ = utils.parse_format_string( format_string ) if keyword_args: # Keyword checking on logging strings is complicated by # special keywords - out of scope. return elif self._format_style == "new": ( keyword_arguments, implicit_pos_args, explicit_pos_args, ) = utils.parse_format_method_string(format_string) keyword_args_cnt = len( {k for k, l in keyword_arguments if not isinstance(k, int)} ) required_num_args = ( keyword_args_cnt + implicit_pos_args + explicit_pos_args ) except utils.UnsupportedFormatCharacter as ex: char = format_string[ex.index] self.add_message( "logging-unsupported-format", node=node, args=(char, ord(char), ex.index), ) return except utils.IncompleteFormatString: self.add_message("logging-format-truncated", node=node) return if num_args > required_num_args: self.add_message("logging-too-many-args", node=node) elif num_args < required_num_args: self.add_message("logging-too-few-args", node=node) def is_complex_format_str(node: nodes.NodeNG) -> bool: """Return whether the node represents a string with complex formatting specs.""" inferred = utils.safe_infer(node) if inferred is None or not ( isinstance(inferred, nodes.Const) and isinstance(inferred.value, str) ): return True try: parsed = list(string.Formatter().parse(inferred.value)) except ValueError: # This format string is invalid return False return any(format_spec for (_, _, format_spec, _) in parsed) def _count_supplied_tokens(args): """Counts the number of tokens in an args list. The Python log functions allow for special keyword arguments: func, exc_info and extra. To handle these cases correctly, we only count arguments that aren't keywords. Args: args (list): AST nodes that are arguments for a log format string. Returns: int: Number of AST nodes that aren't keywords. """ return sum(1 for arg in args if not isinstance(arg, nodes.Keyword)) def register(linter): """Required method to auto-register this checker.""" linter.register_checker(LoggingChecker(linter))