# frozen_string_literal: true module RuboCop module AST # `RuboCop::AST::Node` is a subclass of `Parser::AST::Node`. It provides # access to parent nodes and an object-oriented way to traverse an AST with # the power of `Enumerable`. # # It has predicate methods for every node type, like this: # # @example # node.send_type? # Equivalent to: `node.type == :send` # node.op_asgn_type? # Equivalent to: `node.type == :op_asgn` # # # Non-word characters (other than a-zA-Z0-9_) in type names are omitted. # node.defined_type? # Equivalent to: `node.type == :defined?` # # # Find the first lvar node under the receiver node. # lvar_node = node.each_descendant.find(&:lvar_type?) # class Node < Parser::AST::Node # rubocop:disable Metrics/ClassLength include RuboCop::AST::Sexp extend NodePattern::Macros include RuboCop::AST::Descendence # @api private # <=> isn't included here, because it doesn't return a boolean. COMPARISON_OPERATORS = %i[== === != <= >= > <].to_set.freeze # @api private TRUTHY_LITERALS = %i[str dstr xstr int float sym dsym array hash regexp true irange erange complex rational regopt].to_set.freeze # @api private FALSEY_LITERALS = %i[false nil].to_set.freeze # @api private LITERALS = (TRUTHY_LITERALS + FALSEY_LITERALS).freeze # @api private COMPOSITE_LITERALS = %i[dstr xstr dsym array hash irange erange regexp].to_set.freeze # @api private BASIC_LITERALS = (LITERALS - COMPOSITE_LITERALS).freeze # @api private MUTABLE_LITERALS = %i[str dstr xstr array hash regexp irange erange].to_set.freeze # @api private IMMUTABLE_LITERALS = (LITERALS - MUTABLE_LITERALS).freeze # @api private EQUALS_ASSIGNMENTS = %i[lvasgn ivasgn cvasgn gvasgn casgn masgn].to_set.freeze # @api private SHORTHAND_ASSIGNMENTS = %i[op_asgn or_asgn and_asgn].to_set.freeze # @api private ASSIGNMENTS = (EQUALS_ASSIGNMENTS + SHORTHAND_ASSIGNMENTS).freeze # @api private BASIC_CONDITIONALS = %i[if while until].to_set.freeze # @api private CONDITIONALS = (BASIC_CONDITIONALS + %i[case case_match]).freeze # @api private POST_CONDITION_LOOP_TYPES = %i[while_post until_post].to_set.freeze # @api private LOOP_TYPES = (POST_CONDITION_LOOP_TYPES + %i[while until for]).freeze # @api private VARIABLES = %i[ivar gvar cvar lvar].to_set.freeze # @api private REFERENCES = %i[nth_ref back_ref].to_set.freeze # @api private KEYWORDS = %i[alias and break case class def defs defined? kwbegin do else ensure for if module next not or postexe redo rescue retry return self super zsuper then undef until when while yield].to_set.freeze # @api private OPERATOR_KEYWORDS = %i[and or].to_set.freeze # @api private SPECIAL_KEYWORDS = %w[__FILE__ __LINE__ __ENCODING__].to_set.freeze # @api private ARGUMENT_TYPES = %i[arg optarg restarg kwarg kwoptarg kwrestarg blockarg forward_arg shadowarg].to_set.freeze LITERAL_RECURSIVE_METHODS = (COMPARISON_OPERATORS + %i[* ! <=>]).freeze LITERAL_RECURSIVE_TYPES = (OPERATOR_KEYWORDS + COMPOSITE_LITERALS + %i[begin pair]).freeze private_constant :LITERAL_RECURSIVE_METHODS, :LITERAL_RECURSIVE_TYPES EMPTY_CHILDREN = [].freeze EMPTY_PROPERTIES = {}.freeze private_constant :EMPTY_CHILDREN, :EMPTY_PROPERTIES # @see https://www.rubydoc.info/gems/ast/AST/Node:initialize def initialize(type, children = EMPTY_CHILDREN, properties = EMPTY_PROPERTIES) @mutable_attributes = {} # ::AST::Node#initialize freezes itself. super # #parent= may be invoked multiple times for a node because there are # pending nodes while constructing AST and they are replaced later. # For example, `lvar` and `send` type nodes are initially created as an # `ident` type node and fixed to the appropriate type later. # So, the #parent attribute needs to be mutable. each_child_node do |child_node| child_node.parent = self unless child_node.complete? end end (Parser::Meta::NODE_TYPES - [:send]).each do |node_type| method_name = "#{node_type.to_s.gsub(/\W/, '')}_type?" class_eval <<~RUBY, __FILE__, __LINE__ + 1 def #{method_name} # def block_type? @type == :#{node_type} # @type == :block end # end RUBY end # Most nodes are of 'send' type, so this method is defined # separately to make this check as fast as possible. def send_type? false end # Returns the parent node, or `nil` if the receiver is a root node. # # @return [Node, nil] the parent node or `nil` def parent @mutable_attributes[:parent] end def parent=(node) @mutable_attributes[:parent] = node end # @return [Boolean] def parent? !!parent end # @return [Boolean] def root? !parent end def complete! @mutable_attributes.freeze each_child_node(&:complete!) end def complete? @mutable_attributes.frozen? end protected :parent= # Override `AST::Node#updated` so that `AST::Processor` does not try to # mutate our ASTs. Since we keep references from children to parents and # not just the other way around, we cannot update an AST and share # identical subtrees. Rather, the entire AST must be copied any time any # part of it is changed. def updated(type = nil, children = nil, properties = {}) properties[:location] ||= @location klass = RuboCop::AST::Builder::NODE_MAP[type || @type] || Node klass.new(type || @type, children || @children, properties) end # Returns the index of the receiver node in its siblings. (Sibling index # uses zero based numbering.) # Use is discouraged, this is a potentially slow method. # # @return [Integer, nil] the index of the receiver node in its siblings def sibling_index parent&.children&.index { |sibling| sibling.equal?(self) } end # Use is discouraged, this is a potentially slow method and can lead # to even slower algorithms # @return [Node, nil] the right (aka next) sibling def right_sibling return unless parent parent.children[sibling_index + 1].freeze end # Use is discouraged, this is a potentially slow method and can lead # to even slower algorithms # @return [Node, nil] the left (aka previous) sibling def left_sibling i = sibling_index return if i.nil? || i.zero? parent.children[i - 1].freeze end # Use is discouraged, this is a potentially slow method and can lead # to even slower algorithms # @return [Array] the left (aka previous) siblings def left_siblings return [].freeze unless parent parent.children[0...sibling_index].freeze end # Use is discouraged, this is a potentially slow method and can lead # to even slower algorithms # @return [Array] the right (aka next) siblings def right_siblings return [].freeze unless parent parent.children[sibling_index + 1..].freeze end # Common destructuring method. This can be used to normalize # destructuring for different variations of the node. # Some node types override this with their own custom # destructuring method. # # @return [Array] the different parts of the ndde alias node_parts to_a # Calls the given block for each ancestor node from parent to root. # If no block is given, an `Enumerator` is returned. # # @overload each_ancestor # Yield all nodes. # @overload each_ancestor(type) # Yield only nodes matching the type. # @param [Symbol] type a node type # @overload each_ancestor(type_a, type_b, ...) # Yield only nodes matching any of the types. # @param [Symbol] type_a a node type # @param [Symbol] type_b a node type # @yieldparam [Node] node each ancestor node # @return [self] if a block is given # @return [Enumerator] if no block is given def each_ancestor(*types, &block) return to_enum(__method__, *types) unless block visit_ancestors(types, &block) self end # Returns an array of ancestor nodes. # This is a shorthand for `node.each_ancestor.to_a`. # # @return [Array] an array of ancestor nodes def ancestors each_ancestor.to_a end # NOTE: Some rare nodes may have no source, like `s(:args)` in `foo {}` # @return [String, nil] def source loc.expression&.source end def source_range loc.expression end def first_line loc.line end def last_line loc.last_line end def line_count return 0 unless source_range source_range.last_line - source_range.first_line + 1 end def nonempty_line_count source.lines.grep(/\S/).size end def source_length source_range ? source_range.size : 0 end ## Destructuring # @!method receiver(node = self) def_node_matcher :receiver, <<~PATTERN {(send $_ ...) ({block numblock} (call $_ ...) ...)} PATTERN # @!method str_content(node = self) def_node_matcher :str_content, '(str $_)' def const_name return unless const_type? namespace, name = *self if namespace && !namespace.cbase_type? "#{namespace.const_name}::#{name}" else name.to_s end end # @!method defined_module0(node = self) def_node_matcher :defined_module0, <<~PATTERN {(class (const $_ $_) ...) (module (const $_ $_) ...) (casgn $_ $_ (send #global_const?({:Class :Module}) :new ...)) (casgn $_ $_ (block (send #global_const?({:Class :Module}) :new ...) ...))} PATTERN private :defined_module0 def defined_module namespace, name = *defined_module0 s(:const, namespace, name) if name end def defined_module_name (const = defined_module) && const.const_name end ## Searching the AST def parent_module_name # what class or module is this method/constant/etc definition in? # returns nil if answer cannot be determined ancestors = each_ancestor(:class, :module, :sclass, :casgn, :block) result = ancestors.filter_map do |ancestor| parent_module_name_part(ancestor) do |full_name| return nil unless full_name full_name end end.reverse.join('::') result.empty? ? 'Object' : result end ## Predicates def multiline? line_count > 1 end def single_line? line_count == 1 end def empty_source? source_length.zero? end # Some cops treat the shovel operator as a kind of assignment. # @!method assignment_or_similar?(node = self) def_node_matcher :assignment_or_similar?, <<~PATTERN {assignment? (send _recv :<< ...)} PATTERN def literal? LITERALS.include?(type) end def basic_literal? BASIC_LITERALS.include?(type) end def truthy_literal? TRUTHY_LITERALS.include?(type) end def falsey_literal? FALSEY_LITERALS.include?(type) end def mutable_literal? MUTABLE_LITERALS.include?(type) end def immutable_literal? IMMUTABLE_LITERALS.include?(type) end %i[literal basic_literal].each do |kind| recursive_kind = :"recursive_#{kind}?" kind_filter = :"#{kind}?" define_method(recursive_kind) do case type when :send LITERAL_RECURSIVE_METHODS.include?(method_name) && receiver.send(recursive_kind) && arguments.all?(&recursive_kind) when LITERAL_RECURSIVE_TYPES children.compact.all?(&recursive_kind) else send(kind_filter) end end end def variable? VARIABLES.include?(type) end def reference? REFERENCES.include?(type) end def equals_asgn? EQUALS_ASSIGNMENTS.include?(type) end def shorthand_asgn? SHORTHAND_ASSIGNMENTS.include?(type) end def assignment? ASSIGNMENTS.include?(type) end def basic_conditional? BASIC_CONDITIONALS.include?(type) end def conditional? CONDITIONALS.include?(type) end def post_condition_loop? POST_CONDITION_LOOP_TYPES.include?(type) end # NOTE: `loop { }` is a normal method call and thus not a loop keyword. def loop_keyword? LOOP_TYPES.include?(type) end def keyword? return true if special_keyword? || (send_type? && prefix_not?) return false unless KEYWORDS.include?(type) !OPERATOR_KEYWORDS.include?(type) || loc.operator.is?(type.to_s) end def special_keyword? SPECIAL_KEYWORDS.include?(source) end def operator_keyword? OPERATOR_KEYWORDS.include?(type) end def parenthesized_call? loc.respond_to?(:begin) && loc.begin && loc.begin.is?('(') end def call_type? send_type? || csend_type? end def chained? parent&.call_type? && eql?(parent.receiver) end def argument? parent&.send_type? && parent.arguments.include?(self) end def argument_type? ARGUMENT_TYPES.include?(type) end def boolean_type? true_type? || false_type? end def numeric_type? int_type? || float_type? || rational_type? || complex_type? end def range_type? irange_type? || erange_type? end def guard_clause? node = and_type? || or_type? ? rhs : self node.match_guard_clause? end # @!method match_guard_clause?(node = self) def_node_matcher :match_guard_clause?, <<~PATTERN [${(send nil? {:raise :fail} ...) return break next} single_line?] PATTERN # @!method proc?(node = self) def_node_matcher :proc?, <<~PATTERN {(block (send nil? :proc) ...) (block (send #global_const?(:Proc) :new) ...) (send #global_const?(:Proc) :new)} PATTERN # @!method lambda?(node = self) def_node_matcher :lambda?, '({block numblock} (send nil? :lambda) ...)' # @!method lambda_or_proc?(node = self) def_node_matcher :lambda_or_proc?, '{lambda? proc?}' # @!method global_const?(node = self, name) def_node_matcher :global_const?, '(const {nil? cbase} %1)' # @!method class_constructor?(node = self) def_node_matcher :class_constructor?, <<~PATTERN { (send #global_const?({:Class :Module :Struct}) :new ...) (send #global_const?(:Data) :define ...) ({block numblock} { (send #global_const?({:Class :Module :Struct}) :new ...) (send #global_const?(:Data) :define ...) } ...) } PATTERN # @deprecated Use `:class_constructor?` # @!method struct_constructor?(node = self) def_node_matcher :struct_constructor?, <<~PATTERN ({block numblock} (send #global_const?(:Struct) :new ...) _ $_) PATTERN # @!method class_definition?(node = self) def_node_matcher :class_definition?, <<~PATTERN {(class _ _ $_) (sclass _ $_) ({block numblock} (send #global_const?({:Struct :Class}) :new ...) _ $_)} PATTERN # @!method module_definition?(node = self) def_node_matcher :module_definition?, <<~PATTERN {(module _ $_) ({block numblock} (send #global_const?(:Module) :new ...) _ $_)} PATTERN # Some expressions are evaluated for their value, some for their side # effects, and some for both # If we know that an expression is useful only for its side effects, that # means we can transform it in ways which preserve the side effects, but # change the return value # So, does the return value of this node matter? If we changed it to # `(...; nil)`, might that affect anything? # # rubocop:disable Metrics/MethodLength def value_used? # Be conservative and return true if we're not sure. return false if parent.nil? case parent.type when :array, :defined?, :dstr, :dsym, :eflipflop, :erange, :float, :hash, :iflipflop, :irange, :not, :pair, :regexp, :str, :sym, :when, :xstr parent.value_used? when :begin, :kwbegin begin_value_used? when :for for_value_used? when :case, :if case_if_value_used? when :while, :until, :while_post, :until_post while_until_value_used? else true end end # rubocop:enable Metrics/MethodLength # Some expressions are evaluated for their value, some for their side # effects, and some for both. # If we know that expressions are useful only for their return values, # and have no side effects, that means we can reorder them, change the # number of times they are evaluated, or replace them with other # expressions which are equivalent in value. # So, is evaluation of this node free of side effects? # def pure? # Be conservative and return false if we're not sure case type when :__FILE__, :__LINE__, :const, :cvar, :defined?, :false, :float, :gvar, :int, :ivar, :lvar, :nil, :str, :sym, :true, :regopt true when :and, :array, :begin, :case, :dstr, :dsym, :eflipflop, :ensure, :erange, :for, :hash, :if, :iflipflop, :irange, :kwbegin, :not, :or, :pair, :regexp, :until, :until_post, :when, :while, :while_post child_nodes.all?(&:pure?) else false end end private def visit_ancestors(types) last_node = self while (current_node = last_node.parent) yield current_node if types.empty? || types.include?(current_node.type) last_node = current_node end end def begin_value_used? # the last child node determines the value of the parent sibling_index == parent.children.size - 1 ? parent.value_used? : false end def for_value_used? # `for var in enum; body; end` # (for ) sibling_index == 2 ? parent.value_used? : true end def case_if_value_used? # (case ) # (if ) sibling_index.zero? ? true : parent.value_used? end def while_until_value_used? # (while ) -> always evaluates to `nil` sibling_index.zero? end def parent_module_name_part(node) case node.type when :class, :module, :casgn # TODO: if constant name has cbase (leading ::), then we don't need # to keep traversing up through nested classes/modules node.defined_module_name when :sclass yield parent_module_name_for_sclass(node) else # block parent_module_name_for_block(node) { yield nil } end end def parent_module_name_for_sclass(sclass_node) # TODO: look for constant definition and see if it is nested # inside a class or module subject = sclass_node.children[0] if subject.const_type? "#" elsif subject.self_type? "#" end end def parent_module_name_for_block(ancestor) if ancestor.method?(:class_eval) # `class_eval` with no receiver applies to whatever module or class # we are currently in return unless (receiver = ancestor.receiver) yield unless receiver.const_type? receiver.const_name elsif !new_class_or_module_block?(ancestor) yield end end # @!method new_class_or_module_block?(node = self) def_node_matcher :new_class_or_module_block?, <<~PATTERN ^(casgn _ _ (block (send (const _ {:Class :Module}) :new) ...)) PATTERN end end end