module Rouge module Lexers class Ruby < RegexLexer desc "The Ruby programming language (ruby-lang.org)" tag 'ruby' aliases 'rb' filenames '*.rb', '*.ruby', '*.rbw', '*.rake', '*.gemspec', 'Rakefile', 'Guardfile', 'Gemfile', 'Capfile', 'Vagrantfile', '*.ru', '*.prawn' mimetypes 'text/x-ruby', 'application/x-ruby' def self.analyze_text(text) return 1 if text.shebang? 'ruby' end state :strings do # symbols rule %r( : # initial : @{0,2} # optional ivar, for :@foo and :@@foo [a-z_]\w*[!?]? # the symbol )xi, Str::Symbol # special symbols rule %r(:(?:\*\*|[-+]@|[/\%&\|^`~]|\[\]=?|<<|>>|<=?>|<=?|===?)), Str::Symbol rule /:'(\\\\|\\'|[^'])*'/, Str::Symbol rule /\b[a-z_]\w*?:\s+/, Str::Symbol rule /'(\\\\|\\'|[^'])*'/, Str::Single rule /:"/, Str::Symbol, :simple_sym rule /"/, Str::Double, :simple_string rule /(?, %.abc., %r.abc., etc delimiter_map = { '{' => '}', '[' => ']', '(' => ')', '<' => '>' } rule /%([rqswQWxiI])?([^\w\s])/ do |m| open = Regexp.escape(m[2]) close = Regexp.escape(delimiter_map[m[2]] || m[2]) interp = /[rQWxI]/ === m[1] toktype = Str::Other puts " open: #{open.inspect}" if @debug puts " close: #{close.inspect}" if @debug # regexes if m[1] == 'r' toktype = Str::Regex push :regex_flags end token toktype push do rule /\\[##{open}#{close}\\]/, Str::Escape # nesting rules only with asymmetric delimiters if open != close rule /#{open}/ do token toktype push end end rule /#{close}/, toktype, :pop! if interp mixin :string_intp_escaped rule /#/, toktype else rule /[\\#]/, toktype end rule /[^##{open}#{close}\\]+/m, toktype end end end state :regex_flags do rule /[mixounse]*/, Str::Regex, :pop! end # double-quoted string and symbol [[:string, Str::Double, '"'], [:sym, Str::Symbol, '"'], [:backtick, Str::Backtick, '`']].each do |name, tok, fin| state :"simple_#{name}" do mixin :string_intp_escaped rule /[^\\#{fin}#]+/m, tok rule /[\\#]/, tok rule /#{fin}/, tok, :pop! end end keywords = %w( BEGIN END alias begin break case defined\? do else elsif end ensure for if in next redo rescue raise retry return super then undef unless until when while yield ) keywords_pseudo = %w( initialize new loop include extend raise attr_reader attr_writer attr_accessor attr catch throw private module_function public protected true false nil __FILE__ __LINE__ ) builtins_g = %w( Array Float Integer Str __id__ __send__ abort ancestors at_exit autoload binding callcc caller catch chomp chop class_eval class_variables clone const_defined\? const_get const_missing const_set constants display dup eval exec exit extend fail fork format freeze getc gets global_variables gsub hash id included_modules inspect instance_eval instance_method instance_methods instance_variable_get instance_variable_set instance_variables lambda load local_variables loop method method_missing methods module_eval name object_id open p print printf private_class_method private_instance_methods private_methods proc protected_instance_methods protected_methods public_class_method public_instance_methods public_methods putc puts raise rand readline readlines require scan select self send set_trace_func singleton_methods sleep split sprintf srand sub syscall system taint test throw to_a to_s trace_var trap untaint untrace_var warn ) builtins_q = %w( autoload block_given const_defined eql equal frozen include instance_of is_a iterator kind_of method_defined nil private_method_defined protected_method_defined public_method_defined respond_to tainted ) builtins_b = %w(chomp chop exit gsub sub) start do push :expr_start @heredoc_queue = [] end state :root do rule /\n\s*/m, Text, :expr_start rule /\s+/, Text # NB: NOT /m rule /#.*$/, Comment::Single rule %r(=begin\b.*?end\b)m, Comment::Multiline rule /(?:#{keywords.join('|')})\b/, Keyword, :expr_start rule /(?:#{keywords_pseudo.join('|')})\b/, Keyword::Pseudo, :expr_start rule %r( (module) (\s+) ([a-zA-Z_][a-zA-Z0-9_]*(::[a-zA-Z_][a-zA-Z0-9_]*)*) )x do groups Keyword, Text, Name::Namespace end rule /(def\b)(\s*)/ do groups Keyword, Text push :funcname end rule /(class\b)(\s*)/ do groups Keyword, Text push :classname end rule /(?:#{builtins_q.join('|')})\?/, Name::Builtin, :expr_start rule /(?:#{builtins_b.join('|')})!/, Name::Builtin, :expr_start rule /(?_*\$?:"]), Name::Variable::Global rule /\$-[0adFiIlpvw]/, Name::Variable::Global rule /::/, Operator mixin :strings # char operator. ?x evaulates to "x", unless there's a digit # beforehand like x>=0?n[x]:"" rule %r( \?(\\[MC]-)* # modifiers (\\([\\abefnrstv\#"']|x[a-fA-F0-9]{1,2}|[0-7]{1,3})|\S) (?!\w) )x, Str::Char mixin :has_heredocs rule /[A-Z][a-zA-Z0-9_]+/, Name::Constant, :method_call rule /(\.|::)([a-z_]\w*[!?]?|[*%&^`~+-\/\[<>=])/ do groups Punctuation, Name::Function push :expr_start end rule /[a-zA-Z_]\w*[?!]/, Name, :expr_start rule /[a-zA-Z_]\w*/, Name, :method_call rule /\[|\]|\*\*|<>?|>=|<=|<=>|=~|={3}|!~|&&?|\|\||\.{1,3}/, Operator, :expr_start rule /[-+\/*%=<>&!^|~]=?/, Operator, :expr_start rule %r<[({,?:\\;/]>, Punctuation, :expr_start rule %r<[)}]>, Punctuation end state :has_heredocs do rule /(?>? | <=>? | >= | ===? ) )x do |m| puts "matches: #{[m[0], m[1], m[2], m[3]].inspect}" if @debug groups Name::Class, Operator, Name::Function pop! end rule(//) { pop! } end state :classname do rule /\s+/, Text rule /\(/, Punctuation, :defexpr # class << expr rule /<