class RDParser preclow nonassoc DUMMY left ITEMLISTLINE ENUMLISTLINE DESCLISTLINE METHODLISTLINE STRINGLINE prechigh token STRINGLINE ITEMLISTLINE ENUMLISTLINE DESCLISTLINE METHODLISTLINE WHITELINE SUBTREE HEADLINE INCLUDE INDENT DEDENT DUMMY rule document : blocks { result = DocumentElement.new add_children_to_element(result, *val[0]) } | { raise ParseError, "Error: file empty." } ; blocks : blocks block { result.concat(val[1]) } | block ; block : textblock { result = val } | verbatim { result = val } | lists | headline { result = val } | include { result = val } | WHITELINE { result = [] } | SUBTREE { result = val[0].blocks } ; headline : HEADLINE { # val[0] is like [level, title] title = @inline_parser.parse(val[0][1]) result = Headline.new(val[0][0]) add_children_to_element(result, *title) } ; include : INCLUDE { result = Include.new(val[0]) } ; textblock : textblockcontent = DUMMY { # val[0] is Array of String content = cut_off(val[0]).join("") contents = @inline_parser.parse(content) result = TextBlock.new() add_children_to_element(result, *contents) } ; textblockcontent : textblockcontent STRINGLINE { result.push(val[1]) } | STRINGLINE { result = val } ; verbatim : INDENT verbatimcontent DEDENT { # val[1] is Array of String content = cut_off(val[1]) result = Verbatim.new(content) # imform to lexer. @in_verbatim = false } ; verbatim_after_lists : verbatimcontent { # val[0] is Array of String content = cut_off(val[0]) result = Verbatim.new(content) # imform to lexer. @in_verbatim = false } ; verbatimcontent : verbatimcontent STRINGLINE { result.push(val[1]) } | verbatimcontent INDENT verbatimcontent DEDENT { result.concat(val[2]) } | verbatimcontent WHITELINE { result.push("\n") } | STRINGLINE { result = val # imform to lexer. @in_verbatim = true } ; list : itemlist | enumlist | desclist | methodlist ; lists : lists2 = DUMMY | INDENT lists2 DEDENT { result = val[1] } | INDENT lists2 verbatim_after_lists DEDENT { result = val[1].push(val[2]) } ; lists2 : lists2 list { result.push(val[1]) } | list { result = val } ; itemlist : itemlistitems = DUMMY { result = ItemList.new add_children_to_element(result, *val[0]) } ; itemlistitems : itemlistitems itemlistitem { result.push(val[1]) } | itemlistitem { result = val } ; itemlistitem : first_textblock_in_itemlist other_blocks_in_list DEDENT { result = ItemListItem.new add_children_to_element(result, val[0], *val[1]) } ; enumlist : enumlistitems = DUMMY { result = EnumList.new add_children_to_element(result, *val[0]) } ; enumlistitems : enumlistitems enumlistitem { result.push(val[1]) } | enumlistitem { result = val } ; enumlistitem : first_textblock_in_enumlist other_blocks_in_list DEDENT { result = EnumListItem.new add_children_to_element(result, val[0], *val[1]) } ; desclist : desclistitems = DUMMY { result = DescList.new add_children_to_element(result, *val[0]) } ; desclistitems : desclistitems desclistitem { result.push(val[1]) } | desclistitem { result = val } ; desclistitem : DESCLISTLINE description_part DEDENT { term = DescListItem::Term.new term_contents = @inline_parser.parse(val[0].strip) add_children_to_element(term, *term_contents) result = DescListItem.new set_term_to_element(result, term) add_children_to_element(result, *val[1]) } ; methodlist : methodlistitems = DUMMY { result = MethodList.new add_children_to_element(result, *val[0]) } ; methodlistitems : methodlistitems methodlistitem { result.push(val[1]) } | methodlistitem { result = val } ; methodlistitem : METHODLISTLINE description_part DEDENT { term = MethodListItem::Term.new(val[0].strip) result = MethodListItem.new set_term_to_element(result, term) add_children_to_element(result, *val[1]) } ; description_part : whitelines textblock blocks_in_list { result = [val[1]].concat(val[2]) } | whitelines textblock { result = [val[1]] } | whitelines INDENT blocks_in_list DEDENT { result = val[2] } | whitelines { result = [] } ; blocks_in_list : blocks_in_list block_in_list { result.concat(val[1]) } | block_in_list ; block_in_list : textblock { result = val } | verbatim { result = val } | lists | WHITELINE { result = [] } ; whitelines : whitelines2 | ; whitelines2 : WHITELINE whitelines2 | WHITELINE ; first_textblock_in_itemlist : ITEMLISTLINE textblockcontent { content = cut_off([val[0]].concat(val[1])).join("") contents = @inline_parser.parse(content) result = TextBlock.new() add_children_to_element(result, *contents) } | ITEMLISTLINE { content = cut_off([val[0]]).join("") contents = @inline_parser.parse(content) result = TextBlock.new() add_children_to_element(result, *contents) } ; first_textblock_in_enumlist : ENUMLISTLINE textblockcontent { content = cut_off([val[0]].concat(val[1])).join("") contents = @inline_parser.parse(content) result = TextBlock.new() add_children_to_element(result, *contents) } | ENUMLISTLINE { content = cut_off([val[0]]).join("") contents = @inline_parser.parse(content) result = TextBlock.new() add_children_to_element(result, *contents) } ; other_blocks_in_list : verbatim blocks_in_list { result = [val[0]].concat(val[1]) } | lists blocks_in_list { result.concat(val[1]) } | WHITELINE blocks_in_list { result = val[1] } | verbatim { result = val } | lists | WHITELINE { result = [] } | { result = [] } ; end ---- inner include ParserUtility TMPFILE = ["rdtmp", $$, 0] attr_reader :tree def initialize @inline_parser = RDInlineParser.new(self) end def parse(src, tree) @src = src @src.push(false) # RDtree @tree = tree # @i: index(line no.) of src @i = 0 # stack for current indentation @indent_stack = [] # how indented. @current_indent = @indent_stack.join("") # RDParser for tmp src @subparser = nil # which part is in now @in_part = nil @part_content = [] @in_verbatim = false @yydebug = true do_parse end def next_token # preprocessing # if it is not in RD part # => method while @in_part != "rd" line = @src[@i] @i += 1 # next line case line # src end when false return [false, false] # RD part begin when /^=begin\s*(?:\bRD\b.*)?\s*$/ if @in_part # if in non-RD part @part_content.push(line) else @in_part = "rd" return [:WHITELINE, "=begin\n"] # <= for textblockand end # non-RD part begin when /^=begin\s+(\w+)/ part = $1 if @in_part # if in non-RD part @part_content.push(line) else @in_part = part if @tree.filter[part] # if filter exists # p "BEGIN_PART: #{@in_part}" # DEBUG end # non-RD part end when /^=end/ if @in_part # if in non-RD part # p "END_PART: #{@in_part}" # DEBUG # make Part-in object part = RD::Part.new(@part_content.join(""), @tree, "r") @part_content.clear # call filter, part_out is output(Part object) part_out = @tree.filter[@in_part].call(part) if @tree.filter[@in_part].mode == :rd # if output is RD formated subtree = parse_subtree( (RUBY_VERSION >= '1.9.0' ? part_out.lines.to_a : part_out.to_a ) ) else # if output is target formated basename = TMPFILE.join('.') TMPFILE[-1] += 1 tmpfile = open(@tree.tmp_dir + "/" + basename + ".#{@in_part}", "w") tmpfile.print(part_out) tmpfile.close subtree = parse_subtree(["=begin\n", "<<< #{basename}\n", "=end\n"]) end @in_part = nil return [:SUBTREE, subtree] end else if @in_part # if in non-RD part @part_content.push(line) end end end @current_indent = @indent_stack.join("") line = @src[@i] case line when false if_current_indent_equal("") do [false, false] end when /^=end/ if_current_indent_equal("") do @in_part = nil [:WHITELINE, "=end"] # MUST CHANGE?? end when /^\s*$/ @i += 1 # next line return [:WHITELINE, ':WHITELINE'] when /^\#/ # comment line @i += 1 # next line self.next_token() when /^(={1,4})(?!=)\s*(?=\S)/, /^(\+{1,2})(?!\+)\s*(?=\S)/ rest = $' # ' rest.strip! mark = $1 if_current_indent_equal("") do return [:HEADLINE, [Headline.mark_to_level(mark), rest]] end when /^<<<\s*(\S+)/ file = $1 if_current_indent_equal("") do suffix = file[-3 .. -1] if suffix == ".rd" or suffix == ".rb" subtree = parse_subtree(get_included(file)) [:SUBTREE, subtree] else [:INCLUDE, file] end end when /^(\s*)\*(\s*)/ rest = $' # ' newIndent = $2 if_current_indent_equal($1) do if @in_verbatim [:STRINGLINE, line] else @indent_stack.push("\s" << newIndent) [:ITEMLISTLINE, rest] end end when /^(\s*)(\(\d+\))(\s*)/ rest = $' # ' mark = $2 newIndent = $3 if_current_indent_equal($1) do if @in_verbatim [:STRINGLINE, line] else @indent_stack.push("\s" * mark.size << newIndent) [:ENUMLISTLINE, rest] end end when /^(\s*):(\s*)/ rest = $' # ' newIndent = $2 if_current_indent_equal($1) do if @in_verbatim [:STRINGLINE, line] else @indent_stack.push("\s" << $2) [:DESCLISTLINE, rest] end end when /^(\s*)---(?!-|\s*$)/ indent = $1 rest = $' /\s*/ === rest term = $' new_indent = $& if_current_indent_equal(indent) do if @in_verbatim [:STRINGLINE, line] else @indent_stack.push("\s\s\s" + new_indent) [:METHODLISTLINE, term] end end when /^(\s*)/ if_current_indent_equal($1) do [:STRINGLINE, line] end else raise "[BUG] parsing error may occured." end end =begin private --- RDParser#if_current_indent_equal(indent) if (({@current_indent == ((|indent|))})) then yield block, otherwise process indentation. =end # always @current_indent = @indent_stack.join("") def if_current_indent_equal(indent) indent = indent.sub(/\t/, "\s" * 8) if @current_indent == indent @i += 1 # next line yield elsif indent.index(@current_indent) == 0 @indent_stack.push(indent[@current_indent.size .. -1]) [:INDENT, ":INDENT"] else @indent_stack.pop [:DEDENT, ":DEDENT"] end end private :if_current_indent_equal def cut_off(src) ret = [] whiteline_buf = [] line = src.shift /^\s*/ =~ line indent = Regexp.quote($&) ret.push($') # ' while line = src.shift if /^(\s*)$/ =~ line whiteline_buf.push(line) elsif /^#{indent}/ =~ line unless whiteline_buf.empty? ret.concat(whiteline_buf) whiteline_buf.clear end ret.push($') # ' else raise "[BUG]: probably Parser Error while cutting off.\n" end end ret end private :cut_off def set_term_to_element(parent, term) # parent.set_term_under_document_struct(term, @tree.document_struct) parent.set_term_without_document_struct(term) end private :set_term_to_element def on_error( et, ev, _values ) line = @src[@i] prv, cur, nxt = format_line_num(@i, @i+1, @i+2) raise ParseError, <|#{@src[@i].chomp} #{nxt} |#{@src[@i+1].chomp} Msg end def line_index @i end def parse_subtree(src) @subparser = RD::RDParser.new() unless @subparser @subparser.parse(src, @tree) end private :parse_subtree def get_included(file) included = "" @tree.include_path.each do |dir| file_name = dir + "/" + file if test(?e, file_name) included = IO.readlines(file_name) break end end included end private :get_included def format_line_num(*args) width = args.collect{|i| i.to_s.length }.max args.collect{|i| sprintf("%#{width}d", i) } end private :format_line_num ---- header require "rd/rdinlineparser.tab.rb" require "rd/parser-util" module RD ---- footer end # end of module RD