#-- # =============================================================================== # Copyright (c) 2005,2006,2007 Christopher Kleckner # All rights reserved # # This file is part of the Rio library for ruby. # # Rio is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License as published by # the Free Software Foundation; either version 2 of the License, or # (at your option) any later version. # # Rio is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU General Public License for more details. # # You should have received a copy of the GNU General Public License # along with Rio; if not, write to the Free Software # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA # =============================================================================== #++ # # To create the documentation for Rio run the command # ruby build_doc.rb # from the distribution directory. # # Suggested Reading # * RIO::Doc::SYNOPSIS # * RIO::Doc::INTRO # * RIO::Doc::HOWTO # * RIO::Doc::EXAMPLES # * RIO::Rio # module RIO module IF module GrandeStream # Calls #lines(*args) but when used with the subscript operator # returns the first element of the returned array instead of the array. # # If afile contains ["line 0\n","line 1\n"] # rio('afile').line[0] #=> "line 0\n" # rio('afile').line[1] #=> "line 1\n" # rio('afile').lines[0] #=> ["line 0\n"] # rio('afile').lines[1] #=> ["line 1\n"] # rio('afile').lines[0][0] #=> "line 0\n" # rio('afile').lines[1][0] #=> "line 1\n" def line(*args,&block) target.line(*args,&block); self end # See #line. def record(*args,&block) target.record(*args,&block); self end # See #line. def row(*args,&block) target.row(*args,&block); self end # Sets the rio to read lines and returns the Rio # # If called with a block behaves as if lines(*args).each(&block) had been called # # +lines+ returns the Rio which called it. This might seem counter-intuitive at first. # One might reasonably assume that # rio('adir').lines(0..10) # would return lines. It does not. It configures the rio to return lines and returns # the Rio. This enables chaining for further configuration so constructs like # rio('afile').lines(0..10).skiplines(/::/) # are possible. # # If args are provided they may be one or more of the following: # Regexp:: any matching record will be processed # Range:: specifies a range of records (zero-based) to be included # Integer:: interpreted as a one element range of lines to be processed # Proc:: a proc which will be called for each record, records are included unless nil or false is returned # Symbol:: a symbol which will _sent_ to each record, records are included unless nil or false is returned # Array:: an array of other selectors. records are selected unless any of the matches fail. # # rio('f.txt').lines(/^\s*#/) { |line| ... } # iterate over comment-only lines # rio('f.txt').lines(/^\s*#/).each { |line| ... } # same as above # # rio('f.txt').lines(1,7..9) > rio('anotherfile.txt') # copy lines 1,7,8 and 9 to anotherfile.txt # # rio('f.txt').lines(1...3).to_a # return an array containing lines 1 and 2 of f.txt # rio('f.txt').lines[1...3] # same thing # def lines(*args,&block) target.lines(*args,&block); self end # Sets the rio to read bytes and returns the rio # # _n_ specifies the number of bytes to be returned on each iteration of IF::Grande#each or by IF::GrandeStream#getrec. If _args_ # are provided, they are treated as record selectors as if ario.bytes(n).records(*args) had been # called. See also #records, #lines, IF::Grande#each, IF::Grande#[] # # If called with a block behaves as if ario.bytes(n,*args).each(&block) had been called # # rio('f.dat').bytes(1024) { |rec| ... } # iterate through f.txt 1024 bytes at a time # rio('f.dat').bytes(1024).each { |rec| ... } # same as above # # rio('f.dat').bytes(1024,0..4) { |rec| ... } # iterate through the first five 1024 byte blocks # # rio('f.dat').bytes(64).to_a # return the contents of f.dat as an array of 64 byte chunks # # rio('f.dat').bytes(512).records(0,7..9) > rio('dfile.dat') # copy 512-byte blocks 0,7,8 and 9 to dfile.dat # # rio('f.dat').bytes(2048).records[0...10] # return an array containing the first 10 2K blocks of f.dat # rio('f.dat').bytes(2048)[0...10] # same thing # # rio('f.dat').bytes { |bytestr| ... } # iterate over f.dat 1 byte at a time. # rio('f.dat').bytes[0...100] # returns an array of the first 100 bytes of f.dat # def bytes(n=1,*args,&block) target.bytes(n,*args,&block); self end # Specifies which records will be iterated through by IF::Grande#each or returned by IF::GrandeStream#getrec # # If called with a block behaves as if records(*args).each(&block) had been called # # Returns the Rio # # If no args are provided, all records are selected. # What constitutes a record is affected by #lines,#bytes, # and extensions such as IF::CSV#csv and IF::YAML#yaml. # # If args are provided they may be one or more of the following: # Regexp:: any matching record will be iterated over by IF::Grande#each or returned by IF::GrandeStream#getrec # Integer:: specifies a record-number (zero-based) to be iterated over by IF::Grande#each or returned by IF::GrandeStream#getrec # Range:: specifies a range of records (zero-based) to included in the iteration # Proc:: a proc which will be called for each record, records are included unless nil or false is returned # Symbol:: a symbol which will _sent_ to each record, records are included unless nil or false is returned # Array:: an array of any of above. All must match for a line to be included # # Any other argument type is compared with the record using its === method. # # If the argument is a ::Proc it may be called with one, two or three paramaters. # 1. the record # 2. the recno (optional) # 3. the rio (optional) # # Note in the following examples that since +lines+ is the default ario.records(*args) # is effectively the same as ario.lines(*args). # # rio('afile').records(0) { |line| ... } # iterate over the first line of 'afile' # rio('afile').records(0,5..7)) { |line| ... } # iterate over lines 0,5,6 and 7 # rio('afile').records(/Zippy/) { |line| ... } # iterate over all lines containing 'Zippy' # # # rio('f.csv').puts!(["h0,h1","f0,f1"]) # Create f.csv # # rio('f.csv').csv.records[] #==>[["h0", "h1"], ["f0", "f1"]] # rio('f.csv').csv.lines[] #==>["h0,h1\n", "f0,f1\n"] # rio('f.csv').csv.records[0] #==>[["h0", "h1"]] # def records(*args,&block) target.records(*args,&block); self end # Specifies records which should *not* be iterated through by IF::Grande#each or returned by IF::GrandeStream#getrec # # If called with a block behaves as if skiprecords(*args).each(&block) # had been called # # Returns the Rio # # See also #records, #skiplines, #lines, IF::Grande#skip # # If no args are provided, no records are rejected. What constitutes a record is affected by #lines,#bytes, # and extensions such as IF::CSV#csv and IF::YAML#yaml. # # If args are provided they may be one or more of the following: # Regexp:: any matching record will not be processed # Integer:: specifies a record-number (zero-based) to be skipped # Range:: specifies a range of records (zero-based) to be excluded # Proc:: a proc which will be called for each record, records are excluded unless nil or false is returned # Symbol:: a symbol which will _sent_ to each record, records are excluded unless nil or false is returned # Array:: an array of any of the above, all of which must match for the array to match. # # Note in the following examples that since +lines+ is the default record # type ario.skiprecords(*args) is effectively # the same as ario.skiplines(*args). # # rio('afile').skiprecords(0) { |line| ... } # iterate over all but the first line of 'afile' # rio('afile').skiprecords(0,5..7)) { |line| ... } # don't iterate over lines 0,5,6 and 7 # rio('afile').skiprecords(/Zippy/) { |line| ... } # skip all lines containing 'Zippy' # rio('afile').chomp.skiplines(:empty?) { |line| ... } # skip empty lines # def skiprecords(*args,&block) target.skiprecords(*args,&block); self end # Sets the Rio to read lines and specifies lines which should *not* be iterated through by IF::Grande#each or # returned by IF::GrandeStream#getrec # # If called with a block behaves as if skiplines(*args).each(&block) had been called # # Returns the Rio # # See also #lines, #records, IF::Grande#skip # # If no args are provided, no lines are rejected. # # If args are provided they may be one or more of the following: # Regexp:: any matching line will not be processed # Integer:: specifies a line-number (zero-based) to be skipped # Range:: specifies a range of lines (zero-based) to be excluded # Proc:: a proc which will be called for each line, lines are excluded unless nil or false is returned # Symbol:: a symbol which will _sent_ to each line, lines are excluded unless nil or false is returned # Array:: an array of any of above. All must match for a line to be included # # rio('afile').skiplines(0) { |line| ... } # iterate over all but the first line of 'afile' # rio('afile').skiplines(0,5..7)) { |line| ... } # don't iterate over lines 0,5,6 and 7 # rio('afile').skiplines(/Zippy/) { |line| ... } # skip all lines containing 'Zippy' # rio('afile').chomp.skiplines(:empty?) { |line| ... } # skip empty lines # def skiplines(*args,&block) target.skiplines(*args,&block); self end # Sets the Rio to read rows and specifies rows which should be iterated through # by IF::Grande#each or returned by IF::GrandeStream#getrec. # #rows is intended for use by extensions, where the concept of a row is reasonable. # In the absensence of an extension behaves like #records. def rows(*args,&block) target.rows(*args,&block); self end # Sets the Rio to read rows and specifies lines which should *not* be iterated # through by IF::Grande#each or returned by IF::GrandeStream#getrec # #skiprows is intended for use by extensions, where the concept of a row is # reasonable. In the absence of an extension behaves like #skiprecords def skiprows(*args,&block) target.skiprows(*args,&block); self end # Temporarily set the Rio to read records, and call IF::Grande#get # # See also IF::GrandeStream#records, IF::GrandeStream#lines, IF::Grande#each, IF::Grande#[] # def getrec() target.getrec() end # Temporarily set the Rio to read rows, and call IF::Grande#get # # See also IF::GrandeStream#rows, IF::GrandeStream#lines, IF::Grande#each, IF::Grande#[] # def getrow() target.getrow() end # Temporarily set the Rio to read lines, and call IF::Grande#get # # See also IF::GrandeStream#records, IF::GrandeStream#lines, IF::Grande#each, IF::Grande#[] # def getline() target.getline() end # Slurps the contents of the rio into a string. # # astring = rio('afile.txt').contents # slurp the entire contents of afile.txt into astring # def contents() target.contents() end # Writes a single record to a Rio def putrec(el) target.putrec(el) end # Sets the implicit output mode to 'a'. # # This is the mode Rio will use for output when no mode is specified # # Rios normally don't need to be opened or have their open mode specified. A Rio determines the mode # based on the file system object and on the action specified. For instance when a Rio encounters # a +read+ on a file it opens the file for reading using File#open and calls IO#read; when it encounters # a +read+ on a directory it knows to use Dir#open and call Dir#read. When it encounters a IF::RubyIO#puts, it knows # to perform a File#open, and call IO#puts on the returned handle. By default when a method requires # a file be opened for writing the file is opened with a mode of 'w'. #a changes this implicit # output mode to 'a'. # # Note that this is not the same as setting the output mode *explicitly*, as in rio('afile').mode('a'). # When the mode is set explicitly using IF::RubyIO#mode, the mode specified will be used regardless of # the operation being performed. The #a method only affects how Rio opens a file when # it sees an operator that requires writing, and must determine for itself how to open it. # # rio('afile').puts!('Hello World') # call IO#puts on a file handle opened in 'w' mode # rio('afile').a.puts!('Hello World') # call IO#puts on a file handle opened in 'a' mode # # See also #a!, #w! for setting the implicit output mode 'a+' and 'w+' respectively # # The methods #a, #a!, #w, #w!, #r, #r! set the +implicit+ open mode # to 'a','a+','w','w+','r' and 'r+' respectively. # # See also #+@ def a() target.a(); self end # Unary Plus. Alternate form of #a # rio('f1') > rio('f2') # copy f1 to f2 # rio('f1') > rio('f2').a # append f1 to f2 # rio('f1') > +rio('f2') # same thing # rio('f1') >> rio('f2') # same thing # def +@() RIO::no_warn { +target } self end # Sets the implicit output mode to 'a+'. # # The implicit output mode is the mode Rio will use for output when no mode is specified. # # Returns the Rio # # See the discussion for #a. # def a!() target.a!(); self end # Sets the implicit input mode to 'r'. # # The implicit input mode is the mode Rio will use for input when no mode is specified. # # Returns the Rio # # See the discussion for #a. # # Since 'r' is the implicit input mode used by default, this method # is probably uneeded. # def r() target.r(); self end # Sets the implicit input mode to 'r+'. # # The implicit input mode is the mode Rio will use for input when no mode is specified. # # Returns the Rio # # See the discussion for #a. # def r!() target.r!(); self end # Sets the implicit output mode to 'w'. # # The implicit output mode is the mode Rio will use for output when no mode is specified. # # Returns the Rio # # See the discussion for #a. # # Since 'w' is the implicit output mode used by default, this method # is uneeded, but is provided for completeness.. # def w() target.w(); self end # Sets the implicit output mode to 'w+'. # # The implicit output mode is the mode Rio will use for output when no mode is specified. # # Returns the Rio # # rio(?-,'cat').w!.puts!("Hello Kitty").readline #=> "Hello Kitty" # # See the discussion for #a. # def w!() target.w!(); self end # Set the Rio's closeoneof mode. # # ario.closeoneof(&block) => ario # # +closeoneof+ causes a Rio to be closed automatically whenever the end of # file is reached. This affects# all methods that read from # a rio (IF::RubyIO#readlines, #to_a, IF::Grande#each IF::RubyIO#gets etc.) # Because +closeoneof+ must be on for many of Rio's most useful idioms, # it is on by default. +closeoneof+ can be turned off using #nocloseoneof. # # If a block is given behaves like ario.closeoneof.each(&block) had been called # # Returns the Rio # # ario = rio('afile') # lines = ario.readlines # ario.closed? #=> true # # ario = rio('afile').nocloseoneof # lines = ario.readlines # ario.closed? #=> false # ario.close # must be explicitly closed # # +closeoneof+ is ignored by directory Rios, however, setting it on a directory Rio # causes each file Rio returned while iterating to inherit the directory's setting # # rio('adir').files do |file| # file.closeoneof? #=> true # end # # rio('adir').files.nocloseoneof do |file| # file.closeoneof? #=> false # end # # rio('adir').files.nocloseoneof['*.rb'] # array of .rb file Rios in adir with closeoneof off # # drio = rio('adir').files # frio1 = drio.read # frio1.closeoneof? #=> true # drio.nocloseoneof # frio2 = drio.read # frio2.closeoneof? #=> false # # def closeoneof(arg=true,&block) target.closeoneof(arg,&block); self end # Set the Rio's closeoneof mode to false # ario.nocloseoneof(&block) => ario # See #closeoneof # # If a block is given behaves like # ario.nocloseoneof.each(&block) # # Returns the Rio # # ario = rio('afile') # lines = ario.to_a # ario.closed? #=> true # # ario = rio('afile').nocloseoneof # lines = ario.to_a # ario.closed? #=> false # ario.close # must be explicitly closed def nocloseoneof(arg=false,&block) target.nocloseoneof(arg,&block); self end # Query a Rio's closeoneof mode # ario.closeoneof? => true or false # # See #closeoneof and #nocloseoneof # # ario = rio('afile') # ario.closeoneof? #=> true # lines = ario.to_a # ario.closed? #=> true # # ario = rio('afile').nocloseoneof # ario.closeoneof? #=> false # lines = ario.to_a # ario.closed? #=> false # ario.close # must be explicitly closed def closeoneof?() target.closeoneof?() end # Set a Rio's closeoncopy mode # # ario.closeoncopy(&block) => ario # # #closeoncopy causes the Rio being written to to be closed when using # a grande copy operator. While #closeoneof causes all Rio's to be closed # when reading to the end of file, it does not affect Rios being written to. # #closeoncopy only affects the Rio being written to and only when a # grande copy operator is used. +closeoncopy+ is on by default, with one exception. # # dest = rio('destfile') # dest < rio('srcfile') # dest.closed? #=> true # # dest = rio('destfile').nocloseoncopy # dest < rio('srcfile') # dest.closed? #=> false # dest.close # must be explicitly closed # # dest = rio('destfile') # dest.print(rio('srcfile').contents) # dest.closed? #=> false (IF::RubyIO#print is not a copy operator) # dest.close # # # ==== The Exception # # When a block is passed directly to the rio constructor +closeoncopy+ is turned off. # # rio('afile') { |file| # file.closeoncopy? #=> false # file < a_string # file.closed? #=> false # } # # The file is now closed. See IF::GrandeStream#rio for more informatioin # # ==== Why? # # Some of my favorite Rio idioms are its copy one-liners # # rio('afile') < a_string # put a string into a file # rio('afile') < an_array # put an array into a file # rio('afile') < rio('anotherfile').lines(0..9) # copy the first 10 lines of anotherfile into afile # rio('afile.gz').gzip < rio('anotherfile').lines(0..9) # same thing into a gzipped file # # In each of these cases, 'afile' would remain open after the copy and furthermore # since the destination Rio was not saved in a variable, There is no way to close file. # Without closeoncopy Something like this would be required: # # ario = rio('afile') # ario < something_else # ario.close # # Or this... # # ario = rio('afile') < something_else # ario.close # # Or this... # # (rio('afile') < something_else).close # One line, but ugly, and prone to error. # # What I want is this: # # rio('afile') < something_else # # Simple. I want to copy this to that, I point the arrow and it works. # # In perl the rio's destructor would be called, because there are no remaining references to the Rio # However, it my understanding and experience that in Ruby the finalizer will not necessarily be # called at this point. # def closeoncopy(arg=true,&block) target.closeoncopy(arg,&block); self end # Set a Rio's closeoncopy mode to false # # ario.nocloseoncopy(&block) => ario # # See #closeoncopy # def nocloseoncopy(arg=false,&block) target.nocloseoncopy(arg,&block); self end # Query a Rio's closeoncopy mode # # ario.closeoncopy? => true or false # # See #closeoncopy # def closeoncopy?() target.closeoncopy?() end # Turns off both closeoneof and closeoncopy. # Equivelent to: # ario.nocloseoneof.nocloseoncopy # Returns the Rio # ario.noautoclose(&block) => ario # If a block is given, acts as if # ario.noautoclose.each(&block) # had been called. # # See #nocloseoneof and #nocloseoncopy # def noautoclose(arg=false,&block) target.noautoclose(arg,&block); self end # Queries the Rio's chomp-mode. # See #chomp. # def chomp?() target.chomp?() end # Sets the Rio to chomp lines and returns the Rio # # When called with a block, behaves as if chomp.each(&block) had been called # # chomp causes lines returned by each, to_a, readlines, readline, gets, each_line etc. # to be chomped before iterated over or assigned # # rio('f.txt').chomp.each { |line| ... } # Block is called with lines already chomped # # rio('f.txt').chomp { |line| ... } # same as above # # rio('f.txt').chomp.to_a # returns the lines of f.txt chomped # # rio('f.txt').chomp.lines(1..2).to_a # returns an array containg lines 1 and 2 of the file after being chomped # # This would have similar results to rio('f.txt').lines(1..2).to_a.map{ |line| line.chomp} # # rio('f.txt').lines(1..2).chomp.to_a # same as above # # rio('f.txt').chomp.readlines # returns the lines of f.txt chomped # # rio('f.txt').chomp.gets # returns the first line of 'f.txt' chomped # # rio('f.txt').chomp > an_array # copies the chomped lines of f.txt into an_array # # # fill an array with all the 'require' lines in all the .rb files (recursively) in adir # # chomping each line # # an_array = [] # rio('adir').chomp.all.files("*.rb") { |file| # an_array += file.lines[/^\s*require/] # } # # or simply # # an_array = rio('adir').chomp.all.files("*.rb").lines[/^\s*require/] # def chomp(arg=true,&block) target.chomp(arg,&block); self end # Queries the Rio's strip-mode. # See #strip. # def strip?() target.strip?() end # Sets the Rio to strip lines and returns the Rio # # When called with a block, behaves as if strip.each(&block) had been called # # +strip+ causes lines returned by each, to_a, readlines, readline, gets, each_line etc. # to be stripped with String#strip before iterated over or assigned # # ans = rio(?-).print("A Prompt> ").strip.gets # prompt the user # # See also #chomp def strip(arg=true,&block) target.strip(arg,&block); self end # Sets the Rio to gzip mode. # ario.gzip #=> ario # If applied to a Rio that is being read from Reads # through a Zlib::GzipReader; If applied to a Rio that is being written to # writes through a Zlib::GzipWriter. # # Returns the Rio # # If a block is given, acts like ario.gzip.each(&block) # # rio('afile') > rio('afile.gz').gzip # gzip a file # rio('afile.gz').gzip < rio('afile') # same thing # # rio('afile.gz').gzip > rio('afile') # ungzip a file # rio('afile') < rio('afile.gz').gzip # same thing # # rio('afile.gz').gzip.chomp { |line| ...} # process each chomped line of a gzipped file # rio('afile.gz').gzip[0..9] # an array containing the first 10 lines of a gzipped file # def gzip(&block) target.gzip(true,&block); self end # Queries the Rio's gzip-mode # ario.gzip? #=> true or false # See #gzip # def gzip?() target.gzip?() end # #inputmode? # # #def inputmode?() target.inputmode?() end # This causes String#split(arg) to be called on every line # before it is returned. An array of the split lines is # returned when iterating # # rio('/etc/passwd').split(':').columns(0,2) { |ary| # username,uid = ary # } # # rio('/etc/passwd').split(':').columns(0,2).to_a #=> [[user1,uid1],[user2,uid2]] # # See also IF::Grande#split # def splitlines(*args,&block) target.splitlines(*args,&block) end # #outputmode? # # #def outputmode?() target.outputmode?() end end end end module RIO class Rio include RIO::IF::GrandeStream end end