require 'imw/utils/has_uri'
module IMW
# A resource can be anything addressable via a URI. Examples
# include local files, remote files, webpages, &c.
#
# The IMW::Resource class takes a URI as input and then dynamically
# extends itself with appropriate modules from IMW. As an example,
# calling
#
# my_archive = IMW::Resource.new('/path/to/my/archive.tar.bz2')
#
# would return an IMW::Resource extended by
# IMW::Archives::Tarbz2 (among other modules) which
# therefore has methods for extracting, listing, and appending to
# the archive.
#
# Modules are so extended based on handlers defined in the
# imw/resources directory and accessible via
# IMW::Resource.handlers. You can define your own handlers by
# defining the constant IMW::Resource::USER_DEFINED_HANDLERS in your
# configuration file.
#
# The modules extending a particular IMW::Resource instance can be
# listed as follows
#
# my_archive.modules #=> [IMW::Local::Base, IMW::Local::File, IMW::Local::Compressible, IMW::Archives::Tarbz2]
#
# By default, resources are opened for reading. Passing in the
# appropriate :mode option changes this:
#
# IMW::Resource.new('/path/to/my_new_file', :mode => 'w')
#
# If the :skip_modules option is passed in then the
# resource will not extend itself with any modules and will
# essentially only retain the bare functionality of a URI. This can
# be useful when subclassing IMW::Resource or dealing with a very
# strange kind of resource.
#
# Read the documentation for modules in IMW::Resources to learn more
# about the various behaviors an IMW::Resource can acquire.
#
# You can also instantiate an IMW::Resource using IMW.open, which
# accepts all the same arguments as IMW::Resource.new.
class Resource
# The mode in which to access this resource.
attr_accessor :mode
# A copy of the options passed to this resource on initialization.
attr_accessor :resource_options
# Create a new resource representing +uri+.
#
# IMW will automatically extend the resulting IMW::Resource
# instance with modules appropriate for the given URI:
#
# r = IMW::Resource.new("http://www.infochimps.com")
# r.modules
# => [IMW::Schemes::Remote::Base, IMW::Schemes::Remote::RemoteFile, IMW::Schemes::HTTP, IMW::Formats::Html]
#
# You can prevent this altogether by passing in
# :no_modules:
#
# r = IMW::Resource.new("http://www.infochimps.com", :no_modules => true)
# r.modules
# => []
#
# And you can exert more fine-grained control with the
# :use_modules and :skip_modules options, see
# IMW::Resource.extend_instance! for details.
#
# @param [String, Addressable::URI] uri
# @param [Hash] options
# @option options [true, false] no_modules
# @option options [String] mode the mode to open the resource in (will be ignored when inapplicable)
# @option options [IMW::Metadata::Record, Array] schema the schema of this resource
# @return [IMW::Resource]
def initialize uri, options={}
self.uri = uri
self.resource_options = options
self.mode = options[:mode] || 'r'
self.schema = options[:schema] if options[:schema]
extend_appropriately!(options)
end
# Provides resources with a wrapped Addressable::URI object.
include IMW::Utils::HasURI
# Provides resources with a schema.
include IMW::Metadata::Schematized
# Gives IMW::Resource instances with the ability to dynamically
# extend themselves with modules chosen from a set of handlers
# stored by the IMW::Resource class.
include IMW::Utils::DynamicallyExtendable
[IMW::Schemes::HANDLERS, IMW::CompressedFiles::HANDLERS, IMW::Archives::HANDLERS, IMW::Formats::HANDLERS].each do |handlers|
register_handlers *handlers
end
# Raise an error unless this resource exists.
#
# @param [String] message an optional message to include
def should_exist!(message=nil)
raise IMW::Error.new([message, "No path defined for #{self.inspect} extended by #{modules.join(' ')}"].compact.join(', ')) unless respond_to?(:path)
raise IMW::Error.new([message, "No exist? method defined for #{self.inspect} extended by #{modules.join(' ')}"].compact.join(', ')) unless respond_to?(:exist?)
raise IMW::PathError.new([message, "#{path} does not exist"].compact.join(', ')) unless exist?
self
end
# Close this resource.
#
# Modules should hook into super() as they need to redefine this
# method.
def close
end
# Open a copy of this resource.
#
# This is useful when wanting to reset file handles. Though -- be
# warned -- it does not close any file handles itself...
#
# @return [IMW::Resource] the new (old) resource
def reopen
IMW.open(uri.to_s)
end
# If +method+ begins with the strings +is+, +on+, or +via+ and
# ends with a question mark then we interpret it as a question
# this resource doesn't know how to answer -- so we have it answer
# +false+.
#
# As an example, consider the following loop:
#
# IMW.open('/tmp').all_contents.each do |obj|
# if obj.is_archive?
# # ... do something
# end
# end
#
# When +obj+ is initialized and it _isn't_ an archive, then it
# doesn't know about the is_archive? method -- but it
# should therefore answer false anyway.
#
# This lets a basic text file answer questions about whether it's
# an archive (or on S3, or accessed via some user-defined scheme,
# &c.) without needing to know anything about archives (or S3 or
# the user-defined scheme).
def method_missing method, *args
if args.empty? && method.to_s =~ /(is|on|via)_.*\?$/
# querying for a boolean response so answer false
return false
else
raise IMW::NoMethodError, "undefined method `#{method}' for #{self}, extended by #{modules.join(', ')}"
end
end
end
end