module SitemapGenerator module Builder class SitemapIndexFile < SitemapFile # === Options # # * location - a SitemapGenerator::SitemapIndexLocation instance or a Hash of options # from which a SitemapLocation will be created for you. def initialize(opts={}) @location = opts.is_a?(Hash) ? SitemapGenerator::SitemapIndexLocation.new(opts) : opts @link_count = 0 @sitemaps_link_count = 0 @xml_content = '' # XML urlset content @xml_wrapper_start = <<-HTML HTML @xml_wrapper_start.gsub!(/\s+/, ' ').gsub!(/ *> */, '>').strip! @xml_wrapper_end = %q[] @filesize = SitemapGenerator::Utilities.bytesize(@xml_wrapper_start) + SitemapGenerator::Utilities.bytesize(@xml_wrapper_end) @written = false @reserved_name = nil # holds the name reserved from the namer @frozen = false # rather than actually freeze, use this boolean @first_sitemap = nil # reference to the first thing added to this index # Store the URL of the first sitemap added because if create_index is # false this is the "index" URL @first_sitemap_url = nil end # Finalize sitemaps as they are added to the index. # If it's the first sitemap, finalize it but don't # write it out, because we don't yet know if we need an index. If it's # the second sitemap, we know we need an index, so reserve a name for the # index, and go and write out the first sitemap. If it's the third or # greater sitemap, just finalize and write it out as usual, nothing more # needs to be done. # # If a link is being added to the index manually as a string, then we # can assume that the index is required (unless create_index is false of course). # This seems like the logical thing to do. alias_method :super_add, :add def add(link, options={}) if file = link.is_a?(SitemapFile) && link @sitemaps_link_count += file.link_count file.finalize! unless file.finalized? # First link. If it's a SitemapFile store a reference to it and the options # so that we can create a URL from it later. We can't create the URL yet # because doing so fixes the sitemap file's name, and we have to wait to see # if we have more than one link in the index before we can know who gets the # first name (the index, or the sitemap). If the item is not a SitemapFile, # then it has been manually added and we can be sure that the user intends # for there to be an index. if @link_count == 0 @first_sitemap = SitemapGenerator::Builder::LinkHolder.new(file, options) @link_count += 1 # pretend it's added, but don't add it yet else # need an index so make sure name is reserved and first sitemap is written out reserve_name unless @location.create_index == false write_first_sitemap file.write super(SitemapGenerator::Builder::SitemapIndexUrl.new(file, options)) end else # A link is being added manually. Obviously the user wants an index. # This overrides the create_index setting. unless @location.create_index == false @create_index = true reserve_name end # Use the host from the location if none provided options[:host] ||= @location.host super(SitemapGenerator::Builder::SitemapIndexUrl.new(link, options)) end end # Return a boolean indicating whether the sitemap file can fit another link # of bytes bytes in size. You can also pass a string and the # bytesize will be calculated for you. def file_can_fit?(bytes) bytes = bytes.is_a?(String) ? SitemapGenerator::Utilities.bytesize(bytes) : bytes (@filesize + bytes) < SitemapGenerator::MAX_SITEMAP_FILESIZE && @link_count < SitemapGenerator::MAX_SITEMAP_FILES end # Return the total number of links in all sitemaps reference by this index file def total_link_count @sitemaps_link_count end def stats_summary(opts={}) str = "Sitemap stats: #{number_with_delimiter(@sitemaps_link_count)} links / #{@link_count} sitemaps" str += " / %dm%02ds" % opts[:time_taken].divmod(60) if opts[:time_taken] end def finalize! raise SitemapGenerator::SitemapFinalizedError if finalized? reserve_name if create_index? write_first_sitemap @frozen = true end # Write out the index if an index is needed def write super if create_index? end # Whether or not we need to create an index file. True if create_index is true # or if create_index is :auto and we have more than one link in the index. # If a link is added manually and create_index is not false, we force index # creation because they obviously intend for there to be an index. False otherwise. def create_index? @create_index || @location.create_index == true || @location.create_index == :auto && @link_count > 1 end # Return the index file URL. If create_index is true, this is the URL # of the actual index file. If create_index is false, this is the URL # of the first sitemap that was written out. Only call this method # *after* the files have been finalized. def index_url if create_index? || !@first_sitemap_url @location.url else @first_sitemap_url end end protected # Make sure the first sitemap has been written out and added to the index def write_first_sitemap if @first_sitemap @first_sitemap.link.write unless @first_sitemap.link.written? super_add(SitemapGenerator::Builder::SitemapIndexUrl.new(@first_sitemap.link, @first_sitemap.options)) @link_count -= 1 # we already counted it, don't count it twice # Store the URL because if create_index is false, this is the # "index" URL @first_sitemap_url = @first_sitemap.link.location.url @first_sitemap = nil end end end end end