Sha256: 6d476c55916f62fb30b807dab61c6cae3d2ff02b0cc9de8df636272337b650c4
Contents?: true
Size: 1.64 KB
Versions: 4
Compression:
Stored size: 1.64 KB
Contents
# frozen_string_literal: true require 'iecbib/hit' require "addressable/uri" module Iecbib # Page of hit collection. class HitCollection < Array DOMAIN = 'https://webstore.iec.ch' # @return [TrueClass, FalseClass] attr_reader :fetched # @return [String] attr_reader :text # @return [String] attr_reader :year # @param ref_nbr [String] # @param year [String] def initialize(ref_nbr, year = nil) #(text, hit_pages = nil) @text = ref_nbr @year = year from, to = nil if year from = Date.strptime year, '%Y' to = from.next_year.prev_day end url = "#{DOMAIN}/searchkey&RefNbr=#{ref_nbr}&From=#{from}&To=#{to}&start=1" doc = Nokogiri::HTML OpenURI.open_uri(::Addressable::URI.parse(url).normalize) hits = doc.css('ul.search-results > li').map do |h| link = h.at('a[@href!="#"]') code = link.text.tr [194, 160].pack('c*').force_encoding('UTF-8'), '' title = h.xpath('text()').text.gsub(/[\r\n]/, '') url = DOMAIN + link[:href] Hit.new({ code: code, title: title, url: url }, self) end concat hits # concat(hits.map { |h| Hit.new(h, self) }) @fetched = false # @hit_pages = hit_pages end # @return [Iecbib::HitCollection] def fetch workers = WorkersPool.new 4 workers.worker(&:fetch) each do |hit| workers << hit end workers.end workers.result @fetched = true self end def to_s inspect end def inspect "<#{self.class}:#{format('%#.14x', object_id << 1)} @fetched=#{@fetched}>" end end end
Version data entries
4 entries across 4 versions & 1 rubygems
Version | Path |
---|---|
iecbib-0.2.2 | lib/iecbib/hit_collection.rb |
iecbib-0.2.1 | lib/iecbib/hit_collection.rb |
iecbib-0.2.0 | lib/iecbib/hit_collection.rb |
iecbib-0.1.2 | lib/iecbib/hit_collection.rb |