module Eco module API class Session class Batch < Common::Session::BaseSession DEFAULT_BATCH_BLOCK = 50 VALID_METHODS = [:get, :create, :update, :upsert, :delete] class << self # @return [Boolean] `true` if the method is supported, `false` otherwise. def valid_method?(value) VALID_METHODS.include?(value) end end # Gets the _people_ of the organization according `params`. # If `people` is not `nil`, scopes to only the people specified. # @note # - If `people` is given keys `page:` and `q` of `params:`. # @param people [Nil, People, Enumerable, Enumerable] target _People_ to launch the batch against. # @param params [Hash] api request options. # @option params [String] :page the page number `page` based on `:per_page`. # @option params [String] :per_page the number of people included per each batch api request. # @option params [String] :q some text to search. Omit this parameter to target all the people. # @return [Array] all the people based on `params` def get_people(people = nil, params: {}, silent: false) return launch(people, method: :get, params: params, silent: silent).people if people.is_a?(Enumerable) return get(params: params, silent: silent) end # launches a batch of `method` type using `people` and the specified `params` # @raise Exception # - if `people` is `nil` or is not an `Enumerable`. # - if there's no `api` connection linked to the current `Batch`. # @param people [People, Enumerable, Enumerable] target _People_ to launch the batch against. # @param method [Symbol] the method to launch the batch api request with. # @param params [Hash] api request options. # @option params [String] :per_page the number of people included per each batch api request. # @return [Batch::Status] the `status` of this batch launch. def launch(people, method:, params: {} , silent: false) batch_from(people, method: method, params: params, silent: silent) end def search(data, silent: false, params: {}) params = {per_page: DEFAULT_BATCH_BLOCK}.merge(params) launch(data, method: :get, params: params, silent: silent).tap do |status| status.mode = :search entries = status.queue puts "\n" entries.each_with_index do |entry, i| if (i % 10 == 0) percent = i * 100 / entries.length print "Searching: #{percent.round}% (#{i}/#{entries.length} entries)\r" $stdout.flush end unless status.success?(entry) email = nil case when entry.respond_to?(:email) email = entry.email when entry.respond_to?(:to_h) email = entry.to_h["email"] end people_matching = [] email = email.to_s.strip.downcase unless email.empty? people_matching = get(params: params.merge(q: email), silent: silent).select do |person| person.email == email end end case people_matching.length when 1 status.set_person_match(entry, people_matching.first) when 2..Float::INFINITY status.set_people_match(entry, people_matching) end end end end end private def get(params: {}, silent: false) fatal "cannot batch get without api connnection, please provide a valid api connection!" unless people_api = api&.people params = {per_page: DEFAULT_BATCH_BLOCK}.merge(params) return people_api.get_all(params: params, silent: silent) end def batch_from(data, method:, params: {}, silent: false) fatal "Invalid batch method: #{method}." if !self.class.valid_method?(method) return nil if !data || !data.is_a?(Enumerable) fatal "cannot batch #{method} without api connnection, please provide a valid api connection!" unless people_api = api&.people # param q does not make sense here, even for GET method params = {per_page: DEFAULT_BATCH_BLOCK}.merge(params) per_page = params[:per_page] || DEFAULT_BATCH_BLOCK launch_batch(data, method: method, per_page: per_page, people_api: people_api, silent: silent ) end def launch_batch(data, method:, status: nil, job_mode: true, per_page: DEFAULT_BATCH_BLOCK, people_api: api&.people, silent: false) iteration = 1; done = 0 iterations = (data.length.to_f / per_page).ceil status ||= Eco::API::Session::Batch::Status.new(enviro, queue: data, method: method) status.tap do |status| start_time = Time.now start_slice = Time.now; slice = [] pending_for_server_error = data.to_a[0..-1] data.each_slice(per_page) do |slice| msg = "starting batch '#{method}' iteration #{iteration}/#{iterations}," msg += " with #{slice.length} entries of #{data.length} -- #{done} done" msg += " (last: #{str_stats(start_slice, slice.length)}; total: #{str_stats(start_time, done)})" logger.info(msg) unless silent start_slice = Time.now offer_retry_on(Ecoportal::API::Errors::TimeOut) do people_api.batch(job_mode: false) do |batch| slice.each do |person| batch.public_send(method, person) do |response| faltal("Request with no response") unless !!response unless server_error?(response) pending_for_server_error.delete(person) status[person] = response end end end end # end batch end iteration += 1 done += slice.length end # next slice # temporary working around (due to back-end problems with batch/jobs) unless pending_for_server_error.empty? msg = "Going to re-try #{pending_for_server_error.count} due to server errors" logger.info(msg) unless silent launch_batch(pending_for_server_error, status: status, method: method, job_mode: false, per_page: per_page, people_api: people_api, silent: silent ) end end end def server_error?(response) res_status = response.status server_error = !res_status || res_status.server_error? other_error = !server_error && (!res_status.code || res_status.code < 100) no_body = !server_error && !other_error && !response.body server_error || other_error || no_body end def offer_retry_on(error_type, retries_left = 3, &block) begin block.call rescue error_type => e raise unless retries_left > 0 explanation = "Batch TimeOut. You have #{retries_left} retries left." prompt_user(" Do you want to retry (y/N)?", default: "Y", explanation: explanation, timeout: 10) do |response| if response.upcase.start_with?("Y") puts "\nOkay... let's retry!" offer_retry_on(error_type, retries_left - 1, &block) else raise end end end end def str_stats(start, count) now = Time.now secs = (now - start).round(3) if secs > 0.0 per_sec = (count.to_f / secs).round(2) "#{secs}s -> #{per_sec} people/s" else " -- " end end end end end end require_relative 'batch/job' require_relative 'batch/feedback' require_relative 'batch/request_stats' require_relative 'batch/base_policy' require_relative 'batch/policies' require_relative 'batch/status' require_relative 'batch/errors' require_relative 'batch/jobs' require_relative 'batch/jobs_groups'