Sha256: 763065aae04a70af4076720aa16a6a8ce58f6aa9ff91b4b2fb727f865b64dfab
Contents?: true
Size: 671 Bytes
Versions: 6
Compression:
Stored size: 671 Bytes
Contents
require 'aws-sdk' require 'active_record' require 'active_support' require 'elasticity' require 'highline/import' require 'thor' module Elasticrawl # S3 locations COMMON_CRAWL_BUCKET = 'aws-publicdatasets' COMMON_CRAWL_PATH = 'common-crawl/crawl-data' SEGMENTS_PATH = 'segments' WARC_PATHS = 'warc.paths.gz' MAX_SEGMENTS = 256 require 'elasticrawl/version' require 'elasticrawl/config' require 'elasticrawl/error' require 'elasticrawl/cluster' require 'elasticrawl/crawl' require 'elasticrawl/crawl_segment' require 'elasticrawl/job' require 'elasticrawl/combine_job' require 'elasticrawl/parse_job' require 'elasticrawl/job_step' end
Version data entries
6 entries across 6 versions & 1 rubygems