Sha256: 70513f21a61a26a199fed0f0d06d3c51963b8f8ee84d3d6778d77b6ae05df355

Contents?: true

Size: 1.62 KB

Versions: 10

Compression:

Stored size: 1.62 KB

Contents

# Configures the Elastic MapReduce cluster that is launched to run parse and
# combine jobs. The list of EC2 instance types can be found at
# http://aws.amazon.com/ec2/instance-types/#instance-details

# Using spot instances is recommended to reduce costs. However if the spot
# price rises above your bid price the cluster may be terminated. Elasticrawl
# tries to reduce the effect of this by parsing each Commmon Crawl segment
# in a separate job flow step.

# The master node manages the cluster.
master_instance_group:
  instance_type: m1.medium
  use_spot_instances: true
  bid_price: 0.120

# Core nodes run map and reduce tasks and store data using HDFS.
core_instance_group:
  instance_type: m1.medium
  instance_count: 2
  use_spot_instances: true
  bid_price: 0.120

# Task nodes are optional and only run map and reduce tasks.
task_instance_group:
  instance_type: m1.small
  instance_count: 0
  use_spot_instances: true
  bid_price: 0.080

# Array of bootstrap scripts that will be applied when the cluster nodes are
# initialized. The example installs the Ganglia distributed monitoring system.
bootstrap_scripts: #['s3://elasticmapreduce/bootstrap-actions/install-ganglia']

# Specifying an EC2 key pair allows SSH access to the master node. This also
# allows accessing the Hadoop Web UI over an SSH tunnel.
ec2_key_name: 'elasticrawl'

# Availability Zone (AZ) to launch instances in. An AZ in the US-East region is
# recommended since the Common Crawl corpus is stored there. Otherwise inter
# region data transfer charges will apply.
placement: 'us-east-1c'

# The AMI version to use when launching instances.
emr_ami_version: 'latest'

Version data entries

10 entries across 10 versions & 1 rubygems

Version Path
elasticrawl-1.1.8 spec/fixtures/cluster.yml
elasticrawl-1.1.7 spec/fixtures/cluster.yml
elasticrawl-1.1.6 spec/fixtures/cluster.yml
elasticrawl-1.1.5 spec/fixtures/cluster.yml
elasticrawl-1.1.4 spec/fixtures/cluster.yml
elasticrawl-1.1.3 spec/fixtures/cluster.yml
elasticrawl-1.1.2 spec/fixtures/cluster.yml
elasticrawl-1.1.1 spec/fixtures/cluster.yml
elasticrawl-1.1.0 spec/fixtures/cluster.yml
elasticrawl-1.0.0 spec/fixtures/cluster.yml