#!/usr/bin/env ruby require 'chronic' require 'chronic_duration' require 'sinatra/base' require 'erb' require 'rack/fiber_pool' require 'json' require 'flapjack/rack_logger' require 'flapjack/data/contact' require 'flapjack/data/entity_check' require 'flapjack/redis_pool' require 'flapjack/utility' module Flapjack module Gateways class Web < Sinatra::Base rescue_exception = Proc.new do |env, e| if settings.show_exceptions? # ensure the sinatra error page shows properly request = Sinatra::Request.new(env) printer = Sinatra::ShowExceptions.new(proc{ raise e }) s, h, b = printer.call(env) [s, h, b] else @logger.error e.message @logger.error e.backtrace.join("\n") [503, {}, ""] end end use Rack::FiberPool, :size => 25, :rescue_exception => rescue_exception use Rack::MethodOverride class << self def start @redis = Flapjack::RedisPool.new(:config => @redis_config, :size => 2) @logger.info "starting web - class" if accesslog = (@config && @config['access_log']) if not File.directory?(File.dirname(accesslog)) puts "Parent directory for log file #{accesslog} doesn't exist" puts "Exiting!" exit end access_logger = Flapjack::AsyncLogger.new(@config['access_log']) use Flapjack::CommonLogger, access_logger end end end include Flapjack::Utility set :views, settings.root + '/web/views' set :public_folder, settings.root + '/web/public' helpers do def h(text) ERB::Util.h(text) end def u(text) ERB::Util.u(text) end end def redis self.class.instance_variable_get('@redis') end def logger self.class.instance_variable_get('@logger') end get '/' do check_stats entity_stats erb 'index.html'.to_sym end get '/checks_all' do check_stats @adjective = 'all' checks_by_entity = Flapjack::Data::EntityCheck.find_all_by_entity(:redis => redis) @states = checks_by_entity.keys.inject({}) {|result, entity| result[entity] = checks_by_entity[entity].sort.map {|check| [check] + entity_check_state(entity, check) } result } @entities_sorted = checks_by_entity.keys.sort erb 'checks.html'.to_sym end get '/checks_failing' do check_stats @adjective = 'failing' checks_by_entity = Flapjack::Data::EntityCheck.find_all_failing_by_entity(:redis => redis) @states = checks_by_entity.keys.inject({}) {|result, entity| result[entity] = checks_by_entity[entity].sort.map {|check| [check] + entity_check_state(entity, check) } result } @entities_sorted = checks_by_entity.keys.sort erb 'checks.html'.to_sym end get '/self_stats' do self_stats entity_stats check_stats erb 'self_stats.html'.to_sym end get '/self_stats.json' do self_stats entity_stats check_stats { 'events_queued' => @events_queued, 'all_entities' => @count_all_entities, 'failing_entities' => @count_failing_entities, 'all_checks' => @count_all_checks, 'failing_checks' => @count_failing_checks, 'processed_events' => { 'all_time' => { 'total' => @event_counters['all'].to_i, 'ok' => @event_counters['ok'].to_i, 'failure' => @event_counters['failure'].to_i, 'action' => @event_counters['action'].to_i, } }, 'total_keys' => @dbsize, 'uptime' => @uptime_string, 'boottime' => @boot_time, 'current_time' => Time.now, 'executive_instances' => @executive_instances, }.to_json end get '/entities_all' do entity_stats @adjective = 'all' @entities = Flapjack::Data::Entity.find_all_with_checks(:redis => redis) erb 'entities.html'.to_sym end get '/entities_failing' do entity_stats @adjective = 'failing' @entities = Flapjack::Data::Entity.find_all_with_failing_checks(:redis => redis) erb 'entities.html'.to_sym end get '/entity/:entity' do @entity = params[:entity] entity_stats @states = Flapjack::Data::EntityCheck.find_all_for_entity_name(@entity, :redis => redis).sort.map { |check| [check] + entity_check_state(@entity, check) }.sort_by {|parts| parts } erb 'entity.html'.to_sym end get '/check' do @entity = params[:entity] @check = params[:check] entity_check = get_entity_check(@entity, @check) return 404 if entity_check.nil? check_stats last_change = entity_check.last_change @check_state = entity_check.state @check_enabled = entity_check.enabled? @check_last_update = entity_check.last_update @check_last_change = last_change @check_summary = entity_check.summary @check_details = entity_check.details @last_notifications = last_notification_data(entity_check) @scheduled_maintenances = entity_check.maintenances(nil, nil, :scheduled => true) @acknowledgement_id = entity_check.failed? ? entity_check.event_count_at(entity_check.last_change) : nil @current_scheduled_maintenance = entity_check.current_maintenance(:scheduled => true) @current_unscheduled_maintenance = entity_check.current_maintenance(:scheduled => false) @contacts = entity_check.contacts @state_changes = entity_check.historical_states(nil, Time.now.to_i, :order => 'desc', :limit => 20) erb 'check.html'.to_sym end post '/acknowledgements/:entity/:check' do @entity = params[:entity] @check = params[:check] @summary = params[:summary] @acknowledgement_id = params[:acknowledgement_id] dur = ChronicDuration.parse(params[:duration] || '') @duration = (dur.nil? || (dur <= 0)) ? (4 * 60 * 60) : dur return 404 if get_entity_check(@entity, @check).nil? ack = Flapjack::Data::Event.create_acknowledgement( @entity, @check, :summary => (@summary || ''), :acknowledgement_id => @acknowledgement_id, :duration => @duration, :redis => redis) redirect back end # FIXME: there is bound to be a more idiomatic / restful way of doing this # (probably using 'delete' or 'patch') post '/end_unscheduled_maintenance/:entity/:check' do @entity = params[:entity] @check = params[:check] entity_check = get_entity_check(@entity, @check) return 404 if entity_check.nil? entity_check.end_unscheduled_maintenance(Time.now.to_i) redirect back end # create scheduled maintenance post '/scheduled_maintenances/:entity/:check' do start_time = Chronic.parse(params[:start_time]).to_i raise ArgumentError, "start time parsed to zero" unless start_time > 0 duration = ChronicDuration.parse(params[:duration]) summary = params[:summary] entity_check = get_entity_check(params[:entity], params[:check]) return 404 if entity_check.nil? entity_check.create_scheduled_maintenance(start_time, duration, :summary => summary) redirect back end # delete a scheduled maintenance delete '/scheduled_maintenances/:entity/:check' do entity_check = get_entity_check(params[:entity], params[:check]) return 404 if entity_check.nil? entity_check.end_scheduled_maintenance(params[:start_time].to_i) redirect back end # delete a check (actually just disables it) delete '/checks/:entity/:check' do entity_check = get_entity_check(params[:entity], params[:check]) return 404 if entity_check.nil? entity_check.disable! redirect back end get '/contacts' do #self_stats @contacts = Flapjack::Data::Contact.all(:redis => redis) erb 'contacts.html'.to_sym end get "/contacts/:contact" do contact_id = params[:contact] if contact_id @contact = Flapjack::Data::Contact.find_by_id(contact_id, :redis => redis) end unless @contact status 404 return end if @contact.media.has_key?('pagerduty') @pagerduty_credentials = @contact.pagerduty_credentials end # FIXME: intersect with current checks, or push down to Contact.entities @entities_and_checks = @contact.entities(:checks => true).sort_by {|ec| ec[:entity].name } erb 'contact.html'.to_sym end protected # TODO cache constructed erb object to improve performance -- check mtime # to know when to refresh; would need to synchronize accesses to the cache, # to lock out reads while it's being refreshed def render_erb(file, bind) erb = ERB.new(File.read(File.dirname(__FILE__) + '/web/views/' + file)) erb.result(bind) end private def get_entity_check(entity, check) entity_obj = (entity && entity.length > 0) ? Flapjack::Data::Entity.find_by_name(entity, :redis => redis) : nil return if entity_obj.nil? || (check.nil? || check.length == 0) Flapjack::Data::EntityCheck.for_entity(entity_obj, check, :redis => redis) end def entity_check_state(entity_name, check) entity = Flapjack::Data::Entity.find_by_name(entity_name, :redis => redis) return if entity.nil? entity_check = Flapjack::Data::EntityCheck.for_entity(entity, check, :redis => redis) summary = entity_check.summary summary = summary[0..76] + '...' unless (summary.nil? || (summary.length < 81)) latest_notif = {:problem => entity_check.last_notification_for_state(:problem)[:timestamp], :recovery => entity_check.last_notification_for_state(:recovery)[:timestamp], :acknowledgement => entity_check.last_notification_for_state(:acknowledgement)[:timestamp] }.max_by {|n| n[1] || 0} lc = entity_check.last_change last_change = lc ? ChronicDuration.output(Time.now.to_i - lc.to_i, :format => :short, :keep_zero => true, :units => 2) : 'never' lu = entity_check.last_update last_update = lu ? ChronicDuration.output(Time.now.to_i - lu.to_i, :format => :short, :keep_zero => true, :units => 2) : 'never' ln = latest_notif[1] last_notified = ln ? ChronicDuration.output(Time.now.to_i - ln.to_i, :format => :short, :keep_zero => true, :units => 2) + ", #{latest_notif[0]}" : 'never' [(entity_check.state || '-'), (summary || '-'), last_change, last_update, entity_check.in_unscheduled_maintenance?, entity_check.in_scheduled_maintenance?, last_notified ] end def self_stats @fqdn = `/bin/hostname -f`.chomp @pid = Process.pid @instance_id = "#{@fqdn}:#{@pid}" @dbsize = redis.dbsize @executive_instances = redis.keys("executive_instance:*").map {|i| [ i.match(/executive_instance:(.*)/)[1], redis.hget(i, 'boot_time').to_i ] }.sort {|a, b| b[1] <=> a[1]} @event_counters = redis.hgetall('event_counters') @event_counters_instance = redis.hgetall("event_counters:#{@instance_id}") @boot_time = Time.at(redis.hget("executive_instance:#{@instance_id}", 'boot_time').to_i) @uptime = Time.now.to_i - @boot_time.to_i @uptime_string = time_period_in_words(@uptime) @event_rate_all = (@uptime > 0) ? (@event_counters_instance['all'].to_f / @uptime) : 0 @events_queued = redis.llen('events') end def entity_stats @count_all_entities = Flapjack::Data::Entity.find_all_with_checks(:redis => redis).length @count_failing_entities = Flapjack::Data::Entity.find_all_with_failing_checks(:redis => redis).length end def check_stats # FIXME: move this logic to Flapjack::Data::EntityCheck @count_all_checks = Flapjack::Data::EntityCheck.count_all(:redis => redis) @count_failing_checks = Flapjack::Data::EntityCheck.count_all_failing(:redis => redis) end def last_notification_data(entity_check) last_notifications = entity_check.last_notifications_of_each_type [:critical, :warning, :unknown, :recovery, :acknowledgement].inject({}) do |memo, type| if last_notifications[type] && last_notifications[type][:timestamp] t = Time.at(last_notifications[type][:timestamp]) memo[type] = {:time => t.to_s, :relative => relative_time_ago(t) + " ago", :summary => last_notifications[type][:summary]} end memo end end end end end