require 'rbbt/persist' require 'rbbt/persist/tsv' require 'rbbt/util/log' require 'rbbt/util/semaphore' require 'rbbt/workflow/accessor' class Step attr_accessor :clean_name, :path, :task, :workflow, :inputs, :dependencies, :bindings attr_accessor :task_name, :overriden attr_accessor :pid attr_accessor :exec attr_accessor :relocated attr_accessor :result, :mutex, :seen class << self attr_accessor :lock_dir def lock_dir @lock_dir ||= begin dir = Rbbt.tmp.step_info_locks.find FileUtils.mkdir_p dir unless Open.exists? dir dir end end end def clean_name @clean_name ||= begin info[:clean_name] || path.sub(/_[a-z0-9]{32}/, '') end end def overriden if @overriden.nil? return [] if dependencies.nil? dependencies.select{|dep| dep.overriden }.any? else @overriden end end def initialize(path, task = nil, inputs = nil, dependencies = nil, bindings = nil, clean_name = nil) path = Path.setup(Misc.sanitize_filename(path)) if String === path path = path.call if Proc === path @path = path @task = task @bindings = bindings @dependencies = case when dependencies.nil? [] when Array === dependencies dependencies else [dependencies] end @mutex = Mutex.new @info_mutex = Mutex.new @inputs = inputs NamedArray.setup @inputs, task.inputs.collect{|s| s.to_s} if task and task.respond_to? :inputs and task.inputs if Open.exists?(info_file) and (info[:path] != path) @relocated = true end end def workflow @workflow || info[:workflow] end def load_inputs_from_info if info[:inputs] info_inputs = info[:inputs] if task && task.respond_to?(:inputs) && task.inputs IndiferentHash.setup info_inputs @inputs = NamedArray.setup info_inputs.values_at(*task.inputs.collect{|name| name.to_s}), task.inputs else @inputs = NamedArray.setup info_inputs.values, info_inputs.keys end else nil end end def inputs return @inputs if NamedArray === @inputs load_inputs_from_info if @inputs.nil? NamedArray.setup(@inputs, task.inputs) if task && task.inputs && !(NamedArray === @inputs) @inputs || [] end def recursive_inputs if NamedArray === inputs i = {} inputs.zip(inputs.fields).each do |v,f| i[f] = v end else i = {} end rec_dependencies.each do |dep| next unless NamedArray === dep.inputs dep.inputs.zip(dep.inputs.fields).each do |v,f| if i.include?(f) && i[f] != v Log.debug "Conflict in #{ f }: #{[i[f].inspect, v.inspect] * " <-> "}" i[f] = nil else i[f] = v end end end #dependencies.each do |dep| # di = dep.recursive_inputs # next unless NamedArray === di # di.fields.zip(di).each do |k,v| # i[k] = v unless i.include? k # end #end v = i.values NamedArray.setup v, i.keys v end def task_name @task_name ||= begin if @task.nil? @path.split("/")[-2] else @task.name end end end def path if Proc === @path @path = Path.setup(Misc.sanitize_filename(@path.call)) else @path end end class << self attr_accessor :log_relay_step end def relay_log(step) return self unless Task === self.task and not self.task.name.nil? if not self.respond_to? :original_log class << self attr_accessor :relay_step alias original_log log def log(status, message = nil) self.status = status message Log.uncolor message relay_step.log([task.name.to_s, status.to_s] * ">", message.nil? ? nil : message ) unless (relay_step.done? or relay_step.error? or relay_step.aborted?) end end end @relay_step = step self end def result_type @result_type ||= if @task.nil? info[:result_type] else @task.result_type || info[:result_type] || :string end end def result_description @result_description ||= if @task.nil? info[:result_description] else @task.result_description end end def prepare_result(value, description = nil, entity_info = nil) res = case when IO === value begin res = case result_type when :array array = [] while line = value.gets array << line.chomp end array when :tsv begin TSV.open(value) rescue IOError TSV.setup({}) end else value.read end value.join if value.respond_to? :join res rescue Exception value.abort if value.respond_to? :abort self.abort raise $! end when (not defined? Entity or description.nil? or not Entity.formats.include? description) value when (Annotated === value and info.empty?) value when Annotated === value annotations = value.annotations entity_info ||= begin entity_info = info.dup entity_info.merge! info[:inputs] if info[:inputs] entity_info end entity_info.each do |k,v| value.send("#{h}=", v) if annotations.include? k end value else entity_info ||= begin entity_info = info.dup entity_info.merge! info[:inputs] if info[:inputs] entity_info end Entity.formats[description].setup(value, entity_info.merge(:format => description)) end if Annotated === res dep_hash = nil res.annotations.each do |a| a = a.to_s varname = "@" + a next unless res.instance_variable_get(varname).nil? dep_hash ||= begin h = {} rec_dependencies.each{|dep| h[dep.task_name.to_s] ||= dep } h end dep = dep_hash[a] next if dep.nil? res.send(a.to_s+"=", dep.load) end end res end def child(&block) child_pid = Process.fork &block children_pids = info[:children_pids] if children_pids.nil? children_pids = [child_pid] else children_pids << child_pid end set_info :children_pids, children_pids child_pid end def load res = begin if @result and not @path == @result res = @result else join if not done? res = @path.exists? ? Persist.load_file(@path, result_type) : exec end if result_description entity_info = info.dup entity_info.merge! info[:inputs] if info[:inputs] res = prepare_result res, result_description, entity_info end res rescue IOError if @result @result = nil retry end raise $! end res end def self.clean(path) info_file = Step.info_file path pid_file = Step.pid_file path files_dir = Step.files_dir path if ! (Open.writable?(path) && Open.writable?(info_file)) Log.warn "Could not clean #{path}: not writable" return end if Open.exists?(path) or Open.exists?(pid_file) or Open.exists?(info_file) or Open.exists?(files_dir) @result = nil @pid = nil Misc.insist do Open.rm info_file if Open.exists? info_file Open.rm path if Open.exists? path Open.rm_rf files_dir if Open.exists? files_dir Open.rm pid_file if Open.exists? pid_file end end end def update if dirty? dependencies.collect{|d| d.update} if dependencies clean end end def clean status = [] status << "dirty" if done? && dirty? status << "not running" if ! done? && ! running? status.unshift " " if status.any? Log.high "Cleaning step: #{path}#{status * " "}" abort if ! done? && running? Step.clean(path) self end def rec_dependencies(need_run = false, seen = []) # A step result with no info_file means that it was manually # placed. In that case, do not consider its dependencies return [] if not (defined? WorkflowRESTClient and WorkflowRESTClient::RemoteStep === self) and not Open.exists?(self.info_file) and Open.exists?(self.path.to_s) return [] if dependencies.nil? or dependencies.empty? new_dependencies = [] dependencies.each{|step| next if seen.include? step next if self.done? && need_run && ! updatable? r = step.rec_dependencies(need_run, new_dependencies) new_dependencies.concat r new_dependencies << step } new_dependencies.uniq end def writable? Open.writable?(self.path) && Open.writable?(self.info_file) end def recursive_clean dependencies.each do |step| step.recursive_clean end clean if Open.exists?(self.info_file) self end def step(name) @steps ||= {} @steps[name] ||= begin deps = rec_dependencies.select{|step| step.task_name.to_sym == name.to_sym } raise "Dependency step not found: #{ name }" if deps.empty? if (deps & self.dependencies).any? (deps & self.dependencies).first else deps.first end end end end require 'rbbt/workflow/step/run'