Sha256: 1b62217e8944bd9815b230caadb3665dd82d70885ef67643795c21e616a8a831

Contents?: true

Size: 1.75 KB

Versions: 29

Compression:

Stored size: 1.75 KB

Contents

#!/usr/bin/env ruby
#
# fastasort: Sorts a FASTA file (in fact it can use any flat file input supported
#            by BIORUBY) while modifying the definition of each record in the
#            process so it is suitable for processing with (for example) pal2nal
#            and PAML.
#
#   Copyright (C) 2008 KATAYAMA Toshiaki <k@bioruby.org> & Pjotr Prins
#
#  This program is free software; you can redistribute it and/or modify
#  it under the terms of the GNU General Public License as published by
#  the Free Software Foundation; either version 2 of the License, or
#  (at your option) any later version.
#
#  This program is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#  GNU General Public License for more details.
#
#  $Id: fastasort.rb,v 1.2 2008/05/19 12:22:05 pjotr Exp $
#

require 'bio'

include Bio

table = Hash.new   # table to sort objects
ARGV.each do | fn |
  Bio::FlatFile.auto(fn).each do | item |
    # Some procession of the definition for external programs (just
    # an example):

    # strip JALView extension from definition e.g. .../1-212
    if item.definition =~ /\/\d+-\d+$/
      item.definition = $`
    end
    # substitute slashes:
    definition = item.definition.gsub(/\//,'-')
    # substitute quotes and ampersands:
    definition = item.definition.gsub(/['"&]/,'x')
    # prefix letters if the first position is a number:
    definition = 'seq'+definition if definition =~ /^\d/

    # Now add the data to the sort table
    table[definition] = item.data
  end
end

# Output sorted table
table.sort.each do | definition, data |
  rec = Bio::FastaFormat.new('> '+definition.strip+"\n"+data)
  print rec
end

Version data entries

29 entries across 29 versions & 4 rubygems

Version Path
bio-2.0.5 sample/fastasort.rb
bio-2.0.4 sample/fastasort.rb
bio-2.0.3 sample/fastasort.rb
bio-2.0.2 sample/fastasort.rb
bio-2.0.1 sample/fastasort.rb
bio-2.0.0 sample/fastasort.rb
bio-1.6.0.pre.20181210 sample/fastasort.rb
bio-1.5.2 sample/fastasort.rb
bio-1.5.1 sample/fastasort.rb
bio-1.5.0 sample/fastasort.rb
bioruby-bio-1.2.9.9001 sample/fastasort.rb
bioruby-bio-1.2.9.9501 sample/fastasort.rb
bioruby-bio-1.3.0.5000 sample/fastasort.rb
bioruby-bio-1.3.0.9901 sample/fastasort.rb
bioruby-bio-1.3.0 sample/fastasort.rb
bioruby-bio-1.3.1.5000 sample/fastasort.rb
jandot-bio-1.2.1 sample/fastasort.rb
ngoto-bio-1.2.9.9001 sample/fastasort.rb
ngoto-bio-1.2.9.9501 sample/fastasort.rb
ngoto-bio-1.3.0.5000 sample/fastasort.rb