X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;f=bp_bin%2Fwrite_fasta_files;h=dfeabb20a5555517af240461eb574cb79ed2f125;hb=48bea5c28b89dc5586d0bddb338ccd6ba23aa1f9;hp=debea31cb5c073f3ed6cbbacdb22a3096c7cd201;hpb=14e51cd98e6f898e4b37d9d102922fee25c40ac5;p=biopieces.git diff --git a/bp_bin/write_fasta_files b/bp_bin/write_fasta_files index debea31..dfeabb2 100755 --- a/bp_bin/write_fasta_files +++ b/bp_bin/write_fasta_files @@ -33,30 +33,40 @@ require 'maasha/fasta' require 'pp' casts = [] -casts << {:long=>'key', :short=>'k', :type=>'string', :mandatory=>true, :default=>nil, :allowed=>nil, :disallowed=>nil} -casts << {:long=>'dir', :short=>'d', :type=>'dir!', :mandatory=>true, :default=>nil, :allowed=>nil, :disallowed=>nil} -casts << {:long=>'no_stream', :short=>'x', :type=>'flag', :mandatory=>false, :default=>nil, :allowed=>nil, :disallowed=>nil} +casts << {long: 'key', short: 'k', type: 'string', mandatory: true, default: nil, allowed: nil, disallowed: nil} +casts << {long: 'dir', short: 'd', type: 'dir!', mandatory: true, default: nil, allowed: nil, disallowed: nil} +casts << {long: 'prefix', short: 'p', type: 'string', mandatory: false, default: nil, allowed: nil, disallowed: nil} +casts << {long: 'wrap', short: 'w', type: 'uint', mandatory: false, default: nil, allowed: nil, disallowed: "0"} +casts << {long: 'compress', short: 'Z', type: 'string', mandatory: false, default: nil, allowed: "gzip,bzip,bzip2", disallowed: nil} +casts << {long: 'no_stream', short: 'x', type: 'flag', mandatory: false, default: nil, allowed: nil, disallowed: nil} options = Biopieces.options_parse(ARGV, casts) -key = options[:key].to_sym - -fh_hash = {} +key = options[:key].to_sym +compress = options[:compress] ? options[:compress].to_sym : nil +fh_hash = {} Biopieces.open(options[:stream_in], options[:stream_out]) do |input, output| input.each_record do |record| if record[:SEQ_NAME] and record[:SEQ] and record[key] seq = Seq.new_bp(record) - if fh_hash.has_key? record[key].to_sym + if fh_hash[record[key].to_sym] fasta_io = fh_hash[record[key].to_sym] else - fasta_file = File.join(options[:dir], record[key] + ".fasta") - fasta_io = Fasta.open(fasta_file, "w") + if options[:prefix] + fasta_file = File.join(options[:dir], [options[:prefix], record[key]].join("_") + ".fasta") + else + fasta_file = File.join(options[:dir], record[key] + ".fasta") + end + + fasta_file << ".gz" if compress == :gzip + fasta_file << ".bz2" if compress == :bzip or compress == :bzip2 + fasta_io = Fasta.open(fasta_file, "w", compress: compress) fh_hash[record[key].to_sym] = fasta_io end - fasta_io.puts seq.to_fasta + fasta_io.puts seq.to_fasta(options[:wrap]) end output.puts record unless options[:no_stream]