$options = Maasha::Biopieces::parse_options(
[
{ long => 'data_in', short => 'i', type => 'files!', mandatory => 'no', default => undef, allowed => undef, disallowed => undef },
- { long => 'num', short => 'n', type => 'uint', mandatory => 'no', default => undef, allowed => undef, disallowed => '0' },
+ { long => 'num', short => 'n', type => 'uint', mandatory => 'no', default => undef, allowed => undef, disallowed => 0 },
+ { long => 'quality', short => 'q', type => 'uint', mandatory => 'no', default => 20, allowed => undef, disallowed => undef },
]
);
while ( $entry = Maasha::Fastq::get_entry( $data_in ) )
{
- if ( $record = Maasha::Fastq::fastq2biopiece( $entry ) ) {
+ if ( $record = Maasha::Fastq::fastq2biopiece( $entry ) )
+ {
+ lowercase_low_scores( $record, $options->{ 'quality' } );
+
Maasha::Biopieces::put_record( $record, $out );
}
# >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>><<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<
+sub lowercase_low_scores
+{
+ # Martin A. Hansen, July 2009.
+
+ # Lowercase residues in sequence that are below a given score threshold.
+
+ # This one would be lovely to have written in C.
+
+ my ( $record, # Biopiece record
+ $quality, # quality threshold
+ ) = @_;
+
+ # Returns nothing.
+
+ my ( @seqs, @scores, $i );
+
+ @seqs = split //, $record->{ 'SEQ' };
+ @scores = split /;/, $record->{ 'SCORES' };
+
+ for ( $i = 0; $i < @scores; $i++ ) {
+ $seqs[ $i ] = lc $seqs[ $i ] if $scores[ $i ] < $quality;
+ }
+
+ $record->{ 'SEQ' } = join "", @seqs;
+ $record->{ 'SCORES' } = join ";", @scores;
+}
+
+
+# >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>><<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<
+
+
BEGIN
{
Maasha::Biopieces::status_set();