7 class TestSeq < Test::Unit::TestCase
12 # def test_Seq# autoremoves whitespace, newlines, and carriage returns
14 # dna.seq = "A\tT\r\tC\nG "
15 # assert_equal(dna.seq, "ATCG")
18 def test_Seq_is_dna_with_no_sequence_type_returns_false
19 assert(@entry.is_dna? == false)
22 def test_Seq_is_dna_with_dna_sequence_type_returns_true
24 assert(@entry.is_dna? == true)
27 def test_Seq_is_rna_with_no_sequence_type_returns_false
28 assert(@entry.is_rna? == false)
31 def test_Seq_is_rna_with_rna_sequence_type_returns_true
33 assert(@entry.is_rna? == true)
36 def test_Seq_is_protein_with_no_sequence_type_returns_false
37 assert(@entry.is_protein? == false)
40 def test_Seq_is_protein_with_protein_sequence_type_returns_true
41 @entry.type = 'protein'
42 assert_equal(true, @entry.is_protein?)
45 def test_Seq_type_guess_without_sequence_raises
46 assert_raise(SeqError) { @entry.type_guess }
49 def test_Seq_type_guess_with_protein_returns_protein
50 @entry.seq = 'atcatcrFgatcg'
51 assert_equal('protein', @entry.type_guess)
54 def test_Seq_type_guess_with_rna_returns_rna
55 @entry.seq = 'atcatcrUgatcg'
56 assert_equal('rna', @entry.type_guess)
59 def test_Seq_type_guess_with_dna_returns_dna
60 @entry.seq = 'atcatcgatcg'
61 assert_equal('dna', @entry.type_guess)
64 def test_Seq_type_guess_EM_without_sequence_raises
65 assert_raise(SeqError) { @entry.type_guess! }
68 def test_Seq_type_guess_EM_with_protein_returns_protein
69 @entry.seq = 'atcatcrFgatcg'
71 assert_equal('protein', @entry.type)
74 def test_Seq_type_guess_EM_with_rna_returns_rna
75 @entry.seq = 'atcatcrUgatcg'
77 assert_equal('rna', @entry.type)
80 def test_Seq_type_guess_EM_with_dna_returns_dna
81 @entry.seq = 'atcatcgatcg'
83 assert_equal('dna', @entry.type)
86 def test_Seq_length_is_correct
88 assert_equal(4, @entry.length)
91 def test_Seq_indels_is_correct
92 @entry.seq = 'ATCG.-~_'
93 assert_equal(4, @entry.indels)
96 def test_Seq_to_rna_raises_if_no_sequence
98 assert_raise(SeqError) { @entry.to_rna }
101 def test_Seq_to_rna_raises_on_bad_type
104 assert_raise(SeqError) { @entry.to_rna }
107 def test_Seq_to_rna_transcribes_correctly
108 @entry.seq = 'ATCGatcg'
110 assert_equal("AUCGaucg", @entry.to_rna)
113 def test_Seq_to_rna_changes_entry_type_to_rna
114 @entry.seq = 'ATCGatcg'
117 assert_equal("rna", @entry.type)
120 def test_Seq_to_dna_raises_if_no_sequence
122 assert_raise(SeqError) { @entry.to_dna }
125 def test_Seq_to_dna_raises_on_bad_type
128 assert_raise(SeqError) { @entry.to_dna }
131 def test_Seq_to_dna_transcribes_correctly
132 @entry.seq = 'AUCGaucg'
134 assert_equal("ATCGatcg", @entry.to_dna)
137 def test_Seq_to_dna_changes_entry_type_to_dna
138 @entry.seq = 'AUCGaucg'
141 assert_equal("dna", @entry.type)
144 def test_Seq_to_bp_returns_correct_record
145 @entry.seq_name = 'test'
147 assert_equal({:SEQ_NAME=>"test", :SEQ=>"ATCG", :SEQ_LEN=>4}, @entry.to_bp)
150 def test_Seq_to_bp_raises_on_missing_seq_name
152 assert_raise(SeqError) { @entry.to_bp }
155 def test_Seq_to_bp_raises_on_missing_sequence
156 @entry.seq_name = 'test'
157 assert_raise(SeqError) { @entry.to_bp }
160 def test_Seq_to_fasta_returns_correct_entry
161 @entry.seq_name = 'test'
163 assert_equal(">test\nATCG\n", @entry.to_fasta)
166 def test_Seq_to_fasta_wraps_correctly
167 entry = Seq.new("test", "ATCG")
168 assert_equal(">test\nAT\nCG\n", entry.to_fasta(2))
171 def test_Seq_to_fastq_returns_correct_entry
172 @entry.seq_name = 'test'
175 assert_equal("@test\nATCG\n+\nhhhh\n", @entry.to_fastq)
178 def test_Seq_to_key_with_bad_residue_raises
179 entry = Seq.new("test", "AUCG")
180 assert_raise(SeqError) { entry.to_key }
183 def test_Seq_to_key_returns_correctly
184 entry = Seq.new("test", "ATCG")
185 assert_equal(54, entry.to_key)
188 def test_Seq_reverse_returns_correctly
190 assert_equal("GCTA", @entry.reverse)
193 def test_Seq_complement_raises_if_no_sequence
195 assert_raise(SeqError) { @entry.complement }
198 def test_Seq_complement_raises_on_bad_type
200 @entry.type = 'protein'
201 assert_raise(SeqError) { @entry.complement }
204 def test_Seq_complement_for_DNA_is_correct
205 @entry.seq = 'ATCGatcg'
207 assert_equal("TAGCtagc", @entry.complement)
210 def test_Seq_complement_for_RNA_is_correct
211 @entry.seq = 'AUCGaucg'
213 assert_equal("UAGCuagc", @entry.complement)
216 def test_Seq_reverse_complement_for_DNA_is_correct
217 @entry.seq = 'ATCGatcg'
219 assert_equal("cgatCGAT", @entry.reverse_complement)
222 def test_Seq_reverse_complement_for_RNA_is_correct
223 @entry.seq = 'AUCGaucg'
225 assert_equal("cgauCGAU", @entry.reverse_complement)
228 def test_Seq_hamming_distance_returns_correctly
229 seq1 = Seq.new("test1", "ATCG")
230 seq2 = Seq.new("test2", "atgg")
231 assert_equal(1, seq1.hamming_distance(seq2))
234 def test_Seq_generate_with_length_lt_1_raises
235 assert_raise(SeqError) { @entry.generate(-10, "dna") }
236 assert_raise(SeqError) { @entry.generate(0, "dna") }
239 def test_Seq_generate_with_bad_type_raises
240 assert_raise(SeqError) { @entry.generate(10, "foo") }
243 def test_Seq_generate_with_ok_type_dont_raise
244 %w[dna DNA rna RNA protein Protein].each do |type|
245 assert_nothing_raised { @entry.generate(10, type) }
249 def test_Seq_subseq_with_start_lt_0_raises
251 assert_raise(SeqError) { @entry.subseq(-1, 1) }
254 def test_Seq_subseq_with_length_lt_1_raises
256 assert_raise(SeqError) { @entry.subseq(0, 0) }
259 def test_Seq_subseq_with_start_plus_length_gt_seq_raises
261 assert_raise(SeqError) { @entry.subseq(0, 5) }
264 def test_Seq_subseq_returns_correct_sequence
266 assert_equal("AT", @entry.subseq(0, 2).seq)
267 assert_equal("CG", @entry.subseq(2, 2).seq)
270 def test_Seq_subseq_without_len_returns_correct_sequence
272 assert_equal("ATCG", @entry.subseq(0).seq)
273 assert_equal("CG", @entry.subseq(2).seq)
276 def test_Seq_subseq_returns_correct_qual
279 assert_equal("ab", @entry.subseq(0, 2).qual)
280 assert_equal("cd", @entry.subseq(2, 2).qual)
283 def test_Seq_subseq_without_len_returns_correct_qual
286 assert_equal("abcd", @entry.subseq(0).qual)
287 assert_equal("cd", @entry.subseq(2).qual)
290 def test_Seq_subseq_bang_with_start_lt_0_raises
292 assert_raise(SeqError) { @entry.subseq!(-1, 1) }
295 def test_Seq_subseq_bang_with_length_lt_1_raises
297 assert_raise(SeqError) { @entry.subseq!(0, 0) }
300 def test_Seq_subseq_bang_with_start_plus_length_gt_seq_raises
302 assert_raise(SeqError) { @entry.subseq!(0, 5) }
305 def test_Seq_subseq_bang_returns_correct_sequence
308 assert_equal("AT", @entry.seq)
311 assert_equal("CG", @entry.seq)
314 def test_Seq_subseq_bang_without_len_returns_correct_sequence
317 assert_equal("ATCG", @entry.seq)
320 assert_equal("CG", @entry.seq)
323 def test_Seq_subseq_bang_with_pos_and_len_returns_correct_qual
327 assert_equal("ab", @entry.qual)
331 assert_equal("cd", @entry.qual)
334 def test_Seq_subseq_bang_with_pos_returns_correct_qual
338 assert_equal("abcd", @entry.qual)
342 assert_equal("cd", @entry.qual)
345 def test_Seq_subseq_rand_returns_correct_sequence
347 assert_equal("ATCG", @entry.subseq_rand(4).seq)
350 def test_Seq_composition_returns_correctly
351 @entry.seq = "AAAATTTCCG"
352 assert_equal(4, @entry.composition["A"])
353 assert_equal(3, @entry.composition["T"])
354 assert_equal(2, @entry.composition["C"])
355 assert_equal(1, @entry.composition["G"])
356 assert_equal(0, @entry.composition["X"])
359 def test_Seq_homopol_max_returns_0_with_empty_sequence
361 assert_equal(0, @entry.homopol_max)
364 def test_Seq_homopol_max_returns_0_with_nil_sequence
366 assert_equal(0, @entry.homopol_max)
369 def test_Seq_homopol_max_returns_0_when_not_found
370 @entry.seq = "AtTcCcGggGnnNnn"
371 assert_equal(0, @entry.homopol_max(6))
374 def test_Seq_homopol_max_returns_correctly
375 @entry.seq = "AtTcCcGggGnnNnn"
376 assert_equal(5, @entry.homopol_max(3))
379 def test_Seq_hard_mask_returns_correctly
380 @entry.seq = "--AAAANn"
381 assert_equal(33.33, @entry.hard_mask)
384 def test_Seq_soft_mask_returns_correctly
385 @entry.seq = "--AAAa"
386 assert_equal(25.00, @entry.soft_mask)