@@ -22,18 +22,18 @@ def genome_asm_stats(fasta_file, output_handle, telomere_repeat, n_minimum):
22
22
else :
23
23
seqio = SeqIO .parse (fasta_file , "fasta" )
24
24
25
- telomere_stats = {'FORWARD TELOMERES ' : 0 ,
26
- 'REVERSE TELOMERES ' : 0 ,
27
- 'BOTH TELOMERES ' : 0 }
25
+ telomere_stats = {'TELOMERE FWD ' : 0 ,
26
+ 'TELOMERE REV ' : 0 ,
27
+ 'T2T SCAFFOLDS ' : 0 }
28
28
for record in seqio :
29
29
lengths .append (len (record ))
30
30
forward , reverse = findTelomere (record .seq , telomere_repeat , n_minimum )
31
31
if forward :
32
- telomere_stats ['FORWARD TELOMERES ' ] += 1
32
+ telomere_stats ['TELOMERE FWD ' ] += 1
33
33
if reverse :
34
- telomere_stats ['REVERSE TELOMERES ' ] += 1
34
+ telomere_stats ['TELOMERE REV ' ] += 1
35
35
if forward and reverse :
36
- telomere_stats ['BOTH TELOMERES ' ] += 1
36
+ telomere_stats ['T2T SCAFFOLDS ' ] += 1
37
37
38
38
GC += sum (record .seq .count (x ) for x in ["G" , "C" , "g" , "c" , "S" , "s" ])
39
39
@@ -69,7 +69,7 @@ def genome_asm_stats(fasta_file, output_handle, telomere_repeat, n_minimum):
69
69
report += "%15s = %d\n " % ('N90' , n90 )
70
70
report += "%15s = %.2f\n " % ('GC%' , GC )
71
71
for f in sorted (telomere_stats ):
72
- report += "%15s = %.2f \n " % (f , telomere_stats [f ])
72
+ report += "%15s = %d \n " % (f , telomere_stats [f ])
73
73
74
74
print (report )
75
75
if output_handle :
@@ -110,13 +110,13 @@ def findTelomere(seq, monomer, n):
110
110
https://github.com/markhilt/genome_analysis_tools
111
111
"""
112
112
# Look within first and last 200 bp for repeats
113
- start = seq [:100 ].upper ()
114
- end = seq [- 100 :].upper ()
113
+ start = str ( seq [:100 ]) .upper ()
114
+ end = str ( seq [- 100 :]) .upper ()
115
115
116
116
forward , reverse = False , False
117
117
118
118
# Look for the monomer repeat n number of times.
119
- if re .search (monomer * n , start ):
119
+ if re .search (monomer * 2 , start ):
120
120
forward = True
121
121
rev_monomer = revcomp (monomer )
122
122
if re .search (rev_monomer * n , end ):
@@ -138,5 +138,4 @@ def run(parser, args):
138
138
139
139
if args .report :
140
140
output_handle = open (args .report , "w" )
141
-
142
141
genome_asm_stats (args .input , output_handle , args .telomere_monomer , args .telomere_n_repeat )
0 commit comments