Skip to content

Commit 7dcafe4

Browse files
committedDec 15, 2022
support reporting telomere count and T2T contigs
1 parent 56e7cb5 commit 7dcafe4

File tree

1 file changed

+10
-11
lines changed

1 file changed

+10
-11
lines changed
 

‎AAFTF/assess.py

+10-11
Original file line numberDiff line numberDiff line change
@@ -22,18 +22,18 @@ def genome_asm_stats(fasta_file, output_handle, telomere_repeat, n_minimum):
2222
else:
2323
seqio = SeqIO.parse(fasta_file, "fasta")
2424

25-
telomere_stats = {'FORWARD TELOMERES': 0,
26-
'REVERSE TELOMERES': 0,
27-
'BOTH TELOMERES': 0}
25+
telomere_stats = {'TELOMERE FWD': 0,
26+
'TELOMERE REV': 0,
27+
'T2T SCAFFOLDS': 0}
2828
for record in seqio:
2929
lengths.append(len(record))
3030
forward, reverse = findTelomere(record.seq, telomere_repeat, n_minimum)
3131
if forward:
32-
telomere_stats['FORWARD TELOMERES'] += 1
32+
telomere_stats['TELOMERE FWD'] += 1
3333
if reverse:
34-
telomere_stats['REVERSE TELOMERES'] += 1
34+
telomere_stats['TELOMERE REV'] += 1
3535
if forward and reverse:
36-
telomere_stats['BOTH TELOMERES'] += 1
36+
telomere_stats['T2T SCAFFOLDS'] += 1
3737

3838
GC += sum(record.seq.count(x) for x in ["G", "C", "g", "c", "S", "s"])
3939

@@ -69,7 +69,7 @@ def genome_asm_stats(fasta_file, output_handle, telomere_repeat, n_minimum):
6969
report += "%15s = %d\n" % ('N90', n90)
7070
report += "%15s = %.2f\n" % ('GC%', GC)
7171
for f in sorted(telomere_stats):
72-
report += "%15s = %.2f\n" % (f, telomere_stats[f])
72+
report += "%15s = %d\n" % (f, telomere_stats[f])
7373

7474
print(report)
7575
if output_handle:
@@ -110,13 +110,13 @@ def findTelomere(seq, monomer, n):
110110
https://github.com/markhilt/genome_analysis_tools
111111
"""
112112
# Look within first and last 200 bp for repeats
113-
start = seq[:100].upper()
114-
end = seq[-100:].upper()
113+
start = str(seq[:100]).upper()
114+
end = str(seq[-100:]).upper()
115115

116116
forward, reverse = False, False
117117

118118
# Look for the monomer repeat n number of times.
119-
if re.search(monomer*n, start):
119+
if re.search(monomer*2, start):
120120
forward = True
121121
rev_monomer = revcomp(monomer)
122122
if re.search(rev_monomer*n, end):
@@ -138,5 +138,4 @@ def run(parser, args):
138138

139139
if args.report:
140140
output_handle = open(args.report, "w")
141-
142141
genome_asm_stats(args.input, output_handle, args.telomere_monomer, args.telomere_n_repeat)

0 commit comments

Comments
 (0)
Please sign in to comment.