@@ -218,7 +218,7 @@ rule run_wuhan_nextclade:
218
218
f"--output-translations=data/{ database } /nextclade.translation_{{cds}}.upd.fasta"
219
219
),
220
220
output :
221
- info = f"data/{ database } /nextclade_new_raw .tsv" ,
221
+ info = f"data/{ database } /nextclade_new .tsv" ,
222
222
alignment = temp (f"data/{ database } /nextclade.aligned.upd.fasta" ),
223
223
translations = [
224
224
temp (f"data/{ database } /nextclade.translation_{ gene } .upd.fasta" )
@@ -249,7 +249,7 @@ rule run_21L_nextclade:
249
249
dataset = lambda w : f"data/nextclade_data/sars-cov-2-21L.zip" ,
250
250
sequences = f"data/{ database } /nextclade_21L.sequences.fasta" ,
251
251
output :
252
- info = f"data/{ database } /nextclade_21L_new_raw .tsv" ,
252
+ info = f"data/{ database } /nextclade_21L_new .tsv" ,
253
253
threads :
254
254
workflow .cores * 0.5
255
255
benchmark :
@@ -264,47 +264,13 @@ rule run_21L_nextclade:
264
264
"""
265
265
266
266
267
- rule nextclade_tsv_concat_versions :
268
- input :
269
- nextclade = "data/nextclade" ,
270
- tsv = f"data/{ database } /nextclade{{reference}}_new_raw.tsv" ,
271
- dataset = lambda w : f"data/nextclade_data/sars-cov-2{ w .reference .replace ('_' ,'-' )} .zip" ,
272
- output :
273
- tsv = f"data/{ database } /nextclade{{reference}}_new.tsv" ,
274
- benchmark :
275
- f"benchmarks/nextclade_tsv_concat_versions_{ database } {{reference}}.txt"
276
- shell :
277
- """
278
- if [ -s {input.tsv} ]; then
279
- # Get version numbers
280
- nextclade_version="$({input.nextclade:q} --version)"
281
- dataset_version="$(unzip -p {input.dataset} pathogen.json | jq -r '.version.tag')"
282
- timestamp="$(date -u +"%Y-%m-%dT%H:%M:%SZ")"
283
-
284
- # Combine input file with version numbers and write to output
285
- printf "%s\t nextclade_version\t dataset_version\t run_timestamp\n " \
286
- "$(head -n 1 {input.tsv})" \
287
- > {output.tsv}
288
-
289
- tail -n +2 {input.tsv} | \
290
- awk -v v1="$nextclade_version" \
291
- -v v2="$dataset_version" \
292
- -v v3="$timestamp" \
293
- -v OFS='\t ' '{{print $0, v1, v2, v3}}' \
294
- >> {output.tsv}
295
- else
296
- cp {input.tsv} {output.tsv}
297
- fi
298
- """
299
-
300
-
301
267
rule nextclade_info :
302
268
"""
303
269
Generates nextclade info TSV for all sequences (new + old)
304
270
"""
305
271
input :
306
272
old_info = f"data/{ database } /nextclade{{reference}}_old.tsv" ,
307
- new_info = rules . nextclade_tsv_concat_versions . output . tsv ,
273
+ new_info = f"data/ { database } /nextclade{{reference}}_new. tsv" ,
308
274
output :
309
275
nextclade_info = f"data/{ database } /nextclade{{reference}}.tsv" ,
310
276
benchmark :
0 commit comments