Skip to content

Commit 9047aa9

Browse files
committed
Added files from NCBI taxonomy db.
updated script to get the files Signed-off-by: Inti Pedroso <[email protected]>
1 parent 3807203 commit 9047aa9

File tree

8 files changed

+2229433
-12
lines changed

8 files changed

+2229433
-12
lines changed

example/run.sh

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -2,12 +2,12 @@
22

33
# run test of script.
44

5-
my_perl phylostratiphy.pl \
6-
-blast blastp__Aech_v3.8.pep__nr.e10.sw.txt_old \
7-
-tax_folder data/ \
5+
my_perl ../phylostratiphy.pl \
6+
-blast example/blastp__Aech_v3.8.pep__nr.e10.sw.txt_old \
7+
-tax_folder ncbi_tax_data/ \
88
-prot_only \
99
-query_taxon 103372 \
10-
-virus_list tmp.virus.txt \
10+
-virus_list example/virus_list.tx \
1111
-out test_phylostratiphy
1212

1313

example/run2.sh

Lines changed: 8 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -2,13 +2,16 @@
22

33
# run test of script.
44

5+
cd ..
6+
57
perl phylostratiphy.pl \
6-
-blast dysbindin.blast_out.txt \
7-
-tax_folder data/ \
8+
-blast example/dysbindin.blast_out.txt \
9+
-tax_folder ncbi_tax_data/ \
810
-query_taxon 9606 \
9-
-gi_tax_id dysbindin.tax_info.csv \
11+
-gi_tax_id example/dysbindin.tax_info.csv \
1012
-hard 1e-3 \
11-
-virus_list virus_list.txt \
12-
-out test_phylostratiphy
13+
-virus_list example/virus_list.txt \
14+
-out example/test_phylostratiphy
1315

16+
cd example
1417

get_taxonomy_data.sh

Lines changed: 10 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
echo Starting to download NCBI taxonomy db info
2-
out_folder=data
2+
out_folder=ncbi_tax_data
33

44
mkdir $out_folder
55

@@ -9,14 +9,21 @@ cd $out_folder
99
tax_ftp="ftp://ftp.ncbi.nih.gov/pub/taxonomy"
1010
echo Data from FTP folder [ $tax_ftp ]
1111

12-
for file in gi_taxid_prot.dmp.gz gi_taxid_nucl.dmp.gz taxcat.tar.gz taxdump.tar.gz taxdump_readme.txt gi_taxid.readme taxcat_readme.txt
12+
for file in taxdump.tar.gz taxdump_readme.txt
1313
do
1414
wget $tax_ftp/$file
1515
done
16-
16+
1717
echo Uncompressing
1818
ls *.gz | xargs gunzip -v
1919
ls *.tar | perl -ne 'chomp($_); system "tar xvf $_";'
20+
21+
rm citations.dmp delnodes.dmp division.dmp gc.prt gencode.dmp merged.dmp taxdump.tar
22+
23+
echo Files updated on [ `date` ] > files_update_info.txt
24+
25+
cd ..
2026

2127
echo Done
2228

29+

ncbi_tax_data/files_update_info.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
Files updated on [ Wed 25 Jul 2012 16:18:05 BST ]

0 commit comments

Comments
 (0)