root/galaxy-central/scripts/metagenomics/process_BLAST_db.sh

リビジョン 2, 0.8 KB (コミッタ: hatakeyama, 14 年 前)

import galaxy-central

行番号 
1echo "This will take several hours to finish due to the size of the databases (about 30GB)..."
2echo "Getting nt database from NCBI..."
3wget ftp://ftp.ncbi.nlm.nih.gov/blast/db/FASTA/nt.gz
4echo "Changing fasta title lines to >ginumber_seqlength..."
5echo "Formatting nt database to chunks of 2GB each..."
6gunzip -c nt.gz | python convert_title.py | formatdb -i stdin -p F -n "nt.chunk" -v 2000
7echo "Remove the zip file, keep the formatted files."
8rm nt.gz
9
10echo "Getting wgs database from NCBI..."
11wget ftp://ftp.ncbi.nlm.nih.gov/blast/db/FASTA/wgs.gz
12echo "Changing fasta title lines to >ginumber_seqlength..."
13echo "Formatting wgs database to chunks of 2GB each..."
14gunzip -c wgs.gz | python convert_title.py | formatdb -i stdin -p F -n "wgs.chunk" -v 2000
15echo "Remove the zip file, keep the formatted files."
16rm wgs.gz
17
18echo "Job finished"
Note: リポジトリブラウザについてのヘルプは TracBrowser を参照してください。