#!/bin/tcsh -efx # Script to create a relational version of UniProt database. Should be run on # hgwdev. # Set up working directory mkdir -p /hive/data/outside/swissprot/111004/build # Download swissprot. This will take about 90 minutes. cd /hive/data/outside/swissprot/111004/build wget ftp://ftp.expasy.org/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.dat.gz wget ftp://ftp.expasy.org/databases/uniprot/current_release/knowledgebase/complete/uniprot_trembl.dat.gz wget ftp://ftp.expasy.org/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot_varsplic.fasta.gz # Turn flat file into relational tab-separated files. The -dupeOk flag was # needed this time for spToDb since their were things in swissProt that had # not been removed from trEMBL. This step takes about 20 minutes. zcat *.dat.gz | spToDb stdin ../tabFiles # Create the database. hgsql mysql <