Code:
$ wget ftp://ftp.uniprot.org/pub/databases/uniprot/previous_releases/release10.0/uniref/uniref10.0.tar.gz ... $ tar -zxvf uniref10.0.tar.gz uniref100.tar uniref50.tar $ tar -xvf uniref90.tar README uniref90.dtd uniref90.xml.gz $ gunzip uniref90.xml.gz
Code:
$ head -n 25 uniref90.xml <?xml version="1.0" encoding="ISO-8859-1" ?> <UniRef90 xmlns="http://uniprot.org/uniref" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://uniprot.org/uniref http://www.uniprot.org/support/docs/uniref.xsd" releaseDate="2007-03-06" version="10.0"> <entry id="UniRef90_Q3ASY8" updated="2007-03-06"> <name>Cluster: Parallel beta-helix repeat</name> <property type="member count" value="1"/> <property type="common taxon" value="Chlorobium chlorochromatii CaD3"/> <property type="common taxon ID" value="340177"/> <representativeMember> <dbReference type="UniProtKB ID" id="Q3ASY8_CHLCH"> <property type="UniProtKB accession" value="Q3ASY8"/> <property type="UniParc ID" value="UPI00005D5563"/> <property type="UniRef100 ID" value="UniRef100_Q3ASY8"/> <property type="UniRef50 ID" value="UniRef50_Q3ASY8"/> <property type="protein name" value="Parallel beta-helix repeat"/> <property type="source organism" value="Chlorobium chlorochromatii (strain CaD3)"/> <property type="NCBI taxonomy" value="340177"/> <property type="length" value="36805"/> <property type="isSeed" value="true"/> </dbReference> <sequence length="36805" checksum="A7A8EA21B9345FF9"> MKPRFYIEQLEPRILLSGDILSELVPLLSSREASQMQSDYLLEHPEARRVAPLSAVEAAR ACMVVVQSEAPSLLTEDGLMYPFEVGVGEERSSEANAEPTLAADFSADYTFSKSEWDALE
Code:
$ grep -c "^<entry id" uniref90.xml 2781437
Update: Raised here: http://lists.open-bio.org/pipermail/...er/010909.html
Leave a comment: