File size: 851 Bytes
70b95b8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 |
#!/usr/bin/python
# coding: utf-8
# Author: LE YUAN
# Date: 2020-06-25
# This python script is to obtain protein sequence by uniprot protein id
from urllib import request
# This function is to obtain the protein sequence according to the protein id from Uniprot API
# https://www.uniprot.org/uniprot/A0A1D8PIP5.fasta
# https://www.uniprot.org/help/api_idmapping
def uniprot_sequence(id) :
url = "https://www.uniprot.org/uniprot/%s.fasta" % id
IdSeq = dict()
try :
data = request.urlopen(url)
respdata = data.read().decode("utf-8").strip()
IdSeq[id] = "".join(respdata.split("\n")[1:])
except :
print(id, "can not find from uniprot!")
IdSeq[id] = None
print(IdSeq[id])
# return IdSeq[id]
def main() :
uniprot_sequence('P49384')
if __name__ == "__main__" :
main()
|