Read Genome

[ ]:
import modelseedpy
from modelseedpy.core.msgenome import MSGenome
from modelseedpy.core.rast_client import RastClient
[ ]:
genome = MS
[2]:
rast = RastClient()
[18]:
genome = MSGenome.from_fasta('GCF_000005845.2.faa', split=' ')
[19]:
print('Number of features:', len(genome.features))
Number of features: 3
[ ]:
for f in genome.features:
    print(f.id, len(f.seq), f.description)
[14]:
rast.annotate_genome(genome)
[14]:
[{'execution_time': 1622756127.36331,
  'tool_name': 'kmer_search',
  'hostname': 'pear',
  'parameters': ['-a',
   '-g',
   200,
   '-m',
   5,
   '-d',
   '/opt/patric-common/data/kmer_metadata_v2',
   '-u',
   'http://pear.mcs.anl.gov:6100/query'],
  'id': '9CCA6D20-C4B3-11EB-A893-36A8BEF382BD'},
 {'parameters': ['annotate_hypothetical_only=1',
   'dataset_name=Release70',
   'kmer_size=8'],
  'hostname': 'pear',
  'tool_name': 'KmerAnnotationByFigfam',
  'id': '9CE3769E-C4B3-11EB-A893-36A8BEF382BD',
  'execution_time': 1622756127.52738},
 {'execute_time': 1622756127.88296,
  'hostname': 'pear',
  'parameters': [],
  'tool_name': 'annotate_proteins_similarity',
  'id': '9D19B7EA-C4B3-11EB-9714-71B3BDF382BD'}]

Equivalent call from the client it self

[15]:
#genome, res = rast.annotate_genome_from_fasta('GCF_000005845.2_ASM584v2_protein.faa', split=' ')
#res
[34]:
feature = genome.features.get_by_id('YP_588478.1')
[36]:
feature.ontology_terms
[36]:
{'RAST': 'DUF1435 domain-containing protein YjjZ [Escherichia coli str. K-12 substr. MG1655]'}
[ ]:
feature.add_ontology_term('')