Added genbank parser

This commit is contained in:
Celine Mercier
2019-03-15 16:06:27 +01:00
parent e8090a44c9
commit 7e20870719
2 changed files with 18 additions and 0 deletions

View File

@ -6,6 +6,7 @@ from obitools3.parsers.fastq import fastqIterator
from obitools3.parsers.tab import tabIterator
from obitools3.parsers.ngsfilter import ngsfilterIterator
from obitools3.parsers.embl import emblIterator
from obitools3.parsers.genbank import genbankIterator
oligore = re.compile(b"^[ACGTRYSWKMBDHVN]+$",re.I)
@ -135,6 +136,15 @@ def entryIteratorFactory(lineiterator,
buffersize=buffersize),
Nuc_Seq,
format)
elif format==b'genbank':
return (genbankIterator(lineiterator,
skip=skip,
only=only,
firstline=first,
buffersize=buffersize),
Nuc_Seq,
format)
raise NotImplementedError('File format iterator not implemented yet')

View File

@ -10,6 +10,7 @@ from obitools3.parsers.fastq import fastqIterator
from obitools3.parsers.tab import tabIterator
from obitools3.parsers.ngsfilter import ngsfilterIterator
from obitools3.parsers.embl import emblIterator
from obitools3.parsers.genbank import genbankIterator
from obitools3.parsers.universal import entryIteratorFactory
from obitools3.writers.fasta import FastaNucWriter
@ -478,6 +479,13 @@ def open_uri(uri,
only=only)
else:
raise NotImplementedError('Output sequence file format not implemented')
elif format==b"genbank":
if input:
iseq = genbankIterator(file,
skip=skip,
only=only)
else:
raise NotImplementedError('Output sequence file format not implemented')
else:
raise NotImplementedError('Sequence file format not implemented')
elif seqtype==b"prot":