Add some docs to fasta module

2008-03-18 17:02:40 +00:00
parent f5c818bff2
commit de2b771e19
1 changed files with 65 additions and 1 deletions
--- a/src/obitools/fasta.py
+++ b/src/obitools/fasta.py
@ -1,3 +1,9 @@
 """
 fasta module provides functions to read and write sequences in fasta format.
 """
 from obitools import bioSeqGenerator,BioSequence,AASequence,NucSequence
 from obitools.align import alignmentReader
 from obitools.utils import universalOpen
@ -9,6 +15,28 @@ def _fastaJoinSeq(seqarray):
    return  ''.join([x.strip() for x in seqarray])
 def _parseFasta(seq,bioseqfactory,tagparser=_fastaTag,joinseq=_fastaJoinSeq):
    '''
    Parse a fasta record.
    @attention: internal purpuse function
    @param seq: a sequence object containing all lines corresponding
                to one fasta sequence
    @type seq: C{list} or C{tuple} of C{str}
    @param bioseqfactory: a callable object return a BioSequence
                          instance.
    @type bioseqfactory: a callable object
    @param tagparser: a compiled regular expression usable
                      to identify key, value couples from 
                      title line.
    @type tagparser: regex instance
    @return: a C{BioSequence} instance   
    @see: L{FastaIterator} 
    '''
    title = seq[0].strip()[1:].split(None,1)
    id=title[0]
    if len(title) == 2:
@ -39,6 +67,17 @@ def fastaIterator(file,bioseqfactory=bioSeqGenerator,tagparser=_fastaTag,joinseq
    @param bioseqfactory: a callable object return a BioSequence
                          instance.
    @type bioseqfactory: a callable object
    @param tagparser: a compiled regular expression usable
                      to identify key, value couples from 
                      title line.
    @type tagparser: regex instance
    @return: an iterator on C{BioSequence} instance
    @see: L{fastaNucIterator}
    @see: L{fastaAAIterator}
    '''
    file = universalOpen(file,'ru')
@ -59,6 +98,16 @@ def fastaNucIterator(file,tagparser=_fastaTag):
    @param file: a line iterator containint fasta data
    @type file: an iterable object
    @param tagparser: a compiled regular expression usable
                      to identify key, value couples from 
                      title line.
    @type tagparser: regex instance
    @return: an iterator on C{NucBioSequence} instance
    @see: L{fastaIterator}
    @see: L{fastaAAIterator}
    '''
    return fastaIterator(file, NucSequence,tagparser)
@ -68,8 +117,18 @@ def fastaAAIterator(file,tagparser=_fastaTag):
    Returned sequences by this iterator will be AASequence
    instances
-    @param file: a line iterator containint fasta data
+    @param file: a line iterator containing fasta data
    @type file: an iterable object
    @param tagparser: a compiled regular expression usable
                      to identify key, value couples from 
                      title line.
    @type tagparser: regex instance
    @return: an iterator on C{AABioSequence} instance
    @see: L{fastaIterator}
    @see: L{fastaNucIterator}
    '''
    return fastaIterator(file, AASequence,tagparser)
@ -82,6 +141,11 @@ def formatFasta(data,gbmode=False):
    @type data: BioSequence instance or an iterable object 
                on BioSequence instances
    @param gbmode: if set to C{True} identifier part of the title
                   line follows recommendation from nbci to allow
                   sequence indexing with the blast formatdb command.
    @type gbmode: bool
    @return: a fasta formated string
    @rtype: str
    '''