o
    Rŀg                     @   sR   d Z ddlmZ ddlmZ ddlmZ dd Zedkr'ddl	m
Z
 e
  d	S d	S )
a   Bio.SeqIO support for the "ace" file format.

You are expected to use this module via the Bio.SeqIO functions.
See also the Bio.Sequencing.Ace module which offers more than just accessing
the contig consensus sequences in an ACE file as SeqRecord objects.
    )Seq)	SeqRecord)Acec                 c   s    t | D ]U}|j}d|v rd|vsJ t|dd}nt|}t||j|jd}g }d}|D ]}|dkr=|d q1||j|  |d7 }q1|t	|jksSJ ||j
d< |V  qdS )a  Return SeqRecord objects from an ACE file.

    This uses the Bio.Sequencing.Ace module to do the hard work.  Note that
    by iterating over the file in a single pass, we are forced to ignore any
    WA, CT, RT or WR footer tags.

    Ace files include the base quality for each position, which are taken
    to be PHRED style scores. Just as if you had read in a FASTQ or QUAL file
    using PHRED scores using Bio.SeqIO, these are stored in the SeqRecord's
    letter_annotations dictionary under the "phred_quality" key.

    >>> from Bio import SeqIO
    >>> with open("Ace/consed_sample.ace") as handle:
    ...     for record in SeqIO.parse(handle, "ace"):
    ...         print("%s %s... %i" % (record.id, record.seq[:10], len(record)))
    ...         print(max(record.letter_annotations["phred_quality"]))
    Contig1 agccccgggc... 1475
    90

    However, ACE files do not include a base quality for any gaps in the
    consensus sequence, and these are represented in Biopython with a quality
    of zero. Using zero is perhaps misleading as there may be very strong
    evidence to support the gap in the consensus. Previous versions of
    Biopython therefore used None instead, but this complicated usage, and
    prevented output of the gapped sequence as FASTQ format.

    >>> from Bio import SeqIO
    >>> with open("Ace/contig1.ace") as handle:
    ...     for record in SeqIO.parse(handle, "ace"):
    ...         print("%s ...%s..." % (record.id, record.seq[85:95]))
    ...         print(record.letter_annotations["phred_quality"][85:95])
    ...         print(max(record.letter_annotations["phred_quality"]))
    Contig1 ...AGAGG-ATGC...
    [57, 57, 54, 57, 57, 0, 57, 72, 72, 72]
    90
    Contig2 ...GAATTACTAT...
    [68, 68, 68, 68, 68, 68, 68, 68, 68, 68]
    90

    *-)idnamer      phred_qualityN)r   parsesequencer   replacer   r   appendqualitylenletter_annotations)source
ace_contigconsensus_seq_strconsensus_seq
seq_recordqualsibase r   C/var/www/html/myenv/lib/python3.10/site-packages/Bio/SeqIO/AceIO.pyAceIterator   s&   )	

r   __main__)run_doctestN)__doc__Bio.Seqr   Bio.SeqRecordr   Bio.Sequencingr   r   __name__
Bio._utilsr   r   r   r   r   <module>   s   P
