Source code for bioconvert.gff32gff2

###########################################################################
# Bioconvert is a project to facilitate the interconversion               #
# of life science data from one format to another.                        #
#                                                                         #
# Copyright © 2018-2022  Institut Pasteur, Paris and CNRS.                #
#                                                                         #
# bioconvert is free software: you can redistribute it and/or modify      #
# it under the terms of the GNU General Public License as published by    #
# the Free Software Foundation, either version 3 of the License, or       #
# (at your option) any later version.                                     #
#                                                                         #
# bioconvert is distributed in the hope that it will be useful,           #
# but WITHOUT ANY WARRANTY; without even the implied warranty of          #
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the           #
# GNU General Public License for more details.                            #
#                                                                         #
# You should have received a copy of the GNU General Public License       #
# along with this program (COPYING file).                                 #
# If not, see <http://www.gnu.org/licenses/>.                             #
#                                                                         #
# Repository: https://github.com/bioconvert/bioconvert                    #
# Documentation: http://bioconvert.readthedocs.io                         #
###########################################################################

"""Convert :term:`GFF3` to :term:`GFF2` format"""
from Bio import SeqIO

from bioconvert import ConvBase, compressor
from bioconvert.core.decorators import requires_nothing
from bioconvert.io.gff3 import Gff3


[docs]class GFF32GFF2(ConvBase): """Convert :term:`GFF2` to :term:`GFF3` Method available is Python-based.""" #: Default value _default_method = "bioconvert" def __init__(self, infile, outfile, *args, **kargs): """.. rubric:: constructor :param str infile: input GFF3 filename :param str outfile: output GFF2 filename """ super(GFF32GFF2, self).__init__(infile, outfile, *args, **kargs)
[docs] @requires_nothing @compressor def _method_bioconvert(self, *args, **kwargs): """This method is a basic mapping of the 9th column of gff2 to gff3. Other methods with smart translations must be created for specific usages. There is no good solution for this translation. """ gff3_reader = Gff3(self.infile) with open(self.outfile, "w") as gff2_writer: for annotation in gff3_reader.read(): # Write the 8 first columns gff2_writer.write( "{}\t{}\t{}\t{}\t{}\t{}\t{}\t{}\t".format( annotation["seqid"], annotation["source"] if "source" in annotation else ".", # optional sourse annotation["type"], # should be verified for ontology matching annotation["start"], annotation["stop"], annotation["score"] if "score" in annotation else ".", # Score annotation["strand"] if "strand" in annotation else ".", # starnd annotation["phase"] if "phase" in annotation else ".", # phase ) ) # Write the 9th column using new standards but without smart translations if len(annotation["attributes"]) > 0: attributes = [] for key, value in annotation["attributes"].items(): if isinstance(value, list): value = ",".join(value) # add the value attributes.append('{} "{}"'.format(key, value)) gff2_writer.write("; ".join(attributes) + "\n") else: gff2_writer.write(".\n")