1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
|
#
# Copyright (C) 2010-2017 Institute for Computational Biomedicine,
# Weill Medical College of Cornell University
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
""" Contains classes that can parse sequence base information data
stored in the .sbi format. See the Goby3 and variation analysis projects
for details about this file format.
"""
import gzip
import goby.SegmentInformationRecords_pb2
import goby.MessageChunks
def SequenceSegmentInformationGenerator(basename, verbose=False):
""" Generator to parse .ssi files.
"""
if not basename.endswith(".ssi"):
basename+=".ssi"
collection = goby.SegmentInformationRecords_pb2.SegmentInformationCollection()
for ssi_records in goby.MessageChunks.MessageChunksGenerator(
basename, collectionContainer=collection):
for ssi_record in ssi_records.records:
yield ssi_record
def SequenceSegmentInformationStreamGenerator(basename, verbose=False):
""" Generator to parse .ssi files and endlessly generate SegmentInformation records from them, starting again
from the beginning of the file when the end is reached.
"""
if not basename.endswith(".ssi"):
basename+=".ssi"
while True:
collection = goby.SegmentInformationRecords_pb2.SegmentInformationCollection()
for ssi_records in goby.MessageChunks.MessageChunksGenerator(
basename, collectionContainer=collection):
for ssi_record in ssi_records.records:
yield ssi_record
|