1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
|
#
# Copyright (C) 2010-2017 Institute for Computational Biomedicine,
# Weill Medical College of Cornell University
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
""" Contains classes that can parse sequence base information data
stored in the .sbi format. See the Goby3 and variation analysis projects
for details about this file format.
"""
import gzip
import goby.BaseInformationRecords_pb2
import goby.MessageChunks
def SequenceBaseInformationGenerator(basename, verbose=False):
""" Generator to parse .sbi files.
"""
if not basename.endswith(".sbi"):
basename+=".sbi"
collection = goby.BaseInformationRecords_pb2.BaseInformationCollection()
for sbi_records in goby.MessageChunks.MessageChunksGenerator(
basename, collectionContainer=collection):
for sbi_record in sbi_records.records:
yield sbi_record
|