File: Trinity_util.py

package info (click to toggle)
trinityrnaseq 2.6.6%2Bdfsg-6
  • links: PTS, VCS
  • area: main
  • in suites: buster
  • size: 346,416 kB
  • sloc: perl: 47,542; cpp: 20,209; java: 12,484; python: 2,766; sh: 1,665; makefile: 895; ansic: 90; xml: 83
file content (26 lines) | stat: -rwxr-xr-x 628 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
#!/usr/bin/env python3
# encoding: utf-8

from __future__ import (absolute_import, division,
                        print_function, unicode_literals)

import os, sys, re
import logging

logger = logging.getLogger(__name__)


def get_Trinity_gene_name(transcript_name):
    """
    extracts the gene name from the Trinity identifier as the prefix
    """

    (gene_name, count) = re.subn("_i\d+$", "", transcript_name)
    if count != 1:
        errmsg = "Error, couldn't extract gene_id from transcript_id: {}".format(transcript_name)
        logger.critical(errmsg)
        raise RuntimeError(errmsg)

    return gene_name