File: Trinity_util.py

package info (click to toggle)
trinityrnaseq 2.15.2%2Bdfsg-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 468,004 kB
  • sloc: perl: 49,905; cpp: 17,993; java: 12,489; python: 3,282; sh: 1,989; ansic: 985; makefile: 717; xml: 62
file content (26 lines) | stat: -rwxr-xr-x 624 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
#!/usr/bin/python3
# encoding: utf-8

from __future__ import (absolute_import, division,
                        print_function, unicode_literals)

import os, sys, re
import logging

logger = logging.getLogger(__name__)


def get_Trinity_gene_name(transcript_name):
    """
    extracts the gene name from the Trinity identifier as the prefix
    """

    (gene_name, count) = re.subn("_i\d+$", "", transcript_name)
    if count != 1:
        errmsg = "Error, couldn't extract gene_id from transcript_id: {}".format(transcript_name)
        logger.critical(errmsg)
        raise RuntimeError(errmsg)

    return gene_name