File: Trinity_util.py

package info (click to toggle)
trinityrnaseq 2.11.0%2Bdfsg-6
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 417,528 kB
  • sloc: perl: 48,420; cpp: 17,749; java: 12,695; python: 3,124; sh: 1,030; ansic: 983; makefile: 688; xml: 62
file content (26 lines) | stat: -rwxr-xr-x 624 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
#!/usr/bin/python3
# encoding: utf-8

from __future__ import (absolute_import, division,
                        print_function, unicode_literals)

import os, sys, re
import logging

logger = logging.getLogger(__name__)


def get_Trinity_gene_name(transcript_name):
    """
    extracts the gene name from the Trinity identifier as the prefix
    """

    (gene_name, count) = re.subn("_i\d+$", "", transcript_name)
    if count != 1:
        errmsg = "Error, couldn't extract gene_id from transcript_id: {}".format(transcript_name)
        logger.critical(errmsg)
        raise RuntimeError(errmsg)

    return gene_name