# -*- coding: utf-8 # This file is part of Cicero TTS. # Cicero TTS: A Small, Fast and Free Text-To-Speech Engine. # Copyright (C) 2003-2008 Nicolas Pitre # Copyright (C) 2003-2008 Stéphane Doyon # # This program is free software; you can redistribute it and/or modify # it under the terms of the GNU General Public License version 2. # See the accompanying COPYING file for more details. # # This program comes with ABSOLUTELY NO WARRANTY. # Text to phoneme engine: reads language rule, applies filters, # does text-to-phonemes and prosody. import sys, re, os, stat import tracing def trace(msg): mod = 'ttp' tracing.trace(mod+': '+msg) import config from profiling import * def expand_char_class(str, class_list): if str is None: return "" while 1: again = 0 for targ, subs in class_list : str, n = targ.subn(subs, str) again = again + n if not again: break return str def read_rules(filename): phonems = {} rules = {} filters = [] char_class = [] pitch_def = {} f = file(filename, "r") filetime = os.fstat(f.fileno())[stat.ST_MTIME] # remove coments, extra blanks, end of line, etc. cleanup = re.compile( r"\s+#.*|(?\s+\"(.*)\"$" ) # a phonetic rule rule = re.compile( r"^\s*((?P\S+)\s+)?" r"\[\[ (?P\S+) \]\]\s+" r"((?P\S+)\s+)?" r"\-\>\s*(?P.*)$" ) # Special char _ means space for convenience in filter and rule # patterns, unless preceeded with \. underline = re.compile(r'(?= preSpaces+n1 if n1: v = inxposes[preSpaces] elif preSpaces: v = inxposes[preSpaces-1] else: v = 0 inxposes[preSpaces:preSpaces+n1] = [v]*n2 return r, n2 for targ, subs in filters: #text = re.sub(targ, repl, text) prestr = '' preSpaces = 0 while text: m = re.search(targ, text) if not m: prestr += text break pre = text[:m.start()] prestr += pre preSpaces += pre.count(' ') r, nSpaces = repl(m, preSpaces) text = text[m.end():] prestr += r preSpaces += nSpaces text = prestr #print '%s -> %s' % (targ.pattern, subs) #print text assert len(inxposes) == text.count(' ') +1 trace('filter output: <%s>' % text) return text, inxposes class PhonetizeError(Exception): pass def phonetize(text, rules, showrules=0): done = "" res = [] while text: try: for left, right, pho,n, ln, rule_line in rules[text[0]]: lm = left.search(done) if not lm: continue match = right.match(text) if not match: continue if showrules: sys.stderr.write('%d: { %s } -- [ %s | %s | %s ]\n' \ % (ln+1, rule_line, lm.group(), text[:n], match.group()[n:])) # keep last 20 chars of "done" context. 20 is arbitrary. done = (done + text[:n])[-20:] text = text[n:] res.extend(pho) break else: # FIXME: provide necessary debugging info, and a config # option to die (so we notice) or continue (for # non-developers). raise PhonetizeError('No rule matched') done = done + text[0] text = text[1:] except KeyError: # FIXME: provide necessary debugging info sys.stderr.write('Char unmatched <%s> %d\n' % (text[0], ord(text[0]))) done = done + text[0] text = text[1:] return res def prosodize(phono, pitch_def): phono = phono[:] durations = [] pitches = [] speed = 0 while phono: phos = [] v = 0 while phono: p = phono.pop(0) phos.append(p) ty = phonems[p][0] if ty == 'V': v += 1 elif ty == 'P': break if ty != 'P': punc = '_' else: punc = p if v == 0: pitchdef = [] else: try: pitchdef = list(pitch_def[punc][v]) except IndexError: pitchdef = list(pitch_def[punc][-1]) pitchdef[1:1] = [None]*(v-len(pitchdef)) for p in phos: if phonems[p][0] == 'V': pitches.append(pitchdef.pop(0)) else: pitches.append(None) durs = [phonems[p][1] for p in phos] for i,d in enumerate(durs): if speed: durs[i] = d * (100 - speed) / 100 speed /= 2 else: break durs.reverse() speed = pitch_def[punc][0][0] for i,d in enumerate(durs): if speed: durs[i] = d * (100 - speed) / 100 speed /= 2 else: break durs.reverse() durations.extend(durs) speed = pitch_def[punc][0][1] return durations, pitches m = ProfMonitor('ttp.load') rules, filters, phonems, pitch_def, filetime = read_rules(config.rulefile) ~m def checkReloadRules(): try: newtime = os.stat(config.rulefile)[stat.ST_MTIME] except OSError: return global rules, filters, phonems, pitch_def, filetime if newtime >filetime: trace('Reloading updated rules file') try: r,f,ph,pi,ft = read_rules(config.rulefile) except: trace('Error in new rule file, keeping old rule set') filetime = newtime # don't retry until it changes again. return else: rules, filters, phonems, pitch_def, filetime = r,f,ph,pi,ft spaces = re.compile(r'\s+') def init_inxposes(str): # Original input length inputLen = len(str) # Note index position in original input where stretches of spaces end. inxposes = [] def repl(m): inxposes.append(m.end()) # keep a flag ("\t") to indicate the presence of multiple spaces return " \t"[:len(m.group())] str = spaces.sub(repl, str) # Last index is a bit special: marks end of text. inxposes.append(inputLen) return str, inxposes def word2filtered(str): str, inxposes = init_inxposes(str) str, inxposes = filter_text(str, filters, inxposes) return str def word2phons(str, showrules=0): checkReloadRules() str, inxposes = init_inxposes(str) str, inxposes = filter_text(str, filters, inxposes) phono = phonetize(str, rules, showrules) return ' '.join(phono) def mkIndexes(phono, durations, inxposes): total_dur = 0 # indexes: list of tuples: time in ms, position in original input. indexes = [(0,0)] for pho,dur in zip(phono, durations): total_dur += dur if pho in ('_', '&', '-'): indexes.append( (total_dur, inxposes.pop(0)) ) # end marker indexes.append( (total_dur, inxposes.pop(0)) ) return indexes def mkMbrola(phono, durations, pitches): out = [] for pho,dur,pitch in zip(phono, durations, pitches): if not dur: continue if phonems[pho][0] == 'P': pho = '_' out.append("%s\t%d\t%s\n" % (pho, dur, pitch or "")) # we insert "_ 1" to avoid a "o-_ Concat : PANIC, check your pitch :-)" # from mbrola in some cases. out.append("_\t1\n#\n") out = "".join(out) return out def phons2mbrola(phono): durations, pitches = prosodize(phono, pitch_def) out = mkMbrola(phono, durations, pitches) return out for f in ('init_inxposes', 'filter_text', 'phonetize', 'prosodize', 'mkIndexes', 'mkMbrola'): globals()[f] = ProfProxy('ttp.'+f, globals()[f]) def process(str, showrules=0): checkReloadRules() # FIXME: we ought to cleanup non-printables somewhere. str, inxposes = init_inxposes(str) str, inxposes = filter_text(str, filters, inxposes) phono = phonetize(str, rules, showrules) #trace(phono) assert len(re.findall('[_&-]', ' '.join(phono))) +1 == len(inxposes) durations, pitches = prosodize(phono, pitch_def) indexes = mkIndexes(phono, durations, inxposes) out = mkMbrola(phono, durations, pitches) return out, indexes if 0 and __name__ == "__main__": # Speak text read from command-line. # Deprecated. See tts_shell.py and app_shell.py. # I'm keeping it as a bare bones example. cmd = config.mbrola_prog_path \ + " -f " + str(config.mbrola_f) \ + " -t " + str(config.mbrola_t) \ + " -e " + config.mbrola_voice \ + " - -.raw | sox -traw -r16000 -c1 -w -s - " + config.snd_dev import os pipe = os.popen(cmd, 'w') while 1: line = sys.stdin.readline() if not line: break out, indexes = process(line) out = out.split('\n') out.insert(0, "_\t50") out.insert(-2, "_\t500") out = '\n'.join(out) print out #print indexes pipe.write(out) pipe.flush()