Statistics
| Branch: | Tag: | Revision:

hlrc / tts_bridge / mary / mary_tts_bridge / MaryTTSBridge.py @ e95c8376

History | View | Annotate | Download (6.089 KB)

1 0c15613f Simon Schulz
#!/usr/bin/python
2
"""
3
This file is part of hlrc
4

5
Copyright(c) sschulz <AT> techfak.uni-bielefeld.de
6
http://opensource.cit-ec.de/projects/hlrc
7

8
This file may be licensed under the terms of the
9
GNU General Public License Version 3 (the ``GPL''),
10
or (at your option) any later version.
11

12
Software distributed under the License is distributed
13
on an ``AS IS'' basis, WITHOUT WARRANTY OF ANY KIND, either
14
express or implied. See the GPL for the specific language
15
governing rights and limitations.
16

17
You should have received a copy of the GPL along with this
18
program. If not, go to http://www.gnu.org/licenses/gpl.html
19
or write to the Free Software Foundation, Inc.,
20
51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
21

22
The development of this software was supported by the
23
Excellence Cluster EXC 277 Cognitive Interaction Technology.
24
The Excellence Cluster EXC 277 is a grant of the Deutsche
25
Forschungsgemeinschaft (DFG) in the context of the German
26
Excellence Initiative.
27
"""
28
29
import logging
30
import rospy
31
from hlrc_server.msg import *
32
import time
33
import sys
34
import actionlib
35
from io import BytesIO
36
import wave
37 e21d7f2c Simon Schulz
import os
38
import pkgutil
39 836f314c Robert Haschke
from .MaryTTSClient import *
40
try:
41
    from io import StringIO
42
except ImportError:
43
    from cStringIO import StringIO
44 0c15613f Simon Schulz
45
46 909e9261 Robert Haschke
class MaryTTSBridge(object):
47
    # _feedback = ttsActionFeedback()
48
    # _result   = ttsActionResult()
49 0c15613f Simon Schulz
50
    def __init__(self, topic, voice="cmu-slt-hsmm", locale="en_GB", tts_host="127.0.0.1", tts_port=59125, loglevel=logging.WARNING):
51 909e9261 Robert Haschke
        """initialise
52
        :param  loglevel: optional log level
53
        """
54
        self.loglevel = loglevel
55
        self.logger = logging.getLogger(__name__)
56
        # create nice and actually usable formatter and add it to the handler
57
        self.config_logger(loglevel)
58
        self.logger.info("starting MaryTTSBridge on topic '"+topic+"'")
59 0c15613f Simon Schulz
60 909e9261 Robert Haschke
        self.tts_client = MaryTTSClient(voice, locale, tts_host, tts_port, loglevel)
61 0c15613f Simon Schulz
62 909e9261 Robert Haschke
        rospy.init_node('MaryTTSBridge', anonymous=True)
63 0c15613f Simon Schulz
64 909e9261 Robert Haschke
        self._action_name = topic
65
        self._as = actionlib.SimpleActionServer(self._action_name, ttsAction, execute_cb = self.execute_cb, auto_start = False)
66
        self._as.start()
67 0c15613f Simon Schulz
68
    def __del__(self):
69 909e9261 Robert Haschke
        """destructor
70
        """
71
        self.logger.debug("destructor of MaryTTSBridge called")
72 0c15613f Simon Schulz
73
    def config_logger(self, level):
74 909e9261 Robert Haschke
        """initialise a nice logger formatting
75
        :param  level: log level
76
        """
77
        formatter = logging.Formatter('%(asctime)s %(name)-30s %(levelname)-8s > %(message)s')
78
        ch = logging.StreamHandler()
79
        #ch.setLevel(level)
80
        ch.setFormatter(formatter)
81
        self.logger.setLevel(level)
82
        self.logger.addHandler(ch)
83 0c15613f Simon Schulz
84
    def create_soundchunk(self, audio_data):
85 909e9261 Robert Haschke
        #extract wave from data
86
        fio = BytesIO(audio_data)
87
        wav = wave.open(fio)
88
89
        s = soundchunk()
90
91
        s.channels = wav.getnchannels()
92
        s.data = audio_data
93
        s.endianess = s.ENDIAN_LITTLE  # guessed?!
94
        s.rate = wav.getframerate()
95
        s.samplecount = wav.getnframes()
96
97
        # sample format:
98
        sample_width = wav.getsampwidth()
99
        if (sample_width == 1):
100
            s.sample_type = s.SAMPLE_U8
101
        elif (sample_width == 2):
102
            s.sample_type = s.SAMPLE_U16
103
        elif (sample_width == 3):
104
            s.sample_type = s.SAMPLE_U24
105
        else:
106
            self.logger.error("ERROR: invalid sample width "+str(sample_width) + " detected")
107
            s = soundchunk()
108
109
        self.logger.info("created soundchunk with "+str(s.samplecount)+" samples")
110
111
        return s
112 0c15613f Simon Schulz
113 836f314c Robert Haschke
    def create_phonemes(self, phoneme_bytes):
114 909e9261 Robert Haschke
        last = 0.0
115
        plist = []
116 0c15613f Simon Schulz
117 909e9261 Robert Haschke
        sio = StringIO(phoneme_bytes.decode('ascii'))
118
        for line in sio:
119
            if (line[0] != '#'):
120
                phoneme_list = line.split(" ")
121 e21d7f2c Simon Schulz
                if (line == '\n'):
122 909e9261 Robert Haschke
                    # ignore empty lines
123 e21d7f2c Simon Schulz
                    continue
124
                elif (len(phoneme_list) != 3):
125
                    print("> could not split line '%s' during phoneme seperation\n" % (line))
126
                else:
127 909e9261 Robert Haschke
                    symbol = phoneme_list[2]
128
                    symbol = symbol.rstrip()
129 e21d7f2c Simon Schulz
130 909e9261 Robert Haschke
                    now = float(phoneme_list[0])
131
                    duration = (now - last)*1000
132
                    last = now
133
                    plist.append(phoneme(symbol, int(duration)))
134 0c15613f Simon Schulz
135 909e9261 Robert Haschke
        self.logger.info("created phonemelist with " + str(len(plist)) + " elements")
136 0c15613f Simon Schulz
137 909e9261 Robert Haschke
        return plist
138 0c15613f Simon Schulz
139
    def create_utterance(self, text, audio_data, phoneme_list):
140 909e9261 Robert Haschke
        u = utterance()
141
        u.text     = text
142
        u.audio    = self.create_soundchunk(audio_data)
143
        u.phonemes = self.create_phonemes(phoneme_list)
144 0c15613f Simon Schulz
145 909e9261 Robert Haschke
        self.logger.info("created utterance for 'phonemelist with '" + u.text + "'")
146
        return u
147 0c15613f Simon Schulz
148 e21d7f2c Simon Schulz
    def get_error_message(self):
149
        data_wav = pkgutil.get_data('mary_tts_bridge', 'data/connection_failed.wav')
150
        data_phonemes = pkgutil.get_data('mary_tts_bridge', 'data/connection_failed.phonemes')
151
        return (data_wav, data_phonemes)
152
153 0c15613f Simon Schulz
    def execute_cb(self, goal):
154 909e9261 Robert Haschke
        self.logger.info("incoming utterance '" + goal.text + "'")
155 0c15613f Simon Schulz
156 909e9261 Robert Haschke
        success = True
157
        result  = ttsResult()
158 0c15613f Simon Schulz
159 909e9261 Robert Haschke
        # incoming msg, ask mary tts for data:
160
        try:
161
            audio     = self.tts_client.generate_audio(goal.text)
162
            phonelist = self.tts_client.generate_phonemes(goal.text)
163 0c15613f Simon Schulz
164 909e9261 Robert Haschke
        except:
165
            self.logger.error("failed to create utterance error = '" + str(sys.exc_info()[1]) + "'")
166
            # try to open error message from file:
167 e21d7f2c Simon Schulz
            success = True
168
            (audio, phonelist) = self.get_error_message()
169 0c15613f Simon Schulz
170 909e9261 Robert Haschke
        if success:
171
            # build soundchunk
172
            result.utterance = self.create_utterance(goal.text, audio, phonelist)
173
            self._as.set_succeeded(result)
174
        else:
175
            self._as.set_aborted(result)
176 0c15613f Simon Schulz
177
    def run(self):
178 909e9261 Robert Haschke
        # run the main loop
179
        rospy.spin()
180 0c15613f Simon Schulz
181 909e9261 Robert Haschke
# test code
182 163a7434 Simon Schulz
def main():
183 0c15613f Simon Schulz
    if (len(sys.argv) != 2):
184 909e9261 Robert Haschke
        print("> usage: "+sys.argv[0]+" <topic>\n\n")
185
        sys.exit(1)
186 0c15613f Simon Schulz
187
    bridge = MaryTTSBridge(topic=sys.argv[1], loglevel=logging.INFO)
188
    bridge.run()
189
190 163a7434 Simon Schulz
if __name__ == "__main__":
191
    main()