/tts_bridge/mary/mary_tts_bridge/MaryTTSClient.py - hlrc - Research for Cognitive Interaction

hlrc / tts_bridge / mary / mary_tts_bridge / MaryTTSClient.py @ 38936fe1

History | View | Annotate | Download (3.549 KB)

       """
       This file is part of hlrc
       Copyright(c) sschulz <AT> techfak.uni-bielefeld.de
       http://opensource.cit-ec.de/projects/hlrc
       This file may be licensed under the terms of the
       GNU General Public License Version 3 (the ``GPL''),
       or (at your option) any later version.
       Software distributed under the License is distributed
       on an ``AS IS'' basis, WITHOUT WARRANTY OF ANY KIND, either
       express or implied. See the GPL for the specific language
       governing rights and limitations.
       You should have received a copy of the GPL along with this
       program. If not, go to http://www.gnu.org/licenses/gpl.html
       or write to the Free Software Foundation, Inc.,
 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
       The development of this software was supported by the
       Excellence Cluster EXC 277 Cognitive Interaction Technology.
       The Excellence Cluster EXC 277 is a grant of the Deutsche
       Forschungsgemeinschaft (DFG) in the context of the German
       Excellence Initiative.
       """
       import logging
       #try:
       #        import rsb
       #except ImportError:
       #        RSB_SUPPORT = False
       #else:
       #        from MiddlewareRSB import *
       #        RSB_SUPPORT = True
       #from MiddlewareROS import *
       import sys
       try:
               from http.client import HTTPConnection
               from urllib.parse import urlencode
       except ImportError:  # Python 2
               from httplib import HTTPConnection
               from urllib import urlencode
       import wave
       import ctypes
       import wave
       import sys
       class MaryTTSClient:
           def __init__(self, voice="cmu-slt-hsmm", locale="en_US", tts_host="127.0.0.1", tts_port=59125, loglevel=logging.WARNING):
               """initialise
               :param  loglevel: optional log level
               """
               self.loglevel = loglevel
               self.logger = logging.getLogger(__name__)
               # create nice and actually usable formatter and add it to the handler
               self.config_logger(loglevel)
               self.logger.info("starting MaryTTSClient (voice="+voice+", locale="+locale+", host="+tts_host+", port="+str(tts_port))
               self.tts_host = tts_host
               self.tts_port = tts_port
               self.locale   = locale
               self.voice    = voice
           def __del__(self):
               """destructor
               """
               self.logger.debug("destructor of MaryTTSClient called")
           def config_logger(self, level):
               """initialise a nice logger formatting
               :param  level: log level
               """
               formatter = logging.Formatter('%(asctime)s %(name)-30s %(levelname)-8s > %(message)s')
               ch = logging.StreamHandler()
               #ch.setLevel(level)
               ch.setFormatter(formatter)
               self.logger.setLevel(level)
               self.logger.addHandler(ch)
           def generate_audio(self, message):
               """generate audio from text
               :param message: text to synthesize
               """
               return self.generate(message, "AUDIO")
           def generate_phonemes(self, message):
               """generate phoneme list from text
               :param message: text to synthesize
               """
               return self.generate(message, "REALISED_DURATIONS")
           def generate(self, message, output_type):
               """generate requested data object from text
               :param message: text to synthesize
               """
               raw_params = {
                   "INPUT_TEXT": message,
                   "INPUT_TYPE": "RAWMARYXML",
                   "OUTPUT_TYPE": output_type,
                   "LOCALE": self.locale,
                   "AUDIO": "WAVE_FILE",
                   "VOICE": self.voice,
+              }
               params = urlencode(raw_params)
               headers = {}
               #conn.set_debuglevel(5)
               #open connection to mary server
               conn = HTTPConnection(self.tts_host, self.tts_port)
               conn.request("POST", "/process", params, headers)
               response = conn.getresponse()
               if response.status != 200:
                   print(response.getheaders())
                   conn.close()
                   raise RuntimeError("{0}: {1}".format(response.status,response.reason))
               return response.read()
       #test code
       if __name__ == "__main__":
           client = MaryTTSClient()
           audio = client.generate_phonemes("test 1 2 3 4 5 6 7 8 9 10")
           print(audio)