美文网首页
科大讯飞语音合成ros

科大讯飞语音合成ros

作者: zjh3029 | 来源:发表于2018-03-22 20:25 被阅读0次
    #include <stdio.h>
    #include <string.h>
    #include <stdlib.h>
    #include <unistd.h>
    #include <alsa/asoundlib.h>
    #include "qtts.h"
    #include "msp_cmn.h"
    #include "msp_errors.h"
    
    int makeTextToWav(const char* src_text, const char* params)
    {
        int          ret          = -1;
        const char*  sessionID    = NULL;
        unsigned int audio_len    = 0;
        unsigned int speech_len = 0;
        char* synth_speech = new char[2 * 1024 * 1024];
        int          synth_status = MSP_TTS_FLAG_STILL_HAVE_DATA;
    
        sessionID = QTTSSessionBegin(params, &ret);
        QTTSTextPut(sessionID, src_text, (unsigned int)strlen(src_text), NULL);
        
        unsigned int val;
        int dir=0;
        int size;
        snd_pcm_uframes_t frames;
        snd_pcm_uframes_t periodsize;
        snd_pcm_t *playback_handle;//PCM设备句柄pcm.h
        snd_pcm_hw_params_t *hw_params;//硬件信息和PCM流配置
    
        ret = snd_pcm_open(&playback_handle, "default", SND_PCM_STREAM_PLAYBACK, 0);//1. 打开PCM,最后一个参数为0意味着标准配置
        ret = snd_pcm_hw_params_malloc(&hw_params);//2. 分配snd_pcm_hw_params_t结构体
        ret = snd_pcm_hw_params_any(playback_handle, hw_params);//3. 初始化hw_params
        ret = snd_pcm_hw_params_set_access(playback_handle, hw_params, SND_PCM_ACCESS_RW_INTERLEAVED);//4. 初始化访问权限
        ret = snd_pcm_hw_params_set_format(playback_handle, hw_params, SND_PCM_FORMAT_S16_LE); //5. 初始化采样格式SND_PCM_FORMAT_U8,8位
    
        val = 16000;//6. 设置采样率,如果硬件不支持我们设置的采样率,将使用最接近的 val = 44100,有些录音采样频率固定为8KHz
        ret = snd_pcm_hw_params_set_rate_near(playback_handle, hw_params, &val, &dir);
        ret = snd_pcm_hw_params_set_channels(playback_handle, hw_params, 1);//7. 设置通道数量  1
        frames = 32; /* Set period size to 32 frames. */
        periodsize = frames ;
        ret = snd_pcm_hw_params_set_buffer_size_near(playback_handle, hw_params, &periodsize);
        periodsize /= 2;
        ret = snd_pcm_hw_params_set_period_size_near(playback_handle, hw_params, &periodsize, 0);
        ret = snd_pcm_hw_params(playback_handle, hw_params); //8. 设置hw_params
        snd_pcm_hw_params_get_period_size(hw_params, &frames, &dir);/* Use a buffer large enough to hold one period */
        size = frames * 2; 
    
        while (1)
        {
            const void* data = QTTSAudioGet(sessionID, &audio_len, &synth_status, &ret);
            if (ret) break;
                if (NULL != data)
                {
                    memcpy(synth_speech + speech_len, data, audio_len);
                    speech_len += audio_len;
                }
                if (MSP_TTS_FLAG_DATA_END == synth_status)break;
                usleep(1000); 
        }
        QTTSSessionEnd(sessionID, "Normal");
           
           
            char *buffer;
            buffer = (char *) malloc(size);
            int length_all=0;
            
    while (1)
        {
            memcpy(buffer,synth_speech,size);
            synth_speech+=size;
    
            length_all+=size;
            if (length_all>speech_len){ break;}
            while(ret = snd_pcm_writei(playback_handle, buffer, frames)<0)
            {
                usleep(2000);
                if (ret == -EPIPE)
                {
                      fprintf(stderr, "underrun occurred\n");
                      snd_pcm_prepare(playback_handle);
                }
                else if (ret < 0)
                {
                      fprintf(stderr,"error from writei: %s\n",snd_strerror(ret));
                }
            }
            
        }
        snd_pcm_drain(playback_handle);
        snd_pcm_close(playback_handle);//10. 关闭PCM设备句柄
    
        free(buffer);
        return 0;
    }
    
    int tts(const char* text)
    {
        const char* session_begin_params = "voice_name = xiaowanzi, text_encoding = utf8, sample_rate = 16000, speed = 50, volume = 100, pitch = 50, rdn = 0";
        makeTextToWav(text,session_begin_params);
        
        return 0;
    }
    
    #include <ros/ros.h>
    #include "std_msgs/String.h"
    #include "tts.h"
    /**
     *接受/voice/xf_tts_topic话题的字符串的回调函数
     */
    void TTSCallback(const std_msgs::String::ConstPtr &msg)
    {
        std::string out_result=msg->data.c_str();
        tts(msg->data.c_str());
    }
    
    int main(int argc, char* argv[])
    {
        const char* login_params         = "appid = 5aa8ea00, work_dir = .";//登录参数,appid与msc库绑定,请勿随意改动
        MSPLogin(NULL, NULL, login_params);//第一个参数是用户名,第二个参数是密码,第三个参数是登录参数,用户名和密码可在http://open.voicecloud.cn注册获取
    
        const char* start = "宝宝启动成功了,你知道我在哪里吗?";
        tts(start);
    
        ros::init(argc, argv,"robotts");
        ros::NodeHandle n;
        ros::Subscriber sub = n.subscribe("/voice/recong_topic",3,TTSCallback);
    
        ros::spin();
        MSPLogout(); //退出登录
    
        return 0;
    }
    

    相关文章

      网友评论

          本文标题:科大讯飞语音合成ros

          本文链接:https://www.haomeiwen.com/subject/fdjzqftx.html