最近在做Android语音播报功能(TTS),现总结如下:(ps:demo代码地址:https://github.com/giserlong/TTS_DEMO)
一.Android原生接口
用Android原生接口TextToSpeech,简单易用,但是一般情况下不支持中文,需自己下载讯飞语音+ 等中文引擎,并设置为系统默认tts,方可正常播报中文,关键代码如下:
@Override protected void onCreate(Bundle savedInstanceState) { super.onCreate(savedInstanceState); setContentView(R.layout.activity_native); //初始化TTS tts = new TextToSpeech(this, this); //获取控件 speechText = (EditText)findViewById(R.id.speechTextView); speechButton = (Button)findViewById(R.id.speechButton); //为button添加监听 speechButton.setOnClickListener(new OnClickListener(){ @Override public void onClick(View v){ // TODO Auto-generated method stub tts.speak(speechText.getText().toString(), TextToSpeech.QUEUE_FLUSH, null); } }); } @Override public void onInit(int status){ // 判断是否转化成功 if (status == TextToSpeech.SUCCESS){ //tts.getCurrentEngine(); //默认设定语言为中文,原生的android貌似不支持中文。 int result = tts.setLanguage(Locale.CHINA); if (result == TextToSpeech.LANG_MISSING_DATA || result == TextToSpeech.LANG_NOT_SUPPORTED){ tts.setLanguage(Locale.US); Toast.makeText(this,"不支持中文,已自动设置为英文",Toast.LENGTH_SHORT).show(); Log.d("ss",""); }else{ Toast.makeText(this,"已自动设置为中文",Toast.LENGTH_SHORT).show(); Log.d("ss",""); } } }
二.百度离在线融合SDK
注册百度智能云开发者账号后,添加语音合成应用,填写包名等相关信息后,生成key及APPID等信息:
激活SDK需此关键信息,还需下载对应SDK,并添加至项目中,引用相关jar包,添加对应so库至asset
关键代码如下:
package com.yupont.www.myapplication; import android.content.Context; import android.os.Environment; import com.baidu.tts.client.SpeechSynthesizer; import com.baidu.tts.client.SpeechSynthesizerListener; import com.baidu.tts.client.TtsMode; import java.io.File; import java.io.FileOutputStream; import java.io.InputStream; /** *文件描述:
*
作者:Mark
*
创建时间:2019/5/23
*
更改时间:2019/5/23
*
版本号:1
*/ public class BaiDuSpeechUtil { private final String TAG = this.getClass().getSimpleName(); private SpeechSynthesizer mSpeechSynthesizer; private String mSampleDirPath; private static final String SAMPLE_DIR_NAME = "baiduTTS"; //-------以下全是在assets下的文件,使用离线时必须全部copy到手机中方可使用----start-- private static final String SPEECH_FEMALE_MODEL_NAME = "bd_etts_common_speech_f7_mand_eng_high_am-mix_v3.0.0_20170512.dat"; private static final String SPEECH_MALE_MODEL_NAME = "bd_etts_common_speech_m15_mand_eng_high_am-mix_v3.0.0_20170505.dat"; private static final String TEXT_MODEL_NAME = "bd_etts_text.dat"; private static final String ENGLISH_SPEECH_FEMALE_MODEL_NAME = "bd_etts_speech_female_en.dat"; private static final String ENGLISH_SPEECH_MALE_MODEL_NAME = "bd_etts_speech_male_en.dat"; private static final String ENGLISH_TEXT_MODEL_NAME = "bd_etts_text_en.dat"; //--------end------------------------------------------------------------- private static BaiDuSpeechUtil baiDuSpeechUtil = null; public static BaiDuSpeechUtil getInstance(){ if(baiDuSpeechUtil == null) { synchronized (BaiDuSpeechUtil.class) { if(baiDuSpeechUtil == null) { baiDuSpeechUtil = new BaiDuSpeechUtil(); } } } return baiDuSpeechUtil; } /** * 初始化百度语音资源 * @param context */ public void setInitialEnv(Context context) { initialEnv(context); } /** * 初始化百度语音播报相关 * @param context */ public void setInitialTts(Context context, SpeechSynthesizerListener speechSynthesizerListener){ initialTts(context,speechSynthesizerListener); } private void initialEnv(Context context) { // long start_time= System.currentTimeMillis(); if (mSampleDirPath == null) { String sdcardPath = Environment.getExternalStorageDirectory().toString(); mSampleDirPath = sdcardPath + "/" + SAMPLE_DIR_NAME; } makeDir(mSampleDirPath); copyFromAssetsToSdcard(context,false, SPEECH_FEMALE_MODEL_NAME, mSampleDirPath + "/" + SPEECH_FEMALE_MODEL_NAME); copyFromAssetsToSdcard(context,false, SPEECH_MALE_MODEL_NAME, mSampleDirPath + "/" + SPEECH_MALE_MODEL_NAME); copyFromAssetsToSdcard(context,false, TEXT_MODEL_NAME, mSampleDirPath + "/" + TEXT_MODEL_NAME); copyFromAssetsToSdcard(context,false, "english/" + ENGLISH_SPEECH_FEMALE_MODEL_NAME, mSampleDirPath + "/" + ENGLISH_SPEECH_FEMALE_MODEL_NAME); copyFromAssetsToSdcard(context,false, "english/" + ENGLISH_SPEECH_MALE_MODEL_NAME, mSampleDirPath + "/" + ENGLISH_SPEECH_MALE_MODEL_NAME); copyFromAssetsToSdcard(context,false, "english/" + ENGLISH_TEXT_MODEL_NAME, mSampleDirPath + "/" + ENGLISH_TEXT_MODEL_NAME); // Log.d(TAG,"initialEnv cost:"+ (System.currentTimeMillis()-start_time)); } private void makeDir(String dirPath) { File file = new File(dirPath); if (!file.exists()) { file.mkdirs(); } } /** * 将sample工程需要的资源文件拷贝到SD卡中使用(授权文件为临时授权文件,请注册正式授权) * 主要是在离线时候用到,只需执行一次即可,这里写的不严谨,应该去判断一下离线用的那些文件,sd卡是否存在,如果不存在,则copy,如果存在则无需在copy,可在子线程操作 * @param isCover 是否覆盖已存在的目标文件 * @param source * @param dest */ private void copyFromAssetsToSdcard(Context context, boolean isCover, String source, String dest) { File file = new File(dest); if (isCover || (!isCover && !file.exists())) { InputStream is = null; FileOutputStream fos = null; try { is = context.getAssets().open(source); String path = dest; fos = new FileOutputStream(path); byte[] buffer = new byte[1024]; int size = 0; while ((size = is.read(buffer, 0, 1024)) != -1) { fos.write(buffer, 0, size); } fos.flush(); } catch (Exception e) { e.printStackTrace(); } finally { if (is != null) { try { is.close(); } catch (Exception e) { e.printStackTrace(); } } if (fos != null) { try { is.close(); } catch (Exception e) { e.printStackTrace(); } } } } } //此方法可在子线程中操作,由于这个初始化过程比较费时,大概在1s左右,看项目需求而定,如果是进入界面就必须播放(伴随UI改变的)的,在UI线程,如无其他特殊要求,放在子线程中即可 private void initialTts(Context context,SpeechSynthesizerListener speechSynthesizerListener) { // long start_time= System.currentTimeMillis(); mSpeechSynthesizer = SpeechSynthesizer.getInstance(); mSpeechSynthesizer.setContext(context); mSpeechSynthesizer.setSpeechSynthesizerListener(speechSynthesizerListener); mSpeechSynthesizer.setApiKey(Config.appKey_baidu, Config.secret_baidu); mSpeechSynthesizer.setAppId(Config.appID_baidu); // 文本模型文件路径 (离线引擎使用) mSpeechSynthesizer.setParam(SpeechSynthesizer.PARAM_TTS_TEXT_MODEL_FILE, mSampleDirPath + "/" + TEXT_MODEL_NAME); mSpeechSynthesizer.setParam(SpeechSynthesizer.PARAM_TTS_SPEECH_MODEL_FILE, mSampleDirPath + "/" + SPEECH_FEMALE_MODEL_NAME); // 本地授权文件路径,如未设置将使用默认路径.设置临时授权文件路径,LICENCE_FILE_NAME请替换成临时授权文件的实际路径,仅在使用临时license文件时需要进行设置,如果在[应用管理]中开通了正式离线授权,不需要设置该参数,建议将该行代码删除(离线引擎) // 如果合成结果出现临时授权文件将要到期的提示,说明使用了临时授权文件,请删除临时授权即可。 // 发音人(在线引擎),可用参数为0,1,2,3。。。(服务器端会动态增加,各值含义参考文档,以文档说明为准。0--普通女声,1--普通男声,2--特别男声,3--情感男声。。。) mSpeechSynthesizer.setParam(SpeechSynthesizer.PARAM_SPEAKER, "0"); // 设置Mix模式的合成策略, //mix模式下,wifi使用在线合成,非wifi使用离线合成) mSpeechSynthesizer.setParam(SpeechSynthesizer.PARAM_MIX_MODE, SpeechSynthesizer.MIX_MODE_HIGH_SPEED_SYNTHESIZE_WIFI); // if(SystemUtil.isNetWorkConnected(getCurrentActivity())) { // // AuthInfo接口用于测试开发者是否成功申请了在线或者离线授权,如果测试授权成功了,可以删除AuthInfo部分的代码(该接口首次验证时比较耗时),不会影响正常使用(合成使用时 // AuthInfo authInfo=this.mSpeechSynthesizer.auth(TtsMode.MIX); // // if (authInfo.isSuccess()){ // toPrint("auth success"); // }else{ // String errorMsg=authInfo.getTtsError().getDetailMessage(); // toPrint("auth failed errorMsg=" + errorMsg); // } // } // 初始化tts mSpeechSynthesizer.initTts(TtsMode.MIX); // 加载离线英文资源(提供离线英文合成功能) //int result = mSpeechSynthesizer.loadEnglishModel(mSampleDirPath + "/" + ENGLISH_TEXT_MODEL_NAME, mSampleDirPath + mSampleDirPath + "/" + ENGLISH_SPEECH_FEMALE_MODEL_NAME); // Log.d(TAG,"initialTts cost:"+ (System.currentTimeMillis()-start_time)); int result = mSpeechSynthesizer.loadModel(mSampleDirPath + "/" + TEXT_MODEL_NAME, mSampleDirPath + mSampleDirPath + "/" + SPEECH_FEMALE_MODEL_NAME); if(result<0){ result++; } } /** * 播报的文字 * @param content */ public void speakText(String content) { try{ if(mSpeechSynthesizer != null) { int result = mSpeechSynthesizer.speak(content); if (result < 0) { // Log.d(TAG,"error,please look up error code in doc or URL:http://yuyin.baidu.com/docs/tts/122 "); } } }catch (Exception e) { e.printStackTrace(); } } /** * 暂停 */ public void pauseSpeechSynthesizer(){ if(mSpeechSynthesizer != null) { mSpeechSynthesizer.pause(); } } /** * 停止播放 */ public void stopSpeechSynthesizer(){ if(mSpeechSynthesizer != null) { mSpeechSynthesizer.stop(); } } /** * 接着停止后的地方播放 */ public void resumeSpeechSynthesizer(){ if(mSpeechSynthesizer != null) { mSpeechSynthesizer.resume(); } } /** * 释放mSpeechSynthesizer,在使用完之后必须调用,确保下个界面使用的时候资源已经释放掉了,否则下个界面将无法正常播放 */ public void releaseSpeechSynthesizer(){ if(mSpeechSynthesizer != null) { mSpeechSynthesizer.release(); } } public void setSpeechSynthesizerNull(){ if(mSpeechSynthesizer != null) { mSpeechSynthesizer = null; } } public void endSpeechSynthesizer(){ pauseSpeechSynthesizer(); stopSpeechSynthesizer(); releaseSpeechSynthesizer(); setSpeechSynthesizerNull(); } }
首次需联网,自动下载授权文件,以后离线也能用
三.云知声离线SDK
同百度,注册账号后,下载sdk,做好引用与配置
gradle中配置:
sourceSets {
main {
jniLibs.srcDirs = ['libs']
}
}
关键代码:
package com.yupont.www.myapplication; import java.io.File; import java.io.FileOutputStream; import java.io.InputStream; import android.app.Activity; import android.content.Context; import android.os.Bundle; import android.os.Environment; import android.util.Log; import android.view.View; import android.view.View.OnClickListener; import android.widget.Button; import android.widget.EditText; import android.widget.TextView; import android.widget.Toast; import com.unisound.client.SpeechConstants; import com.unisound.client.SpeechSynthesizer; import com.unisound.client.SpeechSynthesizerListener; public class yzsTTSOfflineActivity extends Activity { private static boolean TTS_PLAY_FLAGE = false; private EditText mTTSText; private TextView mTextViewTip; private TextView mTextViewStatus; private Button mTTSPlayBtn; private SpeechSynthesizer mTTSPlayer; private final String mFrontendModel= Environment.getExternalStorageDirectory().toString()+"/Yupont/UAV/OfflineTTSModels/frontend_model"; private final String mBackendModel = Environment.getExternalStorageDirectory().toString()+"/Yupont/UAV/OfflineTTSModels/backend_lzl"; // private final String mFrontendModel= getClass().getClassLoader().getResource("assets/OfflineTTSModels/frontend_model").getPath().substring(5); // private final String mBackendModel = getClass().getClassLoader().getResource("assets/OfflineTTSModels/backend_lzl").getPath(); // @Override public void onCreate(Bundle savedInstanceState) { // requestWindowFeature(Window.FEATURE_CUSTOM_TITLE); super.onCreate(savedInstanceState); setContentView(R.layout.activity_yzs_offline_tts); copyFilesFassets(this,"OfflineTTSModels", Environment.getExternalStorageDirectory().toString()+"/Yupont/UAV/OfflineTTSModels"); //getWindow().setFeatureInt(Window.FEATURE_CUSTOM_TITLE, R.layout.status_bar_main); mTTSText = (EditText) findViewById(R.id.textViewResult); //mTextViewStatus = (TextView) findViewById(R.id.textViewStatus); //mTextViewTip = (TextView) findViewById(R.id.textViewTip); mTTSPlayBtn = (Button) findViewById(R.id.recognizer_btn); mTTSPlayBtn.setEnabled(false); mTTSPlayBtn.setOnClickListener(new OnClickListener() { @Override public void onClick(View arg0) { TTSPlay(); } }); // 初始化本地TTS播报 initTts(); } /** * 从assets目录中复制整个文件夹内容 * @param context Context 使用CopyFiles类的Activity * @param oldPath String 原文件路径 如:/aa * @param newPath String 复制后路径 如:xx:/bb/cc */ public void copyFilesFassets(Context context, String oldPath, String newPath) { try { String fileNames[] = context.getAssets().list(oldPath);//获取assets目录下的所有文件及目录名 if (fileNames.length > 0) {//如果是目录 File file = new File(newPath); file.mkdirs();//如果文件夹不存在,则递归 for (String fileName : fileNames) { copyFilesFassets(context,oldPath + "/" + fileName,newPath+"/"+fileName); } } else {//如果是文件 if(new File(newPath).exists()){ return; } InputStream is = context.getAssets().open(oldPath); FileOutputStream fos = new FileOutputStream(new File(newPath)); byte[] buffer = new byte[1024]; int byteCount=0; while((byteCount=is.read(buffer))!=-1) {//循环从输入流读取 buffer字节 fos.write(buffer, 0, byteCount);//将读取的输入流写入到输出流 } fos.flush();//刷新缓冲区 is.close(); fos.close(); } } catch (Exception e) { // TODO Auto-generated catch block e.printStackTrace(); //如果捕捉到错误则通知UI线程 //MainActivity.handler.sendEmptyMessage(COPY_FALSE); } } /** * 初始化本地离线TTS */ private void initTts() { // 初始化语音合成对象 try { mTTSPlayer = new SpeechSynthesizer(this, Config.appKey, Config.secret); // 设置本地合成 mTTSPlayer.setOption(SpeechConstants.TTS_SERVICE_MODE, SpeechConstants.TTS_SERVICE_MODE_LOCAL); File _FrontendModelFile = new File(mFrontendModel); if (!_FrontendModelFile.exists()) { toastMessage("文件:" + mFrontendModel + "不存在,请将assets下相关文件拷贝到SD卡指定目录!"); } File _BackendModelFile = new File(mBackendModel); if (!_BackendModelFile.exists()) { toastMessage("文件:" + mBackendModel + "不存在,请将assets下相关文件拷贝到SD卡指定目录!"); } // 设置前端模型 mTTSPlayer.setOption(SpeechConstants.TTS_KEY_FRONTEND_MODEL_PATH, mFrontendModel); // 设置后端模型 mTTSPlayer.setOption(SpeechConstants.TTS_KEY_BACKEND_MODEL_PATH, mBackendModel); // 设置回调监听 mTTSPlayer.setTTSListener(new SpeechSynthesizerListener() { @Override public void onEvent(int type) { switch (type) { case SpeechConstants.TTS_EVENT_INIT: // 初始化成功回调 log_i("onInitFinish"); mTTSPlayBtn.setEnabled(true); break; case SpeechConstants.TTS_EVENT_SYNTHESIZER_START: // 开始合成回调 log_i("beginSynthesizer"); break; case SpeechConstants.TTS_EVENT_SYNTHESIZER_END: // 合成结束回调 log_i("endSynthesizer"); break; case SpeechConstants.TTS_EVENT_BUFFER_BEGIN: // 开始缓存回调 log_i("beginBuffer"); break; case SpeechConstants.TTS_EVENT_BUFFER_READY: // 缓存完毕回调 log_i("bufferReady"); break; case SpeechConstants.TTS_EVENT_PLAYING_START: // 开始播放回调 log_i("onPlayBegin"); break; case SpeechConstants.TTS_EVENT_PLAYING_END: // 播放完成回调 log_i("onPlayEnd"); setTTSButtonReady(); break; case SpeechConstants.TTS_EVENT_PAUSE: // 暂停回调 log_i("pause"); break; case SpeechConstants.TTS_EVENT_RESUME: // 恢复回调 log_i("resume"); break; case SpeechConstants.TTS_EVENT_STOP: // 停止回调 log_i("stop"); break; case SpeechConstants.TTS_EVENT_RELEASE: // 释放资源回调 log_i("release"); break; default: break; } } @Override public void onError(int type, String errorMSG) { // 语音合成错误回调 log_i("onError"); toastMessage(errorMSG); setTTSButtonReady(); } }); // 初始化合成引擎 mTTSPlayer.init(""); } catch (Exception e) { e.printStackTrace(); } } private void TTSPlay() { if (!TTS_PLAY_FLAGE) { mTTSPlayer.playText(mTTSText.getText().toString()); setTTSButtonStop(); } else { mTTSPlayer.stop(); setTTSButtonReady(); } } private void setTTSButtonStop() { TTS_PLAY_FLAGE = true; mTTSPlayBtn.setText(R.string.stop_tts); } private void setTTSButtonReady() { mTTSPlayBtn.setText(R.string.start_tts); TTS_PLAY_FLAGE = false; } protected void setTipText(String tip) { mTextViewTip.setText(tip); } protected void setStatusText(String status) { mTextViewStatus.setText(getString(R.string.lable_status) + "(" + status + ")"); } @Override public void onPause() { super.onPause(); // 主动停止识别 if (mTTSPlayer != null) { mTTSPlayer.stop(); } } private void log_i(String log) { Log.i("demo", log); } @Override protected void onDestroy() { // 主动释放离线引擎 if (mTTSPlayer != null) { mTTSPlayer.release(SpeechConstants.TTS_RELEASE_ENGINE, null); } super.onDestroy(); } private void toastMessage(String message) { Toast.makeText(this, message, Toast.LENGTH_SHORT).show(); } }