// // TtsNormalViewController.m // SpeechDemo // // Created by bytedance on 2020/9/8. // Copyright © 2020 fengkai.0518. All rights reserved. // #import "TtsNormalViewController.h" #include #import #import "AppDelegate.h" #import "FileUtils.h" #import "SettingsHelper.h" #import "ViewController.h" #import "SensitiveDefines.h" @interface TtsNormalViewController () @property (weak, nonatomic) IBOutlet UITextView *referTextView; @property (weak, nonatomic) IBOutlet UITextView *resultTextView; @property (weak, nonatomic) IBOutlet UITextField *statusTextView; @property (weak, nonatomic) IBOutlet UIButton *engineSwitchButton; @property (weak, nonatomic) IBOutlet UIButton *createConnectionButton; @property (weak, nonatomic) IBOutlet UIButton *startEngineButton; @property (weak, nonatomic) IBOutlet UIButton *stopEngineButton; @property (weak, nonatomic) IBOutlet UIButton *pauseResumeButton; // Device ID: 用于定位线上问题 @property (nonatomic, strong) NSString *deviceID; // Debug Path: 用于存放一些 SDK 相关的文件,比如模型、日志等 @property (strong, nonatomic) NSString *debugPath; // SpeechEngine @property (strong, nonatomic) SpeechEngine *curEngine; // Engine State @property (assign, nonatomic) BOOL engineInited; @property (assign, nonatomic) BOOL connectionCreated; @property (assign, nonatomic) BOOL engineStarted; @property (assign, nonatomic) BOOL engineErrorOccurred; @property (assign, nonatomic) BOOL playerPaused; // Settings @property (strong, nonatomic) Settings *settings; // 一些在线合成的配置 @property (strong, nonatomic) NSString *ttsAppId; @property (strong, nonatomic) NSString *ttsVoiceOnline; @property (strong, nonatomic) NSString *ttsVoiceTypeOnline; // 一些离线合成的配置 @property (strong, nonatomic) NSString *ttsVoiceOffline; @property (strong, nonatomic) NSString *ttsVoiceTypeOffline; // 用于合成的文本 @property (strong, nonatomic) NSString *ttsText; @end @implementation TtsNormalViewController - (void)viewDidLoad { [super viewDidLoad]; self.settings = [[SettingsHelper shareInstance]getSettings:VIEW_TTS]; self.engineSwitchButton.enabled = TRUE; [self decorateTextView:self.referTextView]; [self decorateTextView:self.resultTextView]; [self.referTextView setDelegate:self]; self.referTextView.editable = TRUE; self.engineInited = FALSE; self.connectionCreated = FALSE; self.engineStarted = FALSE; self.engineErrorOccurred = FALSE; self.playerPaused = FALSE; [self.statusTextView setText:@"Waiting for init."]; [ViewController setAppDelegate:(AppDelegate *)[[UIApplication sharedApplication] delegate]]; self.debugPath = NSSearchPathForDirectoriesInDomains(NSDocumentDirectory, NSUserDomainMask, YES).firstObject; NSLog(@"当前调试路径 %@", self.debugPath); [[NSNotificationCenter defaultCenter] addObserver:self selector:@selector(appDidEnterBackground:) name:UIApplicationDidEnterBackgroundNotification object:nil]; } - (void)viewDidDisappear:(BOOL)animated { [super viewDidDisappear:animated]; } - (void)decorateTextView:(UITextView *)textView { textView.layer.cornerRadius = 5.0f; textView.layer.borderWidth = .25f; textView.layer.borderColor = [UIColor grayColor].CGColor; } #pragma mark - Notifications - (void)appDidEnterBackground:(UIApplication *)application; { NSLog(@"app enter background."); [self.curEngine sendDirective:SEDirectiveStopEngine]; } -(void)appWillTerminate:(NSNotification*)note { [[NSNotificationCenter defaultCenter] removeObserver:self name:UIApplicationDidEnterBackgroundNotification object:nil]; } #pragma mark - Config & Init & Uninit Methods -(void)configInitParams { //【必需配置】Engine Name [self.curEngine setStringParam:SE_TTS_ENGINE forKey:SE_PARAMS_KEY_ENGINE_NAME_STRING]; //【必需配置】Work Mode, 可选值如下 // SETtsWorkModeOnline, 只进行在线合成,不需要配置离线合成相关参数; // SETtsWorkModeOffline, 只进行离线合成,不需要配置在线合成相关参数; // SETtsWorkModeAlternate, 先发起在线合成,失败后(网络超时),启动离线合成引擎开始合成; [self.curEngine setIntParam:[self getTtsWorkMode] forKey:SE_PARAMS_KEY_TTS_WORK_MODE_INT]; //【可选配置】Debug & Log [self.curEngine setStringParam:self.debugPath forKey:SE_PARAMS_KEY_DEBUG_PATH_STRING]; [self.curEngine setStringParam:SE_LOG_LEVEL_DEBUG forKey:SE_PARAMS_KEY_LOG_LEVEL_STRING]; //【可选配置】User ID(用以辅助定位线上用户问题) [self.curEngine setStringParam:SDEF_UID forKey:SE_PARAMS_KEY_UID_STRING]; [self.curEngine setStringParam:self.deviceID forKey:SE_PARAMS_KEY_DEVICE_ID_STRING]; //【可选配置】是否将合成出的音频保存到设备上,为 true 时需要正确配置 PARAMS_KEY_TTS_AUDIO_PATH_STRING 才会生效 [self.curEngine setBoolParam:[self.settings getBool:SETTING_TTS_ENABLE_DUMP] forKey:SE_PARAMS_KEY_TTS_ENABLE_DUMP_BOOL]; // TTS 音频文件保存目录,必须在合成之前创建好且 APP 具有访问权限,保存的音频文件名格式为 tts_{reqid}.wav, {reqid} 是本次合成的请求 id // PARAMS_KEY_TTS_ENABLE_DUMP_BOOL 配置为 true 的音频时为【必需配置】,否则为【可选配置】 [self.curEngine setStringParam:self.debugPath forKey:SE_PARAMS_KEY_TTS_AUDIO_PATH_STRING]; //【可选配置】合成出的音频的采样率,默认为 24000 [self.curEngine setIntParam:[self.settings getInt:SETTING_TTS_SAMPLE_RATE] forKey:SE_PARAMS_KEY_TTS_SAMPLE_RATE_INT]; //【可选配置】打断播放时使用多长时间淡出停止,单位:毫秒。默认值 0 表示不淡出 [self.curEngine setIntParam:[self.settings getInt:SETTING_AUDIO_FADEOUT_DURATION] forKey:SE_PARAMS_KEY_AUDIO_FADEOUT_DURATION_INT]; //【可选配置】是否禁止创建播放器对象,不使用 SDK 内置播放器时可开启,默认为 false. 开启后将 SE_PARAMS_KEY_TTS_ENABLE_PLAYER_BOOL 设置为 true 不起作用。 [self.curEngine setBoolParam:[self.settings getBool:SETTING_PREVENT_PLAYER_CREATION] forKey:SE_PARAMS_KEY_PREVENT_PLAYER_CREATION_BOOL]; // ------------------------ 在线合成相关配置 ----------------------- NSString* appid = [self.settings getString:SETTING_APPID]; self.ttsAppId = appid.length > 0 ? appid : SDEF_APPID; //【必需配置】在线合成鉴权相关:Appid [self.curEngine setStringParam:self.ttsAppId forKey:SE_PARAMS_KEY_APP_ID_STRING]; NSString* token = [self.settings getString:SETTING_TOKEN]; NSString* ttsAppToken = token.length > 0 ? token : SDEF_TOKEN; //【必需配置】在线合成鉴权相关:Token [self.curEngine setStringParam:ttsAppToken forKey:SE_PARAMS_KEY_APP_TOKEN_STRING]; //【必需配置】语音合成服务域名 NSString *address = [self.settings getString:SETTING_ADDRESS]; NSString *ttsAddress = address.length > 0 ? address : SDEF_DEFAULT_ADDRESS; [self.curEngine setStringParam:ttsAddress forKey:SE_PARAMS_KEY_TTS_ADDRESS_STRING]; //【必需配置】语音合成服务Uri NSString *uri = [self.settings getString:SETTING_URI]; NSString *ttsUri = uri.length > 0 ? uri : SDEF_TTS_DEFAULT_URI; [self.curEngine setStringParam:ttsUri forKey:SE_PARAMS_KEY_TTS_URI_STRING]; // 【可选配置】是否允许在 websocket 建连失败时自动重连 [self.curEngine setBoolParam:![self.settings getBool:SETTING_DISABLE_WS_RECONNECT] forKey:SE_PARAMS_KEY_ENABLE_WS_RECONNECT_BOOL]; //【可选配置】在线合成下发的 opus-ogg 音频的压缩倍率 [self.curEngine setIntParam:10 forKey:SE_PARAMS_KEY_TTS_COMPRESSION_RATE_INT]; // ------------------------ 离线合成相关配置 ----------------------- if ([self getTtsWorkMode] != SETtsWorkModeOnline && [self getTtsWorkMode] != SETtsWorkModeFile) { NSString* resourcePath = @""; if ([[self.settings getOptionsValue:SETTING_TTS_OFFLINE_RESOURCE_FORMAT] isEqual: @"SingleVoice"]) { resourcePath = [[SpeechResourceManager shareInstance] getModelPath]; } else if ([[self.settings getOptionsValue:SETTING_TTS_OFFLINE_RESOURCE_FORMAT] isEqual: @"MultipleVoice"]) { NSString *model_name = [self.settings getString:SETTING_TTS_MODEL_NAME]; resourcePath = [[SpeechResourceManager shareInstance] getModelPath:model_name]; } NSLog(@"TTS resource root path: %@", resourcePath); //【必需配置】离线合成所需资源存放路径 [self.curEngine setStringParam:resourcePath forKey:SE_PARAMS_KEY_TTS_OFF_RESOURCE_PATH_STRING]; } //【必需配置】离线合成鉴权相关:证书文件存放路径 [self.curEngine setStringParam:self.debugPath forKey:SE_PARAMS_KEY_LICENSE_DIRECTORY_STRING]; NSString* authenticationType = [self getAuthenticationType]; //【必需配置】Authenticate Type [self.curEngine setStringParam:authenticationType forKey:SE_PARAMS_KEY_AUTHENTICATE_TYPE_STRING]; if ([authenticationType isEqualToString:SE_AUTHENTICATE_TYPE_PRE_BIND]) { // 按包名授权,获取到授权的 APP 可以不限次数、不限设备数的使用离线合成 NSString *licenseName = [self.settings getString:SETTING_LICENSE_NAME]; NSString *licenseBusiId = [self.settings getString:SETTING_LICENSE_BUSI_ID]; // 证书名和业务 ID, 离线合成鉴权相关,使用火山提供的证书下发服务时为【必需配置】, 否则为【无需配置】 // 证书名,用于下载按报名授权的证书文件 [self.curEngine setStringParam:licenseName forKey:SE_PARAMS_KEY_LICENSE_NAME_STRING]; // 业务 ID, 用于下载按报名授权的证书文件 [self.curEngine setStringParam:licenseBusiId forKey:SE_PARAMS_KEY_LICENSE_BUSI_ID_STRING]; } else if ([authenticationType isEqualToString:SE_AUTHENTICATE_TYPE_LATE_BIND]) { // 按装机量授权,不限制 APP 的包名和使用次数,但是限制使用离线合成的设备数量 //【必需配置】离线合成鉴权相关:Authenticate Address [self.curEngine setStringParam:SDEF_AUTHENTICATE_ADDRESS forKey:SE_PARAMS_KEY_AUTHENTICATE_ADDRESS_STRING]; //【必需配置】离线合成鉴权相关:Authenticate Uri [self.curEngine setStringParam:SDEF_AUTHENTICATE_URI forKey:SE_PARAMS_KEY_AUTHENTICATE_URI_STRING]; NSString* curBusinessKey = [self.settings getString:SETTING_BUSINESS_KEY]; NSString* curAuthenticateSecret = [self.settings getString:SETTING_AUTHENTICATE_SECRET]; //【必需配置】离线合成鉴权相关:Business Key [self.curEngine setStringParam:curBusinessKey forKey:SE_PARAMS_KEY_BUSINESS_KEY_STRING]; //【必需配置】离线合成鉴权相关:Authenticate Secret [self.curEngine setStringParam:curAuthenticateSecret forKey:SE_PARAMS_KEY_AUTHENTICATE_SECRET_STRING]; } // ------------------------ 在离线切换相关配置 ----------------------- if ([self getTtsWorkMode] == SETtsWorkModeAlternate) { // 断点续播功能在断点处会发生由在线合成音频切换到离线合成音频,为了提升用户体验,SDK 支持 // 淡出地停止播放在线音频然后再淡入地开始播放离线音频,下面两个参数可以控制淡出淡入的长度 //【可选配置】断点续播专用,切换到离线合成时淡入的音频长度,单位:毫秒 [self.curEngine setIntParam:30 forKey:SE_PARAMS_KEY_TTS_FADEIN_DURATION_INT]; //【可选配置】断点续播专用,在线合成停止播放时淡出的音频长度,单位:毫秒 [self.curEngine setIntParam:30 forKey:SE_PARAMS_KEY_TTS_FADEOUT_DURATION_INT]; } } -(void)configStartTtsParams { //【必需配置】TTS 使用场景 [self.curEngine setStringParam:SE_TTS_SCENARIO_TYPE_NORMAL forKey:SE_PARAMS_KEY_TTS_SCENARIO_STRING]; NSString* curText = self.referTextView.text; if (curText.length > 0) { self.ttsText = curText; } else { self.ttsText = @"愿中国青年都摆脱冷气,只是向上走,不必听自暴自弃者流的话。能做事的做事,能发声的发声。有一分热,发一分光。就令萤火一般,也可以在黑暗里发一点光,不必等候炬火。此后如竟没有炬火:我便是唯一的光。"; } //【必需配置】需合成的文本,不可超过 80 字 [self.curEngine setStringParam:self.ttsText forKey:SE_PARAMS_KEY_TTS_TEXT_STRING]; //【可选配置】需合成的文本的类型,支持直接传文本(TTS_TEXT_TYPE_PLAIN)和传 SSML 形式(TTS_TEXT_TYPE_SSML)的文本 [self.curEngine setStringParam:[self getTtsTextType] forKey:SE_PARAMS_KEY_TTS_TEXT_TYPE_STRING]; //【可选配置】用于控制 TTS 音频的语速,支持的配置范围参考火山官网 语音技术/语音合成/离在线语音合成SDK/参数说明 文档 [self.curEngine setDoubleParam:[self.settings getDouble:SETTING_TTS_SPEAK_SPEED] forKey:SE_PARAMS_KEY_TTS_SPEED_RATIO_DOUBLE]; //【可选配置】用于控制 TTS 音频的音量,支持的配置范围参考火山官网 语音技术/语音合成/离在线语音合成SDK/参数说明 文档 [self.curEngine setDoubleParam:[self.settings getDouble:SETTING_TTS_AUDIO_VOLUME] forKey:SE_PARAMS_KEY_TTS_VOLUME_RATIO_DOUBLE]; //【可选配置】用于控制 TTS 音频的音高,支持的配置范围参考火山官网 语音技术/语音合成/离在线语音合成SDK/参数说明 文档 [self.curEngine setDoubleParam:[self.settings getDouble:SETTING_TTS_AUDIO_PITCH] forKey:SE_PARAMS_KEY_TTS_PITCH_RATIO_DOUBLE]; //【可选配置】是否在文本的每句结尾处添加静音段,单位:毫秒,默认为 0ms [self.curEngine setIntParam:[self.settings getInt:SETTING_TTS_SILENCE_DURATION] forKey:SE_PARAMS_KEY_TTS_SILENCE_DURATION_INT]; //【可选配置】是否使用 SDK 内置播放器播放合成出的音频,默认为 true [self.curEngine setBoolParam:![self.settings getBool:SETTING_PREVENT_PLAYER_CREATION] && [self.settings getBool:SETTING_TTS_ENABLE_PLAYER] forKey:SE_PARAMS_KEY_TTS_ENABLE_PLAYER_BOOL]; //【可选配置】是否令 SDK 通过回调返回合成的音频数据,默认不返回。 // 开启后,SDK 会流式返回音频,收到 SETtsAudioData 回调表示当次合成所有的音频已经全部返回 [self.curEngine setIntParam:[self.settings getBool:SETTING_TTS_ENABLE_DATA_CALLBACK] ? SETtsDataCallbackModeAll : SETtsDataCallbackModeNone forKey:SE_PARAMS_KEY_TTS_DATA_CALLBACK_MODE_INT]; // SDK 支持使用传入的 reqid 作为合成的唯一标识 NSString* ttsReqId = [self.settings getString:SETTING_TTS_REQUEST_ID]; if (ttsReqId.length > 0) { NSLog(@"Tts req id: %@", ttsReqId); //【可选配置】唯一标识一次合成的 reqid, 不传则自动生成并伴随 MESSAGE_TYPE_TTS_SYNTHESIS_BEGIN 返回 [self.curEngine setStringParam:ttsReqId forKey:SE_PARAMS_KEY_TTS_REQUEST_ID_STRING]; } // ------------------------ 在线合成相关配置 ----------------------- //【必需配置】语音合成服务所用集群 NSString *cluster = [self.settings getString:SETTING_CLUSTER]; [self.curEngine setStringParam:cluster forKey:SE_PARAMS_KEY_TTS_CLUSTER_STRING]; NSString *voiceOnline = [self.settings getString:SETTING_ONLINE_VOICE]; if (voiceOnline.length <= 0) { voiceOnline = [self.settings getOptionsValue:SETTING_ONLINE_VOICE]; } self.ttsVoiceOnline = voiceOnline; //【必需配置】在线合成使用的发音人代号 [self.curEngine setStringParam:self.ttsVoiceOnline forKey:SE_PARAMS_KEY_TTS_VOICE_ONLINE_STRING]; NSString *voiceTypeOnline = [self.settings getString:SETTING_ONLINE_VOICE_TYPE]; if (voiceTypeOnline.length <= 0) { voiceTypeOnline = [self.settings getOptionsValue:SETTING_ONLINE_VOICE_TYPE]; } self.ttsVoiceTypeOnline = voiceTypeOnline; //【必需配置】在线合成使用的音色代号 [self.curEngine setStringParam:self.ttsVoiceTypeOnline forKey:SE_PARAMS_KEY_TTS_VOICE_TYPE_ONLINE_STRING]; //【可选配置】是否打开在线合成的服务端缓存,默认关闭 [self.curEngine setBoolParam:[self.settings getBool:SETTING_TTS_ENABLE_CACHE] forKey:SE_PARAMS_KEY_TTS_ENABLE_CACHE_BOOL]; //【可选配置】指定在线合成的语种,默认为空,即不指定 [self.curEngine setStringParam:[self.settings getString:SETTING_TTS_ONLINE_LANGUAGE] forKey:SE_PARAMS_KEY_TTS_LANGUAGE_ONLINE_STRING]; //【可选配置】是否启用在线合成的情感预测功能 [self.curEngine setBoolParam:[self.settings getBool:SETTING_TTS_WITH_INTENT] forKey:SE_PARAMS_KEY_TTS_WITH_INTENT_BOOL]; //【可选配置】指定在线合成的情感,例如 happy, sad 等 [self.curEngine setStringParam:[self.settings getString:SETTING_TTS_EMOTION] forKey:SE_PARAMS_KEY_TTS_EMOTION_STRING]; //【可选配置】需要返回详细的播放进度或需要启用断点续播功能时应配置为 1, 否则配置为 0 或不配置 [self.curEngine setIntParam:[self.settings getBool:SETTING_TTS_ENABLE_RESUME_FROM_BREAKPOINT] forKey:SE_PARAMS_KEY_TTS_WITH_FRONTEND_INT]; //【可选配置】使用复刻音色 [self.curEngine setBoolParam:[self.settings getBool:SETTING_TTS_USE_VOICECLONE_VOICE] forKey:SE_PARAMS_KEY_TTS_USE_VOICECLONE_BOOL]; //【可选配置】在开启前述使用复刻音色的开关后,制定复刻音色所用的后端集群 [self.curEngine setStringParam:[self.settings getString:SETTING_TTS_BACKEND_CLUSTER] forKey:SE_PARAMS_KEY_TTS_BACKEND_CLUSTER_STRING]; //【可选配置】在线合成的请求参数,JSON 格式。当服务端新增参数但是 SDK 还未新增对应的配置项时,开发者可自行构造请求参数由此传入 [self.curEngine setStringParam:[self.settings getString:SETTING_TTS_REQUEST_PARAMS] forKey:SE_PARAMS_KEY_TTS_REQ_PARAMS_STRING]; // ------------------------ 离线合成相关配置 ----------------------- NSString *voiceOffline = [self.settings getString:SETTING_OFFLINE_VOICE]; if (voiceOffline.length <= 0) { voiceOffline = [self.settings getOptionsValue:SETTING_OFFLINE_VOICE]; } self.ttsVoiceOffline = voiceOffline; //【必需配置】离线合成使用的发音人代号 [self.curEngine setStringParam:self.ttsVoiceOffline forKey:SE_PARAMS_KEY_TTS_VOICE_OFFLINE_STRING]; NSString *voiceTypeOffline = [self.settings getString:SETTING_OFFLINE_VOICE_TYPE]; if (voiceTypeOffline.length <= 0) { voiceTypeOffline = [self.settings getOptionsValue:SETTING_OFFLINE_VOICE_TYPE]; } self.ttsVoiceTypeOffline = voiceTypeOffline; //【必需配置】离线合成使用的音色代号 [self.curEngine setStringParam:self.ttsVoiceTypeOffline forKey:SE_PARAMS_KEY_TTS_VOICE_TYPE_OFFLINE_STRING]; //【可选配置】是否降低离线合成的 CPU 利用率,默认关闭 // 打开该配置会使离线合成的实时率变大,仅当必要(例如为避免系统主动杀死CPU占用持续过高的进程)时才应开启 [self.curEngine setBoolParam:[self.settings getBool:SETTING_TTS_LIMIT_CPU_USAGE] forKey:SE_PARAMS_KEY_TTS_LIMIT_CPU_USAGE_BOOL]; } - (void)initEngine { NSLog(@"获取设备ID,调试使用"); AppDelegate *appDelegate = [ViewController getAppDelegate]; if (appDelegate == nil) { appDelegate = (AppDelegate *)[[UIApplication sharedApplication] delegate]; } [ViewController setAppDelegate:appDelegate]; self.deviceID = appDelegate.deviceID; NSLog(@"获取设备ID成功: %@", self.deviceID); NSLog(@"创建引擎"); if (self.curEngine == nil) { self.curEngine = [[SpeechEngine alloc] init]; if (![self.curEngine createEngineWithDelegate:self]) { NSLog(@"引擎创建失败."); return; } } NSLog(@"SDK 版本号: %@", [self.curEngine getVersion]); if ([self getTtsWorkMode] == SETtsWorkModeOnline || [self getTtsWorkMode] == SETtsWorkModeFile) { // 当使用纯在线模式时,不需要下载离线合成所需资源 [self initEngineInternal]; } else { [self.statusTextView setText:@"Waiting for loading model."]; // 下载离线合成所需资源需要区分多音色资源和单音色资源,下载这两种资源所调用的方法略有不同 if ([[self.settings getOptionsValue:SETTING_TTS_OFFLINE_RESOURCE_FORMAT] isEqual: @"MultipleVoice"]) { // 多音色资源是指一个资源文件中包含了多个离线音色,这种资源一般是旧版(V2)离线合成所用资源 NSLog(@"当前所用资源类别为多音色资源,开始准备多音色资源"); [self prepareMultipleVoiceResource]; } else if ([[self.settings getOptionsValue:SETTING_TTS_OFFLINE_RESOURCE_FORMAT] isEqual: @"SingleVoice"]) { // 单音色资源是指一个资源文件仅包含一个离线音色,新版(V4 及以上)离线合成用的就是单音色资源 NSLog(@"当前所用资源类别为单音色资源,开始准备单音色资源"); [self prepareSingleVoiceResource]; } } } - (void)prepareMultipleVoiceResource { // 因为多音色资源的一个文件包含了多个音色,导致资源的名字和音色的名字无法一一对应 // 所以下载资源需要显式指定资源名字 NSString *model_name = [self.settings getString:SETTING_TTS_MODEL_NAME]; SpeechResourceManager *speechResourceManager = [SpeechResourceManager shareInstance]; NSLog(@"检查本地是否存在可用模型"); if (![speechResourceManager checkModelExist:model_name]) { NSLog(@"本地没有模型,开始下载"); [self fetchMultipleVoiceResource:model_name]; } else { NSLog(@"模型存在,检查是否需要更新模型"); [speechResourceManager checkModelVersion:model_name completion:^(SEResourceStatus status, BOOL needUpdate, NSData *data) { if (status != kSERSuccess || needUpdate == NO) { NSLog(@"无需更新,直接使用本地已有模型。"); [self initEngineInternal]; } else { NSLog(@"存在更新,开始下载模型"); [self fetchMultipleVoiceResource:model_name]; } }]; } } - (void)fetchMultipleVoiceResource:(NSString*)model_name { NSLog(@"需要下载的模型名为 %@", model_name); SpeechResourceManager *speechResourceManager = [SpeechResourceManager shareInstance]; [speechResourceManager fetchModelByName:model_name completion:^(SEResourceStatus status, NSData* data) { if (status == kSERSuccess) { NSLog(@"下载成功"); [self initEngineInternal]; } else { NSLog(@"下载失败,错误码: %d", status); [self speechEngineInitFailed:kSERDownloadFailed]; } }]; } - (void)prepareSingleVoiceResource { SpeechResourceManager *speechResourceManager = [SpeechResourceManager shareInstance]; NSString* offlineLanguage = [self.settings getString:SETTING_TTS_OFFLINE_LANGUAGE]; if (offlineLanguage.length <= 0) { offlineLanguage = SDEF_TTS_DEFAULT_OFFLINE_LANGUAGE; } NSArray* ttsLanguageArray = @[offlineLanguage]; NSLog(@"需要下载的离线合成语种资源有: %@", ttsLanguageArray); [speechResourceManager setTtsLanguage:ttsLanguageArray]; NSArray* needDownloadVoiceType = (NSArray *)SDEF_TTS_DEFAULT_DOWNLOAD_OFFLINE_VOICES(); NSArray* voiceTypeArray = [self.settings getOptions:SETTING_OFFLINE_VOICE_TYPE].optionsArray; if (voiceTypeArray != nil && voiceTypeArray.count > 0) { needDownloadVoiceType = voiceTypeArray; } NSLog(@"需要下载的离线合成音色资源有: %@", needDownloadVoiceType); [speechResourceManager setTtsVoiceType:needDownloadVoiceType]; NSLog(@"检查本地是否存在可用模型"); if ([speechResourceManager checkModelExist]) { NSLog(@"本地没有模型,开始下载"); [self fetchSingleVoiceResource]; } else { NSLog(@"模型存在,检查是否需要更新模型"); [speechResourceManager checkModelVersion:^(SEResourceStatus status, BOOL needUpdate, NSData *data) { if (status != kSERSuccess || needUpdate == NO) { NSLog(@"无需更新,直接使用本地已有模型。"); [self initEngineInternal]; } else { NSLog(@"存在更新,开始下载模型"); [self fetchSingleVoiceResource]; } }]; } } - (void)fetchSingleVoiceResource { SpeechResourceManager *speechResourceManager = [SpeechResourceManager shareInstance]; [speechResourceManager fetchModel:^(SEResourceStatus status, NSData* data) { if (status == kSERSuccess) { NSLog(@"下载成功"); [self initEngineInternal]; } else { NSLog(@"下载失败,错误码: %d", status); [self speechEngineInitFailed:kSERDownloadFailed]; } }]; } - (void)initEngineInternal { NSLog(@"配置初始化参数"); [self configInitParams]; NSLog(@"引擎初始化"); SEEngineErrorCode ret = [self.curEngine initEngine]; self.engineInited = (ret == SENoError); if (self.engineInited) { NSLog(@"初始化成功"); [self speechEngineInitSucceeded]; } else { NSLog(@"初始化失败,返回值: %d", ret); [self speechEngineInitFailed:ret]; } } - (void)uninitEngine { if (self.curEngine != nil) { NSLog(@"引擎析构"); [self.curEngine destroyEngine]; self.curEngine = nil; NSLog(@"引擎析构完成"); } } #pragma mark - UI Actions - (IBAction)switchEngine:(id)sender { if (self.engineStarted) { [self.statusTextView setText:@"Engine is busy, stop it first!"]; return; } [self clearResult:nil]; self.startEngineButton.enabled = FALSE; self.pauseResumeButton.enabled = FALSE; if (self.engineInited) { self.referTextView.editable = FALSE; [self uninitEngine]; self.engineInited = FALSE; self.connectionCreated = FALSE; [self.statusTextView setText:@"Waiting for init."]; self.engineSwitchButton.enabled = TRUE; [self.engineSwitchButton setTitle:@"Init Engine" forState:UIControlStateNormal]; self.stopEngineButton.enabled = FALSE; self.createConnectionButton.enabled = FALSE; } else { self.referTextView.editable = TRUE; [self initEngine]; } } - (IBAction)createConnection:(id)sender { if (self.connectionCreated) { NSLog(@"Connection is created."); return; } // SEDirectiveCreateConnection 指令,可减小在线合成的端到端播放延时,主要应用在能够提前预知要使用语音合成的情况下,例如语音交互场景 // SEDirectiveCreateConnection 指令是一个同步指令,调用返回之后可以根据返回值判断连接是否建立成功 // 如果不使用 SEDirectiveCreateConnection 指令,建连实际发生在调用 DIRECTIVE_START_ENGINE 后 NSLog(@"触发提前建连"); NSLog(@"Directive: SEDirectiveCreateConnection"); SEEngineErrorCode ret = [self.curEngine sendDirective:SEDirectiveCreateConnection]; if(ret != SENoError) { NSString* error_message = [NSString stringWithFormat:@"在线合成提前建连失败: %d", ret]; NSLog(@"%@", error_message); [self createConnectionFailed:error_message]; } else { NSString* message = [NSString stringWithFormat:@"在线合成提前建连成功: %d", ret]; NSLog(@"%@", message); [self createConnectionSucceeded:message]; } } - (IBAction)startEngineBtnClicked:(id)sender { NSLog(@"Start engine, current status: %d", self.engineStarted); if (!self.engineStarted) { [self clearResult:nil]; self.engineErrorOccurred = FALSE; // Directive:启动引擎前调用SYNC_STOP指令,保证前一次请求结束。 NSLog(@"关闭引擎(同步)"); NSLog(@"Directive: SEDirectiveSyncStopEngine"); SEEngineErrorCode ret = [self.curEngine sendDirective:SEDirectiveSyncStopEngine]; if (ret != SENoError) { NSLog(@"Send directive syncstop failed: %d", ret); } else { [self configStartTtsParams]; NSLog(@"启动引擎."); NSLog(@"Directive: SEDirectiveStartEngine"); SEEngineErrorCode ret = [self.curEngine sendDirective:SEDirectiveStartEngine]; if (SENoError != ret) { NSString* message = [NSString stringWithFormat:@"发送启动引擎指令失败: %d", ret]; [self sendStartEngineDirectiveFailed:message]; } } } } - (IBAction)stopEngineBtnClicked:(id)sender { NSLog(@"关闭引擎"); NSLog(@"Directive: SEDirectiveStopEngine"); [self.curEngine sendDirective:SEDirectiveStopEngine]; } - (void) pausePlayback { NSLog(@"暂停播放"); NSLog(@"Directive: SEDirectivePausePlayer"); SEEngineErrorCode ret = [self.curEngine sendDirective:SEDirectivePausePlayer]; if (ret == SENoError) { self.playerPaused = TRUE; [self.pauseResumeButton setTitle:@"Resume" forState:UIControlStateNormal]; } NSLog(@"Pause playback status: %d", ret); } - (void)resumePlayback { NSLog(@"继续播放"); NSLog(@"Directive: SEDirectiveResumePlayer"); SEEngineErrorCode ret = [self.curEngine sendDirective:SEDirectiveResumePlayer]; if (ret == SENoError) { self.playerPaused = FALSE; [self.pauseResumeButton setTitle:@"Pause" forState:UIControlStateNormal]; } NSLog(@"Resume playback status: %d", ret); } - (IBAction)controlPlayingStatus:(id)sender { NSLog(@"Pause or resume player, current player status: %hhd", self.playerPaused); if (self.playerPaused) { [self resumePlayback]; } else { [self pausePlayback]; } } - (IBAction)clearResult:(id)sender { [self.resultTextView setText:@""]; } #pragma mark - Message Callback - (void)onMessageWithType:(SEMessageType)type andData:(NSData *)data { NSLog(@"Message Type: %d.", type); switch (type) { case SEEngineStart: NSLog(@"Callback: 引擎启动成功: data: %@", data); [self speechEngineStarted]; break; case SEEngineStop: NSLog(@"Callback: 引擎关闭: data: %@", data); [self speechEngineStopped]; break; case SEEngineError: NSLog(@"Callback: 错误信息: %@", data); [self speechEngineError:data]; break; case SETtsSynthesisBegin: NSLog(@"Callback: 合成开始: %@", data); [self speechStartSynthesis:data]; break; case SETtsSynthesisEnd: NSLog(@"Callback: 合成结束: %@", data); [self speechFinishSynthesis:data]; break; case SETtsStartPlaying: NSLog(@"Callback: 播放开始: %@", data); [self speechStartPlaying:data]; break; case SETtsPlaybackProgress: NSLog(@"Callback: 播放进度"); [self updatePlayingProgress:data]; break; case SETtsFinishPlaying: NSLog(@"Callback: 播放结束: %@", data); [self speechFinishPlaying:data]; break; case SETtsAudioData: NSLog(@"Callback: 音频数据,长度 %lu 字节", (unsigned long)data.length); [self speechTtsAudioData:data]; break; default: break; } } - (void)speechEngineInitSucceeded { dispatch_async(dispatch_get_main_queue(), ^{ self.engineSwitchButton.enabled = TRUE; [self.engineSwitchButton setTitle:@"UninitEngine" forState:UIControlStateNormal]; [self.statusTextView setText:@"Ready"]; [self.resultTextView setText:[NSString stringWithFormat:@"DeviceID: %@.", self.deviceID]]; self.referTextView.editable = TRUE; self.startEngineButton.enabled = TRUE; self.createConnectionButton.enabled = [self getTtsWorkMode] != SETtsWorkModeOffline; }); } - (void)speechEngineInitFailed:(int)initStatus { dispatch_async(dispatch_get_main_queue(), ^{ [self uninitEngine]; [self.statusTextView setText:[[NSString alloc] initWithFormat:@"Failed to init engine, %d!", initStatus]]; self.engineSwitchButton.enabled = TRUE; }); } - (void)createConnectionSucceeded:(NSString*)tipText { dispatch_async(dispatch_get_main_queue(), ^{ self.createConnectionButton.enabled = FALSE; [self.resultTextView setText:tipText]; self.connectionCreated = TRUE; }); } - (void)createConnectionFailed:(NSString*)tipText { dispatch_async(dispatch_get_main_queue(), ^{ [self.resultTextView setText:tipText]; self.connectionCreated = FALSE; }); } - (void)sendStartEngineDirectiveFailed:(NSString*)tipText { NSLog(@"%@", tipText); dispatch_async(dispatch_get_main_queue(), ^{ [self.resultTextView setText:tipText]; self.engineStarted = FALSE; }); } - (void)speechEngineStarted { dispatch_async(dispatch_get_main_queue(), ^{ self.referTextView.editable = FALSE; self.engineStarted = true; [self.statusTextView setText:@"Engine Started!"]; [self.resultTextView setText:self.ttsText]; self.startEngineButton.enabled = FALSE; self.stopEngineButton.enabled = TRUE; self.createConnectionButton.enabled = FALSE; }); } - (void)speechEngineStopped { dispatch_async(dispatch_get_main_queue(), ^{ self.referTextView.editable = TRUE; self.engineStarted = FALSE; self.connectionCreated = FALSE; [self.statusTextView setText:@"Engine Stopped!"]; self.startEngineButton.enabled = TRUE; self.stopEngineButton.enabled = FALSE; self.createConnectionButton.enabled = [self getTtsWorkMode] != SETtsWorkModeOffline; [self.pauseResumeButton setTitle:@"Pause" forState:UIControlStateNormal]; self.pauseResumeButton.enabled = FALSE; self.playerPaused = FALSE; }); } - (void)speechEngineError:(NSData *)data { self.engineErrorOccurred = TRUE; dispatch_async(dispatch_get_main_queue(), ^{ [self.resultTextView setTextColor:[UIColor blackColor]]; [self.resultTextView setText:[[NSString alloc] initWithData:data encoding:NSUTF8StringEncoding]]; }); } - (void)speechStartSynthesis:(NSData *)data { } - (void)speechFinishSynthesis:(NSData *)data { } - (void)speechStartPlaying:(NSData *)data { dispatch_async(dispatch_get_main_queue(), ^{ self.pauseResumeButton.enabled = TRUE; }); } - (void)updatePlayingProgress :(NSData *)data { if (data != nil) { NSError *error = nil; id object = [NSJSONSerialization JSONObjectWithData:data options:0 error:&error]; if(error) { NSLog(@"Parse data as json error!"); return ; } if([object isKindOfClass:[NSDictionary class]]) { NSDictionary *results = object; float percentage = [[results valueForKey:@"progress"] floatValue]; NSString *reqid = [results valueForKey:@"reqid"]; NSLog(@"当前播放的文本对应的 reqid: %@,播放进度:%.3f", reqid, percentage); } } } - (void)speechFinishPlaying :(NSData *)data { } - (void)speechTtsAudioData:(NSData *)data { } #pragma mark - Helper - (NSString*)getTtsTextType { switch ([self.settings getOptions:SETTING_TTS_TEXT_TYPE].chooseIdx) { case 0: return SE_TTS_TEXT_TYPE_PLAIN; case 1: return SE_TTS_TEXT_TYPE_SSML; default: break; } return SE_TTS_TEXT_TYPE_PLAIN;; } - (int)getTtsWorkMode { switch ([self.settings getOptions:SETTING_TTS_WORK_MODE].chooseIdx) { case 0: return SETtsWorkModeOnline; case 1: return SETtsWorkModeOffline; case 2: return SETtsWorkModeAlternate; default: break; } return SETtsWorkModeOnline;; } - (NSString*)getAuthenticationType { switch ([self.settings getOptions:SETTING_AUTHENTICATION_TYPE].chooseIdx) { case 0: return SE_AUTHENTICATE_TYPE_PRE_BIND; case 1: return SE_AUTHENTICATE_TYPE_LATE_BIND; default: break; } return SE_AUTHENTICATE_TYPE_PRE_BIND; } - (long)timeDelayFrom:(long)pastTimestamp { return [[NSDate date] timeIntervalSince1970] * 1000 - pastTimestamp; } #pragma mark - UITextViewDelegate - (BOOL)textView:(UITextView *)textView shouldChangeTextInRange:(NSRange)range replacementText:(NSString *)text { if([text isEqualToString:@"\n"]) { [textView resignFirstResponder]; return NO; } return YES; } #pragma mark - Navigation // In a storyboard-based application, you will often want to do a little preparation before navigation - (void)prepareForSegue:(UIStoryboardSegue *)segue sender:(id)sender { // Get the new view controller using [segue destinationViewController]. // Pass the selected object to the new view controller. id nextPage = [segue destinationViewController]; [nextPage setValue:VIEW_TTS forKey:@"viewId"]; } @end