2、新增HttpsPlaybackFromUrl通用HTTPS音频下载播放方法,obtain_story同时支持HTTPS URL和WebSocket两种方式; 3、新增RTC↔HTTPS双向音频切换三标志位状态机(opus_playback_active_/https_playback_active_/https_playback_abort_),HTTPS播放期间静默丢弃RTC PCM包,OnAudioOutput捕获is_opus_frame防止残留Opus帧杂音; 4、新增AbortHttpsPlayback中止方法,使用独立高优先级任务(priority=10)执行DMA flush; 5、协议层新增OnBotMessage回调,Bot下行消息立即中止HTTPS播放;volc_rtc_protocol移除is_binary依赖改为直接前缀检测,新增info前缀和subv跳过逻辑; 6、新增subtitle字幕消息解析,通过bot_前缀区分USER/AI,用户说话时立即中止HTTPS播放; 7、AbortSpeaking新增HTTPS中止信号和DMA缓冲区flush; 8、Kconfig新增STORY_API_URL故事播放API地址配置; Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
152 lines
5.1 KiB
C++
152 lines
5.1 KiB
C++
#include "protocol.h"
|
|
|
|
#include <esp_log.h>
|
|
|
|
#define TAG "Protocol"
|
|
|
|
void Protocol::OnIncomingJson(std::function<void(const cJSON* root)> callback) {
|
|
on_incoming_json_ = callback;
|
|
}
|
|
|
|
void Protocol::OnIncomingAudio(std::function<void(std::vector<uint8_t>&& data)> callback) {
|
|
on_incoming_audio_ = callback;
|
|
}
|
|
|
|
void Protocol::OnAudioChannelOpened(std::function<void()> callback) {
|
|
on_audio_channel_opened_ = callback;
|
|
}
|
|
|
|
void Protocol::OnAudioChannelClosed(std::function<void()> callback) {
|
|
on_audio_channel_closed_ = callback;// 设置音频通道关闭回调
|
|
}
|
|
|
|
void Protocol::OnNetworkError(std::function<void(const std::string& message)> callback) {
|
|
on_network_error_ = callback;
|
|
}
|
|
|
|
void Protocol::OnBotMessage(std::function<void()> callback) {
|
|
on_bot_message_ = callback;
|
|
}
|
|
|
|
void Protocol::SetError(const std::string& message) {
|
|
error_occurred_ = true;
|
|
if (on_network_error_ != nullptr) {
|
|
on_network_error_(message);
|
|
}
|
|
}
|
|
|
|
void Protocol::SendAbortSpeaking(AbortReason reason) {
|
|
std::string message = "{\"session_id\":\"" + session_id_ + "\",\"type\":\"abort\"";
|
|
if (reason == kAbortReasonWakeWordDetected) {
|
|
message += ",\"reason\":\"wake_word_detected\"";
|
|
} else if (reason == kAbortReasonVoiceInterrupt) {
|
|
message += ",\"reason\":\"voice_interrupt\"";
|
|
}
|
|
message += "}";
|
|
SendText(message);
|
|
}
|
|
|
|
// 发送故事请求 【新增】
|
|
void Protocol::SendStoryRequest() {
|
|
std::string json = "{\"session_id\":\"" + session_id_ + "\",\"type\":\"story\"}";// 构建故事请求 json 消息
|
|
ESP_LOGI(TAG, "Sending story request JSON: %s", json.c_str()); // 打印测试
|
|
SendText(json);// 向服务器发送 json消息
|
|
}
|
|
|
|
void Protocol::SendWakeWordDetected(const std::string& wake_word) {
|
|
std::string json = "{\"session_id\":\"" + session_id_ +
|
|
"\",\"type\":\"listen\",\"state\":\"detect\",\"text\":\"" + wake_word + "\"}";
|
|
SendText(json);
|
|
}
|
|
|
|
void Protocol::SendStartListening(ListeningMode mode) {
|
|
std::string message = "{";
|
|
if (!session_id_.empty()) {
|
|
message += "\"session_id\":\"" + session_id_ + "\",";
|
|
}
|
|
message += "\"type\":\"listen\",\"state\":\"start\"";
|
|
if (mode == kListeningModeRealtime) {
|
|
message += ",\"mode\":\"realtime\"";
|
|
} else if (mode == kListeningModeAutoStop) {
|
|
message += ",\"mode\":\"auto\"";
|
|
} else {
|
|
message += ",\"mode\":\"manual\"";
|
|
}
|
|
message += "}";
|
|
ESP_LOGI(TAG, "SendStartListening: mode=%d session_id=%s", (int)mode, session_id_.c_str());
|
|
SendText(message);
|
|
}
|
|
|
|
void Protocol::SendStopListening() {
|
|
std::string message = "{\"session_id\":\"" + session_id_ + "\",\"type\":\"listen\",\"state\":\"stop\"}";
|
|
SendText(message);// 向服务器发送 json消息
|
|
}
|
|
|
|
void Protocol::SendTextMessage(const std::string& text) {
|
|
std::string json = "{\"session_id\":\"" + session_id_ +
|
|
"\",\"type\":\"listen\",\"state\":\"detect\",\"text\":\"" + text + "\"}";
|
|
SendText(json);
|
|
}
|
|
|
|
|
|
void Protocol::SendIotDescriptors(const std::string& descriptors) {
|
|
cJSON* root = cJSON_Parse(descriptors.c_str());
|
|
if (root == nullptr) {
|
|
ESP_LOGE(TAG, "Failed to parse IoT descriptors: %s", descriptors.c_str());
|
|
return;
|
|
}
|
|
|
|
if (!cJSON_IsArray(root)) {
|
|
ESP_LOGE(TAG, "IoT descriptors should be an array");
|
|
cJSON_Delete(root);
|
|
return;
|
|
}
|
|
|
|
int arraySize = cJSON_GetArraySize(root);
|
|
for (int i = 0; i < arraySize; ++i) {
|
|
cJSON* descriptor = cJSON_GetArrayItem(root, i);
|
|
if (descriptor == nullptr) {
|
|
ESP_LOGE(TAG, "Failed to get IoT descriptor at index %d", i);
|
|
continue;
|
|
}
|
|
|
|
cJSON* messageRoot = cJSON_CreateObject();
|
|
cJSON_AddStringToObject(messageRoot, "session_id", session_id_.c_str());
|
|
cJSON_AddStringToObject(messageRoot, "type", "iot");
|
|
cJSON_AddBoolToObject(messageRoot, "update", true);
|
|
|
|
cJSON* descriptorArray = cJSON_CreateArray();
|
|
cJSON_AddItemToArray(descriptorArray, cJSON_Duplicate(descriptor, 1));
|
|
cJSON_AddItemToObject(messageRoot, "descriptors", descriptorArray);
|
|
|
|
char* message = cJSON_PrintUnformatted(messageRoot);
|
|
if (message == nullptr) {
|
|
ESP_LOGE(TAG, "Failed to print JSON message for IoT descriptor at index %d", i);
|
|
cJSON_Delete(messageRoot);
|
|
continue;
|
|
}
|
|
|
|
SendText(std::string(message));
|
|
cJSON_free(message);
|
|
cJSON_Delete(messageRoot);
|
|
}
|
|
|
|
cJSON_Delete(root);
|
|
}
|
|
|
|
void Protocol::SendIotStates(const std::string& states) {
|
|
std::string message = "{\"session_id\":\"" + session_id_ + "\",\"type\":\"iot\",\"update\":true,\"states\":" + states + "}";
|
|
SendText(message);
|
|
}
|
|
|
|
bool Protocol::IsTimeout() const {
|
|
const int kTimeoutSeconds = 120;
|
|
auto now = std::chrono::steady_clock::now();
|
|
auto duration = std::chrono::duration_cast<std::chrono::seconds>(now - last_incoming_time_);
|
|
bool timeout = duration.count() > kTimeoutSeconds;
|
|
if (timeout) {
|
|
ESP_LOGE(TAG, "Channel timeout %lld seconds", duration.count());
|
|
}
|
|
return timeout;
|
|
}
|