From d58fa13356c35c1051eedb458de3607741f88557 Mon Sep 17 00:00:00 2001 From: wangxiangshun Date: Sun, 19 Oct 2025 00:02:11 +0800 Subject: [PATCH] =?UTF-8?q?STT=E6=B5=81=E5=BC=8F=E8=BE=93=E5=85=A5?= =?UTF-8?q?=E4=B8=9A=E5=8A=A1=E9=80=BB=E8=BE=91=E5=A4=84=E7=90=86?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../java/com/vetti/socket/ChatWebSocketHandler.java | 12 ++++++++---- .../ai/whisper/RealtimeTranscriptionMicrophone.java | 4 ++-- 2 files changed, 10 insertions(+), 6 deletions(-) diff --git a/vetti-admin/src/main/java/com/vetti/socket/ChatWebSocketHandler.java b/vetti-admin/src/main/java/com/vetti/socket/ChatWebSocketHandler.java index 477b45d..1477227 100644 --- a/vetti-admin/src/main/java/com/vetti/socket/ChatWebSocketHandler.java +++ b/vetti-admin/src/main/java/com/vetti/socket/ChatWebSocketHandler.java @@ -198,16 +198,16 @@ public class ChatWebSocketHandler { WebSocket webSocket = cacheWebSocket.get(clientId); log.info("获取的socket对象为:{}",webSocket); if(webSocket != null){ - // 1. 启动音频缓冲 - webSocket.send("{\"type\": \"input_audio_buffer.start\"}"); +// 1. 启动音频缓冲 +// webSocket.send("{\"type\": \"input_audio_buffer.start\"}"); log.info("3.1 开始发送数据音频流啦"); // 将音频数据转换为 Base64 编码的字符串 String base64Audio = Base64.getEncoder().encodeToString(bytes); String message = "{ \"type\": \"input_audio_buffer.append\", \"audio\": \"" + base64Audio + "\" }"; webSocket.send(message); // 3. 提交音频并请求转录 - webSocket.send("{\"type\": \"input_audio_buffer.commit\"}"); - webSocket.send("{\"type\": \"response.create\"}"); +// webSocket.send("{\"type\": \"input_audio_buffer.commit\"}"); +// webSocket.send("{\"type\": \"response.create\"}"); } }catch (Exception e){ e.printStackTrace(); @@ -326,6 +326,10 @@ public class ChatWebSocketHandler { config.put("type", "transcription_session.update"); config.put("session", sessionConfig); webSocket.send(config.toString()); + + // 1. 启动音频缓冲 + webSocket.send("{\"type\": \"input_audio_buffer.start\"}"); + //存储客户端webSocket对象,对数据进行隔离处理 cacheWebSocket.put(clientId,webSocket); } diff --git a/vetti-common/src/main/java/com/vetti/common/ai/whisper/RealtimeTranscriptionMicrophone.java b/vetti-common/src/main/java/com/vetti/common/ai/whisper/RealtimeTranscriptionMicrophone.java index 619b96d..d95b76b 100644 --- a/vetti-common/src/main/java/com/vetti/common/ai/whisper/RealtimeTranscriptionMicrophone.java +++ b/vetti-common/src/main/java/com/vetti/common/ai/whisper/RealtimeTranscriptionMicrophone.java @@ -81,8 +81,8 @@ public class RealtimeTranscriptionMicrophone { } // 3. 提交音频并请求转录 - webSocket.send("{\"type\": \"input_audio_buffer.commit\"}"); - webSocket.send("{\"type\": \"response.create\"}"); +// webSocket.send("{\"type\": \"input_audio_buffer.commit\"}"); +// webSocket.send("{\"type\": \"response.create\"}"); } catch (Exception e) { e.printStackTrace(); }