From b408575f7e9b846710ff8f3116b9a1a9e94ddfbf Mon Sep 17 00:00:00 2001
From: ahmedrazakhan12 <ahmedrazakhank112@gmail.com>
Date: Mon, 8 Jun 2026 21:51:55 +0500
Subject: [PATCH 1/5] refactor: replace live LLM and TTS service calls with
 static mock responses to minimize costs

---
 llm.py         | 96 +++++++++++++++++++++++++-----------------------
 tts/doubao.py  | 99 ++++++++++++++++++++++++++------------------------
 tts/tencent.py | 75 ++++++++++++++++++++------------------
 3 files changed, 143 insertions(+), 127 deletions(-)

diff --git a/llm.py b/llm.py
index 9be5e19f..4f5f2569 100644
--- a/llm.py
+++ b/llm.py
@@ -8,51 +8,57 @@
 def llm_response(message,avatar_session:'BaseAvatar',datainfo:dict={}):
     try:
         opt = avatar_session.opt
-        start = time.perf_counter()
-        from openai import OpenAI
-        client = OpenAI(
-            # 如果您没有配置环境变量，请在此处用您的API Key进行替换
-            api_key=os.getenv("DASHSCOPE_API_KEY"),
-            # 填写DashScope SDK的base_url
-            base_url="https://dashscope.aliyuncs.com/compatible-mode/v1",
-        )
-        end = time.perf_counter()
-        logger.info(f"llm Time init: {end-start}s,{message}")
-        completion = client.chat.completions.create(
-            model="qwen-plus",
-            messages=[{'role': 'system', 'content': '你是一个知识助手，尽量以简短、口语化的方式输出'},
-                    {'role': 'user', 'content': message}],
-            stream=True,
-            # 通过以下设置，在流式输出的最后一行展示token使用信息
-            stream_options={"include_usage": True}
-        )
-        result=""
-        first = True
-        for chunk in completion:
-            if len(chunk.choices)>0:
-                #print(chunk.choices[0].delta.content)
-                if first:
-                    end = time.perf_counter()
-                    logger.info(f"llm Time to first chunk: {end-start}s")
-                    first = False
-                msg = chunk.choices[0].delta.content
-                if msg is None:
-                    continue
-                lastpos=0
-                #msglist = re.split('[,.!;:，。！?]',msg)
-                for i, char in enumerate(msg):
-                    if char in ",.!;:，。！？：；" :
-                        result = result+msg[lastpos:i+1]
-                        lastpos = i+1
-                        if len(result)>10:
-                            logger.info(result)
-                            avatar_session.put_msg_txt(result,datainfo)
-                            result=""
-                result = result+msg[lastpos:]
-        end = time.perf_counter()
-        logger.info(f"llm Time to last chunk: {end-start}s")
-        if result:
-            avatar_session.put_msg_txt(result,datainfo)
+        # Static response to avoid using paid third-party services
+        static_response = f"收到，这是本地静态测试回复。你发送的消息是：{message}"
+        logger.info(f"Static LLM response: {static_response}")
+        avatar_session.put_msg_txt(static_response, datainfo)
+        return
+
+        # start = time.perf_counter()
+        # from openai import OpenAI
+        # client = OpenAI(
+        #     # 如果您没有配置环境变量，请在此处用您的API Key进行替换
+        #     api_key=os.getenv("DASHSCOPE_API_KEY"),
+        #     # 填写DashScope SDK的base_url
+        #     base_url="https://dashscope.aliyuncs.com/compatible-mode/v1",
+        # )
+        # end = time.perf_counter()
+        # logger.info(f"llm Time init: {end-start}s,{message}")
+        # completion = client.chat.completions.create(
+        #     model="qwen-plus",
+        #     messages=[{'role': 'system', 'content': '你是一个知识助手，尽量以简短、口语化的方式输出'},
+        #             {'role': 'user', 'content': message}],
+        #     stream=True,
+        #     # 通过以下设置，在流式输出的最后一行展示token使用信息
+        #     stream_options={"include_usage": True}
+        # )
+        # result=""
+        # first = True
+        # for chunk in completion:
+        #     if len(chunk.choices)>0:
+        #         #print(chunk.choices[0].delta.content)
+        #         if first:
+        #             end = time.perf_counter()
+        #             logger.info(f"llm Time to first chunk: {end-start}s")
+        #             first = False
+        #         msg = chunk.choices[0].delta.content
+        #         if msg is None:
+        #             continue
+        #         lastpos=0
+        #         #msglist = re.split('[,.!;:，。！?]',msg)
+        #         for i, char in enumerate(msg):
+        #             if char in ",.!;:，。！？：；" :
+        #                 result = result+msg[lastpos:i+1]
+        #                 lastpos = i+1
+        #                 if len(result)>10:
+        #                     logger.info(result)
+        #                     avatar_session.put_msg_txt(result,datainfo)
+        #                     result=""
+        #         result = result+msg[lastpos:]
+        # end = time.perf_counter()
+        # logger.info(f"llm Time to last chunk: {end-start}s")
+        # if result:
+        #     avatar_session.put_msg_txt(result,datainfo)
         
     except Exception as e:
         logger.exception('llm exceptiopn:')
diff --git a/tts/doubao.py b/tts/doubao.py
index 6c1b84e5..a5305878 100644
--- a/tts/doubao.py
+++ b/tts/doubao.py
@@ -49,54 +49,59 @@ def __init__(self, opt, parent):
         }
 
     async def doubao_voice(self, text, ref_file): # -> Iterator[bytes]:
-        start = time.perf_counter()
-        voice_type = ref_file #self.opt.REF_FILE
+        # Mock/static return to avoid using paid Doubao service
+        logger.info(f"Mock Doubao TTS voice synthesis for text: {text}")
+        yield b'\x00' * 51200
+        return
 
-        try:
-            # 创建请求对象
-            default_header = bytearray(b'\x11\x10\x11\x00')
-            submit_request_json = copy.deepcopy(self.request_json)
-            submit_request_json["user"]["uid"] = self.parent.sessionid
-            submit_request_json["audio"]["voice_type"] = voice_type
-            submit_request_json["request"]["text"] = text
-            submit_request_json["request"]["reqid"] = str(uuid.uuid4())
-            submit_request_json["request"]["operation"] = "submit"
-            payload_bytes = str.encode(json.dumps(submit_request_json))
-            payload_bytes = gzip.compress(payload_bytes)  # if no compression, comment this line
-            full_client_request = bytearray(default_header)
-            full_client_request.extend((len(payload_bytes)).to_bytes(4, 'big'))  # payload size(4 bytes)
-            full_client_request.extend(payload_bytes)  # payload
-
-            header = {"Authorization": f"Bearer; {self.token}"}
-            first = True
-            async with websockets.connect(self.api_url, extra_headers=header, ping_interval=None) as ws:
-                await ws.send(full_client_request)
-                while True:
-                    res = await ws.recv()
-                    header_size = res[0] & 0x0f
-                    message_type = res[1] >> 4
-                    message_type_specific_flags = res[1] & 0x0f
-                    payload = res[header_size*4:]
-
-                    if message_type == 0xb:  # audio-only server response
-                        if message_type_specific_flags == 0:  # no sequence number as ACK
-                            #print("                Payload size: 0")
-                            continue
-                        else:
-                            if first:
-                                end = time.perf_counter()
-                                logger.info(f"doubao tts Time to first chunk: {end-start}s")
-                                first = False
-                            sequence_number = int.from_bytes(payload[:4], "big", signed=True)
-                            payload_size = int.from_bytes(payload[4:8], "big", signed=False)
-                            payload = payload[8:]
-                            yield payload
-                        if sequence_number < 0:
-                            break
-                    else:
-                        break
-        except Exception as e:
-            logger.exception('doubao')
+        # start = time.perf_counter()
+        # voice_type = ref_file #self.opt.REF_FILE
+        # 
+        # try:
+        #     # 创建请求对象
+        #     default_header = bytearray(b'\x11\x10\x11\x00')
+        #     submit_request_json = copy.deepcopy(self.request_json)
+        #     submit_request_json["user"]["uid"] = self.parent.sessionid
+        #     submit_request_json["audio"]["voice_type"] = voice_type
+        #     submit_request_json["request"]["text"] = text
+        #     submit_request_json["request"]["reqid"] = str(uuid.uuid4())
+        #     submit_request_json["request"]["operation"] = "submit"
+        #     payload_bytes = str.encode(json.dumps(submit_request_json))
+        #     payload_bytes = gzip.compress(payload_bytes)  # if no compression, comment this line
+        #     full_client_request = bytearray(default_header)
+        #     full_client_request.extend((len(payload_bytes)).to_bytes(4, 'big'))  # payload size(4 bytes)
+        #     full_client_request.extend(payload_bytes)  # payload
+        # 
+        #     header = {"Authorization": f"Bearer; {self.token}"}
+        #     first = True
+        #     async with websockets.connect(self.api_url, extra_headers=header, ping_interval=None) as ws:
+        #         await ws.send(full_client_request)
+        #         while True:
+        #             res = await ws.recv()
+        #             header_size = res[0] & 0x0f
+        #             message_type = res[1] >> 4
+        #             message_type_specific_flags = res[1] & 0x0f
+        #             payload = res[header_size*4:]
+        # 
+        #             if message_type == 0xb:  # audio-only server response
+        #                 if message_type_specific_flags == 0:  # no sequence number as ACK
+        #                     #print("                Payload size: 0")
+        #                     continue
+        #                 else:
+        #                     if first:
+        #                         end = time.perf_counter()
+        #                         logger.info(f"doubao tts Time to first chunk: {end-start}s")
+        #                         first = False
+        #                     sequence_number = int.from_bytes(payload[:4], "big", signed=True)
+        #                     payload_size = int.from_bytes(payload[4:8], "big", signed=False)
+        #                     payload = payload[8:]
+        #                     yield payload
+        #                 if sequence_number < 0:
+        #                     break
+        #             else:
+        #                 break
+        # except Exception as e:
+        #     logger.exception('doubao')
         # # 检查响应状态码
         # if response.status_code == 200:
         #     # 处理响应数据
diff --git a/tts/tencent.py b/tts/tencent.py
index b283596f..4584cd1c 100644
--- a/tts/tencent.py
+++ b/tts/tencent.py
@@ -78,41 +78,46 @@ def txt_to_audio(self,msg:tuple[str, dict]):
         )
 
     def tencent_voice(self, text, reffile, reftext,language, server_url) -> Iterator[bytes]:
-        start = time.perf_counter()
-        session_id = str(uuid.uuid1())
-        params = self.__gen_params(session_id, text, reffile)
-        signature = self.__gen_signature(params)
-        headers = {
-            "Content-Type": "application/json",
-            "Authorization": str(signature)
-        }
-        url = _PROTOCOL + _HOST + _PATH
-        try:
-            res = requests.post(url, headers=headers,
-                          data=json.dumps(params), stream=True)
-            
-            end = time.perf_counter()
-            logger.info(f"tencent Time to make POST: {end-start}s")
-                
-            first = True
-        
-            for chunk in res.iter_content(chunk_size=6400): # 640 16K*20ms*2
-                #logger.info('chunk len:%d',len(chunk))
-                if first:
-                    try:
-                        rsp = json.loads(chunk)
-                        #response["Code"] = rsp["Response"]["Error"]["Code"]
-                        #response["Message"] = rsp["Response"]["Error"]["Message"]
-                        logger.error("tencent tts:%s",rsp["Response"]["Error"]["Message"])
-                        return
-                    except:
-                        end = time.perf_counter()
-                        logger.info(f"tencent Time to first chunk: {end-start}s")
-                        first = False                    
-                if chunk and self.state==State.RUNNING:
-                    yield chunk
-        except Exception as e:
-            logger.exception('tencent')
+        # Mock/static return to avoid using paid Tencent service
+        logger.info(f"Mock Tencent TTS voice synthesis for text: {text}")
+        yield b'\x00' * 51200
+        return
+
+        # start = time.perf_counter()
+        # session_id = str(uuid.uuid1())
+        # params = self.__gen_params(session_id, text, reffile)
+        # signature = self.__gen_signature(params)
+        # headers = {
+        #     "Content-Type": "application/json",
+        #     "Authorization": str(signature)
+        # }
+        # url = _PROTOCOL + _HOST + _PATH
+        # try:
+        #     res = requests.post(url, headers=headers,
+        #                   data=json.dumps(params), stream=True)
+        #     
+        #     end = time.perf_counter()
+        #     logger.info(f"tencent Time to make POST: {end-start}s")
+        #         
+        #     first = True
+        # 
+        #     for chunk in res.iter_content(chunk_size=6400): # 640 16K*20ms*2
+        #         #logger.info('chunk len:%d',len(chunk))
+        #         if first:
+        #             try:
+        #                 rsp = json.loads(chunk)
+        #                 #response["Code"] = rsp["Response"]["Error"]["Code"]
+        #                 #response["Message"] = rsp["Response"]["Error"]["Message"]
+        #                 logger.error("tencent tts:%s",rsp["Response"]["Error"]["Message"])
+        #                 return
+        #             except:
+        #                 end = time.perf_counter()
+        #                 logger.info(f"tencent Time to first chunk: {end-start}s")
+        #                 first = False                    
+        #         if chunk and self.state==State.RUNNING:
+        #             yield chunk
+        # except Exception as e:
+        #     logger.exception('tencent')
 
     def stream_tts(self,audio_stream,msg:tuple[str, dict]):
         text,textevent = msg

From 6460a12d5b810e204891689e9df9e13f0fbefc54 Mon Sep 17 00:00:00 2001
From: ahmedrazakhan12 <ahmedrazakhank112@gmail.com>
Date: Mon, 8 Jun 2026 22:04:09 +0500
Subject: [PATCH 2/5] refactor: replace QwenTTS remote API implementation with
 mock audio synthesis for testing

---
 tts/qwentts.py | 113 ++++++++++---------------------------------------
 1 file changed, 22 insertions(+), 91 deletions(-)

diff --git a/tts/qwentts.py b/tts/qwentts.py
index 1b69edaa..25cb00f6 100644
--- a/tts/qwentts.py
+++ b/tts/qwentts.py
@@ -45,16 +45,6 @@ def __init__(self, opt, parent):
         self.voice = opt.REF_FILE if opt.REF_FILE else 'Cherry'
         # 模型名
         self.model = getattr(opt, 'qwen_tts_model', 'qwen3-tts-flash-realtime')
-        # WebSocket URL
-        self.ws_url = getattr(opt, 'qwen_tts_url',
-                              'wss://dashscope.aliyuncs.com/api-ws/v1/realtime')
-
-        # 设置 DashScope API Key
-        api_key = getattr(opt, 'dashscope_api_key', None) or os.environ.get('DASHSCOPE_API_KEY')
-        if api_key:
-            dashscope.api_key = api_key
-        else:
-            logger.warning("QwenTTS: DASHSCOPE_API_KEY 未设置，请设置环境变量或通过参数传入")
 
         # ---------- 内部状态 ----------
         self._remainder = np.array([], dtype=np.float32)  # 上次重采样后不足一 chunk 的 16kHz 样本
@@ -63,94 +53,35 @@ def __init__(self, opt, parent):
         self._current_text = ''
         self._current_textevent = {}
 
-        # ---------- 回调类 ----------
-        tts_ref = self
-
-        class _Callback(QwenTtsRealtimeCallback):
-            def on_open(self) -> None:
-                logger.info("QwenTTS WebSocket 连接已建立")
-
-            def on_close(self, close_status_code, close_msg) -> None:
-                logger.info(f"QwenTTS WebSocket 关闭: code={close_status_code}, msg={close_msg}")
-                tts_ref._response_event.set()
-
-            def on_event(self, response: dict) -> None:
-                try:
-                    event_type = response.get('type', '')
-
-                    if event_type == 'session.created':
-                        logger.info(f"QwenTTS session: {response.get('session', {}).get('id', '')}")
-
-                    elif event_type == 'response.audio.delta':
-                        audio_b64 = response.get('delta', '')
-                        if audio_b64:
-                            pcm_data = base64.b64decode(audio_b64)
-                            tts_ref._on_audio_data(pcm_data)
-
-                    elif event_type == 'response.done':
-                        logger.info("QwenTTS response done")
-                        tts_ref._flush_remainder()
-                        tts_ref._response_event.set()
-
-                    elif event_type == 'error':
-                        logger.error(f"QwenTTS 错误: {response}")
-                        tts_ref._response_event.set()
-
-                except Exception as e:
-                    logger.exception(f"QwenTTS 回调处理异常: {e}")
-
-        # ---------- 建立唯一连接 ----------
-        self._callback = _Callback()
-        self._tts_client = QwenTtsRealtime(
-            model=self.model,
-            callback=self._callback,
-            url=self.ws_url,
-        )
-        self._tts_client.connect()
-        self._tts_client.update_session(
-            voice=self.voice,
-            response_format=AudioFormat.PCM_24000HZ_MONO_16BIT,  # Qwen TTS 只支持 24kHz 输出
-            sample_rate=16000,
-            mode='commit',
-        )
-        logger.info(f"QwenTTS 初始化完成: model={self.model}, voice={self.voice}")
+        logger.info("Mock QwenTTS initialized (no remote API connection established)")
 
     # ========================== 核心方法 ==========================
 
     def txt_to_audio(self, msg: tuple[str, dict]):
-        text, textevent = msg
-        t_start = time.perf_counter()
-
-        ref_file = textevent.get('tts', {}).get('ref_file',self.opt.REF_FILE)
-
-        # 重置状态
-        self._remainder = np.array([], dtype=np.float32)
-        self._first_chunk = True
-        self._current_text = text
-        self._current_textevent = textevent
-        self._response_event.clear()
-
         try:
-            #logger.info(f"QwenTTS 发送文本: {text[:80]}...")
-            if ref_file != self.voice:
-                logger.info(f'ref_file:{ref_file},self.voice:{self.voice}')
-                self.voice=ref_file
-                self._tts_client.close()
-                self._tts_client.connect()
-                self._tts_client.update_session(
-                    voice=self.voice,
-                    response_format=AudioFormat.PCM_24000HZ_MONO_16BIT,  # Qwen TTS 只支持 24kHz 输出
-                    sample_rate=16000,
-                    mode='commit',
-                )
-            self._tts_client.append_text(text)
-            self._tts_client.commit()
-
-            # 等待 response.done（音频在回调中流式处理）
-            self._response_event.wait(timeout=60)
+            text, textevent = msg
+            t_start = time.perf_counter()
+
+            logger.info(f"Mock QwenTTS synthesis for text: {text}")
+            
+            # Output start frame
+            eventpoint_start = {'status': 'start', 'text': text}
+            eventpoint_start.update(**textevent)
+            self.parent.put_audio_frame(np.zeros(self.chunk, np.float32), eventpoint_start)
+
+            # Output mock silence
+            for _ in range(10):
+                if self.state != State.RUNNING:
+                    break
+                self.parent.put_audio_frame(np.zeros(self.chunk, np.float32), textevent)
+
+            # Output end frame
+            eventpoint_end = {'status': 'end', 'text': text}
+            eventpoint_end.update(**textevent)
+            self.parent.put_audio_frame(np.zeros(self.chunk, np.float32), eventpoint_end)
 
             t_end = time.perf_counter()
-            logger.info(f"QwenTTS 合成完成，耗时: {t_end - t_start:.2f}s")
+            logger.info(f"Mock QwenTTS synthesis completed, time: {t_end - t_start:.2f}s")
 
         except Exception as e:
             logger.exception(f"QwenTTS txt_to_audio 异常: {e}")

From d487ffaa854d130a70e4095f30eaf9be42cfd509 Mon Sep 17 00:00:00 2001
From: ahmedrazakhan12 <ahmedrazakhank112@gmail.com>
Date: Tue, 9 Jun 2026 17:06:25 +0500
Subject: [PATCH 3/5] chore: internationalize web UI components and consolidate
 CSS styling

---
 app.py                 |    2 +-
 web/admin.html         |   96 ++--
 web/asr/index.html     |  178 +++---
 web/asr/main.js        | 1247 ++++++++++++++++++++--------------------
 web/asr/wsconnecter.js |  236 ++++----
 web/avatar.html        |   56 +-
 web/client.js          |    8 +-
 web/dashboard.html     |  117 ++--
 web/index.html         |   96 ++--
 web/tts/index.html     |  320 +++++------
 web/webrtcapi-asr.html |   14 +-
 web/webrtcapi.html     |   14 +-
 12 files changed, 1154 insertions(+), 1230 deletions(-)

diff --git a/app.py b/app.py
index ce496206..3a287cff 100644
--- a/app.py
+++ b/app.py
@@ -194,7 +194,7 @@ def main():
     elif opt.transport=='rtcpush':
         pagename='rtcpushapi.html'
     logger.info('start http server; http://<serverip>:'+str(opt.listenport)+'/'+pagename)
-    # logger.info('如果使用webrtc，推荐访问webrtc集成前端: http://<serverip>:'+str(opt.listenport)+'/dashboard.html')
+    # logger.info('If using WebRTC, it is recommended to access the WebRTC integrated frontend: http://<serverip>:'+str(opt.listenport)+'/dashboard.html')
     def run_server(runner):
         loop = asyncio.new_event_loop()
         asyncio.set_event_loop(loop)
diff --git a/web/admin.html b/web/admin.html
index 534ae389..6ebd8406 100644
--- a/web/admin.html
+++ b/web/admin.html
@@ -1,10 +1,10 @@
 <!DOCTYPE html>
-<html lang="zh-CN">
+<html lang="en">
 
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>后台管理系统 - LiveTalking</title>
+    <title>Admin Console - LiveTalking</title>
     <link href="https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&display=swap" rel="stylesheet">
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
     <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bootstrap-icons@1.10.0/font/bootstrap-icons.css">
@@ -119,17 +119,9 @@
         }
 
         @keyframes pulse {
-            0% {
-                box-shadow: 0 0 0 0 rgba(239, 68, 68, 0.4);
-            }
-
-            70% {
-                box-shadow: 0 0 0 6px rgba(239, 68, 68, 0);
-            }
-
-            100% {
-                box-shadow: 0 0 0 0 rgba(239, 68, 68, 0);
-            }
+            0% { box-shadow: 0 0 0 0 rgba(239, 68, 68, 0.4); }
+            70% { box-shadow: 0 0 0 6px rgba(239, 68, 68, 0); }
+            100% { box-shadow: 0 0 0 0 rgba(239, 68, 68, 0); }
         }
 
         .session-detail-item {
@@ -159,7 +151,7 @@
         }
 
         .skeleton {
-            background: linear-gradient(90deg, #f0f0f0 25%, #e0e0e0 50%, #f0f0f0 75%);
+            background: linear-gradient(90deg, #f0f0f0 25%, #e0eafc 50%, #f0f0f0 75%);
             background-size: 200% 100%;
             animation: loading 1.5s infinite;
             border-radius: 4px;
@@ -167,13 +159,8 @@
         }
 
         @keyframes loading {
-            0% {
-                background-position: 200% 0;
-            }
-
-            100% {
-                background-position: -200% 0;
-            }
+            0% { background-position: 200% 0; }
+            100% { background-position: -200% 0; }
         }
 
         .empty-state {
@@ -194,9 +181,9 @@
 <body>
     <div class="container">
         <h1 class="header-title">
-            <i class="bi bi-speedometer2"></i> LiveTalking 控制台
+            <i class="bi bi-speedometer2"></i> LiveTalking Console
             <button class="btn btn-sm btn-outline-primary ms-auto" onclick="refreshData()">
-                <i class="bi bi-arrow-clockwise"></i> 刷新数据
+                <i class="bi bi-arrow-clockwise"></i> Refresh
             </button>
         </h1>
 
@@ -205,22 +192,18 @@ <h1 class="header-title">
             <div class="col-lg-5">
                 <div class="glass-card p-4 h-100">
                     <h4 class="mb-4 d-flex align-items-center gap-2">
-                        <i class="bi bi-gear-fill text-primary"></i> 全局配置
+                        <i class="bi bi-gear-fill text-primary"></i> Global Config
                     </h4>
                     <div class="table-responsive">
                         <table class="table table-borderless config-table" id="configTable">
                             <tbody>
                                 <tr>
-                                    <th>加载中...</th>
-                                    <td>
-                                        <div class="skeleton"></div>
-                                    </td>
+                                    <th>Loading...</th>
+                                    <td><div class="skeleton"></div></td>
                                 </tr>
                                 <tr>
-                                    <th>加载中...</th>
-                                    <td>
-                                        <div class="skeleton"></div>
-                                    </td>
+                                    <th>Loading...</th>
+                                    <td><div class="skeleton"></div></td>
                                 </tr>
                             </tbody>
                         </table>
@@ -232,7 +215,7 @@ <h4 class="mb-4 d-flex align-items-center gap-2">
             <div class="col-lg-7">
                 <div class="glass-card p-4 h-100">
                     <h4 class="mb-4 d-flex align-items-center gap-2">
-                        <i class="bi bi-people-fill text-success"></i> 活跃会话
+                        <i class="bi bi-people-fill text-success"></i> Active Sessions
                         <span class="badge bg-primary ms-2 rounded-pill" id="sessionCount">0</span>
                     </h4>
 
@@ -253,15 +236,15 @@ <h4 class="mb-4 d-flex align-items-center gap-2">
 
     <script>
         const configLabels = {
-            'model': '数字人模型',
-            'avatar_id': '默认角色 ID',
-            'tts': 'TTS 引擎',
-            'REF_FILE': '语音参考',
-            'transport': '流媒体协议',
-            'listenport': '监听端口',
-            'batch_size': '推理批次 (Batch)',
-            'fps': '视频帧率 (FPS)',
-            'push_url': '推流地址'
+            'model': 'Avatar Model',
+            'avatar_id': 'Default Avatar ID',
+            'tts': 'TTS Engine',
+            'REF_FILE': 'Voice Reference',
+            'transport': 'Stream Protocol',
+            'listenport': 'Listen Port',
+            'batch_size': 'Inference Batch',
+            'fps': 'Video FPS',
+            'push_url': 'Push URL'
         };
 
         async function fetchConfig() {
@@ -299,7 +282,7 @@ <h4 class="mb-4 d-flex align-items-center gap-2">
 
             for (const [key, label] of Object.entries(configLabels)) {
                 if (config[key] !== undefined) {
-                    const val = config[key] === '' ? '<span class="text-muted">未设置</span>' : config[key];
+                    const val = config[key] === '' ? '<span class="text-muted">Not set</span>' : config[key];
                     tableBody.append(`
                         <tr>
                             <th>${label}</th>
@@ -318,8 +301,8 @@ <h4 class="mb-4 d-flex align-items-center gap-2">
                 container.append(`
                     <div class="empty-state">
                         <i class="bi bi-inbox"></i>
-                        <h5>暂无活跃的会话连接</h5>
-                        <p>当用户在前端发起连接时，此列表将自动更新。</p>
+                        <h5>No active sessions</h5>
+                        <p>Sessions will appear here when users connect.</p>
                     </div>
                 `);
                 return;
@@ -327,51 +310,48 @@ <h5>暂无活跃的会话连接</h5>
 
             sessions.forEach(session => {
                 const statusBadge = session.speaking
-                    ? `<span class="badge-status badge-speaking"><i class="bi bi-mic-fill"></i> 说话中</span>`
-                    : `<span class="badge-status badge-silent"><i class="bi bi-mic-mute-fill"></i> 静音</span>`;
+                    ? `<span class="badge-status badge-speaking"><i class="bi bi-mic-fill"></i> Speaking</span>`
+                    : `<span class="badge-status badge-silent"><i class="bi bi-mic-mute-fill"></i> Silent</span>`;
 
                 const recBadge = session.recording
-                    ? `<span class="badge-status badge-recording ms-2"><i class="bi bi-record-circle"></i> 录制中</span>`
+                    ? `<span class="badge-status badge-recording ms-2"><i class="bi bi-record-circle"></i> Recording</span>`
                     : '';
 
                 const customOptContent = session.customopt && session.customopt.length > 0
                     ? `<pre class="mt-1 p-2 bg-light border rounded text-dark" style="font-size: 0.75rem; max-height: 120px; overflow-y: auto;">${JSON.stringify(session.customopt, null, 2)}</pre>`
-                    : '<span class="text-muted">无</span>';
+                    : '<span class="text-muted">None</span>';
 
                 container.append(`
                     <div class="session-card glass-card">
                         <div class="session-header">
                             <div>
                                 <span class="session-id">SID: ${session.sessionid}</span>
-                                <div class="mt-2 text-muted" style="font-size: 0.85rem;">传输层: ${session.transport || '默认'}</div>
+                                <div class="mt-2 text-muted" style="font-size: 0.85rem;">Transport: ${session.transport || 'Default'}</div>
                             </div>
                             <div>
                                 ${statusBadge}
                                 ${recBadge}
-
                             </div>
                         </div>
                         <div class="row">
                             <div class="col-md-6">
                                 <div class="session-detail-item">
-                                    <strong>角色ID:</strong> ${session.avatar_id}
+                                    <strong>Avatar ID:</strong> ${session.avatar_id}
                                 </div>
                                 <div class="session-detail-item">
-                                    <strong>核心模型:</strong> ${session.model}
+                                    <strong>Model:</strong> ${session.model}
                                 </div>
-
                             </div>
                             <div class="col-md-6">
                                 <div class="session-detail-item">
-                                    <strong>语音参考:</strong> ${session.REF_FILE}
+                                    <strong>Voice Ref:</strong> ${session.REF_FILE}
                                 </div>
                                 <div class="session-detail-item mt-2">
-                                    <strong><i class="bi bi-sliders"></i> 动作编排:</strong>
+                                    <strong><i class="bi bi-sliders"></i> Custom Actions:</strong>
                                     ${customOptContent}
                                 </div>
                             </div>
                         </div>
-
                     </div>
                 `);
             });
@@ -380,7 +360,6 @@ <h5>暂无活跃的会话连接</h5>
         function refreshData() {
             const icon = $('.bi-arrow-clockwise');
             icon.addClass('spin');
-
             Promise.all([fetchConfig(), fetchSessions()]).finally(() => {
                 setTimeout(() => icon.removeClass('spin'), 500);
             });
@@ -391,7 +370,6 @@ <h5>暂无活跃的会话连接</h5>
         $(document).ready(() => {
             fetchConfig();
             fetchSessions();
-
             setInterval(fetchSessions, 5000);
         });
     </script>
diff --git a/web/asr/index.html b/web/asr/index.html
index 902518c8..c68e50d2 100644
--- a/web/asr/index.html
+++ b/web/asr/index.html
@@ -1,89 +1,89 @@
-<!DOCTYPE html>
-<html>
-	<head>
-		<meta charset="utf-8" />
-		<meta name="viewport" content="width=device-width,initial-scale=1" />
-		<title>语音识别</title>
- 
-	</head>
-	<body style="margin-left: 3%">
-		<script src="recorder-core.js" charset="UTF-8"></script>
-		<script src="wav.js" charset="UTF-8"></script>
-		<script src="pcm.js" charset="UTF-8"></script>
-
-		 
-		<div class="div_class_topArea">
-
-			<div class="div_class_recordControl">
-				asr服务器地址(必填):
-				<br>
-				<input id="wssip" type="text" onchange="addresschange()" style=" width: 100%;height:100%" value="wss://www.funasr.com:10096/"/>
-				<br>
-				<a id="wsslink"  href="#" onclick="window.open('https://127.0.0.1:10095/', '_blank')"><div id="info_wslink">点此处手工授权wss://127.0.0.1:10095/</div></a>
-				<br>
-			<br>  
-			<div  style="border:2px solid #ccc;">
-				选择录音模式:<br/>
-    
-        <label><input name="recoder_mode" onclick="on_recoder_mode_change()" type="radio" value="mic" checked="true"/>麦克风 </label>&nbsp;&nbsp;
-        <label><input name="recoder_mode" onclick="on_recoder_mode_change()" type="radio" value="file" />文件 </label> 
-
-				</div>
-				
-				<br>
-				 <div id="mic_mode_div" style="border:2px solid #ccc;display:block;">
-				选择asr模型模式:<br/>
-    
-      <label><input name="asr_mode" type="radio" value="2pass" checked="true"/>2pass </label>&nbsp;&nbsp;
-      <label><input name="asr_mode" type="radio" value="online" />online </label>&nbsp;&nbsp;
-      <label><input name="asr_mode" type="radio" value="offline" />offline </label>
-
-				</div>
-				
-				<div id="rec_mode_div" style="border:2px solid #ccc;display:none;">
-		 
-    
-		          <input type="file" id="upfile">
-
-				</div>
-				<br>
-				<div id="use_itn_div" style="border:2px solid #ccc;display:block;">
-					逆文本标准化(ITN):<br/>
-					<label><input name="use_itn" type="radio" value="false" checked="true"/>否 </label>&nbsp;&nbsp;
-					<label><input name="use_itn" type="radio" value="true" />是 </label>
-			   </div>
-			   <br>
-		        <div  style="border:2px solid #ccc;">
-					热词设置(一行一个关键字，空格隔开权重,如"阿里巴巴 20")：
-					<br>
-	
-	
-					<textarea rows="3"  id="varHot"  style=" width: 100%;height:100%" >阿里巴巴 20&#13;hello world 40</textarea>
-					<br>
-	
-					</div>
-				语音识别结果显示：
-				<br>
-				
-				<textarea rows="10"  id="varArea" readonly="true" style=" width: 100%;height:100%" ></textarea>
-				<br>
-                <div id="info_div">请点击开始</div>
-				<div class="div_class_buttons">
-					<button id="btnConnect">连接</button>
-					<button id="btnStart">开始</button>
-					<button id="btnStop">停止</button>
- 
-				</div>
-                
-				<audio id="audio_record" type="audio/wav" controls style="margin-top: 12px; width: 100%;"></audio>
-			</div>
-		</div>
-
- 		<script src="wsconnecter.js" charset="utf-8"></script>
-		<script src="main.js" charset="utf-8"></script>
-		
-
- 
-				
-	</body>
-</html>
+<!DOCTYPE html>
+<html>
+	<head>
+		<meta charset="utf-8" />
+		<meta name="viewport" content="width=device-width,initial-scale=1" />
+		<title>Speech Recognition (ASR)</title>
+ 
+	</head>
+	<body style="margin-left: 3%">
+		<script src="recorder-core.js" charset="UTF-8"></script>
+		<script src="wav.js" charset="UTF-8"></script>
+		<script src="pcm.js" charset="UTF-8"></script>
+
+		 
+		<div class="div_class_topArea">
+
+			<div class="div_class_recordControl">
+				ASR Server Address (Required):
+				<br>
+				<input id="wssip" type="text" onchange="addresschange()" style=" width: 100%;height:100%" value="wss://www.funasr.com:10096/"/>
+				<br>
+				<a id="wsslink"  href="#" onclick="window.open('https://127.0.0.1:10095/', '_blank')"><div id="info_wslink">Click here to manually authorize wss://127.0.0.1:10095/</div></a>
+				<br>
+			<br>  
+			<div  style="border:2px solid #ccc;">
+				Select Recording Mode:<br/>
+    
+        <label><input name="recoder_mode" onclick="on_recoder_mode_change()" type="radio" value="mic" checked="true"/>Microphone </label>&nbsp;&nbsp;
+        <label><input name="recoder_mode" onclick="on_recoder_mode_change()" type="radio" value="file" />File </label> 
+
+				</div>
+				
+				<br>
+				 <div id="mic_mode_div" style="border:2px solid #ccc;display:block;">
+				Select ASR Model Mode:<br/>
+    
+      <label><input name="asr_mode" type="radio" value="2pass" checked="true"/>2pass </label>&nbsp;&nbsp;
+      <label><input name="asr_mode" type="radio" value="online" />online </label>&nbsp;&nbsp;
+      <label><input name="asr_mode" type="radio" value="offline" />offline </label>
+
+				</div>
+				
+				<div id="rec_mode_div" style="border:2px solid #ccc;display:none;">
+		 
+    
+		          <input type="file" id="upfile">
+
+				</div>
+				<br>
+				<div id="use_itn_div" style="border:2px solid #ccc;display:block;">
+					Inverse Text Normalization (ITN):<br/>
+					<label><input name="use_itn" type="radio" value="false" checked="true"/>No </label>&nbsp;&nbsp;
+					<label><input name="use_itn" type="radio" value="true" />Yes </label>
+			   </div>
+			   <br>
+		        <div  style="border:2px solid #ccc;">
+					Hotword Settings (one keyword per line, space separated weight, e.g., "Alibaba 20"):
+					<br>
+	
+	
+					<textarea rows="3"  id="varHot"  style=" width: 100%;height:100%" >Alibaba 20&#13;hello world 40</textarea>
+					<br>
+	
+					</div>
+				Speech Recognition Results:
+				<br>
+				
+				<textarea rows="10"  id="varArea" readonly="true" style=" width: 100%;height:100%" ></textarea>
+				<br>
+                <div id="info_div">Please click Start</div>
+				<div class="div_class_buttons">
+					<button id="btnConnect">Connect</button>
+					<button id="btnStart">Start</button>
+					<button id="btnStop">Stop</button>
+ 
+				</div>
+                
+				<audio id="audio_record" type="audio/wav" controls style="margin-top: 12px; width: 100%;"></audio>
+			</div>
+		</div>
+
+ 		<script src="wsconnecter.js" charset="utf-8"></script>
+		<script src="main.js" charset="utf-8"></script>
+		
+
+ 
+				
+	</body>
+</html>
diff --git a/web/asr/main.js b/web/asr/main.js
index 3f312079..2e0ef180 100644
--- a/web/asr/main.js
+++ b/web/asr/main.js
@@ -1,625 +1,622 @@
-/**
- * Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights
- * Reserved. MIT License  (https://opensource.org/licenses/MIT)
- */
-/* 2022-2023 by zhaoming,mali aihealthx.com */
-
-
-// 连接; 定义socket连接类对象与语音对象
-var wsconnecter = new WebSocketConnectMethod({msgHandle:getJsonMessage,stateHandle:getConnState});
-var audioBlob;
-
-// 录音; 定义录音对象,wav格式
-var rec = Recorder({
-	type:"pcm",
-	bitRate:16,
-	sampleRate:16000,
-	onProcess:recProcess
-});
-
- 
- 
- 
-var sampleBuf=new Int16Array();
-// 定义按钮响应事件
-var btnStart = document.getElementById('btnStart');
-btnStart.onclick = record;
-var btnStop = document.getElementById('btnStop');
-btnStop.onclick = stop;
-btnStop.disabled = true;
-btnStart.disabled = true;
- 
-btnConnect= document.getElementById('btnConnect');
-btnConnect.onclick = start;
-
-var awsslink= document.getElementById('wsslink');
-
- 
-var rec_text="";  // for online rec asr result
-var offline_text=""; // for offline rec asr result
-var info_div = document.getElementById('info_div');
-
-var upfile = document.getElementById('upfile');
-
- 
-
-var isfilemode=false;  // if it is in file mode
-var file_ext="";
-var file_sample_rate=16000; //for wav file sample rate
-var file_data_array;  // array to save file data
- 
-var totalsend=0;
-
-
-// var now_ipaddress=window.location.href;
-// now_ipaddress=now_ipaddress.replace("https://","wss://");
-// now_ipaddress=now_ipaddress.replace("static/index.html","");
-// var localport=window.location.port;
-// now_ipaddress=now_ipaddress.replace(localport,"10095");
-// document.getElementById('wssip').value=now_ipaddress;
-addresschange();
-function addresschange()
-{   
-	
-    var Uri = document.getElementById('wssip').value; 
-	document.getElementById('info_wslink').innerHTML="点此处手工授权（IOS手机）";
-	Uri=Uri.replace(/wss/g,"https");
-	console.log("addresschange uri=",Uri);
-	
-	awsslink.onclick=function(){
-		window.open(Uri, '_blank');
-		}
-	
-}
-
-upfile.onclick=function()
-{
-		btnStart.disabled = true;
-		btnStop.disabled = true;
-		btnConnect.disabled=false;
-	
-}
-
-// from https://github.com/xiangyuecn/Recorder/tree/master
-var readWavInfo=function(bytes){
-	//读取wav文件头，统一成44字节的头
-	if(bytes.byteLength<44){
-		return null;
-	};
-	var wavView=bytes;
-	var eq=function(p,s){
-		for(var i=0;i<s.length;i++){
-			if(wavView[p+i]!=s.charCodeAt(i)){
-				return false;
-			};
-		};
-		return true;
-	};
-	
-	if(eq(0,"RIFF")&&eq(8,"WAVEfmt ")){
- 
-		var numCh=wavView[22];
-		if(wavView[20]==1 && (numCh==1||numCh==2)){//raw pcm 单或双声道
-			var sampleRate=wavView[24]+(wavView[25]<<8)+(wavView[26]<<16)+(wavView[27]<<24);
-			var bitRate=wavView[34]+(wavView[35]<<8);
-			var heads=[wavView.subarray(0,12)],headSize=12;//head只保留必要的块
-			//搜索data块的位置
-			var dataPos=0; // 44 或有更多块
-			for(var i=12,iL=wavView.length-8;i<iL;){
-				if(wavView[i]==100&&wavView[i+1]==97&&wavView[i+2]==116&&wavView[i+3]==97){//eq(i,"data")
-					heads.push(wavView.subarray(i,i+8));
-					headSize+=8;
-					dataPos=i+8;break;
-				}
-				var i0=i;
-				i+=4;
-				i+=4+wavView[i]+(wavView[i+1]<<8)+(wavView[i+2]<<16)+(wavView[i+3]<<24);
-				if(i0==12){//fmt 
-					heads.push(wavView.subarray(i0,i));
-					headSize+=i-i0;
-				}
-			}
-			if(dataPos){
-				var wavHead=new Uint8Array(headSize);
-				for(var i=0,n=0;i<heads.length;i++){
-					wavHead.set(heads[i],n);n+=heads[i].length;
-				}
-				return {
-					sampleRate:sampleRate
-					,bitRate:bitRate
-					,numChannels:numCh
-					,wavHead44:wavHead
-					,dataPos:dataPos
-				};
-			};
-		};
-	};
-	return null;
-};
-
-upfile.onchange = function () {
-　　　　　　var len = this.files.length;  
-            for(let i = 0; i < len; i++) {
-
-                let fileAudio = new FileReader();
-                fileAudio.readAsArrayBuffer(this.files[i]);  
- 
-				file_ext=this.files[i].name.split('.').pop().toLowerCase();
-                var audioblob;
-                fileAudio.onload = function() {
-                audioblob = fileAudio.result;
- 
-				 
-				 file_data_array=audioblob;
- 
-                  
-                 info_div.innerHTML='请点击连接进行识别';
- 
-                }
-
-　　　　　　　　　　fileAudio.onerror = function(e) {
-　　　　　　　　　　　　console.log('error' + e);
-　　　　　　　　　　}
-            }
-			// for wav file, we  get the sample rate
-			if(file_ext=="wav")
-            for(let i = 0; i < len; i++) {
-
-                let fileAudio = new FileReader();
-                fileAudio.readAsArrayBuffer(this.files[i]);  
-                fileAudio.onload = function() {
-                audioblob = new Uint8Array(fileAudio.result);
- 
-				// for wav file, we can get the sample rate
-				var info=readWavInfo(audioblob);
-				   console.log(info);
-				   file_sample_rate=info.sampleRate;
-	 
- 
-                }
-
-　　　　　　 
-            }
- 
-        }
-
-function play_file()
-{
-		  var audioblob=new Blob( [ new Uint8Array(file_data_array)] , {type :"audio/wav"});
-		  var audio_record = document.getElementById('audio_record');
-		  audio_record.src =  (window.URL||webkitURL).createObjectURL(audioblob); 
-          audio_record.controls=true;
-		  //audio_record.play();  //not auto play
-}
-function start_file_send()
-{
-		sampleBuf=new Uint8Array( file_data_array );
- 
-		var chunk_size=960; // for asr chunk_size [5, 10, 5]
- 
-
- 
-		
- 
-		while(sampleBuf.length>=chunk_size){
-			
-		    sendBuf=sampleBuf.slice(0,chunk_size);
-			totalsend=totalsend+sampleBuf.length;
-			sampleBuf=sampleBuf.slice(chunk_size,sampleBuf.length);
-			wsconnecter.wsSend(sendBuf);
- 
-		 
-		}
- 
-		stop();
-
- 
-
-}
- 
-	
-function on_recoder_mode_change()
-{
-            var item = null;
-            var obj = document.getElementsByName("recoder_mode");
-            for (var i = 0; i < obj.length; i++) { //遍历Radio 
-                if (obj[i].checked) {
-                    item = obj[i].value;  
-					break;
-                }
-		    
-
-           }
-		    if(item=="mic")
-			{
-				document.getElementById("mic_mode_div").style.display = 'block';
-				document.getElementById("rec_mode_div").style.display = 'none';
- 
- 
-		        btnStart.disabled = true;
-		        btnStop.disabled = true;
-		        btnConnect.disabled=false;
-				isfilemode=false;
-			}
-			else
-			{
-				document.getElementById("mic_mode_div").style.display = 'none';
-				document.getElementById("rec_mode_div").style.display = 'block';
- 
-		        btnStart.disabled = true;
-		        btnStop.disabled = true;
-		        btnConnect.disabled=true;
-			    isfilemode=true;
-				info_div.innerHTML='请点击选择文件';
-			    
-	 
-			}
-}
-
-
-function getHotwords(){
-	
-	var obj = document.getElementById("varHot");
-
-	if(typeof(obj) == 'undefined' || obj==null || obj.value.length<=0){
-	  return null;
-	}
-	let val = obj.value.toString();
-  
-	console.log("hotwords="+val);
-	let items = val.split(/[(\r\n)\r\n]+/);  //split by \r\n
-	var jsonresult = {};
-	const regexNum = /^[0-9]*$/; // test number
-	for (item of items) {
-  
-		let result = item.split(" ");
-		if(result.length>=2 && regexNum.test(result[result.length-1]))
-		{ 
-			var wordstr="";
-			for(var i=0;i<result.length-1;i++)
-				wordstr=wordstr+result[i]+" ";
-  
-			jsonresult[wordstr.trim()]= parseInt(result[result.length-1]);
-		}
-	}
-	console.log("jsonresult="+JSON.stringify(jsonresult));
-	return  JSON.stringify(jsonresult);
-
-}
-function getAsrMode(){
-
-            var item = null;
-            var obj = document.getElementsByName("asr_mode");
-            for (var i = 0; i < obj.length; i++) { //遍历Radio 
-                if (obj[i].checked) {
-                    item = obj[i].value;  
-					break;
-                }
-		    
-
-           }
-            if(isfilemode)
-			{
-				item= "offline";
-			}
-		   console.log("asr mode"+item);
-		   
-		   return item;
-}
-		   
-function handleWithTimestamp(tmptext,tmptime)
-{
-	console.log( "tmptext: " + tmptext);
-	console.log( "tmptime: " + tmptime);
-    if(tmptime==null || tmptime=="undefined" || tmptext.length<=0)
-	{
-		return tmptext;
-	}
-	tmptext=tmptext.replace(/。|？|，|、|\?|\.|\ /g, ","); // in case there are a lot of "。"
-	var words=tmptext.split(",");  // split to chinese sentence or english words
-	var jsontime=JSON.parse(tmptime); //JSON.parse(tmptime.replace(/\]\]\[\[/g, "],[")); // in case there are a lot segments by VAD
-	var char_index=0; // index for timestamp
-	var text_withtime="";
-	for(var i=0;i<words.length;i++)
-	{   
-	if(words[i]=="undefined"  || words[i].length<=0)
-	{
-		continue;
-	}
-    console.log("words===",words[i]);
-	console.log( "words: " + words[i]+",time="+jsontime[char_index][0]/1000);
-	if (/^[a-zA-Z]+$/.test(words[i]))
-	{   // if it is english
-		text_withtime=text_withtime+jsontime[char_index][0]/1000+":"+words[i]+"\n";
-		char_index=char_index+1;  //for english, timestamp unit is about a word
-	}
-	else{
-        // if it is chinese
-		text_withtime=text_withtime+jsontime[char_index][0]/1000+":"+words[i]+"\n";
-		char_index=char_index+words[i].length; //for chinese, timestamp unit is about a char
-	}
-	}
-	return text_withtime;
-	
-
-}
-
-const sleep = (delay) => new Promise((resolve) => setTimeout(resolve, delay))
-async function is_speaking() {
-	const response = await fetch('/is_speaking', {
-		body: JSON.stringify({
-			sessionid: String(parent.document.getElementById('sessionid').value),
-		}),
-		headers: {
-			'Content-Type': 'application/json'
-		},
-		method: 'POST'
-	  });
-	const data = await response.json();
-	console.log('is_speaking res:',data)
-	return data.data
-}
-
-async function waitSpeakingEnd() {
-	rec.stop() //关闭录音
-	for(let i=0;i<10;i++) {  //等待数字人开始讲话，最长等待10s
-		bspeak = await is_speaking()
-		if(bspeak) {
-			break
-		}
-		await sleep(1000)
-	}
-
-	while(true) {  //等待数字人讲话结束
-		bspeak = await is_speaking()
-		if(!bspeak) {
-			break
-		}
-		await sleep(1000)
-	}
-	await sleep(2000)
-	rec.start() 
-}
-// 语音识别结果; 对jsonMsg数据解析,将识别结果附加到编辑框中
-function getJsonMessage( jsonMsg ) {
-	//console.log(jsonMsg);
-	console.log( "message: " + JSON.parse(jsonMsg.data)['text'] );
-	var rectxt=""+JSON.parse(jsonMsg.data)['text'];
-	var asrmodel=JSON.parse(jsonMsg.data)['mode'];
-	var is_final=JSON.parse(jsonMsg.data)['is_final'];
-	var timestamp=JSON.parse(jsonMsg.data)['timestamp'];
-	if(asrmodel=="2pass-offline" || asrmodel=="offline")
-	{
-		offline_text=offline_text+rectxt.replace(/ +/g,"")+'\n'; //handleWithTimestamp(rectxt,timestamp); //rectxt; //.replace(/ +/g,"");
-		rec_text=offline_text;
-		fetch('/human', {
-            body: JSON.stringify({
-                text: rectxt.replace(/ +/g,""),
-                type: 'chat',
-				sessionid: String(parent.document.getElementById('sessionid').value),
-            }),
-            headers: {
-                'Content-Type': 'application/json'
-            },
-            method: 'POST'
-      	});
-
-		waitSpeakingEnd();
-	}
-	else
-	{
-		rec_text=rec_text+rectxt; //.replace(/ +/g,"");
-	}
-	var varArea=document.getElementById('varArea');
-	
-	varArea.value=rec_text;
-	console.log( "offline_text: " + asrmodel+","+offline_text);
-	console.log( "rec_text: " + rec_text);
-	if (isfilemode==true && is_final==true){
-		console.log("call stop ws!");
-		play_file();
-		wsconnecter.wsStop();
-        
-		info_div.innerHTML="请点击连接";
- 
-		btnStart.disabled = true;
-		btnStop.disabled = true;
-		btnConnect.disabled=false;
-	}
-	
-	 
- 
-}
-
-// 连接状态响应
-function getConnState( connState ) {
-	if ( connState === 0 ) { //on open
- 
- 
-		info_div.innerHTML='连接成功!请点击开始';
-		if (isfilemode==true){
-			info_div.innerHTML='请耐心等待,大文件等待时间更长';
-			start_file_send();
-		}
-		else
-		{
-			btnStart.disabled = false;
-			btnStop.disabled = true;
-			btnConnect.disabled=true;
-		}
-	} else if ( connState === 1 ) {
-		//stop();
-	} else if ( connState === 2 ) {
-		stop();
-		console.log( 'connecttion error' );
-		 
-		alert("连接地址"+document.getElementById('wssip').value+"失败,请检查asr地址和端口。或试试界面上手动授权，再连接。");
-		btnStart.disabled = true;
-		btnStop.disabled = true;
-		btnConnect.disabled=false;
- 
- 
-		info_div.innerHTML='请点击连接';
-	}
-}
-
-function record()
-{
- 
-		 rec.open( function(){
-		 rec.start();
-		 console.log("开始");
-			btnStart.disabled = true;
-			btnStop.disabled = false;
-			btnConnect.disabled=true;
-		 });
- 
-}
-
- 
-
-// 识别启动、停止、清空操作
-function start() {
-	
-	// 清除显示
-	clear();
-	//控件状态更新
- 	console.log("isfilemode"+isfilemode);
-    
-	//启动连接
-	var ret=wsconnecter.wsStart();
-	// 1 is ok, 0 is error
-	if(ret==1){
-		info_div.innerHTML="正在连接asr服务器，请等待...";
-		isRec = true;
-		btnStart.disabled = true;
-		btnStop.disabled = true;
-		btnConnect.disabled=true;
- 
-        return 1;
-	}
-	else
-	{
-		info_div.innerHTML="请点击开始";
-		btnStart.disabled = true;
-		btnStop.disabled = true;
-		btnConnect.disabled=false;
- 
-		return 0;
-	}
-}
-
- 
-function stop() {
-		var chunk_size = new Array( 5, 10, 5 );
-		var request = {
-			"chunk_size": chunk_size,
-			"wav_name":  "h5",
-			"is_speaking":  false,
-			"chunk_interval":10,
-			"mode":getAsrMode(),
-		};
-		console.log(request);
-		if(sampleBuf.length>0){
-		wsconnecter.wsSend(sampleBuf);
-		console.log("sampleBuf.length"+sampleBuf.length);
-		sampleBuf=new Int16Array();
-		}
-	   wsconnecter.wsSend( JSON.stringify(request) );
- 
-	  
-	
-	 
-
- 
-	// 控件状态更新
-	
-	isRec = false;
-    info_div.innerHTML="发送完数据,请等候,正在识别...";
-
-   if(isfilemode==false){
-	    btnStop.disabled = true;
-		btnStart.disabled = true;
-		btnConnect.disabled=true;
-		//wait 3s for asr result
-	  setTimeout(function(){
-		console.log("call stop ws!");
-		wsconnecter.wsStop();
-		btnConnect.disabled=false;
-		info_div.innerHTML="请点击连接";}, 3000 );
- 
- 
-	   
-	rec.stop(function(blob,duration){
-  
-		console.log(blob);
-		var audioBlob = Recorder.pcm2wav(data = {sampleRate:16000, bitRate:16, blob:blob},
-		function(theblob,duration){
-				console.log(theblob);
-		var audio_record = document.getElementById('audio_record');
-		audio_record.src =  (window.URL||webkitURL).createObjectURL(theblob); 
-        audio_record.controls=true;
-		//audio_record.play(); 
-         	
-
-	}   ,function(msg){
-		 console.log(msg);
-	}
-		);
- 
-
- 
-	},function(errMsg){
-		console.log("errMsg: " + errMsg);
-	});
-   }
-    // 停止连接
- 
-    
-
-}
-
-function clear() {
- 
-    var varArea=document.getElementById('varArea');
- 
-	varArea.value="";
-    rec_text="";
-	offline_text="";
- 
-}
-
- 
-function recProcess( buffer, powerLevel, bufferDuration, bufferSampleRate,newBufferIdx,asyncEnd ) {
-	if ( isRec === true ) {
-		var data_48k = buffer[buffer.length-1];  
- 
-		var  array_48k = new Array(data_48k);
-		var data_16k=Recorder.SampleData(array_48k,bufferSampleRate,16000).data;
- 
-		sampleBuf = Int16Array.from([...sampleBuf, ...data_16k]);
-		var chunk_size=960; // for asr chunk_size [5, 10, 5]
-		info_div.innerHTML=""+bufferDuration/1000+"s";
-		while(sampleBuf.length>=chunk_size){
-		    sendBuf=sampleBuf.slice(0,chunk_size);
-			sampleBuf=sampleBuf.slice(chunk_size,sampleBuf.length);
-			wsconnecter.wsSend(sendBuf);
-			
-			
-		 
-		}
-		
- 
-		
-	}
-}
-
-function getUseITN() {
-	var obj = document.getElementsByName("use_itn");
-	for (var i = 0; i < obj.length; i++) {
-		if (obj[i].checked) {
-			return obj[i].value === "true";
-		}
-	}
-	return false;
-}
+/**
+ * Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights
+ * Reserved. MIT License  (https://opensource.org/licenses/MIT)
+ */
+/* 2022-2023 by zhaoming,mali aihealthx.com */
+
+
+// Connection; Define socket connection and audio objects
+var wsconnecter = new WebSocketConnectMethod({msgHandle:getJsonMessage,stateHandle:getConnState});
+var audioBlob;
+
+// Recording; Define recording object, wav format
+var rec = Recorder({
+	type:"pcm",
+	bitRate:16,
+	sampleRate:16000,
+	onProcess:recProcess
+});
+
+ 
+ 
+ 
+var sampleBuf=new Int16Array();
+// Define button click handlers
+var btnStart = document.getElementById('btnStart');
+btnStart.onclick = record;
+var btnStop = document.getElementById('btnStop');
+btnStop.onclick = stop;
+btnStop.disabled = true;
+btnStart.disabled = true;
+ 
+btnConnect= document.getElementById('btnConnect');
+btnConnect.onclick = start;
+
+var awsslink= document.getElementById('wsslink');
+
+ 
+var rec_text="";  // for online rec asr result
+var offline_text=""; // for offline rec asr result
+var info_div = document.getElementById('info_div');
+
+var upfile = document.getElementById('upfile');
+
+ 
+
+var isfilemode=false;  // if it is in file mode
+var file_ext="";
+var file_sample_rate=16000; //for wav file sample rate
+var file_data_array;  // array to save file data
+ 
+var totalsend=0;
+
+
+// var now_ipaddress=window.location.href;
+// now_ipaddress=now_ipaddress.replace("https://","wss://");
+// now_ipaddress=now_ipaddress.replace("static/index.html","");
+// var localport=window.location.port;
+// now_ipaddress=now_ipaddress.replace(localport,"10095");
+// document.getElementById('wssip').value=now_ipaddress;
+addresschange();
+function addresschange()
+{   
+	
+    var Uri = document.getElementById('wssip').value; 
+	document.getElementById('info_wslink').innerHTML="Click here to manually authorize (iOS)";
+	Uri=Uri.replace(/wss/g,"https");
+	console.log("addresschange uri=",Uri);
+	
+	awsslink.onclick=function(){
+		window.open(Uri, '_blank');
+		}
+	
+}
+
+upfile.onclick=function()
+{
+		btnStart.disabled = true;
+		btnStop.disabled = true;
+		btnConnect.disabled=false;
+	
+}
+
+// from https://github.com/xiangyuecn/Recorder/tree/master
+var readWavInfo=function(bytes){
+	// Read wav header, uniform to 44-byte header
+	if(bytes.byteLength<44){
+		return null;
+	};
+	var wavView=bytes;
+	var eq=function(p,s){
+		for(var i=0;i<s.length;i++){
+			if(wavView[p+i]!=s.charCodeAt(i)){
+				return false;
+			};
+		};
+		return true;
+	};
+	
+	if(eq(0,"RIFF")&&eq(8,"WAVEfmt ")){
+ 
+		var numCh=wavView[22];
+		if(wavView[20]==1 && (numCh==1||numCh==2)){//raw pcm single or dual channel
+			var sampleRate=wavView[24]+(wavView[25]<<8)+(wavView[26]<<16)+(wavView[27]<<24);
+			var bitRate=wavView[34]+(wavView[35]<<8);
+			var heads=[wavView.subarray(0,12)],headSize=12;//head only retains necessary blocks
+			// Search for data block position
+			var dataPos=0; // 44 or more blocks
+			for(var i=12,iL=wavView.length-8;i<iL;){
+				if(wavView[i]==100&&wavView[i+1]==97&&wavView[i+2]==116&&wavView[i+3]==97){//eq(i,"data")
+					heads.push(wavView.subarray(i,i+8));
+					headSize+=8;
+					dataPos=i+8;break;
+				}
+				var i0=i;
+				i+=4;
+				i+=4+wavView[i]+(wavView[i+1]<<8)+(wavView[i+2]<<16)+(wavView[i+3]<<24);
+				if(i0==12){//fmt 
+					heads.push(wavView.subarray(i0,i));
+					headSize+=i-i0;
+				}
+			}
+			if(dataPos){
+				var wavHead=new Uint8Array(headSize);
+				for(var i=0,n=0;i<heads.length;i++){
+					wavHead.set(heads[i],n);n+=heads[i].length;
+				}
+				return {
+					sampleRate:sampleRate
+					,bitRate:bitRate
+					,numChannels:numCh
+					,wavHead44:wavHead
+					,dataPos:dataPos
+				};
+			};
+		};
+	};
+	return null;
+};
+
+upfile.onchange = function () {
+            var len = this.files.length;  
+            for(let i = 0; i < len; i++) {
+
+                let fileAudio = new FileReader();
+                fileAudio.readAsArrayBuffer(this.files[i]);  
+ 
+				file_ext=this.files[i].name.split('.').pop().toLowerCase();
+                var audioblob;
+                fileAudio.onload = function() {
+                audioblob = fileAudio.result;
+ 
+				 
+				 file_data_array=audioblob;
+ 
+                  
+                 info_div.innerHTML='Please click Connect to start recognition';
+ 
+                }
+
+                fileAudio.onerror = function(e) {
+                    console.log('error' + e);
+                }
+            }
+			// for wav file, we  get the sample rate
+			if(file_ext=="wav")
+            for(let i = 0; i < len; i++) {
+
+                let fileAudio = new FileReader();
+                fileAudio.readAsArrayBuffer(this.files[i]);  
+                fileAudio.onload = function() {
+                audioblob = new Uint8Array(fileAudio.result);
+ 
+				// for wav file, we can get the sample rate
+				var info=readWavInfo(audioblob);
+				   console.log(info);
+				   file_sample_rate=info.sampleRate;
+	 
+ 
+                }
+
+                 
+            }
+ 
+        }
+
+function play_file()
+{
+		  var audioblob=new Blob( [ new Uint8Array(file_data_array)] , {type :"audio/wav"});
+		  var audio_record = document.getElementById('audio_record');
+		  audio_record.src =  (window.URL||webkitURL).createObjectURL(audioblob); 
+          audio_record.controls=true;
+		  //audio_record.play();  //not auto play
+}
+function start_file_send()
+{
+		sampleBuf=new Uint8Array( file_data_array );
+ 
+		var chunk_size=960; // for asr chunk_size [5, 10, 5]
+ 
+		while(sampleBuf.length>=chunk_size){
+			
+		    sendBuf=sampleBuf.slice(0,chunk_size);
+			totalsend=totalsend+sampleBuf.length;
+			sampleBuf=sampleBuf.slice(chunk_size,sampleBuf.length);
+			wsconnecter.wsSend(sendBuf);
+ 
+		 
+		}
+ 
+		stop();
+
+ 
+
+}
+ 
+	
+function on_recoder_mode_change()
+{
+            var item = null;
+            var obj = document.getElementsByName("recoder_mode");
+            for (var i = 0; i < obj.length; i++) { // Iterate over radios 
+                if (obj[i].checked) {
+                    item = obj[i].value;  
+					break;
+                }
+		    
+
+           }
+		    if(item=="mic")
+			{
+				document.getElementById("mic_mode_div").style.display = 'block';
+				document.getElementById("rec_mode_div").style.display = 'none';
+ 
+ 
+		        btnStart.disabled = true;
+		        btnStop.disabled = true;
+		        btnConnect.disabled=false;
+				isfilemode=false;
+			}
+			else
+			{
+				document.getElementById("mic_mode_div").style.display = 'none';
+				document.getElementById("rec_mode_div").style.display = 'block';
+ 
+		        btnStart.disabled = true;
+		        btnStop.disabled = true;
+		        btnConnect.disabled=true;
+			    isfilemode=true;
+				info_div.innerHTML='Please click to select a file';
+			    
+	 
+			}
+}
+
+
+function getHotwords(){
+	
+	var obj = document.getElementById("varHot");
+
+	if(typeof(obj) == 'undefined' || obj==null || obj.value.length<=0){
+	  return null;
+	}
+	let val = obj.value.toString();
+  
+	console.log("hotwords="+val);
+	let items = val.split(/[(\r\n)\r\n]+/);  //split by \r\n
+	var jsonresult = {};
+	const regexNum = /^[0-9]*$/; // test number
+	for (item of items) {
+  
+		let result = item.split(" ");
+		if(result.length>=2 && regexNum.test(result[result.length-1]))
+		{ 
+			var wordstr="";
+			for(var i=0;i<result.length-1;i++)
+				wordstr=wordstr+result[i]+" ";
+  
+			jsonresult[wordstr.trim()]= parseInt(result[result.length-1]);
+		}
+	}
+	console.log("jsonresult="+JSON.stringify(jsonresult));
+	return  JSON.stringify(jsonresult);
+
+}
+function getAsrMode(){
+
+            var item = null;
+            var obj = document.getElementsByName("asr_mode");
+            for (var i = 0; i < obj.length; i++) { // Iterate over radios 
+                if (obj[i].checked) {
+                    item = obj[i].value;  
+					break;
+                }
+		    
+
+           }
+            if(isfilemode)
+			{
+				item= "offline";
+			}
+		   console.log("asr mode"+item);
+		   
+		   return item;
+}
+		   
+function handleWithTimestamp(tmptext,tmptime)
+{
+	console.log( "tmptext: " + tmptext);
+	console.log( "tmptime: " + tmptime);
+    if(tmptime==null || tmptime=="undefined" || tmptext.length<=0)
+	{
+		return tmptext;
+	}
+	tmptext=tmptext.replace(/。|？|，|、|\?|\.|\ /g, ","); // in case there are a lot of "。"
+	var words=tmptext.split(",");  // split to chinese sentence or english words
+	var jsontime=JSON.parse(tmptime); //JSON.parse(tmptime.replace(/\]\]\[\[/g, "],[")); // in case there are a lot segments by VAD
+	var char_index=0; // index for timestamp
+	var text_withtime="";
+	for(var i=0;i<words.length;i++)
+	{   
+	if(words[i]=="undefined"  || words[i].length<=0)
+	{
+		continue;
+	}
+    console.log("words===",words[i]);
+	console.log( "words: " + words[i]+",time="+jsontime[char_index][0]/1000);
+	if (/^[a-zA-Z]+$/.test(words[i]))
+	{   // if it is english
+		text_withtime=text_withtime+jsontime[char_index][0]/1000+":"+words[i]+"\n";
+		char_index=char_index+1;  //for english, timestamp unit is about a word
+	}
+	else{
+        // if it is chinese
+		text_withtime=text_withtime+jsontime[char_index][0]/1000+":"+words[i]+"\n";
+		char_index=char_index+words[i].length; //for chinese, timestamp unit is about a char
+	}
+	}
+	return text_withtime;
+	
+
+}
+
+const sleep = (delay) => new Promise((resolve) => setTimeout(resolve, delay))
+async function is_speaking() {
+	const response = await fetch('/is_speaking', {
+		body: JSON.stringify({
+			sessionid: String(parent.document.getElementById('sessionid').value),
+		}),
+		headers: {
+			'Content-Type': 'application/json'
+		},
+		method: 'POST'
+	  });
+	const data = await response.json();
+	console.log('is_speaking res:',data)
+	return data.data
+}
+
+async function waitSpeakingEnd() {
+	rec.stop() // Stop recording
+	for(let i=0;i<10;i++) {  // Wait for avatar to start speaking, max 10s
+		bspeak = await is_speaking()
+		if(bspeak) {
+			break
+		}
+		await sleep(1000)
+	}
+
+	while(true) {  // Wait for avatar to finish speaking
+		bspeak = await is_speaking()
+		if(!bspeak) {
+			break
+		}
+		await sleep(1000)
+	}
+	await sleep(2000)
+	rec.start() 
+}
+// ASR result; Parse jsonMsg data and append to text area
+function getJsonMessage( jsonMsg ) {
+	//console.log(jsonMsg);
+	console.log( "message: " + JSON.parse(jsonMsg.data)['text'] );
+	var rectxt=""+JSON.parse(jsonMsg.data)['text'];
+	var asrmodel=JSON.parse(jsonMsg.data)['mode'];
+	var is_final=JSON.parse(jsonMsg.data)['is_final'];
+	var timestamp=JSON.parse(jsonMsg.data)['timestamp'];
+	if(asrmodel=="2pass-offline" || asrmodel=="offline")
+	{
+		offline_text=offline_text+rectxt.replace(/ +/g,"")+'\n'; //handleWithTimestamp(rectxt,timestamp); //rectxt; //.replace(/ +/g,"");
+		rec_text=offline_text;
+		fetch('/human', {
+            body: JSON.stringify({
+                text: rectxt.replace(/ +/g,""),
+                type: 'chat',
+				sessionid: String(parent.document.getElementById('sessionid').value),
+            }),
+            headers: {
+                'Content-Type': 'application/json'
+            },
+            method: 'POST'
+      	});
+
+		waitSpeakingEnd();
+	}
+	else
+	{
+		rec_text=rec_text+rectxt; //.replace(/ +/g,"");
+	}
+	var varArea=document.getElementById('varArea');
+	
+	varArea.value=rec_text;
+	console.log( "offline_text: " + asrmodel+","+offline_text);
+	console.log( "rec_text: " + rec_text);
+	if (isfilemode==true && is_final==true){
+		console.log("call stop ws!");
+		play_file();
+		wsconnecter.wsStop();
+        
+		info_div.innerHTML="Please click Connect";
+ 
+		btnStart.disabled = true;
+		btnStop.disabled = true;
+		btnConnect.disabled=false;
+	}
+	
+	 
+ 
+}
+
+// Connection status handler
+function getConnState( connState ) {
+	if ( connState === 0 ) { //on open
+ 
+ 
+		info_div.innerHTML='Connected successfully! Please click Start';
+		if (isfilemode==true){
+			info_div.innerHTML='Please wait patiently, larger files take longer';
+			start_file_send();
+		}
+		else
+		{
+			btnStart.disabled = false;
+			btnStop.disabled = true;
+			btnConnect.disabled=true;
+		}
+	} else if ( connState === 1 ) {
+		//stop();
+	} else if ( connState === 2 ) {
+		stop();
+		console.log( 'connecttion error' );
+		 
+		alert("Connection to " + document.getElementById('wssip').value + " failed. Please check the ASR address and port, or try manually authorizing first.");
+		btnStart.disabled = true;
+		btnStop.disabled = true;
+		btnConnect.disabled=false;
+ 
+ 
+		info_div.innerHTML='Please click Connect';
+	}
+}
+
+function record()
+{
+ 
+		 rec.open( function(){
+		 rec.start();
+		 console.log("Start");
+			btnStart.disabled = true;
+			btnStop.disabled = false;
+			btnConnect.disabled=true;
+		 });
+ 
+}
+
+ 
+
+// Recognition start, stop, clear operations
+function start() {
+	
+	// Clear display
+	clear();
+	// Control state update
+ 	console.log("isfilemode"+isfilemode);
+    
+	// Start connection
+	var ret=wsconnecter.wsStart();
+	// 1 is ok, 0 is error
+	if(ret==1){
+		info_div.innerHTML="Connecting to ASR server, please wait...";
+		isRec = true;
+		btnStart.disabled = true;
+		btnStop.disabled = true;
+		btnConnect.disabled=true;
+ 
+        return 1;
+	}
+	else
+	{
+		info_div.innerHTML="Please click Start";
+		btnStart.disabled = true;
+		btnStop.disabled = true;
+		btnConnect.disabled=false;
+ 
+		return 0;
+	}
+}
+
+ 
+function stop() {
+		var chunk_size = new Array( 5, 10, 5 );
+		var request = {
+			"chunk_size": chunk_size,
+			"wav_name":  "h5",
+			"is_speaking":  false,
+			"chunk_interval":10,
+			"mode":getAsrMode(),
+		};
+		console.log(request);
+		if(sampleBuf.length>0){
+		wsconnecter.wsSend(sampleBuf);
+		console.log("sampleBuf.length"+sampleBuf.length);
+		sampleBuf=new Int16Array();
+		}
+	   wsconnecter.wsSend( JSON.stringify(request) );
+ 
+	  
+	
+	 
+
+ 
+	// Control state update
+	
+	isRec = false;
+    info_div.innerHTML="Data sent, please wait, recognizing...";
+
+   if(isfilemode==false){
+	    btnStop.disabled = true;
+		btnStart.disabled = true;
+		btnConnect.disabled=true;
+		//wait 3s for asr result
+	  setTimeout(function(){
+		console.log("call stop ws!");
+		wsconnecter.wsStop();
+		btnConnect.disabled=false;
+		info_div.innerHTML="Please click Connect";}, 3000 );
+ 
+ 
+	   
+	rec.stop(function(blob,duration){
+  
+		console.log(blob);
+		var audioBlob = Recorder.pcm2wav(data = {sampleRate:16000, bitRate:16, blob:blob},
+		function(theblob,duration){
+				console.log(theblob);
+		var audio_record = document.getElementById('audio_record');
+		audio_record.src =  (window.URL||webkitURL).createObjectURL(theblob); 
+        audio_record.controls=true;
+		//audio_record.play(); 
+         	
+
+	}   ,function(msg){
+		 console.log(msg);
+	}
+		);
+ 
+
+
+ 
+	},function(errMsg){
+		console.log("errMsg: " + errMsg);
+	});
+   }
+    // Stop connection
+ 
+    
+
+}
+
+function clear() {
+ 
+    var varArea=document.getElementById('varArea');
+ 
+	varArea.value="";
+    rec_text="";
+	offline_text="";
+ 
+}
+
+ 
+function recProcess( buffer, powerLevel, bufferDuration, bufferSampleRate,newBufferIdx,asyncEnd ) {
+	if ( isRec === true ) {
+		var data_48k = buffer[buffer.length-1];  
+ 
+		var  array_48k = new Array(data_48k);
+		var data_16k=Recorder.SampleData(array_48k,bufferSampleRate,16000).data;
+ 
+		sampleBuf = Int16Array.from([...sampleBuf, ...data_16k]);
+		var chunk_size=960; // for asr chunk_size [5, 10, 5]
+		info_div.innerHTML=""+bufferDuration/1000+"s";
+		while(sampleBuf.length>=chunk_size){
+		    sendBuf=sampleBuf.slice(0,chunk_size);
+			sampleBuf=sampleBuf.slice(chunk_size,sampleBuf.length);
+			wsconnecter.wsSend(sendBuf);
+			
+			
+		 
+		}
+		
+ 
+		
+	}
+}
+
+function getUseITN() {
+	var obj = document.getElementsByName("use_itn");
+	for (var i = 0; i < obj.length; i++) {
+		if (obj[i].checked) {
+			return obj[i].value === "true";
+		}
+	}
+	return false;
+}
diff --git a/web/asr/wsconnecter.js b/web/asr/wsconnecter.js
index db140efc..7e2ee995 100644
--- a/web/asr/wsconnecter.js
+++ b/web/asr/wsconnecter.js
@@ -1,119 +1,119 @@
-/**
- * Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights
- * Reserved. MIT License  (https://opensource.org/licenses/MIT)
- */
-/* 2021-2023 by zhaoming,mali aihealthx.com */
-
-function WebSocketConnectMethod( config ) { //定义socket连接方法类
-
-	
-	var speechSokt;
-	var connKeeperID;
-	
-	var msgHandle = config.msgHandle;
-	var stateHandle = config.stateHandle;
-			  
-	this.wsStart = function () {
-		var Uri = document.getElementById('wssip').value; //"wss://111.205.137.58:5821/wss/" //设置wss asr online接口地址 如 wss://X.X.X.X:port/wss/
-		if(Uri.match(/wss:\S*|ws:\S*/))
-		{
-			console.log("Uri"+Uri);
-		}
-		else
-		{
-			alert("请检查wss地址正确性");
-			return 0;
-		}
- 
-		if ( 'WebSocket' in window ) {
-			speechSokt = new WebSocket( Uri ); // 定义socket连接对象
-			speechSokt.onopen = function(e){onOpen(e);}; // 定义响应函数
-			speechSokt.onclose = function(e){
-			    console.log("onclose ws!");
-			    //speechSokt.close();
-				onClose(e);
-				};
-			speechSokt.onmessage = function(e){onMessage(e);};
-			speechSokt.onerror = function(e){onError(e);};
-			return 1;
-		}
-		else {
-			alert('当前浏览器不支持 WebSocket');
-			return 0;
-		}
-	};
-	
-	// 定义停止与发送函数
-	this.wsStop = function () {
-		if(speechSokt != undefined) {
-			console.log("stop ws!");
-			speechSokt.close();
-		}
-	};
-	
-	this.wsSend = function ( oneData ) {
- 
-		if(speechSokt == undefined) return;
-		if ( speechSokt.readyState === 1 ) { // 0:CONNECTING, 1:OPEN, 2:CLOSING, 3:CLOSED
- 
-			speechSokt.send( oneData );
- 
-			
-		}
-	};
-	
-	// SOCEKT连接中的消息与状态响应
-	function onOpen( e ) {
-		// 发送json
-		var chunk_size = new Array( 5, 10, 5 );
-		var request = {
-			"chunk_size": chunk_size,
-			"wav_name":  "h5",
-			"is_speaking":  true,
-			"chunk_interval":10,
-			"itn":getUseITN(),
-			"mode":getAsrMode(),
-			
-		};
-		if(isfilemode)
-		{
-			request.wav_format=file_ext;
-			if(file_ext=="wav")
-			{
-				request.wav_format="PCM";
-				request.audio_fs=file_sample_rate;
-			}
-		}
-		
-		var hotwords=getHotwords();
- 
-		if(hotwords!=null  )
-		{
-			request.hotwords=hotwords;
-		}
-		console.log(JSON.stringify(request));
-		speechSokt.send(JSON.stringify(request));
-		console.log("连接成功");
-		stateHandle(0);
- 
-	}
-	
-	function onClose( e ) {
-		stateHandle(1);
-	}
-	
-	function onMessage( e ) {
- 
-		msgHandle( e );
-	}
-	
-	function onError( e ) {
- 
-		info_div.innerHTML="连接"+e;
-		console.log(e);
-		stateHandle(2);
-		
-	}
-    
- 
+/**
+ * Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights
+ * Reserved. MIT License  (https://opensource.org/licenses/MIT)
+ */
+/* 2021-2023 by zhaoming,mali aihealthx.com */
+
+function WebSocketConnectMethod( config ) { // Define socket connection method class
+
+	
+	var speechSokt;
+	var connKeeperID;
+	
+	var msgHandle = config.msgHandle;
+	var stateHandle = config.stateHandle;
+			  
+	this.wsStart = function () {
+		var Uri = document.getElementById('wssip').value; //"wss://111.205.137.58:5821/wss/" // Set wss asr online interface address e.g. wss://X.X.X.X:port/wss/
+		if(Uri.match(/wss:\S*|ws:\S*/))
+		{
+			console.log("Uri"+Uri);
+		}
+		else
+		{
+			alert("Please check that the WSS address is correct");
+			return 0;
+		}
+ 
+		if ( 'WebSocket' in window ) {
+			speechSokt = new WebSocket( Uri ); // Define socket connection object
+			speechSokt.onopen = function(e){onOpen(e);}; // Define handler functions
+			speechSokt.onclose = function(e){
+			    console.log("onclose ws!");
+			    //speechSokt.close();
+				onClose(e);
+				};
+			speechSokt.onmessage = function(e){onMessage(e);};
+			speechSokt.onerror = function(e){onError(e);};
+			return 1;
+		}
+		else {
+			alert('WebSocket is not supported by this browser');
+			return 0;
+		}
+	};
+	
+	// Define stop and send functions
+	this.wsStop = function () {
+		if(speechSokt != undefined) {
+			console.log("stop ws!");
+			speechSokt.close();
+		}
+	};
+	
+	this.wsSend = function ( oneData ) {
+ 
+		if(speechSokt == undefined) return;
+		if ( speechSokt.readyState === 1 ) { // 0:CONNECTING, 1:OPEN, 2:CLOSING, 3:CLOSED
+ 
+			speechSokt.send( oneData );
+ 
+			
+		}
+	};
+	
+	// Message and status handlers for socket connection
+	function onOpen( e ) {
+		// Send JSON
+		var chunk_size = new Array( 5, 10, 5 );
+		var request = {
+			"chunk_size": chunk_size,
+			"wav_name":  "h5",
+			"is_speaking":  true,
+			"chunk_interval":10,
+			"itn":getUseITN(),
+			"mode":getAsrMode(),
+			
+		};
+		if(isfilemode)
+		{
+			request.wav_format=file_ext;
+			if(file_ext=="wav")
+			{
+				request.wav_format="PCM";
+				request.audio_fs=file_sample_rate;
+			}
+		}
+		
+		var hotwords=getHotwords();
+ 
+		if(hotwords!=null  )
+		{
+			request.hotwords=hotwords;
+		}
+		console.log(JSON.stringify(request));
+		speechSokt.send(JSON.stringify(request));
+		console.log("Connection successful");
+		stateHandle(0);
+ 
+	}
+	
+	function onClose( e ) {
+		stateHandle(1);
+	}
+	
+	function onMessage( e ) {
+ 
+		msgHandle( e );
+	}
+	
+	function onError( e ) {
+ 
+		info_div.innerHTML="Connection " + e;
+		console.log(e);
+		stateHandle(2);
+		
+	}
+    
+ 
 }
\ No newline at end of file
diff --git a/web/avatar.html b/web/avatar.html
index 0932bb6d..4ea3be3b 100644
--- a/web/avatar.html
+++ b/web/avatar.html
@@ -1,9 +1,9 @@
 <!DOCTYPE html>
-<html lang="zh-CN">
+<html lang="en">
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Avatar 生成 - LiveTalking</title>
+    <title>Avatar Creator - LiveTalking</title>
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
     <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bootstrap-icons@1.10.0/font/bootstrap-icons.css">
     <style>
@@ -128,23 +128,23 @@
     <div class="container-fluid px-4">
         <a class="navbar-brand" href="#">
             <i class="bi bi-person-bounding-box me-2"></i>
-            LiveTalking Avatar 生成系统
+            LiveTalking Avatar Creator
         </a>
     </div>
 </nav>
 
 <div class="container">
     <div class="row">
-        <!-- 提交任务表单 -->
+        <!-- Task Form -->
         <div class="col-lg-5">
             <div class="glass-card">
                 <div class="card-header">
-                    <i class="bi bi-plus-circle-fill"></i> 创建新生成任务
+                    <i class="bi bi-plus-circle-fill"></i> Create New Task
                 </div>
                 <div class="card-body">
                     <form id="taskForm">
                         <div class="mb-3">
-                            <label class="form-label">算法模型</label>
+                            <label class="form-label">Model</label>
                             <select class="form-select" name="model" id="modelSelect" required>
                                 <option value="wav2lip">Wav2Lip</option>
                                 <option value="musetalk">MuseTalk</option>
@@ -152,22 +152,22 @@
                         </div>
                         <div class="mb-3">
                             <label class="form-label">Avatar ID</label>
-                            <input type="text" class="form-control" name="avatar_id" placeholder="如: wav2lip256_test" required>
+                            <input type="text" class="form-control" name="avatar_id" placeholder="e.g. my_avatar_001" required>
                         </div>
                         <div class="mb-3">
-                            <label class="form-label">视频文件</label>
+                            <label class="form-label">Video File</label>
                             <input type="file" class="form-control" name="video_file" accept="video/*" required>
                         </div>
 
                         <div class="mb-3">
                             <a class="text-decoration-none" data-bs-toggle="collapse" href="#advancedParams" role="button">
-                                <i class="bi bi-gear me-1"></i> 高级参数 (可选)
+                                <i class="bi bi-gear me-1"></i> Advanced (Optional)
                             </a>
                             <div class="collapse mt-2" id="advancedParams">
                                 <div class="param-group">
                                     <div class="row">
                                         <div class="col-6 mb-2">
-                                            <label class="form-label small">图像大小</label>
+                                            <label class="form-label small">Image Size</label>
                                             <input type="number" class="form-control form-control-sm" name="img_size" id="imgSizeInput" value="256">
                                         </div>
                                         <div class="col-6 mb-2">
@@ -177,11 +177,11 @@
                                     </div>
                                     <div class="row">
                                         <div class="col-6 mb-2">
-                                            <label class="form-label small">Pads (上下左右)</label>
+                                            <label class="form-label small">Pads (top bottom left right)</label>
                                             <input type="text" class="form-control form-control-sm" name="pads" value="0 10 0 0" placeholder="0 10 0 0">
                                         </div>
                                         <div class="col-6 mb-2">
-                                            <label class="form-label small">人脸检测批大小</label>
+                                            <label class="form-label small">Face Detect Batch Size</label>
                                             <input type="number" class="form-control form-control-sm" name="face_det_batch_size" value="4">
                                         </div>
                                     </div>
@@ -190,26 +190,26 @@
                         </div>
 
                         <button type="submit" class="btn btn-submit w-100 mt-2" id="submitBtn">
-                            <i class="bi bi-cloud-arrow-up-fill me-2"></i>提交生成任务
+                            <i class="bi bi-cloud-arrow-up-fill me-2"></i>Submit Task
                         </button>
                     </form>
                 </div>
             </div>
         </div>
 
-        <!-- 任务列表 -->
+        <!-- Task List -->
         <div class="col-lg-7">
             <div class="glass-card">
                 <div class="card-header">
-                    <i class="bi bi-list-task"></i> 任务列表
+                    <i class="bi bi-list-task"></i> Task List
                     <span class="refresh-spinner" id="refreshInfo">
-                        <i class="bi bi-arrow-repeat spin"></i> 自动更新中...
+                        <i class="bi bi-arrow-repeat spin"></i> Auto refreshing...
                     </span>
                 </div>
                 <div class="card-body" id="taskList" style="max-height: 600px; overflow-y: auto;">
                     <div class="text-center py-5 text-muted">
                         <div class="spinner-border spinner-border-sm me-2"></div>
-                        正在加载任务列表...
+                        Loading tasks...
                     </div>
                 </div>
             </div>
@@ -223,11 +223,10 @@
     const submitBtn = document.getElementById('submitBtn');
     const taskList = document.getElementById('taskList');
 
-    // 提交任务
     taskForm.addEventListener('submit', async (e) => {
         e.preventDefault();
         submitBtn.disabled = true;
-        submitBtn.innerHTML = '<span class="spinner-border spinner-border-sm me-2"></span>正在上传并创建任务...';
+        submitBtn.innerHTML = '<span class="spinner-border spinner-border-sm me-2"></span>Uploading & creating task...';
 
         const formData = new FormData(taskForm);
 
@@ -239,21 +238,20 @@
             const result = await response.json();
 
             if (result.code === 0) {
-                alert('任务提交成功! Task ID: ' + result.data.task_id);
+                alert('Task created! Task ID: ' + result.data.task_id);
                 refreshTasks();
             } else {
-                alert('提交失败: ' + result.msg);
+                alert('Failed: ' + result.msg);
             }
         } catch (error) {
             console.error('Error:', error);
-            alert('提交发生网络错误');
+            alert('Network error');
         } finally {
             submitBtn.disabled = false;
-            submitBtn.innerHTML = '<i class="bi bi-cloud-arrow-up-fill me-2"></i>提交生成任务';
+            submitBtn.innerHTML = '<i class="bi bi-cloud-arrow-up-fill me-2"></i>Submit Task';
         }
     });
 
-    // 刷新任务列表
     async function refreshTasks() {
         try {
             const response = await fetch('/api/avatar/tasks');
@@ -269,7 +267,7 @@
 
     function renderTasks(tasks) {
         if (!tasks || tasks.length === 0) {
-            taskList.innerHTML = '<div class="text-center py-5 text-muted">暂无任务</div>';
+            taskList.innerHTML = '<div class="text-center py-5 text-muted">No tasks yet</div>';
             return;
         }
 
@@ -309,7 +307,7 @@
                     <div class="d-flex justify-content-end mt-2">
                         ${isPending ? `
                         <button class="btn btn-sm btn-outline-danger" onclick="deleteTask('${task.task_id}')">
-                            <i class="bi bi-trash"></i> 取消任务
+                            <i class="bi bi-trash"></i> Cancel
                         </button>` : ''}
                     </div>
                 </div>
@@ -319,7 +317,7 @@
     }
 
     async function deleteTask(taskId) {
-        if (!confirm('确定要取消此 Pending 任务吗?')) return;
+        if (!confirm('Cancel this pending task?')) return;
 
         try {
             const response = await fetch(`/api/avatar/task/${taskId}`, {
@@ -332,14 +330,12 @@
                 alert(result.msg);
             }
         } catch (error) {
-            alert('删除请求失败');
+            alert('Delete request failed');
         }
     }
 
-    // 初始加载及自动定时刷新
     refreshTasks();
     setInterval(refreshTasks, 3000);
-
 </script>
 
 </body>
diff --git a/web/client.js b/web/client.js
index 8a511131..b8132b57 100644
--- a/web/client.js
+++ b/web/client.js
@@ -77,7 +77,7 @@ function stop() {
 }
 
 window.onunload = function(event) {
-    // 在这里执行你想要的操作
+    // Perform operations here
     setTimeout(() => {
         pc.close();
     }, 500);
@@ -88,10 +88,10 @@ window.onbeforeunload = function (e) {
                 pc.close();
             }, 500);
         e = e || window.event
-        // 兼容IE8和Firefox 4之前的版本
+        // Compatibility for older browser versions
         if (e) {
-          e.returnValue = '关闭提示'
+          e.returnValue = 'Are you sure you want to leave?'
         }
         // Chrome, Safari, Firefox 4+, Opera 12+ , IE 9+
-        return '关闭提示'
+        return 'Are you sure you want to leave?'
       }
\ No newline at end of file
diff --git a/web/dashboard.html b/web/dashboard.html
index 66a35f1a..e443a5b0 100644
--- a/web/dashboard.html
+++ b/web/dashboard.html
@@ -1,9 +1,9 @@
 <!DOCTYPE html>
-<html lang="zh-CN">
+<html lang="en">
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>livetalking数字人交互平台</title>
+    <title>LiveTalking Interactive Platform</title>
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
     <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bootstrap-icons@1.10.0/font/bootstrap-icons.css">
     <style>
@@ -281,18 +281,18 @@
     <div class="dashboard-container">
         <div class="row">
             <div class="col-12">
-                <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
+                <h1 class="text-center mb-4">LiveTalking Interactive Platform</h1>
             </div>
         </div>
 
         <div class="row">
-            <!-- 视频区域 -->
+            <!-- Video Area -->
             <div class="col-lg-8">
                 <div class="card">
                     <div class="card-header d-flex justify-content-between align-items-center">
                         <div>
                             <span class="status-indicator status-disconnected" id="connection-status"></span>
-                            <span id="status-text">未连接</span>
+                            <span id="status-text">Disconnected</span>
                         </div>
                     </div>
                     <div class="card-body p-0">
@@ -300,7 +300,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                             <video id="video" autoplay playsinline></video>
                             <div class="recording-indicator" id="recording-indicator">
                                 <div class="blink"></div>
-                                <span>录制中</span>
+                                <span>Recording</span>
                             </div>
                         </div>
                         
@@ -308,19 +308,19 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                             <div class="row">
                                 <div class="col-md-6 mb-3">
                                     <button class="btn btn-primary w-100" id="start">
-                                        <i class="bi bi-play-fill"></i> 开始连接
+                                        <i class="bi bi-play-fill"></i> Start Connection
                                     </button>
                                     <button class="btn btn-danger w-100" id="stop" style="display: none;">
-                                        <i class="bi bi-stop-fill"></i> 停止连接
+                                        <i class="bi bi-stop-fill"></i> Stop Connection
                                     </button>
                                 </div>
                                 <div class="col-md-6 mb-3">
                                     <div class="d-flex">
                                         <button class="btn btn-outline-primary flex-grow-1 me-2" id="btn_start_record">
-                                            <i class="bi bi-record-fill"></i> 开始录制
+                                            <i class="bi bi-record-fill"></i> Start Recording
                                         </button>
                                         <button class="btn btn-outline-danger flex-grow-1" id="btn_stop_record" disabled>
-                                            <i class="bi bi-stop-fill"></i> 停止录制
+                                            <i class="bi bi-stop-fill"></i> Stop Recording
                                         </button>
                                     </div>
                                 </div>
@@ -329,7 +329,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                             <div class="row">
                                 <div class="col-12">
                                     <div class="video-size-control">
-                                        <label for="video-size-slider" class="form-label">视频大小调节: <span id="video-size-value">100%</span></label>
+                                        <label for="video-size-slider" class="form-label">Adjust Video Size: <span id="video-size-value">100%</span></label>
                                         <input type="range" class="form-range" id="video-size-slider" min="50" max="150" value="100">
                                     </div>
                                 </div>
@@ -340,7 +340,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                                     <div class="col-md-12">
                                         <div class="form-check form-switch mb-3">
                                             <input class="form-check-input" type="checkbox" id="use-stun">
-                                            <label class="form-check-label" for="use-stun">使用STUN服务器</label>
+                                            <label class="form-check-label" for="use-stun">Use STUN Server</label>
                                         </div>
                                     </div>
                                 </div>
@@ -350,54 +350,54 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 </div>
             </div>
 
-            <!-- 右侧交互 -->
+            <!-- Interaction Column -->
             <div class="col-lg-4">
                 <div class="card">
                     <div class="card-header">
                         <ul class="nav nav-tabs card-header-tabs" id="interaction-tabs" role="tablist">
                             <li class="nav-item" role="presentation">
-                                <button class="nav-link active" id="chat-tab" data-bs-toggle="tab" data-bs-target="#chat" type="button" role="tab" aria-controls="chat" aria-selected="true">对话模式</button>
+                                <button class="nav-link active" id="chat-tab" data-bs-toggle="tab" data-bs-target="#chat" type="button" role="tab" aria-controls="chat" aria-selected="true">Chat Mode</button>
                             </li>
                             <li class="nav-item" role="presentation">
-                                <button class="nav-link" id="tts-tab" data-bs-toggle="tab" data-bs-target="#tts" type="button" role="tab" aria-controls="tts" aria-selected="false">朗读模式</button>
+                                <button class="nav-link" id="tts-tab" data-bs-toggle="tab" data-bs-target="#tts" type="button" role="tab" aria-controls="tts" aria-selected="false">TTS Mode</button>
                             </li>
                         </ul>
                     </div>
                     <div class="card-body">
                         <div class="tab-content" id="interaction-tabs-content">
-                            <!-- 对话模式 -->
+                            <!-- Chat Mode -->
                             <div class="tab-pane fade show active" id="chat" role="tabpanel" aria-labelledby="chat-tab">
                                 <div class="asr-container mb-3" id="chat-messages">
                                     <div class="asr-text system-message">
-                                        系统: 欢迎使用livetalking，请点击"开始连接"按钮开始对话。
+                                        System: Welcome to LiveTalking. Click "Start Connection" to begin.
                                     </div>
                                 </div>
                                 
                                 <form id="chat-form">
                                     <div class="input-group mb-3">
-                                        <textarea class="form-control" id="chat-message" rows="3" placeholder="输入您想对数字人说的话..."></textarea>
+                                        <textarea class="form-control" id="chat-message" rows="3" placeholder="Type what you want to say to the avatar..."></textarea>
                                         <button class="btn btn-primary" type="submit">
-                                            <i class="bi bi-send"></i> 发送
+                                            <i class="bi bi-send"></i> Send
                                         </button>
                                     </div>
                                 </form>
                                 
-                                <!-- 按住说话按钮 -->
+                                <!-- Hold to Talk Button -->
                                 <div class="voice-record-btn" id="voice-record-btn">
                                     <i class="bi bi-mic-fill"></i>
                                 </div>
-                                <div class="voice-record-label">按住说话，松开发送</div>
+                                <div class="voice-record-label">Hold to talk, release to send</div>
                             </div>
                             
-                            <!-- 朗读模式 -->
+                            <!-- TTS Mode -->
                             <div class="tab-pane fade" id="tts" role="tabpanel" aria-labelledby="tts-tab">
                                 <form id="echo-form">
                                     <div class="mb-3">
-                                        <label for="message" class="form-label">输入要朗读的文本</label>
-                                        <textarea class="form-control" id="message" rows="6" placeholder="输入您想让数字人朗读的文字..."></textarea>
+                                        <label for="message" class="form-label">Enter text to read aloud</label>
+                                        <textarea class="form-control" id="message" rows="6" placeholder="Type what you want the avatar to read aloud..."></textarea>
                                     </div>
                                     <button type="submit" class="btn btn-primary w-100">
-                                        <i class="bi bi-volume-up"></i> 朗读文本
+                                        <i class="bi bi-volume-up"></i> Read Aloud
                                     </button>
                                 </form>
                             </div>
@@ -412,7 +412,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
         </div>
     </div>
 
-    <!-- 隐藏的会话ID -->
+    <!-- Hidden session ID -->
     <input type="hidden" id="sessionid" value="0">
 
 
@@ -436,25 +436,25 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 switch(status) {
                     case 'connected':
                         statusIndicator.addClass('status-connected');
-                        statusText.text('已连接');
+                        statusText.text('Connected');
                         break;
                     case 'connecting':
                         statusIndicator.addClass('status-connecting');
-                        statusText.text('连接中...');
+                        statusText.text('Connecting...');
                         break;
                     case 'disconnected':
                     default:
                         statusIndicator.addClass('status-disconnected');
-                        statusText.text('未连接');
+                        statusText.text('Disconnected');
                         break;
                 }
             }
 
-            // 添加聊天消息
+            // Add Chat Message
             function addChatMessage(message, type = 'user') {
                 const messagesContainer = $('#chat-messages');
                 const messageClass = type === 'user' ? 'user-message' : 'system-message';
-                const sender = type === 'user' ? '您' : '数字人';
+                const sender = type === 'user' ? 'You' : 'Avatar';
                 
                 const messageElement = $(`
                     <div class="asr-text ${messageClass}">
@@ -466,24 +466,24 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 messagesContainer.scrollTop(messagesContainer[0].scrollHeight);
             }
 
-            // 开始/停止按钮
+            // Start/Stop buttons
             $('#start').click(function() {
                 updateConnectionStatus('connecting');
                 start();
                 $(this).hide();
                 $('#stop').show();
                 
-                // 添加定时器检查视频流是否已加载
+                // Add timer to check if video stream loaded
                 let connectionCheckTimer = setInterval(function() {
                     const video = document.getElementById('video');
-                    // 检查视频是否有数据
+                    // Check if video has data
                     if (video.readyState >= 3 && video.videoWidth > 0) {
                         updateConnectionStatus('connected');
                         clearInterval(connectionCheckTimer);
                     }
-                }, 2000); // 每2秒检查一次
+                }, 2000); // Check every 2s
                 
-                // 60秒后如果还是连接中状态，就停止检查
+                // Stop checking after 60s if still connecting
                 setTimeout(function() {
                     if (connectionCheckTimer) {
                         clearInterval(connectionCheckTimer);
@@ -498,7 +498,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 updateConnectionStatus('disconnected');
             });
 
-            // 录制功能
+            // Recording functions
             $('#btn_start_record').click(function() {
                 console.log('Starting recording...');
                 fetch('/record', {
@@ -570,10 +570,10 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 });
                 
                 $('#message').val('');
-                addChatMessage(`已发送朗读请求: "${message}"`, 'system');
+                addChatMessage(`Sent reading request: "${message}"`, 'system');
             });
 
-            // 聊天模式表单提交
+            // Chat form submit
             $('#chat-form').on('submit', function(e) {
                 e.preventDefault();
                 var message = $('#chat-message').val();
@@ -598,20 +598,20 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 $('#chat-message').val('');
             });
 
-            // 按住说话功能
+            // Hold to talk voice recording
             let mediaRecorder;
             let audioChunks = [];
             let isRecording = false;
             let recognition;
             
-            // 检查浏览器是否支持语音识别
+            // Check speech recognition support
             const isSpeechRecognitionSupported = 'webkitSpeechRecognition' in window || 'SpeechRecognition' in window;
             
             if (isSpeechRecognitionSupported) {
                 recognition = new (window.SpeechRecognition || window.webkitSpeechRecognition)();
                 recognition.continuous = true;
                 recognition.interimResults = true;
-                recognition.lang = 'zh-CN';
+                recognition.lang = 'en-US';
                 
                 recognition.onresult = function(event) {
                     let interimTranscript = '';
@@ -632,11 +632,11 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 };
                 
                 recognition.onerror = function(event) {
-                    console.error('语音识别错误:', event.error);
+                    console.error('Speech recognition error:', event.error);
                 };
             }
             
-            // 按住说话按钮事件
+            // Hold to talk events
             $('#voice-record-btn').on('mousedown touchstart', function(e) {
                 e.preventDefault();
                 startRecording();
@@ -646,7 +646,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 }
             });
             
-            // 开始录音
+            // Start recording
             function startRecording() {
                 if (isRecording) return;
                 
@@ -672,34 +672,34 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                         }
                     })
                     .catch(function(error) {
-                        console.error('无法访问麦克风:', error);
-                        alert('无法访问麦克风，请检查浏览器权限设置。');
+                        console.error('Cannot access microphone:', error);
+                        alert('Cannot access microphone, please check browser permission settings.');
                     });
             }
 
+            // Stop recording
             function stopRecording() {
                 if (!isRecording) return;
                 
                 mediaRecorder.stop();
                 isRecording = false;
                 
-                // 停止所有音轨
+                // Stop all tracks
                 mediaRecorder.stream.getTracks().forEach(track => track.stop());
                 
-                // 视觉反馈恢复
+                // Visual feedback reset
                 $('#voice-record-btn').removeClass('recording-pulse');
                 $('#voice-record-btn').css('background-color', '');
                 
-                // 停止语音识别
+                // Stop recognition
                 if (recognition) {
                     recognition.stop();
                 }
                 
-                // 获取识别的文本并发送
+                // Get recognized text and send
                 setTimeout(function() {
                     const recognizedText = $('#chat-message').val().trim();
                     if (recognizedText) {
-                        // 发送识别的文本
                         fetch('/human', {
                             body: JSON.stringify({
                                 text: recognizedText,
@@ -719,7 +719,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 }, 500); 
             }
 
-            // WebRTC 相关功能
+            // WebRTC related functions
             if (typeof window.onWebRTCConnected === 'function') {
                 const originalOnConnected = window.onWebRTCConnected;
                 window.onWebRTCConnected = function() {
@@ -732,7 +732,7 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 };
             }
 
-            // 当连接断开时更新状态
+            // Update status on disconnect
             if (typeof window.onWebRTCDisconnected === 'function') {
                 const originalOnDisconnected = window.onWebRTCDisconnected;
                 window.onWebRTCDisconnected = function() {
@@ -745,11 +745,10 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 };
             }
 
-            // SRS WebRTC播放功能
-            var sdk = null; // 全局处理器，用于在重新发布时进行清理
+            // SRS WebRTC playback
+            var sdk = null;
 
             function startPlay() {
-                // 关闭之前的连接
                 if (sdk) {
                     sdk.close();
                 }
@@ -761,10 +760,10 @@ <h1 class="text-center mb-4">livetalking数字人交互平台</h1>
                 var url = "http://" + host + ":1985/rtc/v1/whep/?app=live&stream=livestream";
                 
                 sdk.play(url).then(function(session) {
-                    console.log('WebRTC播放已启动，会话ID:', session.sessionid);
+                    console.log('WebRTC playback started, Session ID:', session.sessionid);
                 }).catch(function(reason) {
                     sdk.close();
-                    console.error('WebRTC播放失败:', reason);
+                    console.error('WebRTC playback failed:', reason);
                 });
             }
         });
diff --git a/web/index.html b/web/index.html
index 79c91ea8..adf58aad 100644
--- a/web/index.html
+++ b/web/index.html
@@ -1,9 +1,9 @@
 <!DOCTYPE html>
-<html lang="zh-CN">
+<html lang="en">
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>LiveTalking - 数字人实时驱动</title>
+    <title>LiveTalking - Real-time Digital Human</title>
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
     <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bootstrap-icons@1.10.0/font/bootstrap-icons.css">
     <style>
@@ -69,7 +69,6 @@
         .quick-link { text-decoration: none; }
         .quick-link .glass-card { transition: transform 0.3s, box-shadow 0.3s; cursor: pointer; }
         .quick-link:hover .glass-card { transform: translateY(-3px); box-shadow: 0 12px 28px rgba(0,0,0,0.1); }
-        pre { background: #1e293b; color: #e2e8f0; padding: 12px; border-radius: 8px; font-size: 0.8rem; max-height: 120px; overflow-y: auto; }
         label { font-weight: 500; font-size: 0.9rem; color: #64748b; margin-bottom: 4px; }
         .param-hint { font-size: 0.75rem; color: #94a3b8; }
         ::placeholder { color: #9ca3af !important; opacity: 1; }
@@ -81,9 +80,8 @@
 <nav class="navbar navbar-dark" style="background: linear-gradient(135deg, #4361ee, #3f37c9); box-shadow: 0 2px 10px rgba(0,0,0,0.1);">
     <div class="container-fluid px-4">
         <span class="navbar-brand"><i class="bi bi-camera-video-fill me-2"></i>LiveTalking</span>
-        <a href="/index-en.html" class="text-white-50 small text-decoration-none me-2">English</a>
         <div class="d-flex gap-2">
-            <span class="session-badge disconnected" id="statusBadge"><span class="status-dot off"></span>未连接</span>
+            <span class="session-badge disconnected" id="statusBadge"><span class="status-dot off"></span>Disconnected</span>
             <span class="text-white-50 small" id="sessionIdDisplay">SID: -</span>
         </div>
     </div>
@@ -96,8 +94,8 @@
             <a href="/avatar.html" class="quick-link" target="_blank">
                 <div class="glass-card p-3 text-center">
                     <i class="bi bi-person-bounding-box fs-2" style="color: #4361ee;"></i>
-                    <div class="fw-bold mt-2">Avatar 生成</div>
-                    <div class="small text-muted">创建数字人形象</div>
+                    <div class="fw-bold mt-2">Avatar Creator</div>
+                    <div class="small text-muted">Generate digital human avatars</div>
                 </div>
             </a>
         </div>
@@ -105,8 +103,8 @@
             <a href="/admin.html" class="quick-link" target="_blank">
                 <div class="glass-card p-3 text-center">
                     <i class="bi bi-speedometer2 fs-2" style="color: #4361ee;"></i>
-                    <div class="fw-bold mt-2">管理后台</div>
-                    <div class="small text-muted">监控会话与配置</div>
+                    <div class="fw-bold mt-2">Admin Console</div>
+                    <div class="small text-muted">Monitor sessions &amp; config</div>
                 </div>
             </a>
         </div>
@@ -114,8 +112,8 @@
             <a href="/tts/index.html" class="quick-link" target="_blank">
                 <div class="glass-card p-3 text-center">
                     <i class="bi bi-soundwave fs-2" style="color: #4361ee;"></i>
-                    <div class="fw-bold mt-2">TTS 语音管理</div>
-                    <div class="small text-muted">语音列表 · 克隆 · 合成</div>
+                    <div class="fw-bold mt-2">TTS Voice Manager</div>
+                    <div class="small text-muted">Voices · Clone · Synthesize</div>
                 </div>
             </a>
         </div>
@@ -126,7 +124,7 @@
         <div class="col-lg-7">
             <!-- 1. WebRTC Connection -->
             <div class="glass-card">
-                <div class="card-header"><i class="bi bi-broadcast"></i> WebRTC 连接</div>
+                <div class="card-header"><i class="bi bi-broadcast"></i> WebRTC Connection</div>
                 <div class="card-body">
                     <div class="row g-2 align-items-end mb-3">
                         <div class="col-md-4">
@@ -134,17 +132,17 @@
                             <input type="text" class="form-control form-control-sm" id="offerAvatar" placeholder="wav2lip256_avatar1">
                         </div>
                         <div class="col-md-4">
-                            <label class="form-label">参考音频</label>
+                            <label class="form-label">Ref Audio</label>
                             <input type="text" class="form-control form-control-sm" id="offerRefAudio" placeholder="zh-CN-YunxiaNeural">
                         </div>
                         <div class="col-md-4">
-                            <label class="form-label">参考音频文本</label>
-                            <input type="text" class="form-control form-control-sm" id="offerRefText" placeholder="参考文本（可选）">
+                            <label class="form-label">Ref Text</label>
+                            <input type="text" class="form-control form-control-sm" id="offerRefText" placeholder="Reference text (optional)">
                         </div>
                     </div>
                     <div class="d-flex gap-2">
-                        <button class="btn-primary-custom" id="btnStart" onclick="start()"><i class="bi bi-play-fill"></i> 开始连接</button>
-                        <button class="btn-danger-custom" id="btnStop" onclick="stop()" style="display:none;"><i class="bi bi-stop-fill"></i> 断开连接</button>
+                        <button class="btn-primary-custom" id="btnStart" onclick="start()"><i class="bi bi-play-fill"></i> Connect</button>
+                        <button class="btn-danger-custom" id="btnStop" onclick="stop()" style="display:none;"><i class="bi bi-stop-fill"></i> Disconnect</button>
                     </div>
                     <div class="mt-3">
                         <video id="video" autoplay playsinline muted controls></video>
@@ -158,58 +156,58 @@
         <div class="col-lg-5">
             <!-- 2. Text Driver -->
             <div class="glass-card">
-                <div class="card-header"><i class="bi bi-chat-text-fill"></i> 文本驱动 (POST /human)</div>
+                <div class="card-header"><i class="bi bi-chat-text-fill"></i> Text Driver (POST /human)</div>
                 <div class="card-body">
                     <div class="mb-2">
-                        <label class="form-label">输入文本 <span class="param-hint">(type: echo/chat)</span></label>
-                        <textarea class="form-control form-control-sm" id="txtMessage" rows="2" placeholder="输入要播报的文本...">你好，欢迎使用LiveTalking</textarea>
+                        <label class="form-label">Text <span class="param-hint">(type: echo/chat)</span></label>
+                        <textarea class="form-control form-control-sm" id="txtMessage" rows="2" placeholder="Enter text to speak...">Hello, welcome to LiveTalking</textarea>
                     </div>
                     <div class="d-flex gap-2 align-items-end">
                         <select class="form-select form-select-sm" style="width:120px;" id="txtType">
-                            <option value="echo">Echo 复读</option>
+                            <option value="echo">Echo</option>
                             <option value="chat">Chat LLM</option>
                         </select>
                         <div class="form-check form-switch">
                             <input class="form-check-input" type="checkbox" id="txtInterrupt" checked>
-                            <label class="form-check-label small">打断</label>
+                            <label class="form-check-label small">Interrupt</label>
                         </div>
-                        <button class="btn-primary-custom btn-sm ms-auto" onclick="sendText()"><i class="bi bi-send"></i> 发送</button>
-                        <button class="btn-outline-custom btn-sm" onclick="interrupt()"><i class="bi bi-stop-circle"></i> 打断</button>
+                        <button class="btn-primary-custom btn-sm ms-auto" onclick="sendText()"><i class="bi bi-send"></i> Send</button>
+                        <button class="btn-outline-custom btn-sm" onclick="interrupt()"><i class="bi bi-stop-circle"></i> Interrupt</button>
                     </div>
                 </div>
             </div>
 
-            <!-- 3. Audio Upload -->
+            <!-- 3. Audio Driver -->
             <div class="glass-card">
-                <div class="card-header"><i class="bi bi-mic-fill"></i> 音频驱动 (POST /humanaudio)</div>
+                <div class="card-header"><i class="bi bi-mic-fill"></i> Audio Driver (POST /humanaudio)</div>
                 <div class="card-body">
                     <input type="file" class="form-control form-control-sm mb-2" id="audioFile" accept="audio/*">
-                    <button class="btn-primary-custom btn-sm" onclick="uploadAudio()"><i class="bi bi-upload"></i> 上传并播放</button>
+                    <button class="btn-primary-custom btn-sm" onclick="uploadAudio()"><i class="bi bi-upload"></i> Upload &amp; Play</button>
                 </div>
             </div>
 
             <!-- 4. Recording -->
             <div class="glass-card">
-                <div class="card-header"><i class="bi bi-record-circle"></i> 录制控制 (POST /record)</div>
+                <div class="card-header"><i class="bi bi-record-circle"></i> Recording (POST /record)</div>
                 <div class="card-body">
                     <div class="d-flex gap-2">
-                        <button class="btn-outline-custom btn-sm" id="btnRecToggle" onclick="toggleRecord()"><i class="bi bi-record-circle"></i> 开始录制</button>
-                        <button class="btn-outline-custom btn-sm" id="btnDownload" onclick="downloadRecord()" disabled><i class="bi bi-download"></i> 下载录像</button>
+                        <button class="btn-outline-custom btn-sm" id="btnRecToggle" onclick="toggleRecord()"><i class="bi bi-record-circle"></i> Start Recording</button>
+                        <button class="btn-outline-custom btn-sm" id="btnDownload" onclick="downloadRecord()" disabled><i class="bi bi-download"></i> Download Video</button>
                     </div>
                 </div>
             </div>
 
             <!-- 5. Custom State -->
             <div class="glass-card">
-                <div class="card-header"><i class="bi bi-sliders"></i> 动作编排 (POST /set_audiotype)</div>
+                <div class="card-header"><i class="bi bi-sliders"></i> Custom State (POST /set_audiotype)</div>
                 <div class="card-body">
                     <div class="row g-2 align-items-end">
                         <div class="col-6">
-                            <label class="form-label">Audiotype 索引</label>
+                            <label class="form-label">Audiotype Index</label>
                             <input type="number" class="form-control form-control-sm" id="audiotypeVal" value="2" min="2">
                         </div>
                         <div class="col-6">
-                            <button class="btn-primary-custom btn-sm w-100" onclick="setAudiotype()"><i class="bi bi-arrow-right-circle"></i> 切换状态</button>
+                            <button class="btn-primary-custom btn-sm w-100" onclick="setAudiotype()"><i class="bi bi-arrow-right-circle"></i> Switch State</button>
                         </div>
                     </div>
                 </div>
@@ -227,10 +225,10 @@
     const badge = document.getElementById('statusBadge');
     if (connected) {
         badge.className = 'session-badge connected';
-        badge.innerHTML = '<span class="status-dot on"></span>已连接';
+        badge.innerHTML = '<span class="status-dot on"></span>Connected';
     } else {
         badge.className = 'session-badge disconnected';
-        badge.innerHTML = '<span class="status-dot off"></span>未连接';
+        badge.innerHTML = '<span class="status-dot off"></span>Disconnected';
     }
 }
 
@@ -239,7 +237,7 @@
     document.getElementById('sessionIdDisplay').textContent = 'SID: ' + (sid || '-');
 }
 
-// ─── WebRTC ────────────────────────────────────────────────
+// --- WebRTC ---
 function negotiate() {
     pc.addTransceiver('video', { direction: 'recvonly' });
     pc.addTransceiver('audio', { direction: 'recvonly' });
@@ -296,12 +294,12 @@
     document.getElementById('audio').srcObject = null;
 }
 
-// ─── Text ──────────────────────────────────────────────────
+// --- Text ---
 function sendText() {
     const text = document.getElementById('txtMessage').value;
     const type = document.getElementById('txtType').value;
     const interrupt = document.getElementById('txtInterrupt').checked;
-    if (!text || !sessionid) return alert('请先连接 WebRTC');
+    if (!text || !sessionid) return alert('Please connect WebRTC first');
 
     fetch('/human', {
         method: 'POST',
@@ -313,10 +311,10 @@
     });
 }
 
-// ─── Audio Upload ──────────────────────────────────────────
+// --- Audio Upload ---
 function uploadAudio() {
     const file = document.getElementById('audioFile').files[0];
-    if (!file || !sessionid) return alert('请先连接 WebRTC 并选择音频文件');
+    if (!file || !sessionid) return alert('Please connect WebRTC and select an audio file');
 
     const formData = new FormData();
     formData.append('file', file);
@@ -326,7 +324,7 @@
         .then(r => r.json()).then(d => console.log('humanaudio:', d));
 }
 
-// ─── Interrupt ─────────────────────────────────────────────
+// --- Interrupt ---
 function interrupt() {
     if (!sessionid) return;
     fetch('/interrupt_talk', {
@@ -336,9 +334,9 @@
     }).then(r => r.json()).then(d => console.log('interrupt:', d));
 }
 
-// ─── Speaking Status ───────────────────────────────────────
+// --- Speaking Status ---
 function checkSpeaking() {
-    if (!sessionid) return alert('请先连接 WebRTC');
+    if (!sessionid) return alert('Please connect WebRTC first');
     fetch('/is_speaking', {
         method: 'POST',
         headers: { 'Content-Type': 'application/json' },
@@ -346,10 +344,10 @@
     }).then(r => r.json()).then(d => alert('Speaking: ' + JSON.stringify(d.data)));
 }
 
-// ─── Recording ─────────────────────────────────────────────
+// --- Recording ---
 let recording = false;
 function toggleRecord() {
-    if (!sessionid) return alert('请先连接 WebRTC');
+    if (!sessionid) return alert('Please connect WebRTC first');
     const btn = document.getElementById('btnRecToggle');
     const type = recording ? 'end_record' : 'start_record';
     fetch('/record', {
@@ -361,11 +359,11 @@
         recording = !recording;
         if (recording) {
             btn.className = 'btn-danger-custom btn-sm';
-            btn.innerHTML = '<i class="bi bi-stop-circle"></i> 停止录制';
+            btn.innerHTML = '<i class="bi bi-stop-circle"></i> Stop Recording';
             document.getElementById('btnDownload').disabled = true;
         } else {
             btn.className = 'btn-outline-custom btn-sm';
-            btn.innerHTML = '<i class="bi bi-record-circle"></i> 开始录制';
+            btn.innerHTML = '<i class="bi bi-record-circle"></i> Start Recording';
             document.getElementById('btnDownload').disabled = false;
         }
     });
@@ -375,9 +373,9 @@
     window.open('/record/' + sessionid, '_blank');
 }
 
-// ─── Audiotype ─────────────────────────────────────────────
+// --- Audiotype ---
 function setAudiotype() {
-    if (!sessionid) return alert('请先连接 WebRTC');
+    if (!sessionid) return alert('Please connect WebRTC first');
     const val = parseInt(document.getElementById('audiotypeVal').value) || 0;
     fetch('/set_audiotype', {
         method: 'POST',
diff --git a/web/tts/index.html b/web/tts/index.html
index c79d5c2c..b8d673ee 100644
--- a/web/tts/index.html
+++ b/web/tts/index.html
@@ -1,10 +1,10 @@
 <!DOCTYPE html>
-<html lang="zh-CN">
+<html lang="en">
 
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>TTS 语音管理 - LiveTalking</title>
+    <title>TTS Voice Manager - LiveTalking</title>
     <link href="https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&display=swap" rel="stylesheet">
     <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0/dist/css/bootstrap.min.css" rel="stylesheet">
     <link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/bootstrap-icons@1.10.0/font/bootstrap-icons.css">
@@ -31,13 +31,11 @@
             padding-bottom: 40px;
         }
 
-        /* Navbar */
         .navbar-custom {
             background: linear-gradient(135deg, #4361ee, #3f37c9);
             box-shadow: 0 2px 10px rgba(0, 0, 0, 0.1);
         }
 
-        /* Glass Card */
         .glass-card {
             background: var(--card-bg);
             backdrop-filter: blur(12px);
@@ -66,7 +64,6 @@
             padding: 20px;
         }
 
-        /* Buttons */
         .btn-primary-custom {
             background: linear-gradient(135deg, #4361ee, #3f37c9);
             border: none;
@@ -131,7 +128,6 @@
             box-shadow: 0 4px 14px rgba(239, 68, 68, 0.3);
         }
 
-        /* Form */
         label {
             font-weight: 500;
             font-size: 0.9rem;
@@ -149,7 +145,6 @@
             opacity: 1;
         }
 
-        /* Voice List */
         .voice-table {
             width: 100%;
             font-size: 0.9rem;
@@ -202,14 +197,12 @@
             border: 1px solid rgba(0, 0, 0, 0.06);
         }
 
-        /* Audio Player */
         .audio-preview {
             width: 100%;
             margin-top: 12px;
             border-radius: 8px;
         }
 
-        /* Loading Spinner */
         .spinner-overlay {
             display: none;
             position: fixed;
@@ -235,7 +228,6 @@
             box-shadow: 0 20px 40px rgba(0, 0, 0, 0.15);
         }
 
-        /* Toast */
         .toast-container {
             position: fixed;
             top: 20px;
@@ -277,7 +269,6 @@
             }
         }
 
-        /* Server status indicator */
         .server-status {
             display: inline-flex;
             align-items: center;
@@ -300,7 +291,6 @@
             background: #ef4444;
         }
 
-        /* Waveform animation */
         .playing-indicator {
             display: none;
             align-items: center;
@@ -362,7 +352,7 @@
     <div class="spinner-overlay" id="spinnerOverlay">
         <div class="spinner-box">
             <div class="spinner-border text-primary mb-2" role="status"></div>
-            <div class="fw-bold" id="spinnerText">处理中...</div>
+            <div class="fw-bold" id="spinnerText">Processing...</div>
         </div>
     </div>
 
@@ -372,14 +362,13 @@
     <!-- Navbar -->
     <nav class="navbar navbar-dark navbar-custom">
         <div class="container-fluid px-4">
-            <span class="navbar-brand"><i class="bi bi-soundwave me-2"></i>TTS 语音管理</span>
+            <span class="navbar-brand"><i class="bi bi-soundwave me-2"></i>TTS Voice Manager</span>
             <div class="d-flex align-items-center gap-3">
-                <a href="/tts/index-en.html" class="text-white-50 small text-decoration-none">English</a>
                 <span class="server-status text-white-50">
                     <span class="status-dot off" id="serverDot"></span>
-                    <span id="serverStatusText">未连接</span>
+                    <span id="serverStatusText">Disconnected</span>
                 </span>
-                <a href="/index.html" class="text-white-50 small text-decoration-none"><i class="bi bi-house"></i> 主页</a>
+                <a href="/index.html" class="text-white-50 small text-decoration-none"><i class="bi bi-house"></i> Home</a>
             </div>
         </div>
     </nav>
@@ -388,21 +377,21 @@
 
         <!-- Server Configuration -->
         <div class="glass-card">
-            <div class="card-header"><i class="bi bi-gear-fill"></i> 服务器配置</div>
+            <div class="card-header"><i class="bi bi-gear-fill"></i> Server Configuration</div>
             <div class="card-body">
                 <div class="row g-3 align-items-end">
                     <div class="col-md-9">
-                        <label class="form-label">TTS 服务器地址</label>
+                        <label class="form-label">TTS Server URL</label>
                         <input type="text" class="form-control" id="serverUrl"
                         placeholder="http://localhost:8091"
                         value="http://localhost:8091">
-                        <div class="param-hint mt-1">vLLM Omni 服务的 base URL（例如 http://your-server:8091）</div>
+                        <div class="param-hint mt-1">Base URL of the vLLM Omni service (e.g. http://your-server:8091)</div>
                     </div>
                     <div class="col-md-3 d-flex gap-2">
                         <button class="btn-primary-custom flex-grow-1" onclick="checkServer()">
-                            <i class="bi bi-plug"></i> 连接测试
+                            <i class="bi bi-plug"></i> Test Connection
                         </button>
-                        <button class="btn-outline-custom" onclick="saveConfig()" title="保存配置">
+                        <button class="btn-outline-custom" onclick="saveConfig()" title="Save config">
                             <i class="bi bi-floppy"></i>
                         </button>
                     </div>
@@ -416,11 +405,11 @@
                 <!-- Voice List -->
                 <div class="glass-card">
                     <div class="card-header d-flex justify-content-between align-items-center">
-                        <span><i class="bi bi-people-fill"></i> 语音列表</span>
+                        <span><i class="bi bi-people-fill"></i> Voice List</span>
                         <div class="d-flex gap-2 align-items-center">
-                            <span class="badge bg-light text-muted" id="voiceCount">0 个语音</span>
+                            <span class="badge bg-light text-muted" id="voiceCount">0 voices</span>
                             <button class="btn-outline-custom btn-sm" onclick="refreshVoices()">
-                                <i class="bi bi-arrow-clockwise"></i> 刷新
+                                <i class="bi bi-arrow-clockwise"></i> Refresh
                             </button>
                         </div>
                     </div>
@@ -428,7 +417,7 @@
                         <div class="voice-list-container" id="voiceListContainer">
                             <div class="text-center text-muted py-5">
                                 <i class="bi bi-info-circle fs-3 d-block mb-2"></i>
-                                请先连接服务器，然后点击"刷新"获取语音列表
+                                Connect to server first, then click "Refresh" to load voices
                             </div>
                         </div>
                     </div>
@@ -436,44 +425,44 @@
 
                 <!-- Upload / Clone Voice -->
                 <div class="glass-card">
-                    <div class="card-header"><i class="bi bi-cloud-upload-fill"></i> 上传克隆语音</div>
+                    <div class="card-header"><i class="bi bi-cloud-upload-fill"></i> Upload Clone Voice</div>
                     <div class="card-body">
                         <form id="cloneForm" onsubmit="return false;">
                             <input type="hidden" id="cloneConsent">
                             <div class="row g-3">
                                 <div class="col-md-6">
-                                    <label class="form-label">音频样本 <span class="text-danger">*</span></label>
+                                    <label class="form-label">Audio Sample <span class="text-danger">*</span></label>
                                     <div class="input-group input-group-sm">
                                         <input type="file" class="form-control form-control-sm" id="cloneAudioFile"
                                         accept="audio/*" onchange="onAudioFileChange()">
                                         <button class="btn btn-outline-custom btn-sm" type="button" id="btnTranscribe" disabled
-                                        onclick="transcribeAudio()" title="自动识别音频文本">
-                                            <i class="bi bi-mic"></i> 识别
+                                        onclick="transcribeAudio()" title="Auto-transcribe audio">
+                                            <i class="bi bi-mic"></i> Transcribe
                                         </button>
                                     </div>
-                                    <div class="param-hint mt-1">支持 wav, mp3, flac, ogg, aac, webm, mp4（最大 10MB）</div>
+                                    <div class="param-hint mt-1">Supports wav, mp3, flac, ogg, aac, webm, mp4 (max 10MB)</div>
                                 </div>
                                 <div class="col-md-6">
-                                    <label class="form-label">语音名称 <span class="text-danger">*</span></label>
+                                    <label class="form-label">Voice Name <span class="text-danger">*</span></label>
                                     <input type="text" class="form-control form-control-sm" id="cloneName"
-                                    placeholder="例如：my_custom_voice">
-                                    <div class="param-hint mt-1">唯一名称，用于后续合成时选择</div>
+                                    placeholder="e.g. my_custom_voice">
+                                    <div class="param-hint mt-1">Unique name used to select this voice later</div>
                                 </div>
                                 <div class="col-12">
-                                    <label class="form-label">参考文本 <span class="text-danger">*</span></label>
+                                    <label class="form-label">Reference Text <span class="text-danger">*</span></label>
                                     <textarea class="form-control form-control-sm" id="cloneRefText" rows="2"
-                                    placeholder="音频样本的准确转录文本，点击音频旁的"识别"按钮自动生成"></textarea>
-                                    <div class="param-hint mt-1">提供准确的转录文本可启用更高质量的上下文克隆</div>
+                                    placeholder="Exact transcript of the audio sample, click the Transcribe button to auto-generate"></textarea>
+                                    <div class="param-hint mt-1">Accurate transcript enables higher-quality in-context cloning</div>
                                 </div>
                                 <div class="col-12">
-                                    <label class="form-label">说话人描述</label>
+                                    <label class="form-label">Speaker Description</label>
                                     <input type="text" class="form-control form-control-sm" id="cloneDescription"
-                                    placeholder="例如：温暖的女声旁白、沉稳的男中音（可选）">
-                                    <div class="param-hint mt-1">自由格式的语音特征描述</div>
+                                    placeholder="e.g. warm female narrator, deep male baritone (optional)">
+                                    <div class="param-hint mt-1">Free-form description of voice characteristics</div>
                                 </div>
                                 <div class="col-12">
                                     <button type="button" class="btn-primary-custom" onclick="uploadVoice()" id="btnUpload">
-                                        <i class="bi bi-cloud-upload"></i> 上传克隆
+                                        <i class="bi bi-cloud-upload"></i> Upload Clone
                                     </button>
                                 </div>
                             </div>
@@ -485,24 +474,24 @@
             <!-- Right Column: Speech Synthesis -->
             <div class="col-lg-5">
                 <div class="glass-card">
-                    <div class="card-header"><i class="bi bi-chat-text-fill"></i> 语音合成测试</div>
+                    <div class="card-header"><i class="bi bi-chat-text-fill"></i> Speech Synthesis Test</div>
                     <div class="card-body">
                         <div class="mb-3">
-                            <label class="form-label">选择语音 <span class="text-danger">*</span></label>
+                            <label class="form-label">Select Voice <span class="text-danger">*</span></label>
                             <select class="form-select form-select-sm" id="synthVoice">
-                                <option value="">-- 请先刷新语音列表 --</option>
+                                <option value="">-- Refresh voice list first --</option>
                             </select>
                         </div>
 
                         <div class="mb-3">
-                            <label class="form-label">合成文本 <span class="text-danger">*</span></label>
+                            <label class="form-label">Text to Synthesize <span class="text-danger">*</span></label>
                             <textarea class="form-control form-control-sm" id="synthText" rows="3"
-                        placeholder="输入要合成语音的文本...">你好，欢迎使用LiveTalking数字人实时驱动系统。</textarea>
+                        placeholder="Enter text to synthesize...">Hello, welcome to LiveTalking real-time digital human system.</textarea>
                     </div>
 
                     <div class="row g-2 mb-3">
                         <div class="col-md-6">
-                            <label class="form-label">语速</label>
+                            <label class="form-label">Speed</label>
                             <div class="input-group input-group-sm">
                                 <input type="range" class="form-range" id="synthSpeed" min="0.25" max="4.0" step="0.05" value="1.0"
                                 oninput="document.getElementById('synthSpeedVal').textContent=this.value">
@@ -510,26 +499,26 @@
                             </div>
                         </div>
                         <div class="col-md-6">
-                            <label class="form-label">语言</label>
+                            <label class="form-label">Language</label>
                             <select class="form-select form-select-sm" id="synthLanguage">
-                                <option value="Auto">自动检测</option>
-                                <option value="Chinese">中文</option>
+                                <option value="Auto">Auto Detect</option>
+                                <option value="Chinese">Chinese</option>
                                 <option value="English">English</option>
-                                <option value="Japanese">日本語</option>
-                                <option value="Korean">한국어</option>
-                                <option value="German">Deutsch</option>
-                                <option value="French">Français</option>
-                                <option value="Russian">Русский</option>
-                                <option value="Portuguese">Português</option>
-                                <option value="Spanish">Español</option>
-                                <option value="Italian">Italiano</option>
+                                <option value="Japanese">Japanese</option>
+                                <option value="Korean">Korean</option>
+                                <option value="German">German</option>
+                                <option value="French">French</option>
+                                <option value="Russian">Russian</option>
+                                <option value="Portuguese">Portuguese</option>
+                                <option value="Spanish">Spanish</option>
+                                <option value="Italian">Italian</option>
                             </select>
                         </div>
                     </div>
 
                     <div class="row g-2 mb-3">
                         <div class="col-md-6">
-                            <label class="form-label">输出格式</label>
+                            <label class="form-label">Output Format</label>
                             <select class="form-select form-select-sm" id="synthFormat">
                                 <option value="wav">WAV</option>
                                 <option value="mp3">MP3</option>
@@ -540,35 +529,35 @@
                             </select>
                         </div>
                         <div class="col-md-6">
-                            <label class="form-label">任务类型</label>
+                            <label class="form-label">Task Type</label>
                             <select class="form-select form-select-sm" id="synthTaskType">
                                 <option value="CustomVoice">CustomVoice</option>
                                 <option value="VoiceDesign">VoiceDesign</option>
-                                <option value="Base">Base（需克隆语音）</option>
+                                <option value="Base">Base (requires cloned voice)</option>
                             </select>
                         </div>
                     </div>
 
                     <div class="mb-3">
-                        <label class="form-label">语音指令 <span class="param-hint">(可选)</span></label>
+                        <label class="form-label">Voice Instructions <span class="param-hint">(optional)</span></label>
                         <input type="text" class="form-control form-control-sm" id="synthInstructions"
-                        placeholder="例如：用愉快的语气、放慢语速、带有疑问的语气">
-                        <div class="param-hint mt-1">描述语音风格、情感或说话方式</div>
+                        placeholder="e.g. Speak in a cheerful tone, slow down, sound questioning">
+                        <div class="param-hint mt-1">Describe the voice style, emotion, or delivery</div>
                     </div>
 
                     <div class="d-flex gap-2">
                         <button class="btn-primary-custom flex-grow-1" onclick="synthesize()" id="btnSynthesize">
-                            <i class="bi bi-play-fill"></i> 合成语音
+                            <i class="bi bi-play-fill"></i> Synthesize
                         </button>
                         <button class="btn-outline-custom" onclick="downloadAudio()" id="btnDownload" disabled>
-                            <i class="bi bi-download"></i> 下载
+                            <i class="bi bi-download"></i> Download
                         </button>
                     </div>
 
                     <!-- Audio Preview -->
                     <div id="audioPreviewSection" style="display:none; margin-top:16px;">
                         <div class="d-flex align-items-center gap-2 mb-2">
-                            <span class="fw-bold small">合成结果</span>
+                            <span class="fw-bold small">Synthesis Result</span>
                             <div class="playing-indicator" id="playingIndicator">
                                 <div class="wave-bar"></div>
                                 <div class="wave-bar"></div>
@@ -581,36 +570,36 @@
                     </div>
                 </div>
             </div>
-        </div>
 
-        <!-- Advanced: Ref Audio Settings -->
-        <div class="glass-card" id="refAudioCard" style="display:none;">
-            <div class="card-header"><i class="bi bi-sliders"></i> 高级：参考音频设置 (Base 模式)</div>
-            <div class="card-body">
-                <div class="row g-3">
-                    <div class="col-md-4">
-                        <label class="form-label">参考音频 URL</label>
-                        <input type="text" class="form-control form-control-sm" id="refAudioUrl"
-                        placeholder="http://... 或 data:audio/wav;base64,...">
-                        <div class="param-hint mt-1">远程 URL 或 base64 data URL</div>
-                    </div>
-                    <div class="col-md-4">
-                        <label class="form-label">参考文本</label>
-                        <input type="text" class="form-control form-control-sm" id="refText"
-                        placeholder="参考音频的转录文本">
-                    </div>
-                    <div class="col-md-4 d-flex align-items-end">
-                        <div class="form-check form-switch">
-                            <input class="form-check-input" type="checkbox" id="xVectorOnly">
-                            <label class="form-check-label small">仅使用 X-Vector 模式 <span class="param-hint">(更快，质量略低)</span></label>
+            <!-- Advanced: Ref Audio Settings -->
+            <div class="glass-card" id="refAudioCard" style="display:none;">
+                <div class="card-header"><i class="bi bi-sliders"></i> Advanced: Reference Audio (Base Mode)</div>
+                <div class="card-body">
+                    <div class="row g-3">
+                        <div class="col-md-4">
+                            <label class="form-label">Reference Audio URL</label>
+                            <input type="text" class="form-control form-control-sm" id="refAudioUrl"
+                            placeholder="http://... or data:audio/wav;base64,...">
+                            <div class="param-hint mt-1">Remote URL or base64 data URL</div>
+                        </div>
+                        <div class="col-md-4">
+                            <label class="form-label">Reference Text</label>
+                            <input type="text" class="form-control form-control-sm" id="refText"
+                            placeholder="Transcript of reference audio">
+                        </div>
+                        <div class="col-md-4 d-flex align-items-end">
+                            <div class="form-check form-switch">
+                                <input class="form-check-input" type="checkbox" id="xVectorOnly">
+                                <label class="form-check-label small">X-Vector Only Mode <span class="param-hint">(faster, lower quality)</span></label>
+                            </div>
                         </div>
                     </div>
                 </div>
             </div>
         </div>
-    </div>
 
-        <!-- Hidden audio blob store -->
+        </div>
+
         <script>
             // ==================== State ====================
             let audioBlob = null;
@@ -622,7 +611,7 @@
                 return document.getElementById('serverUrl').value.replace(/\/+$/, '');
             }
 
-            function showSpinner(text = '处理中...') {
+            function showSpinner(text = 'Processing...') {
                 document.getElementById('spinnerText').textContent = text;
                 document.getElementById('spinnerOverlay').classList.add('show');
             }
@@ -649,10 +638,10 @@
                 const text = document.getElementById('serverStatusText');
                 if (connected) {
                     dot.className = 'status-dot on';
-                    text.textContent = '已连接';
+                    text.textContent = 'Connected';
                 } else {
                     dot.className = 'status-dot off';
-                    text.textContent = '未连接';
+                    text.textContent = 'Disconnected';
                 }
             }
 
@@ -662,7 +651,7 @@
                     serverUrl: document.getElementById('serverUrl').value,
                 };
                 localStorage.setItem('tts_config', JSON.stringify(config));
-                showToast('<i class="bi bi-check-circle me-1"></i>配置已保存到本地', 'success');
+                showToast('<i class="bi bi-check-circle me-1"></i>Configuration saved locally', 'success');
             }
 
             function loadConfig() {
@@ -679,11 +668,11 @@
             async function checkServer() {
                 const baseUrl = getBaseUrl();
                 if (!baseUrl) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请输入服务器地址', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please enter server URL', 'error');
                     return;
                 }
 
-                showSpinner('正在连接服务器...');
+                showSpinner('Connecting to server...');
                 setServerStatus(false);
 
                 try {
@@ -700,14 +689,14 @@
                         setServerStatus(true);
                         const presetCount = data.voices?.filter(v => !(data.uploaded_voices || []).map(u => u.name).includes(v)).length || 0;
                         const uploadCount = data.uploaded_voices?.length || 0;
-                        showToast(`<i class="bi bi-check-circle me-1"></i>连接成功！发现 ${presetCount} 个预设语音，${uploadCount} 个已上传语音`, 'success');
+                        showToast(`<i class="bi bi-check-circle me-1"></i>Connected! Found ${presetCount} preset and ${uploadCount} uploaded voices`, 'success');
                     } else {
                         const errText = await resp.text();
-                        showToast(`<i class="bi bi-x-circle me-1"></i>服务器返回错误: ${resp.status} ${resp.statusText}`, 'error');
+                        showToast(`<i class="bi bi-x-circle me-1"></i>Server error: ${resp.status} ${resp.statusText}`, 'error');
                         console.error('Server check failed:', resp.status, errText);
                     }
                 } catch (e) {
-                    showToast(`<i class="bi bi-x-circle me-1"></i>无法连接到服务器: ${e.message}`, 'error');
+                    showToast(`<i class="bi bi-x-circle me-1"></i>Cannot connect: ${e.message}`, 'error');
                     console.error('Connection error:', e);
                 } finally {
                     hideSpinner();
@@ -718,11 +707,11 @@
             async function refreshVoices() {
                 const baseUrl = getBaseUrl();
                 if (!baseUrl) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请先配置服务器地址', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please configure server URL first', 'error');
                     return;
                 }
 
-                showSpinner('正在获取语音列表...');
+                showSpinner('Fetching voice list...');
 
                 try {
                     const resp = await fetch(`${baseUrl}/v1/audio/voices`);
@@ -740,9 +729,9 @@
                     const uploadedNames = (data.uploaded_voices || []).map(v => v.name);
                     const presetCount = (data.voices || []).filter(v => !uploadedNames.includes(v)).length;
                     const total = presetCount + (data.uploaded_voices?.length || 0);
-                    showToast(`<i class="bi bi-check-circle me-1"></i>已刷新，共 ${total} 个语音`, 'success');
+                    showToast(`<i class="bi bi-check-circle me-1"></i>Refreshed, ${total} voices total`, 'success');
                 } catch (e) {
-                    showToast(`<i class="bi bi-x-circle me-1"></i>获取失败: ${e.message}`, 'error');
+                    showToast(`<i class="bi bi-x-circle me-1"></i>Failed: ${e.message}`, 'error');
                     console.error('Refresh voices error:', e);
                 } finally {
                     hideSpinner();
@@ -758,13 +747,13 @@
                 const presetVoices = (data.voices || []).filter(v => !uploadedNames.has(v));
                 const total = presetVoices.length + uploadedVoices.length;
 
-                countEl.textContent = `${total} 个语音`;
+                countEl.textContent = `${total} voice${total !== 1 ? 's' : ''}`;
 
                 if (total === 0) {
                     container.innerHTML = `
                             <div class="text-center text-muted py-5">
                                 <i class="bi bi-inbox fs-3 d-block mb-2"></i>
-                                暂无语音，请上传克隆语音
+                                No voices yet, upload a clone voice to get started
                             </div>`;
                     return;
                 }
@@ -773,46 +762,44 @@
                         <table class="voice-table table table-borderless mb-0">
                             <thead>
                                 <tr>
-                                    <th>名称</th>
-                                    <th>类型</th>
-                                    <th>描述 / 参考文本</th>
-                                    <th>操作</th>
+                                    <th>Name</th>
+                                    <th>Type</th>
+                                    <th>Description / Ref Text</th>
+                                    <th>Actions</th>
                                 </tr>
                             </thead>
                             <tbody>`;
 
-                // Preset voices
                 for (const v of presetVoices) {
                     html += `
                                 <tr>
                                     <td><strong>${escapeHtml(v)}</strong></td>
-                                    <td><span class="badge-preset">预设</span></td>
+                                    <td><span class="badge-preset">Preset</span></td>
                                     <td><span class="text-muted small">—</span></td>
                                     <td>
-                                        <button class="btn btn-sm btn-outline-custom py-0 px-2" onclick="selectVoice('${escapeHtml(v)}')" title="选用此语音">
+                                        <button class="btn btn-sm btn-outline-custom py-0 px-2" onclick="selectVoice('${escapeHtml(v)}')" title="Use this voice">
                                             <i class="bi bi-check2"></i>
                                         </button>
                                     </td>
                                 </tr>`;
                 }
 
-                // Uploaded voices
                 for (const v of uploadedVoices) {
                     const desc = v.speaker_description || v.ref_text || '—';
-                    const created = v.created_at ? new Date(v.created_at * 1000).toLocaleDateString('zh-CN') : '';
+                    const created = v.created_at ? new Date(v.created_at * 1000).toLocaleDateString('en-US') : '';
                     html += `
                                 <tr>
                                     <td><strong>${escapeHtml(v.name)}</strong></td>
-                                    <td><span class="badge-uploaded">已上传</span></td>
+                                    <td><span class="badge-uploaded">Uploaded</span></td>
                                     <td>
                                         <span class="small">${escapeHtml(desc)}</span>
                                         ${created ? `<br><span class="param-hint">${created}</span>` : ''}
                                     </td>
                                     <td>
-                                        <button class="btn btn-sm btn-outline-custom py-0 px-2" onclick="selectVoice('${escapeHtml(v.name)}')" title="选用此语音">
+                                        <button class="btn btn-sm btn-outline-custom py-0 px-2" onclick="selectVoice('${escapeHtml(v.name)}')" title="Use this voice">
                                             <i class="bi bi-check2"></i>
                                         </button>
-                                        <button class="btn btn-sm text-danger py-0 px-1" onclick="deleteVoice('${escapeHtml(v.name)}')" title="删除此语音">
+                                        <button class="btn btn-sm text-danger py-0 px-1" onclick="deleteVoice('${escapeHtml(v.name)}')" title="Delete this voice">
                                             <i class="bi bi-trash3"></i>
                                         </button>
                                     </td>
@@ -825,7 +812,7 @@
 
             function populateVoiceSelect(data) {
                 const select = document.getElementById('synthVoice');
-                select.innerHTML = '<option value="">-- 请选择语音 --</option>';
+                select.innerHTML = '<option value="">-- Select a voice --</option>';
 
                 const uploadedVoices = data.uploaded_voices || [];
                 const uploadedNames = new Set(uploadedVoices.map(v => v.name));
@@ -833,7 +820,7 @@
 
                 if (presetVoices.length > 0) {
                     const optgroup = document.createElement('optgroup');
-                    optgroup.label = '预设语音';
+                    optgroup.label = 'Preset Voices';
                     for (const v of presetVoices) {
                         const opt = document.createElement('option');
                         opt.value = v;
@@ -845,7 +832,7 @@
 
                 if (uploadedVoices.length > 0) {
                     const optgroup = document.createElement('optgroup');
-                    optgroup.label = '已上传语音';
+                    optgroup.label = 'Uploaded Voices';
                     for (const v of uploadedVoices) {
                         const opt = document.createElement('option');
                         opt.value = v.name;
@@ -858,35 +845,32 @@
 
             function selectVoice(name) {
                 document.getElementById('synthVoice').value = name;
-                // Scroll to synth card
                 document.getElementById('synthText').focus();
-                showToast(`<i class="bi bi-check-circle me-1"></i>已选用语音: ${name}`, 'info');
+                showToast(`<i class="bi bi-check-circle me-1"></i>Selected voice: ${name}`, 'info');
             }
 
             async function deleteVoice(name) {
-                if (!confirm(`确定要删除语音 "${name}" 吗？此操作不可撤销。`)) return;
+                if (!confirm(`Are you sure you want to delete voice "${name}"? This cannot be undone.`)) return;
 
                 const baseUrl = getBaseUrl();
-                showSpinner('正在删除语音...');
+                showSpinner('Deleting voice...');
 
                 try {
-                    // Try DELETE method on the voice endpoint
                     const resp = await fetch(`${baseUrl}/v1/audio/voices/${encodeURIComponent(name)}`, {
                         method: 'DELETE',
                     });
 
                     if (resp.ok) {
-                        showToast(`<i class="bi bi-check-circle me-1"></i>语音 "${name}" 已删除`, 'success');
+                        showToast(`<i class="bi bi-check-circle me-1"></i>Voice "${name}" deleted`, 'success');
                         await refreshVoices();
                     } else if (resp.status === 404 || resp.status === 405) {
-                        // Some implementations might not support DELETE, try alternative
-                        showToast(`<i class="bi bi-info-circle me-1"></i>服务器不支持删除操作，请手动管理`, 'info');
+                        showToast(`<i class="bi bi-info-circle me-1"></i>Server does not support delete, please manage manually`, 'info');
                     } else {
                         const errText = await resp.text();
                         throw new Error(`${resp.status}: ${errText}`);
                     }
                 } catch (e) {
-                    showToast(`<i class="bi bi-x-circle me-1"></i>删除失败: ${e.message}`, 'error');
+                    showToast(`<i class="bi bi-x-circle me-1"></i>Delete failed: ${e.message}`, 'error');
                 } finally {
                     hideSpinner();
                 }
@@ -908,22 +892,22 @@
                 const btnTranscribe = document.getElementById('btnTranscribe');
 
                 if (!fileInput.files || fileInput.files.length === 0) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请先选择音频文件', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please select an audio file first', 'error');
                     return;
                 }
 
                 // Check for browser SpeechRecognition support
                 const SpeechRecognition = window.SpeechRecognition || window.webkitSpeechRecognition;
                 if (!SpeechRecognition) {
-                    showToast('<i class="bi bi-x-circle me-1"></i>当前浏览器不支持语音识别，请使用 Chrome 或 Edge', 'error');
+                    showToast('<i class="bi bi-x-circle me-1"></i>Speech recognition not supported in this browser, please use Chrome or Edge', 'error');
                     return;
                 }
 
                 btnTranscribe.disabled = true;
-                showSpinner('正在通过浏览器语音识别...\n请确保麦克风已开启，将播放音频进行识别');
+                showSpinner('Transcribing via browser speech recognition...\nPlease ensure microphone is enabled, audio will play for recognition');
 
                 const recognition = new SpeechRecognition();
-                recognition.lang = 'zh-CN';
+                recognition.lang = 'en-US';
                 recognition.interimResults = true;
                 recognition.continuous = true;
                 recognition.maxAlternatives = 1;
@@ -952,12 +936,10 @@
                 recognition.onerror = (event) => {
                     if (event.error === 'no-speech' || event.error === 'aborted') return;
                     console.error('Speech recognition error:', event.error);
-                    // Don't show toast for transient errors during playback
                 };
 
                 recognition.onend = () => {
                     if (!audio.ended && !audio.paused) {
-                        // Recognition ended but audio still playing, restart
                         try {
                             if (recognitionStarted) recognition.start();
                         } catch (e) { /* ignore */ }
@@ -969,9 +951,9 @@
                     URL.revokeObjectURL(audio.src);
                     document.getElementById('cloneRefText').value = finalTranscript.trim();
                     if (finalTranscript.trim()) {
-                        showToast('<i class="bi bi-check-circle me-1"></i>语音识别完成，请核对转录文本', 'success');
+                        showToast('<i class="bi bi-check-circle me-1"></i>Transcription complete, please verify the text', 'success');
                     } else {
-                        showToast('<i class="bi bi-info-circle me-1"></i>未识别到语音内容，请检查麦克风或手动输入文本', 'info');
+                        showToast('<i class="bi bi-info-circle me-1"></i>No speech detected, please check microphone or enter text manually', 'info');
                     }
                     btnTranscribe.disabled = false;
                     hideSpinner();
@@ -980,7 +962,7 @@
                 audio.onerror = () => {
                     try { recognition.stop(); } catch (e) { /* ignore */ }
                     URL.revokeObjectURL(audio.src);
-                    showToast('<i class="bi bi-x-circle me-1"></i>音频播放失败', 'error');
+                    showToast('<i class="bi bi-x-circle me-1"></i>Audio playback failed', 'error');
                     btnTranscribe.disabled = false;
                     hideSpinner();
                 };
@@ -988,15 +970,14 @@
                 try {
                     recognition.start();
                     recognitionStarted = true;
-                    // Small delay to let recognition initialize before playback
                     setTimeout(() => audio.play().catch(e => {
                         try { recognition.stop(); } catch (e2) { /* ignore */ }
-                        showToast('<i class="bi bi-x-circle me-1"></i>音频播放失败: ' + e.message, 'error');
+                        showToast('<i class="bi bi-x-circle me-1"></i>Audio playback failed: ' + e.message, 'error');
                         btnTranscribe.disabled = false;
                         hideSpinner();
                     }), 300);
                 } catch (e) {
-                    showToast('<i class="bi bi-x-circle me-1"></i>启动语音识别失败: ' + e.message, 'error');
+                    showToast('<i class="bi bi-x-circle me-1"></i>Failed to start speech recognition: ' + e.message, 'error');
                     btnTranscribe.disabled = false;
                     hideSpinner();
                 }
@@ -1012,22 +993,22 @@
                 const btnUpload = document.getElementById('btnUpload');
 
                 if (!fileInput.files || fileInput.files.length === 0) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请选择音频文件', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please select an audio file', 'error');
                     return;
                 }
                 if (!nameInput.value.trim()) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请输入语音名称', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please enter a voice name', 'error');
                     return;
                 }
                 if (!refTextInput.value.trim()) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请填写参考文本（可点击音频旁的"识别"按钮自动生成）', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please fill in reference text (click the Transcribe button to auto-generate)', 'error');
                     return;
                 }
 
                 const file = fileInput.files[0];
-                const maxSize = 10 * 1024 * 1024; // 10MB
+                const maxSize = 10 * 1024 * 1024;
                 if (file.size > maxSize) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>音频文件不能超过 10MB', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Audio file must not exceed 10MB', 'error');
                     return;
                 }
 
@@ -1037,7 +1018,7 @@
                 }
 
                 btnUpload.disabled = true;
-                showSpinner('正在上传克隆语音...');
+                showSpinner('Uploading clone voice...');
 
                 try {
                     const formData = new FormData();
@@ -1052,14 +1033,11 @@
                     const resp = await fetch(`${baseUrl}/v1/audio/voices`, {
                         method: 'POST',
                         body: formData,
-                        // Don't set Content-Type header — the browser will set it with the boundary
                     });
 
                     if (resp.ok) {
-                        const result = await resp.json().catch(() => ({}));
-                        showToast(`<i class="bi bi-check-circle me-1"></i>语音 "${nameInput.value.trim()}" 上传成功！`, 'success');
+                        showToast(`<i class="bi bi-check-circle me-1"></i>Voice "${nameInput.value.trim()}" uploaded successfully!`, 'success');
 
-                        // Clear form
                         fileInput.value = '';
                         nameInput.value = '';
                         consentInput.value = generateConsentId();
@@ -1067,7 +1045,6 @@
                         descInput.value = '';
                         document.getElementById('btnTranscribe').disabled = true;
 
-                        // Refresh voice list
                         await refreshVoices();
                     } else {
                         const errText = await resp.text();
@@ -1079,7 +1056,7 @@
                         throw new Error(errMsg);
                     }
                 } catch (e) {
-                    showToast(`<i class="bi bi-x-circle me-1"></i>上传失败: ${e.message}`, 'error');
+                    showToast(`<i class="bi bi-x-circle me-1"></i>Upload failed: ${e.message}`, 'error');
                     console.error('Upload error:', e);
                 } finally {
                     btnUpload.disabled = false;
@@ -1100,18 +1077,17 @@
                 const btnSynthesize = document.getElementById('btnSynthesize');
 
                 if (!voice) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请先选择语音', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please select a voice', 'error');
                     return;
                 }
                 if (!text) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请输入合成文本', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please enter text to synthesize', 'error');
                     return;
                 }
 
                 btnSynthesize.disabled = true;
-                showSpinner('正在合成语音...');
+                showSpinner('Synthesizing speech...');
 
-                // Clean up previous audio
                 if (audioUrl) {
                     URL.revokeObjectURL(audioUrl);
                     audioUrl = null;
@@ -1120,7 +1096,7 @@
 
                 try {
                     const body = {
-                        input: text,                        
+                        input: text,
                         voice: voice,
                         response_format: format,
                         speed: speed,
@@ -1132,7 +1108,6 @@
                         body.instructions = instructions;
                     }
 
-                    // Add ref_audio params for Base task type
                     if (taskType === 'Base') {
                         const refAudioUrl = document.getElementById('refAudioUrl').value.trim();
                         const refText = document.getElementById('refText').value.trim();
@@ -1161,31 +1136,26 @@
                         throw new Error(errMsg);
                     }
 
-                    // Get audio blob from response
                     audioBlob = await resp.blob();
 
-                    // Create preview URL
                     const mimeType = getMimeType(format);
                     audioUrl = URL.createObjectURL(new Blob([audioBlob], { type: mimeType }));
 
-                    // Show audio player
                     const previewSection = document.getElementById('audioPreviewSection');
                     const audioEl = document.getElementById('audioPreview');
                     previewSection.style.display = 'block';
                     audioEl.src = audioUrl;
                     audioEl.load();
 
-                    // Enable download button
                     document.getElementById('btnDownload').disabled = false;
 
-                    // Show playing indicator when audio plays
                     audioEl.onplay = () => document.getElementById('playingIndicator').classList.add('active');
                     audioEl.onpause = () => document.getElementById('playingIndicator').classList.remove('active');
                     audioEl.onended = () => document.getElementById('playingIndicator').classList.remove('active');
 
-                    showToast(`<i class="bi bi-check-circle me-1"></i>语音合成成功！`, 'success');
+                    showToast(`<i class="bi bi-check-circle me-1"></i>Speech synthesized successfully!`, 'success');
                 } catch (e) {
-                    showToast(`<i class="bi bi-x-circle me-1"></i>合成失败: ${e.message}`, 'error');
+                    showToast(`<i class="bi bi-x-circle me-1"></i>Synthesis failed: ${e.message}`, 'error');
                     console.error('Synthesis error:', e);
                 } finally {
                     btnSynthesize.disabled = false;
@@ -1195,7 +1165,7 @@
 
             function downloadAudio() {
                 if (!audioBlob) {
-                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>请先合成语音', 'error');
+                    showToast('<i class="bi bi-exclamation-triangle me-1"></i>Please synthesize speech first', 'error');
                     return;
                 }
 
@@ -1226,32 +1196,18 @@
                 return map[format] || 'audio/wav';
             }
 
-            function escapeHtml(str) {
-                if (!str) return '';
-                const div = document.createElement('div');
-                div.textContent = str;
-                return div.innerHTML;
-            }
-
             // ==================== Event Listeners ====================
-            // Show/hide ref audio card based on task type
             document.getElementById('synthTaskType').addEventListener('change', function() {
                 const refCard = document.getElementById('refAudioCard');
-                if (this.value === 'Base') {
-                    refCard.style.display = 'block';
-                } else {
-                    refCard.style.display = 'none';
-                }
+                refCard.style.display = this.value === 'Base' ? 'block' : 'none';
             });
 
-            // Enter key triggers synthesis
             document.getElementById('synthText').addEventListener('keydown', function(e) {
                 if (e.ctrlKey && e.key === 'Enter') {
                     synthesize();
                 }
             });
 
-            // Enter key in server URL triggers check
             document.getElementById('serverUrl').addEventListener('keydown', function(e) {
                 if (e.key === 'Enter') {
                     checkServer();
diff --git a/web/webrtcapi-asr.html b/web/webrtcapi-asr.html
index be43844a..da6af02e 100644
--- a/web/webrtcapi-asr.html
+++ b/web/webrtcapi-asr.html
@@ -99,7 +99,7 @@ <h2>Media</h2>
 	  });
 
     $('#btn_start_record').click(function() {
-        // 开始录制
+        // Start recording
         console.log('Starting recording...');
         fetch('/record', {
             body: JSON.stringify({
@@ -124,7 +124,7 @@ <h2>Media</h2>
     });
 
     $('#btn_stop_record').click(function() {
-        // 结束录制
+        // Stop recording
         console.log('Stopping recording...');
         fetch('/record', {
             body: JSON.stringify({
@@ -149,7 +149,7 @@ <h2>Media</h2>
     });
 
     // $('#btn_download').click(function() {
-    //     // 下载视频文件
+    //     // Download video file
     //     console.log('Downloading video...');
     //     fetch('/record_lasted.mp4', {
     //         method: 'GET'
@@ -160,17 +160,17 @@ <h2>Media</h2>
     //             throw new Error('Failed to download the video.');
     //         }
     //     }).then(function(blob) {
-    //         // 创建一个 Blob 对象
+    //         // Create a Blob object
     //         const url = window.URL.createObjectURL(blob);
-    //         // 创建一个隐藏的可下载链接
+    //         // Create a hidden downloadable link
     //         const a = document.createElement('a');
     //         a.style.display = 'none';
     //         a.href = url;
     //         a.download = 'record_lasted.mp4';
     //         document.body.appendChild(a);
-    //         // 触发下载
+    //         // Trigger download
     //         a.click();
-    //         // 清理
+    //         // Cleanup
     //         window.URL.revokeObjectURL(url);
     //         document.body.removeChild(a);
     //         console.log('Video downloaded successfully.');
diff --git a/web/webrtcapi.html b/web/webrtcapi.html
index b847d207..833609ab 100644
--- a/web/webrtcapi.html
+++ b/web/webrtcapi.html
@@ -97,7 +97,7 @@ <h2>Media</h2>
 	  });
 
     $('#btn_start_record').click(function() {
-        // 开始录制
+        // Start recording
         console.log('Starting recording...');
         fetch('/record', {
             body: JSON.stringify({
@@ -123,7 +123,7 @@ <h2>Media</h2>
     });
 
     $('#btn_stop_record').click(function() {
-        // 结束录制
+        // Stop recording
         console.log('Stopping recording...');
         fetch('/record', {
             body: JSON.stringify({
@@ -149,7 +149,7 @@ <h2>Media</h2>
     });
 
     // $('#btn_download').click(function() {
-    //     // 下载视频文件
+    //     // Download video file
     //     console.log('Downloading video...');
     //     fetch('/record_lasted.mp4', {
     //         method: 'GET'
@@ -160,17 +160,17 @@ <h2>Media</h2>
     //             throw new Error('Failed to download the video.');
     //         }
     //     }).then(function(blob) {
-    //         // 创建一个 Blob 对象
+    //         // Create a Blob object
     //         const url = window.URL.createObjectURL(blob);
-    //         // 创建一个隐藏的可下载链接
+    //         // Create a hidden downloadable link
     //         const a = document.createElement('a');
     //         a.style.display = 'none';
     //         a.href = url;
     //         a.download = 'record_lasted.mp4';
     //         document.body.appendChild(a);
-    //         // 触发下载
+    //         // Trigger download
     //         a.click();
-    //         // 清理
+    //         // Cleanup
     //         window.URL.revokeObjectURL(url);
     //         document.body.removeChild(a);
     //         console.log('Video downloaded successfully.');

From 7c1db791e4b3e1103ffb94d10ffba98437bd3eec Mon Sep 17 00:00:00 2001
From: ahmedrazakhan12 <ahmedrazakhank112@gmail.com>
Date: Tue, 9 Jun 2026 17:06:46 +0500
Subject: [PATCH 4/5] chore: translate README.md to English and remove
 redundant README-EN.md

---
 README-EN.md | 217 ---------------------------------------------------
 README.md    | 213 +++++++++++++++++++++++++-------------------------
 2 files changed, 105 insertions(+), 325 deletions(-)
 delete mode 100644 README-EN.md

diff --git a/README-EN.md b/README-EN.md
deleted file mode 100644
index 508192a6..00000000
--- a/README-EN.md
+++ /dev/null
@@ -1,217 +0,0 @@
-<p align="center">
-    <img src="./assets/LiveTalking-logo.png" align="middle" width="600"/>
-</p>
-
-English | [中文版](./README.md)
-
-<p align="center">
-    <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-dfd.svg"></a>
-    <a href="https://github.com/lipku/LiveTalking/releases"><img src="https://img.shields.io/github/v/release/lipku/LiveTalking?color=ffa"></a>
-    <a href=""><img src="https://img.shields.io/badge/python-3.10+-aff.svg"></a>
-    <a href=""><img src="https://img.shields.io/badge/os-linux%2C%20win%2C%20mac-pink.svg"></a>
-    <a href="https://github.com/lipku/LiveTalking/graphs/contributors"><img src="https://img.shields.io/github/contributors/lipku/LiveTalking?color=c4f042&style=flat-square"></a>
-</p>
-<p align="center">
-<a href="https://trendshift.io/repositories/12565" target="_blank"><img src="https://trendshift.io/api/badge/repositories/12565" alt="lipku%2FLiveTalking | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
-</p>
-
-A real-time interactive streaming digital human engine enabling synchronized audio-video conversation, widely adopted in commercial applications.
-
-**Demos**: [wav2lip](https://youtu.be/-ss0H8qLr7E) | [ernerf](https://www.bilibili.com/video/BV1G1421z73r/) | [musetalk](https://youtu.be/vzUMruoZlxc/)
-
-Domestic Mirror: <https://gitee.com/lipku/LiveTalking>
-
----
-
-## Features
-1. Supports multiple digital human models: ernerf, musetalk, wav2lip, Ultralight-Digital-Human
-2. Supports voice cloning
-3. Supports interrupting the digital human while speaking
-4. Supports full-body video stitching
-5. Supports WebRTC, RTMP, and virtual camera output
-6. Supports action choreography: plays custom videos when not speaking
-7. Supports multi-concurrency
-8. Supports custom digital human avatars
-9. Provides frontend API integration
-
----
-
-## Usage Scenarios
-
-LiveTalking leverages real-time streaming digital human technology to drive virtual avatars via text or voice, combined with LLM for intelligent conversation. Suitable for the following scenarios:
-
-| Scenario | Description |
-|----------|-------------|
-| **Virtual Streamer / Live Commerce** | 24/7 unmanned live streaming with LLM-generated sales scripts and action choreography for natural performance |
-| **AI Digital Human Customer Service** | Integrate enterprise knowledge bases for real-time voice Q&A with interruption support |
-| **Online Education / Training** | Digital teacher分身 for course recording, or API-driven digital instructor for real-time lectures |
-| **Intelligent Voice Assistant** | Pair with smart speakers or apps, calling the `/human` API to drive digital human voice interactions |
-| **Large Screen Presentation** | Digital human presenter for exhibition halls, event venues, and other content narration scenarios |
-| **Batch Short Video Creation** | Submit scripts in batch via API to generate digital human videos without real-person filming, using `/human` + `/record` APIs |
-
-**Core Flow**: User input (text/audio) → LLM response (optional) → TTS speech synthesis → Real-time lip-sync → Audio/video streaming output
-
----
-
-## 1. Installation
-
-Tested on Ubuntu 24.04, Python 3.12, PyTorch 2.9.1, CUDA 13.0.
-
-### 1.1 Install Dependencies
-
-```bash
-git clone https://github.com/lipku/LiveTalking.git 
-conda create -n livetalking python=3.12
-conda activate livetalking
-# If CUDA version is not 13.0 (check via nvidia-smi), install the corresponding PyTorch version(https://pytorch.org/get-started/previous-versions)
-pip install torch==2.9.1 torchvision==0.24.1 torchaudio==2.9.1 --index-url https://download.pytorch.org/whl/cu130
-cd LiveTalking
-pip install -r requirements.txt
-```
-
-Installation FAQ: <https://doc.livetalking.ai/en/docs/faq/>
-
-Linux CUDA environment setup: <https://zhuanlan.zhihu.com/p/674972886>
-
----
-
-## 2. Quick Start
-
-### 2.1 Download Models
-
-| Source | Link |
-|--------|------|
-| Quark Cloud | <https://pan.quark.cn/s/83a750323ef0> |
-| Google Drive | <https://drive.google.com/drive/folders/1FOC_MD6wdogyyX_7V1d4NDIO7P9NlSAJ?usp=sharing> |
-
-1. Copy `wav2lip256.pth` to the project's `models/` directory and rename it to `wav2lip.pth`
-2. Extract `wav2lip256_avatar1.tar.gz` and copy the entire extracted folder to `data/avatars/`
-
-### 2.2 Start the Server
-
-```bash
-python app.py --transport webrtc --model wav2lip --avatar_id wav2lip256_avatar1
-```
-
-> **Note**: The server must open ports TCP:8010, UDP:1-65536
-
-### 2.3 Client Access
-
-| Method | Description |
-|--------|-------------|
-| Browser | Open `http://serverip:8010/index.html`, click "Start Connection" to play the digital human video, then enter text and submit |
-| API | See [API Docs](docs/api.md) for HTTP-based integration |
-| Desktop App | Download: <https://pan.quark.cn/s/d7192d8ac19b> |
-
-### 2.4 Web Pages
-
-| Page | URL | Description |
-|------|-----|-------------|
-| Home | `/index.html` | WebRTC connection + text/audio driver + recording control |
-| Avatar Creator | `/avatar.html` | Upload video to auto-generate digital human avatars |
-| Admin Console | `/admin.html` | Real-time session monitoring & global configuration |
-
-<img src="./assets/index.jpg" align="middle"/>
-
-### 2.5 Quick Experience
-
-Create an instance with a cloud image to run instantly:
-
-- [UCloud Image](https://www.compshare.cn/images/4458094e-a43d-45fe-9b57-de79253befe4?referral_code=3XW3852OBmnD089hMMrtuU&ytag=GPU_GitHub_livetalking)
-
-### 2.6 Documentation
-<https://doc.livetalking.ai/en>
-
----
-
-## 3. Architecture
-
-### Dataflow Diagram
-
-<img src="./assets/dataflow.png" align="middle" />
-
-### Layer Overview
-
-**API Layer**
-- `/human`: Accepts text, supporting echo (direct playback) and chat (LLM conversation) modes
-- `/humanaudio`: Accepts audio files for direct playback
-- Each connection is assigned a unique `sessionid`, supporting multi-user concurrency
-
-**Logic Layer**
-- **LLM Engine**: Integrates with models like Qwen to generate conversational responses
-- **TTS Engine**: Modular design supporting EdgeTTS, GPT-SoVITS, CosyVoice, Tencent Cloud, and more
-- **Feature Extraction**: Synchronously extracts acoustic features (e.g., Mel spectrograms) for lip-sync inference
-
-**Rendering Layer**
-- **Model Inference**: Uses deep learning models (Wav2Lip, MuseTalk, etc.) to generate lip-sync frames from audio features
-- **Post-Processing**: Smoothly overlays the generated mouth region back onto the original high-definition video
-
-**Streaming Layer**
-- **WebRTC**: Low-latency browser-based streaming
-- **RTMP**: Standard live streaming protocol, supports pushing to platforms like Bilibili/YouTube
-- **Virtual Camera**: Outputs as a system camera device
-
-**Plugin System**
-- Decentralized registration mechanism based on [registry.py](registry.py), allowing developers to extend TTS, Avatar, and Output modules
-
----
-
-## 4. API Documentation
-
-| Document | Description |
-|----------|-------------|
-| [docs/api.md](docs/api.md) | General API — WebRTC, text/audio driver, recording, action choreography |
-| [docs/avatar_api.md](docs/avatar_api.md) | Avatar Generation API — create tasks, query progress, delete tasks |
-| [docs/admin_api.md](docs/admin_api.md) | Admin API — global config, session monitoring, force stop |
-
----
-
-## 5. Docker
-
-Available images:
-- **AutoDL**: <https://www.codewithgpu.com/i/lipku/livetalking/base> — [Tutorial](https://doc.livetalking.ai/en/docs/autodl/)
-- **UCloud**: <https://www.compshare.cn/images/4458094e-a43d-45fe-9b57-de79253befe4?referral_code=3XW3852OBmnD089hMMrtuU&ytag=GPU_GitHub_livetalking> — Supports opening any port, no additional SRS deployment required — [Tutorial](https://doc.livetalking.ai/en/docs/ucloud/)
-
-> AutoDL cannot open UDP ports, so you need to deploy SRS or TURN relay service separately.
-
----
-
-## 6. Performance
-
-- Each video stream compression consumes CPU; higher resolution means greater CPU usage. Each lip-sync inference consumes GPU
-- Concurrent sessions when not speaking depend on CPU; concurrent speaking sessions depend on GPU
-- In backend logs: `inferfps` = GPU inference frame rate, `finalfps` = final streaming frame rate. Both must be >= 25 for real-time performance
-
-### Real-Time Inference Performance
-
-| Model | GPU | FPS |
-|:------|:----|:----|
-| wav2lip256 | RTX 3060 | 60 |
-| wav2lip256 | RTX 3080Ti | 120 |
-| musetalk | RTX 3080Ti | 42 |
-| musetalk | RTX 3090 | 45 |
-| musetalk | RTX 4090 | 72 |
-
-- wav2lip256: RTX 3060 or higher recommended
-- musetalk: RTX 3080Ti or higher recommended
-
----
-
-## 7. Statement
-
-Videos developed based on this project and published on platforms such as Bilibili, WeChat Channels, and Douyin must include the LiveTalking watermark and logo.
-
----
-
-If this project is helpful to you, please give it a Star. Contributors interested in improving this project are also welcome.
-
-| Community | Link |
-|-----------|------|
-| Knowledge Planet | <https://t.zsxq.com/7NMyO> |
-| WeChat | wxwubug (mention for group invite) |
-| Telegram | <https://t.me/livetalking> |
-| Discord | <https://discord.gg/n5jSPCT3Uf> |
-| Email | lipku@foxmail.com |
-| WeChat Official | 数字人技术 |
-
-<img src="./assets/qrcode-wechat.jpg" align="middle" />
diff --git a/README.md b/README.md
index fa37432d..508192a6 100644
--- a/README.md
+++ b/README.md
@@ -2,8 +2,7 @@
     <img src="./assets/LiveTalking-logo.png" align="middle" width="600"/>
 </p>
 
-中文版 ｜ [English](./README-EN.md)
-
+English | [中文版](./README.md)
 
 <p align="center">
     <a href="./LICENSE"><img src="https://img.shields.io/badge/license-Apache%202-dfd.svg"></a>
@@ -16,205 +15,203 @@
 <a href="https://trendshift.io/repositories/12565" target="_blank"><img src="https://trendshift.io/api/badge/repositories/12565" alt="lipku%2FLiveTalking | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
 </p>
 
-实时交互流式数字人引擎，实现音视频同步对话，已在业内获得广泛商用
+A real-time interactive streaming digital human engine enabling synchronized audio-video conversation, widely adopted in commercial applications.
 
-**效果演示**: [wav2lip](https://www.bilibili.com/video/BV1scwBeyELA/) | [ernerf](https://www.bilibili.com/video/BV1G1421z73r/) | [musetalk](https://www.bilibili.com/video/BV1bUwezvEnG/)
+**Demos**: [wav2lip](https://youtu.be/-ss0H8qLr7E) | [ernerf](https://www.bilibili.com/video/BV1G1421z73r/) | [musetalk](https://youtu.be/vzUMruoZlxc/)
 
-国内镜像: <https://gitee.com/lipku/LiveTalking>
+Domestic Mirror: <https://gitee.com/lipku/LiveTalking>
 
 ---
 
 ## Features
-1. 支持多种数字人模型: ernerf、musetalk、wav2lip、Ultralight-Digital-Human
-2. 支持声音克隆
-3. 支持数字人说话被打断
-4. 支持全身视频拼接
-5. 支持 WebRTC、RTMP、虚拟摄像头输出
-6. 支持动作编排：不说话时播放自定义视频
-7. 支持多并发
-8. 支持自定义数字人形象
-9. 提供前端API接口对接
+1. Supports multiple digital human models: ernerf, musetalk, wav2lip, Ultralight-Digital-Human
+2. Supports voice cloning
+3. Supports interrupting the digital human while speaking
+4. Supports full-body video stitching
+5. Supports WebRTC, RTMP, and virtual camera output
+6. Supports action choreography: plays custom videos when not speaking
+7. Supports multi-concurrency
+8. Supports custom digital human avatars
+9. Provides frontend API integration
 
 ---
 
-## 使用场景
+## Usage Scenarios
 
-LiveTalking 基于实时流式数字人技术，通过文本或语音驱动虚拟形象说话，结合 LLM 实现智能对话。适用于以下场景：
+LiveTalking leverages real-time streaming digital human technology to drive virtual avatars via text or voice, combined with LLM for intelligent conversation. Suitable for the following scenarios:
 
-| 场景 | 说明 |
-|------|------|
-| **虚拟主播/直播带货** | 24 小时无人直播，通过 LLM 自动生成带货话术，配合动作编排实现自然表现 |
-| **AI 数字人客服** | 接入企业知识库，用户语音提问，数字人实时回答，支持打断重说 |
-| **在线教育/培训** | 教师数字分身录制课程，或通过 API 驱动数字人讲师实时授课 |
-| **智能语音助手** | 结合智能音箱或 APP，调用 `/human` 接口驱动数字人进行语音对话交互 |
-| **大屏讲解** | 数字人讲解员在展厅大屏、活动现场等场景进行内容讲解和互动 |
-| **短视频批量制作** | 通过 API 批量提交文案生成数字人出镜视频，无需真人拍摄，调用 `/human` + `/record` 接口 |
+| Scenario | Description |
+|----------|-------------|
+| **Virtual Streamer / Live Commerce** | 24/7 unmanned live streaming with LLM-generated sales scripts and action choreography for natural performance |
+| **AI Digital Human Customer Service** | Integrate enterprise knowledge bases for real-time voice Q&A with interruption support |
+| **Online Education / Training** | Digital teacher分身 for course recording, or API-driven digital instructor for real-time lectures |
+| **Intelligent Voice Assistant** | Pair with smart speakers or apps, calling the `/human` API to drive digital human voice interactions |
+| **Large Screen Presentation** | Digital human presenter for exhibition halls, event venues, and other content narration scenarios |
+| **Batch Short Video Creation** | Submit scripts in batch via API to generate digital human videos without real-person filming, using `/human` + `/record` APIs |
 
-**核心流程**：用户输入文字/音频 → LLM 生成回复（可选）→ TTS 合成语音 → 数字人实时口型同步 → 音视频推流输出
+**Core Flow**: User input (text/audio) → LLM response (optional) → TTS speech synthesis → Real-time lip-sync → Audio/video streaming output
 
 ---
 
-## 1. 安装
+## 1. Installation
 
-已在 Ubuntu 22.04、Python 3.12、PyTorch 2.9.1、CUDA 13.0 测试通过。
+Tested on Ubuntu 24.04, Python 3.12, PyTorch 2.9.1, CUDA 13.0.
 
-### 1.1 安装依赖
+### 1.1 Install Dependencies
 
 ```bash
 git clone https://github.com/lipku/LiveTalking.git 
 conda create -n livetalking python=3.12
 conda activate livetalking
-# 如果 CUDA 版本不为 13.0 (运行 nvidia-smi 确认)，请根据 PyTorch 官网(https://pytorch.org/get-started/previous-versions)安装对应版本
+# If CUDA version is not 13.0 (check via nvidia-smi), install the corresponding PyTorch version(https://pytorch.org/get-started/previous-versions)
 pip install torch==2.9.1 torchvision==0.24.1 torchaudio==2.9.1 --index-url https://download.pytorch.org/whl/cu130
 cd LiveTalking
 pip install -r requirements.txt
 ```
 
-安装常见问题：[FAQ](https://doc.livetalking.ai/docs/faq/)
+Installation FAQ: <https://doc.livetalking.ai/en/docs/faq/>
 
-Linux CUDA 环境搭建参考: <https://zhuanlan.zhihu.com/p/674972886>
+Linux CUDA environment setup: <https://zhuanlan.zhihu.com/p/674972886>
 
 ---
 
-## 2. 快速开始
+## 2. Quick Start
 
-### 2.1 下载模型
+### 2.1 Download Models
 
-| 网盘 | 地址 |
-|------|------|
-| 夸克云盘 | <https://pan.quark.cn/s/83a750323ef0> |
+| Source | Link |
+|--------|------|
+| Quark Cloud | <https://pan.quark.cn/s/83a750323ef0> |
 | Google Drive | <https://drive.google.com/drive/folders/1FOC_MD6wdogyyX_7V1d4NDIO7P9NlSAJ?usp=sharing> |
 
-1. 将 `wav2lip256.pth` 拷贝到项目的 `models/` 目录下，重命名为 `wav2lip.pth`
-2. 将 `wav2lip256_avatar1.tar.gz` 解压后整个文件夹拷贝到 `data/avatars/` 目录下
+1. Copy `wav2lip256.pth` to the project's `models/` directory and rename it to `wav2lip.pth`
+2. Extract `wav2lip256_avatar1.tar.gz` and copy the entire extracted folder to `data/avatars/`
 
-### 2.2 启动服务
+### 2.2 Start the Server
 
 ```bash
 python app.py --transport webrtc --model wav2lip --avatar_id wav2lip256_avatar1
 ```
 
+> **Note**: The server must open ports TCP:8010, UDP:1-65536
 
->  **注意**: 服务端需开放端口 TCP:8010, UDP:1-65536  
-
-
-### 2.3 客户端接入
+### 2.3 Client Access
 
-| 方式 | 说明 |
-|------|------|
-| 浏览器 | 打开 `http://serverip:8010/index.html`，点击"开始连接"播放数字人视频，在文本框输入文字提交即可 |
-| API 调用 | 参考 [API 文档](docs/api.md) 通过 HTTP 接口驱动 |
-| 桌面客户端 | 下载地址: <https://pan.quark.cn/s/d7192d8ac19b> |
+| Method | Description |
+|--------|-------------|
+| Browser | Open `http://serverip:8010/index.html`, click "Start Connection" to play the digital human video, then enter text and submit |
+| API | See [API Docs](docs/api.md) for HTTP-based integration |
+| Desktop App | Download: <https://pan.quark.cn/s/d7192d8ac19b> |
 
-### 2.4 Web 页面
+### 2.4 Web Pages
 
-| 页面 | 地址 | 说明 |
-|------|------|------|
-| 首页 | `/index.html` | WebRTC 连接 + 文本/音频驱动 + 录制控制 |
-| Avatar 生成 | `/avatar.html` | 上传视频自动生成数字人形象 |
-| 管理后台 | `/admin.html` | 实时监控会话状态与全局配置 |
+| Page | URL | Description |
+|------|-----|-------------|
+| Home | `/index.html` | WebRTC connection + text/audio driver + recording control |
+| Avatar Creator | `/avatar.html` | Upload video to auto-generate digital human avatars |
+| Admin Console | `/admin.html` | Real-time session monitoring & global configuration |
 
 <img src="./assets/index.jpg" align="middle"/>
 
-### 2.5 快速体验
+### 2.5 Quick Experience
 
-使用在线镜像创建实例即可运行:
+Create an instance with a cloud image to run instantly:
 
-- [UCloud 镜像](https://www.compshare.cn/images/4458094e-a43d-45fe-9b57-de79253befe4?referral_code=3XW3852OBmnD089hMMrtuU&ytag=GPU_GitHub_livetalking)
+- [UCloud Image](https://www.compshare.cn/images/4458094e-a43d-45fe-9b57-de79253befe4?referral_code=3XW3852OBmnD089hMMrtuU&ytag=GPU_GitHub_livetalking)
+
+### 2.6 Documentation
+<https://doc.livetalking.ai/en>
 
-### 2.6 使用说明
-<https://doc.livetalking.ai>
 ---
 
-## 3. 系统架构
+## 3. Architecture
 
-### 数据流图
+### Dataflow Diagram
 
 <img src="./assets/dataflow.png" align="middle" />
 
+### Layer Overview
 
-### 各层说明
-
-**API 层**
-- `/human`: 接收文本，支持 echo（直接复读）和 chat（LLM 对话）模式
-- `/humanaudio`: 接收音频文件直接播放
-- 每个连接分配唯一 `sessionid`，支持多用户并发
+**API Layer**
+- `/human`: Accepts text, supporting echo (direct playback) and chat (LLM conversation) modes
+- `/humanaudio`: Accepts audio files for direct playback
+- Each connection is assigned a unique `sessionid`, supporting multi-user concurrency
 
-**逻辑层**
-- **LLM 引擎**: 对接 Qwen 等大模型生成对话回复
-- **TTS 引擎**: 模块化设计，支持 EdgeTTS、GPT-SoVITS、CosyVoice、腾讯云等多种方案
-- **特征提取**: 同步提取音频的声学特征（如 Mel 频谱），用于口型推理
+**Logic Layer**
+- **LLM Engine**: Integrates with models like Qwen to generate conversational responses
+- **TTS Engine**: Modular design supporting EdgeTTS, GPT-SoVITS, CosyVoice, Tencent Cloud, and more
+- **Feature Extraction**: Synchronously extracts acoustic features (e.g., Mel spectrograms) for lip-sync inference
 
-**渲染层**
-- **模型推理**: 使用深度学习模型 (Wav2Lip, MuseTalk 等) 根据音频特征生成口型画面
-- **后处理**: 将生成的口型区域平滑贴回原始高清视频
+**Rendering Layer**
+- **Model Inference**: Uses deep learning models (Wav2Lip, MuseTalk, etc.) to generate lip-sync frames from audio features
+- **Post-Processing**: Smoothly overlays the generated mouth region back onto the original high-definition video
 
-**推流层**
-- **WebRTC**: 低延迟浏览器端推流
-- **RTMP**: 标准直播协议，支持推流到 B站/YouTube 等平台
-- **虚拟摄像头**: 输出为系统摄像头设备
+**Streaming Layer**
+- **WebRTC**: Low-latency browser-based streaming
+- **RTMP**: Standard live streaming protocol, supports pushing to platforms like Bilibili/YouTube
+- **Virtual Camera**: Outputs as a system camera device
 
-**插件系统**
-- 基于 [registry.py](registry.py) 的去中心化注册机制，开发者可自行扩展 TTS、Avatar、Output 模块
+**Plugin System**
+- Decentralized registration mechanism based on [registry.py](registry.py), allowing developers to extend TTS, Avatar, and Output modules
 
 ---
 
-## 4. API 接口
+## 4. API Documentation
 
-| 文档 | 说明 |
-|------|------|
-| [docs/api.md](docs/api.md) | 通用业务 API — WebRTC、文本/音频驱动、录制、动作编排 |
-| [docs/avatar_api.md](docs/avatar_api.md) | Avatar 生成 API — 创建任务、查询进度、删除任务 |
-| [docs/admin_api.md](docs/admin_api.md) | Admin 管理 API — 全局配置、会话监控、强制停止 |
+| Document | Description |
+|----------|-------------|
+| [docs/api.md](docs/api.md) | General API — WebRTC, text/audio driver, recording, action choreography |
+| [docs/avatar_api.md](docs/avatar_api.md) | Avatar Generation API — create tasks, query progress, delete tasks |
+| [docs/admin_api.md](docs/admin_api.md) | Admin API — global config, session monitoring, force stop |
 
 ---
 
-## 5. Docker 运行
+## 5. Docker
 
-镜像说明:
-- **AutoDL**: <https://www.codewithgpu.com/i/lipku/livetalking/base> — [教程](https://doc.livetalking.ai/docs/autodl/)
-- **UCloud**: <https://www.compshare.cn/images/4458094e-a43d-45fe-9b57-de79253befe4?referral_code=3XW3852OBmnD089hMMrtuU&ytag=GPU_GitHub_livetalking> — 支持开放任意端口，无需额外部署 SRS — [教程](https://doc.livetalking.ai/docs/ucloud/)
+Available images:
+- **AutoDL**: <https://www.codewithgpu.com/i/lipku/livetalking/base> — [Tutorial](https://doc.livetalking.ai/en/docs/autodl/)
+- **UCloud**: <https://www.compshare.cn/images/4458094e-a43d-45fe-9b57-de79253befe4?referral_code=3XW3852OBmnD089hMMrtuU&ytag=GPU_GitHub_livetalking> — Supports opening any port, no additional SRS deployment required — [Tutorial](https://doc.livetalking.ai/en/docs/ucloud/)
 
-> AutoDL 由于不能开放 UDP 端口，需自行部署 SRS 或 TURN 转发服务。
+> AutoDL cannot open UDP ports, so you need to deploy SRS or TURN relay service separately.
 
 ---
 
-## 6. 性能指标
+## 6. Performance
 
-- 每路视频压缩消耗 CPU，分辨率越高 CPU 消耗越大；每路口型推理消耗 GPU
-- 不说话时并发数取决于 CPU，同时说话并发数取决于 GPU
-- 后端日志 `inferfps` = GPU 推理帧率, `finalfps` = 最终推流帧率，两者均需 >=25 才算实时
+- Each video stream compression consumes CPU; higher resolution means greater CPU usage. Each lip-sync inference consumes GPU
+- Concurrent sessions when not speaking depend on CPU; concurrent speaking sessions depend on GPU
+- In backend logs: `inferfps` = GPU inference frame rate, `finalfps` = final streaming frame rate. Both must be >= 25 for real-time performance
 
-### 实时推理性能
+### Real-Time Inference Performance
 
-| 模型 | 显卡 | FPS |
-|:------|:------|:----|
+| Model | GPU | FPS |
+|:------|:----|:----|
 | wav2lip256 | RTX 3060 | 60 |
 | wav2lip256 | RTX 3080Ti | 120 |
 | musetalk | RTX 3080Ti | 42 |
 | musetalk | RTX 3090 | 45 |
 | musetalk | RTX 4090 | 72 |
 
-- wav2lip256 推荐 RTX 3060 及以上
-- musetalk 推荐 RTX 3080Ti 及以上
+- wav2lip256: RTX 3060 or higher recommended
+- musetalk: RTX 3080Ti or higher recommended
 
 ---
 
-## 7. 声明
+## 7. Statement
 
-基于本项目开发并发布在B站、视频号、抖音等平台上的视频需带上 LiveTalking 水印和标识。
+Videos developed based on this project and published on platforms such as Bilibili, WeChat Channels, and Douyin must include the LiveTalking watermark and logo.
 
 ---
 
-如果本项目对你有帮助，帮忙点个 Star。也欢迎感兴趣的朋友一起来完善该项目。
+If this project is helpful to you, please give it a Star. Contributors interested in improving this project are also welcome.
 
-| 社区 | 链接 |
-|------|------|
-| 知识星球 | <https://t.zsxq.com/7NMyO> |
-| 微信 | wxwubug (加群请备注) |
+| Community | Link |
+|-----------|------|
+| Knowledge Planet | <https://t.zsxq.com/7NMyO> |
+| WeChat | wxwubug (mention for group invite) |
 | Telegram | <https://t.me/livetalking> |
 | Discord | <https://discord.gg/n5jSPCT3Uf> |
 | Email | lipku@foxmail.com |
-| 微信公众号 | 数字人技术 |
+| WeChat Official | 数字人技术 |
 
 <img src="./assets/qrcode-wechat.jpg" align="middle" />

From f28870a7be792cd83bc46af828b32d05ab83b45e Mon Sep 17 00:00:00 2001
From: Ali Nasir <alinasir77@gmail.com>
Date: Wed, 10 Jun 2026 15:06:11 +0500
Subject: [PATCH 5/5] added .pem files in gitignore

---
 .gitignore | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/.gitignore b/.gitignore
index 2a83f0af..efc032af 100644
--- a/.gitignore
+++ b/.gitignore
@@ -19,3 +19,5 @@ workspace/log_ngp.txt
 models/
 *.log
 dist
+*.pem
+*.sh