Commit d2daeb1

benny-dou <60535774+benny-dou@users.noreply.github.com>
2025-07-11 16:51:10
refactor(asr): rename somme files [skip ci]
1 parent 13b7b71
src/asr/ali_asr.py → src/asr/ali.py
File renamed without changes
src/asr/tecent_asr.py → src/asr/tecent.py
@@ -75,7 +75,7 @@ async def tencent_single_asr(path: str | Path, engine: str, voice_format: str) -
     """Tencent Single Sentence ASR.
 
     一句话识别
-    https://cloud.tencent.com/document/product/1093/52097
+    https://cloud.tencent.com/document/product/1093/35646
     """
     async with await anyio.open_file(path, "rb") as f:
         content = await f.read()
src/asr/voice_recognition.py
@@ -10,12 +10,12 @@ from pyrogram.client import Client
 from pyrogram.enums import ParseMode
 from pyrogram.types import Message
 
-from asr.ali_asr import ali_asr
+from asr.ali import ali_asr
 from asr.cloudflare import cloudflare_asr
 from asr.deepgram import deepgram_asr
 from asr.gemini import gemini_asr
 from asr.groq import groq_asr
-from asr.tecent_asr import tencent_async_asr, tencent_flash_asr, tencent_single_asr
+from asr.tecent import tencent_async_asr, tencent_flash_asr, tencent_single_asr
 from asr.utils import get_asr_method
 from config import CAPTION_LENGTH, PREFIX, TEXT_LENGTH
 from messages.parser import parse_msg
src/config.py
@@ -266,11 +266,11 @@ class ASR:
     CLOUDFLARE_MODEL = os.getenv("ASR_CLOUDFLARE_MODEL", "@cf/openai/whisper-large-v3-turbo")
     CLOUDFLARE_KEYS = os.getenv("ASR_CLOUDFLARE_KEYS", "")  # comma separated keys for load balance. e.g. "AccountID:API_TOKEN, AccountID:API_TOKEN, ..."
     GEMINI_CHUNK_SECONDS = float(os.getenv("ASR_GEMINI_CHUNK_SECONDS", "900"))  # split long audio file into chunks
-    GEMINI_OVERLAP_SECONDS = float(os.getenv("ASR_GEMINI_OVERLAP_SECONDS", "10"))  # overlap seconds between chunks
+    GEMINI_OVERLAP_SECONDS = float(os.getenv("ASR_GEMINI_OVERLAP_SECONDS", "5"))  # overlap seconds between chunks
     GROQ_PROXY = os.getenv("ASR_GROQ_PROXY", None)  # Ban CN & HK IP
     GROQ_MAX_BYTES = int(os.getenv("ASR_GROQ_MAX_BYTES", "26214400"))  # 25MB (max file bytes for single file)
     GROQ_CHUNK_SECONDS = float(os.getenv("ASR_GROQ_CHUNK_SECONDS", "1800"))  # split long audio file into chunks
-    GROQ_OVERLAP_SECONDS = float(os.getenv("ASR_GROQ_OVERLAP_SECONDS", "10"))  # overlap seconds between chunks
+    GROQ_OVERLAP_SECONDS = float(os.getenv("ASR_GROQ_OVERLAP_SECONDS", "5"))  # overlap seconds between chunks
     GROQ_KEYS = os.getenv("ASR_GROQ_KEYS", "")  # comma separated keys for load balance.
     GROQ_MODELS = os.getenv("ASR_GROQ_MODELS", "whisper-large-v3")  # comma separated model names.