Commit d2daeb1
Changed files (4)
src/asr/ali_asr.py → src/asr/ali.py
File renamed without changes
src/asr/tecent_asr.py → src/asr/tecent.py
@@ -75,7 +75,7 @@ async def tencent_single_asr(path: str | Path, engine: str, voice_format: str) -
"""Tencent Single Sentence ASR.
一句话识别
- https://cloud.tencent.com/document/product/1093/52097
+ https://cloud.tencent.com/document/product/1093/35646
"""
async with await anyio.open_file(path, "rb") as f:
content = await f.read()
src/asr/voice_recognition.py
@@ -10,12 +10,12 @@ from pyrogram.client import Client
from pyrogram.enums import ParseMode
from pyrogram.types import Message
-from asr.ali_asr import ali_asr
+from asr.ali import ali_asr
from asr.cloudflare import cloudflare_asr
from asr.deepgram import deepgram_asr
from asr.gemini import gemini_asr
from asr.groq import groq_asr
-from asr.tecent_asr import tencent_async_asr, tencent_flash_asr, tencent_single_asr
+from asr.tecent import tencent_async_asr, tencent_flash_asr, tencent_single_asr
from asr.utils import get_asr_method
from config import CAPTION_LENGTH, PREFIX, TEXT_LENGTH
from messages.parser import parse_msg
src/config.py
@@ -266,11 +266,11 @@ class ASR:
CLOUDFLARE_MODEL = os.getenv("ASR_CLOUDFLARE_MODEL", "@cf/openai/whisper-large-v3-turbo")
CLOUDFLARE_KEYS = os.getenv("ASR_CLOUDFLARE_KEYS", "") # comma separated keys for load balance. e.g. "AccountID:API_TOKEN, AccountID:API_TOKEN, ..."
GEMINI_CHUNK_SECONDS = float(os.getenv("ASR_GEMINI_CHUNK_SECONDS", "900")) # split long audio file into chunks
- GEMINI_OVERLAP_SECONDS = float(os.getenv("ASR_GEMINI_OVERLAP_SECONDS", "10")) # overlap seconds between chunks
+ GEMINI_OVERLAP_SECONDS = float(os.getenv("ASR_GEMINI_OVERLAP_SECONDS", "5")) # overlap seconds between chunks
GROQ_PROXY = os.getenv("ASR_GROQ_PROXY", None) # Ban CN & HK IP
GROQ_MAX_BYTES = int(os.getenv("ASR_GROQ_MAX_BYTES", "26214400")) # 25MB (max file bytes for single file)
GROQ_CHUNK_SECONDS = float(os.getenv("ASR_GROQ_CHUNK_SECONDS", "1800")) # split long audio file into chunks
- GROQ_OVERLAP_SECONDS = float(os.getenv("ASR_GROQ_OVERLAP_SECONDS", "10")) # overlap seconds between chunks
+ GROQ_OVERLAP_SECONDS = float(os.getenv("ASR_GROQ_OVERLAP_SECONDS", "5")) # overlap seconds between chunks
GROQ_KEYS = os.getenv("ASR_GROQ_KEYS", "") # comma separated keys for load balance.
GROQ_MODELS = os.getenv("ASR_GROQ_MODELS", "whisper-large-v3") # comma separated model names.