File size: 1,383 Bytes
dbf2148
 
 
 
 
 
6fd0088
 
 
 
 
 
 
 
 
dbf2148
 
76d9735
aeca306
dbf2148
8a29960
aeca306
dbf2148
 
 
 
 
 
 
 
 
 
 
6fd0088
dbf2148
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
import os
from dotenv import load_dotenv

load_dotenv()

class Settings:
    # Ưu tiên lấy từ environment variables (cho Hugging Face)
    GROQ_API_KEY = os.getenv("GROQ_API_KEY") or os.getenv("X_GROQ_API_KEY")
    
    # Kiểm tra API Key
    if not GROQ_API_KEY:
        print("❌ CẢNH BÁO: Không tìm thấy GROQ_API_KEY")
        print("💡 Trên Hugging Face Spaces, hãy thêm biến môi trường:")
        print("   - Tên: GROQ_API_KEY")
        print("   - Value: gsk_xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx")
    
    # Multilingual Model Settings
    VIETNAMESE_EMBEDDING_MODEL = 'keepitreal/vietnamese-sbert'
    VIETNAMESE_LLM_MODEL = "llama-3.1-8b-instant"
    
    MULTILINGUAL_EMBEDDING_MODEL = 'sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2'
    MULTILINGUAL_LLM_MODEL = "llama-3.1-8b-instant"
    
    WHISPER_MODEL = "whisper-large-v3-turbo"
    
    # TTS Settings
    MAX_CHUNK_LENGTH = 200
    SUPPORTED_LANGUAGES = {
        'vi': 'vi', 'en': 'en', 'fr': 'fr', 'es': 'es', 
        'de': 'de', 'ja': 'ja', 'ko': 'ko', 'zh': 'zh'
    }
    
    # RAG Settings
    EMBEDDING_DIMENSION = 384
    TOP_K_RESULTS = 3
    
    # SpeechBrain VAD Settings
    VAD_MODEL = "speechbrain/vad-crdnn-libriparty"
    VAD_THRESHOLD = 0.5
    VAD_MIN_SILENCE_DURATION = 0.5
    VAD_SPEECH_PAD_DURATION = 0.1
    SAMPLE_RATE = 16000

settings = Settings()