File size: 930 Bytes
5fc69e4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
import os

# Hugging Face Spaces serve URL (๊ณต๊ฐœ ์„ค์ •์ด๋ฏ€๋กœ ์ง์ ‘ ์ฃผ์†Œ ์‚ฌ์šฉ ๊ฐ€๋Šฅ)
HF_SERVE_URL = os.getenv(
    "HF_SERVE_URL",
    "https://m97j-PersonaChatEngine.hf.space"
)

# ์š”์ฒญ ํƒ€์ž„์•„์›ƒ (์ดˆ ๋‹จ์œ„)
HF_TIMEOUT = float(os.getenv("HF_TIMEOUT", "25"))

# RAG ํ•ญ์ƒ ์‚ฌ์šฉ (ํ† ๊ธ€์ด ์•„๋‹ˆ๋ผ ๊ณ ์ • ์‚ฌ์šฉ)
RAG_ENABLED = True

# ์ƒ์„ฑ ํŒŒ๋ผ๋ฏธํ„ฐ ๊ธฐ๋ณธ๊ฐ’ (์š”์ฒญ๋งˆ๋‹ค override ๊ฐ€๋Šฅ)
GENERATION_CONFIG = {
    "max_new_tokens": int(os.getenv("GEN_MAX_NEW_TOKENS", "220")),
    "temperature": float(os.getenv("GEN_TEMPERATURE", "0.7")),
    "top_p": float(os.getenv("GEN_TOP_P", "0.9")),
    "repetition_penalty": float(os.getenv("GEN_REPETITION_PENALTY", "1.1")),
    "do_sample": True
}

'''
# ๋ชจ๋ธ ์ •๋ณด (์ถ”ํ›„ ํ™•์žฅ ๊ฐ€๋Šฅ)
MODEL_INFO = {
    "base_model": "meta-llama/Meta-Llama-3-8B",
    "adapter": "m97j/PersonaAdapter-v1",
    "serve_mode": "hf_spaces",  # ๋˜๋Š” "local", "api"
}

'''