Spaces:

moazx
/

HBV_AI_Assistant

Running

App Files Files Community

HBV_AI_Assistant / core /config.py

moazx

return to the old version

e42cea3 about 5 hours ago

raw

history blame contribute delete

5.17 kB

	import os
	from pathlib import Path
	from langchain_huggingface import HuggingFaceEmbeddings
	from langchain_openai import ChatOpenAI
	from dotenv import load_dotenv
	import logging
	from logging.handlers import RotatingFileHandler
	from pydantic_settings import BaseSettings, SettingsConfigDict

	# Initialize environment
	load_dotenv()


	# --- Settings (simple, in-file) ---
	class Settings(BaseSettings):
	model_config = SettingsConfigDict(env_file='.env', env_file_encoding='utf-8', extra='ignore')

	OPENAI_API_KEY: str
	OPENAI_BASE_URL: str \| None = None

	# LlamaParse configuration for advanced PDF parsing
	LLAMA_CLOUD_API_KEY: str \| None = None
	LLAMA_PREMIUM_MODE: bool = False # Set to True for GPT-4o parsing (costs more)

	LOG_LEVEL: str = os.getenv("LOG_LEVEL", "INFO")
	DATA_DIR: str = os.getenv("DATA_DIR", "")
	LOG_DIR: str = os.getenv("LOG_DIR", "")


	settings = Settings()


	# --- File Path Configuration (Cross-platform compatible) ---
	PROJECT_ROOT = Path(__file__).parent.parent.absolute()
	DATA_DIR = Path(settings.DATA_DIR or (PROJECT_ROOT / "data"))
	NEW_DATA = DATA_DIR / "new_data"
	PROCESSED_DATA = DATA_DIR / "processed_data"
	CHUNKS_PATH = DATA_DIR / "chunks.pkl"
	VECTOR_STORE_DIR = DATA_DIR / "vector_store"
	DATA_DIR.mkdir(parents=True, exist_ok=True)
	NEW_DATA.mkdir(parents=True, exist_ok=True)
	PROCESSED_DATA.mkdir(parents=True, exist_ok=True)
	VECTOR_STORE_DIR.mkdir(parents=True, exist_ok=True)

	# Setup logging
	LOG_DIR = Path(settings.LOG_DIR or (Path(__file__).parent.parent / "logs"))
	LOG_DIR.mkdir(parents=True, exist_ok=True)

	LOG_FILE = LOG_DIR / "app.log"

	# Configure application logger (avoid duplicate handlers)
	LOG_LEVEL = settings.LOG_LEVEL.upper()
	logger = logging.getLogger("AgenticMedicalRAG") # centralized logger
	logger.setLevel(LOG_LEVEL)
	logger.propagate = False
	if not logger.handlers:
	formatter = logging.Formatter(
	fmt="%(asctime)s - %(name)s - %(levelname)s - %(message)s"
	)
	file_handler = RotatingFileHandler(
	LOG_FILE,
	maxBytes=1000000,
	backupCount=3,
	encoding="utf-8"
	)
	file_handler.setFormatter(formatter)
	stream_handler = logging.StreamHandler()
	stream_handler.setFormatter(formatter)
	logger.addHandler(file_handler)
	logger.addHandler(stream_handler)



	# --- LLM Configuration with lazy loading ---
	_llm = None

	def get_llm():
	"""Get LLM with lazy loading for faster startup"""
	global _llm
	if _llm is None:
	logger.info("Initializing LLM (first time)...")
	openai_key = settings.OPENAI_API_KEY

	if not openai_key:
	logger.error("OPENAI_API_KEY not found in environment variables")
	raise ValueError("OpenAI API key is required. Please set OPENAI_API_KEY environment variable.")

	try:
	_llm = ChatOpenAI(
	model="gpt-4o",
	api_key=openai_key,
	base_url=settings.OPENAI_BASE_URL,
	temperature=0.0,
	max_tokens=2048,
	request_timeout=30, # Increased timeout for stability
	max_retries=2,
	streaming=True,
	)
	logger.info("LLM initialized successfully")
	except Exception as e:
	logger.error(f"Failed to initialize LLM: {e}")
	raise
	return _llm

	def create_llm():
	"""Create LLM with proper error handling and fallbacks"""
	return get_llm()

	# Lazy loading - only initialize when actually needed
	LLM = None # Will be loaded on first use

	# --- Embedding Model Configuration with lazy loading ---
	_embedding_model = None

	def get_embedding_model():
	"""Get embedding model with lazy loading for faster startup"""
	global _embedding_model
	if _embedding_model is None:
	logger.info("Loading embedding model (first time)...")
	try:
	_embedding_model = HuggingFaceEmbeddings(
	model_name="abhinand/MedEmbed-base-v0.1",
	model_kwargs={'device': 'cpu'},
	encode_kwargs={'normalize_embeddings': True}
	)
	logger.info("Embedding model loaded successfully")
	except Exception as e:
	logger.error(f"Failed to load embedding model: {e}")
	raise ValueError("Failed to load embedding model")
	return _embedding_model

	# For backward compatibility
	def create_embedding_model():
	"""Create embedding model with proper error handling"""
	return get_embedding_model()

	# Lazy loading - only load when actually needed
	EMBEDDING_MODEL = None # Will be loaded on first use

	# Configuration validation
	def validate_config():
	"""Validate all required configurations"""
	required_env_vars = ["OPENAI_API_KEY"]
	missing_vars = [var for var in required_env_vars if not getattr(settings, var, None)]

	if missing_vars:
	raise ValueError(f"Missing required environment variables: {missing_vars}")

	logger.info("Configuration validation completed")

	# Run validation on import
	try:
	validate_config()
	except Exception as e:
	logger.error(f"Configuration validation failed: {e}")
	raise e