# Corrected RAG System Configuration
# This config works with the corrected code implementation

# API Configuration
apis:
  siliconflow:
    api_key: "${SILICONFLOW_API_KEY}"
    base_url: "https://api.siliconflow.com/v1"
  groq:
    api_key: "${GROQ_API_KEY}" 
    base_url: "https://api.groq.com/openai/v1"
    
# Model Configuration
models:
  # SiliconFlow Models
  embedding_model: "Qwen/Qwen3-Embedding-8B"
  reranker_model: "Qwen/Qwen3-Reranker-8B"
  
  # Groq Models (OpenAI compatible)
  llm_model: "openai/gpt-oss-120b"  # Primary model
  alternative_models:
    - "openai/gpt-oss-20b"           # Faster, less capable
    - "qwen/qwen3-32b"             # Good balance
    
# RAG System Configuration
rag_system:
  # Chunking settings
  chunk_size: 512
  chunk_overlap: 50
  max_context_chunks: 5
  

  # Retrieval settings
  similarity_threshold: 0.7
  rerank_top_k: 20
  final_top_k: 5
  
  # Generation settings
  temperature: 0.1
  max_tokens: 4096
  
  # Performance settings
  batch_size: 32
  max_retries: 3
  enable_caching: true

# Text Processing Configuration
text_processing:
  # Text splitting
  separators: ["\n\n", "\n", " ", ""]
  
  # Language settings
  language: "korean"
  encoding: "utf-8"

# Vector Store Configuration (if using)
vector_store:
  provider: "qdrant"
  collection_name: "manufacturing_docs"
  vector_size: 1024
  distance_metric: "cosine"
  
  # Qdrant specific
  qdrant_url: "${QDRANT_URL}"
  qdrant_api_key: "${QDRANT_API_KEY}"

# Document Processing Configuration
document_processing:
  # Supported formats
  supported_formats: [".pdf", ".xlsx", ".xls", ".txt", ".md", ".png", ".jpg", ".jpeg"]
  
  # File size limits
  max_file_size_mb: 100
  
  # Processing options
  extract_images: true
  extract_tables: true
  ocr_enabled: true
  
  # OCR settings
  ocr_language: "kor+eng"
  ocr_confidence_threshold: 0.6

# Logging Configuration
logging:
  level: "INFO"
  format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
  file_logging: true
  log_file: "logs/rag_system.log"
  max_file_size_mb: 10
  backup_count: 5

# Performance Configuration
performance:
  # Rate limiting
  siliconflow_requests_per_minute: 60
  groq_requests_per_minute: 30
  api_timeout: 60  # Increased timeout for large documents
  max_retries: 3
  retry_delay: 5
  batch_size: 32  # Consider reducing this for large documents
  api_timeout_seconds: 30
  max_workers: 4
  

# Cache Configuration
cache:
  enabled: true
  type: "memory"  # Options: memory, redis, file
  ttl_seconds: 3600
  max_size: 1000

# Evaluation Configuration
evaluation:
  metrics: ["accuracy", "relevance", "coherence"]
  threshold: 0.8
  save_results: true
  results_dir: "evaluation_results"

# Development/Debug Configuration
debug:
  verbose_logging: false
  save_intermediate_results: false
  profiling_enabled: false