rag_korean_manufacturing_docs / src /evaluation_config.yaml
A7m0d's picture
Upload folder using huggingface_hub
7dfe46c verified
# Evaluation Settings
evaluation:
threshold: 0.8
verbose_mode: true
max_retries: 3
timeout_seconds: 30
# Dataset Settings
dataset:
input_column: "input"
output_column: "expected_output"
context_column: null
# Logging Configuration
logging:
level: "INFO"
max_file_size_mb: 10
backup_count: 5
# Output Settings
output:
results_dir: "results"
logs_dir: "logs"
save_detailed_results: true
# Metrics Configuration
metrics:
answer_relevancy:
enabled: true
threshold: 0.8
verbose_mode: true
contextual_precision:
enabled: false
threshold: 0.8
# RAG System Configuration
rag_system:
embedding_model: "qwen3-embedding"
reranker_model: "qwen3-reranker"
llm_model: "openai/gpt-oss-120b" # Groq model
vector_store: "qdrant"
chunk_size: 512
chunk_overlap: 50
max_context_chunks: 5
similarity_threshold: 0.7
rerank_top_k: 20
final_top_k: 5
# API Configuration
apis:
groq_api_key: "${GROQ_API_KEY}"
siliconflow_api_key: "${SILICONFLOW_API_KEY}"
qdrant_url: "${QDRANT_URL}"
qdrant_api_key: "${QDRANT_API_KEY}"
# Document Processing Configuration
document_processing:
pdf_engine: "pymupdf"
excel_engine: "openpyxl"
ocr_engine: "tesseract"
image_processing: true
table_extraction: true
max_file_size_mb: 100
# Storage Configuration
storage:
qdrant_collection: "manufacturing_docs"
metadata_db_path: "./data/metadata.db"
file_storage_path: "./data/documents"
enable_compression: true