# ------------------------------------------------------------------ # RAG CBT QUESTION-ANSWERING SYSTEM CONFIGURATION # ------------------------------------------------------------------ project: name: "cbt-rag-system" category: "psychology" doc_limit: null # Load all pages from the book processing: # Embedding model used for both vector db and evaluator similarity embedding_model: "jinaai/jina-embeddings-v2-small-en" # Options: sentence, recursive, semantic, fixed technique: "recursive" # Jina supports 8192 tokens (~32k chars), using 1000 chars for better context chunk_size: 1000 chunk_overlap: 100 vector_db: base_index_name: "cbt-book" dimension: 512 # Jina outputs 512 dimensions metric: "cosine" batch_size: 50 # Reduced batch size for CPU processing retrieval: # Options: hybrid, semantic, bm25 mode: "hybrid" # Options: cross-encoder, rrf rerank_strategy: "cross-encoder" use_mmr: true top_k: 10 final_k: 5 generation: temperature: 0. max_new_tokens: 512 # The model used to Judge the others (OpenRouter) judge_model: "stepfun/step-3.5-flash:free" # List of contestants in the tournament models: - "Llama-3-8B" - "Mistral-7B" - "Qwen-2.5" - "DeepSeek-V3" - "TinyAya"