-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathkeys.json.template
More file actions
41 lines (29 loc) · 1.39 KB
/
keys.json.template
File metadata and controls
41 lines (29 loc) · 1.39 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
{
"_comment": "Configuration template for Test the RAG system",
"_instructions": "Copy this file to 'keys.json' and fill in your actual credentials",
"AZURE_OPENAI_ENDPOINT": "https://your-endpoint.openai.azure.com",
"AZURE_OPENAI_API_KEY": "your-azure-openai-api-key-here",
"AZURE_OPENAI_API_VERSION": "2024-02-01",
"QDRANT_URL": "https://your-cluster-id.region.gcp.cloud.qdrant.io",
"QDRANT_API_KEY": "your-qdrant-api-key-here",
"QDRANT_COLLECTION": "knowledge_embeddings",
"CHUNK_STRATEGY": "SEMANTIC",
"_chunk_strategy_options": "FIXED, OVERLAP, SENTENCE, PARAGRAPH, SEMANTIC, HYBRID, DOC_STRUCTURE, SLIDING_WINDOW",
"EMBED_MODEL": "EMB_3_LARGE",
"_embed_model_options": "ADA_002, EMB_3_SMALL, EMB_3_LARGE",
"LLM_MODEL": "gpt-4o",
"_llm_model_options": "gpt-4o, gpt-4, gpt-4-turbo, gpt-3.5-turbo",
"LLM_MAX_TOKENS": 1000,
"LLM_TEMPERATURE": 0.7,
"RAG_TOP_K": 10,
"_rag_top_k_range": "8-20",
"RAG_RERANK_METHOD": "MMR",
"_rag_rerank_options": "MMR, CROSS_ENCODER, LLM_RERANK",
"RAG_FINAL_CHUNKS": 5,
"_rag_final_chunks_range": "3-7",
"RAG_CONTEXT_MAX_TOKENS": 1500,
"_rag_context_max_tokens_range": "1000-1500",
"RAG_SYSTEM_PROMPT": "You are a retrieval-augmented assistant. Use only the provided context. Cite sources. If unsure, say you don't know.",
"RAG_MMR_DIVERSITY_THRESHOLD": 0.7,
"_rag_mmr_diversity_range": "0.5-0.9"
}