-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy path.env.example
More file actions
65 lines (47 loc) · 1.46 KB
/
.env.example
File metadata and controls
65 lines (47 loc) · 1.46 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
# Copy this file to .env and customize for your setup
# === Network ===
# Where workers are located (for local docker-compose)
WORKER_URLS=http://worker1:5000,http://worker2:5000
# For Docker Swarm, use the service name instead
# WORKER_SERVICE=llm_worker
# WORKER_PORT=5000
# Router listen address
HOST=0.0.0.0
PORT=5000
# === Timeouts (seconds) ===
# How long to wait for worker health check
HEALTH_TIMEOUT=2
# How long to wait for inference response
REQUEST_TIMEOUT=30
# How many times to retry if a worker fails
MAX_RETRIES=2
# === Model ===
# HuggingFace model to use
# Light models: distilgpt2, distilbert-base-uncased
# Medium: gpt2, gpt-neo-125M
# Large: gpt-neo-2.7B (requires >4GB RAM)
MODEL_NAME=distilgpt2
# Max tokens to generate
MAX_LENGTH=100
# Temperature controls randomness (0=deterministic, 1=more random)
TEMPERATURE=0.7
# Use sampling (True) or greedy (False) for generation
DO_SAMPLE=True
# === DPR Models (for retrieval) ===
# DPR question encoder for encoding queries
DPR_QUESTION_ENCODER=facebook/dpr-question_encoder-single-nq-base
# DPR context encoder for encoding corpus passages
DPR_CONTEXT_ENCODER=facebook/dpr-ctx_encoder-single-nq-base
# PDF corpus directory
PDF_DIR=pdf_corpus
# Data directory for persisting embeddings
DATA_DIR=data
# Batch size for encoding
ENCODE_BATCH=32
# === System ===
# Enable debug mode (True/False)
DEBUG=False
# Logging level: DEBUG, INFO, WARNING, ERROR
LOG_LEVEL=INFO
# Where to save log files
LOGS_DIR=logs