-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.py
More file actions
18 lines (16 loc) · 923 Bytes
/
config.py
File metadata and controls
18 lines (16 loc) · 923 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
# Ollama Configuration
OLLAMA_MODEL = "gemma3:4b" # Model to use (e.g., "llama2", "mistral", "gemma3:1b")
OLLAMA_BASE_URL = "http://localhost:11434" # Default Ollama URL
OLLAMA_THINK_MODE = False # Enable thinking mode if supported by model
OLLAMA_CONTEXT = 4096 # Context window size
OLLAMA_KEEP_ALIVE = 30 # Keep model loaded for N minutes
# File Paths
PROMPT_FILE = "prompt.txt" # Template prompt with {INPUT} placeholder
INPUT_FILE = "input.txt" # Input file with one item per line
OUTPUT_FILE = "output.jsonl" # Output file in JSONL format
ERROR_FILE = "errors.log" # Error log file
# Performance Settings
# Benchmark results: gemma3:1b achieves 2.65 items/s with 3 workers (100% efficiency)
# Benchmark results: gemma3:4b achieves 0.85 items/s with 3 workers (3x slower but more accurate)
PARALLEL_WORKERS = 3 # Benchmark test
REQUEST_TIMEOUT = 120 # Maximum seconds per request (not currently enforced)