-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy path.env.example
More file actions
54 lines (44 loc) · 1.47 KB
/
.env.example
File metadata and controls
54 lines (44 loc) · 1.47 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
# Database Configuration
DB_HOST=localhost
DB_PORT=5432
DB_NAME=memory_db
DB_USER=postgres
DB_PASSWORD=your_secure_password_here
# API Keys
OPENAI_API_KEY=sk-...
ANTHROPIC_API_KEY=sk-ant-...
# Application Settings
ENVIRONMENT=development # development, staging, production
DEBUG=true
LOG_LEVEL=INFO
# Model Settings
USE_GPU=true
CUDA_VISIBLE_DEVICES=0
TRANSFORMERS_CACHE=/app/models/cache
# Security
SECRET_KEY=your-secret-key-here-change-in-production
API_KEY=your-api-key-here
# Redis (for task queue)
REDIS_HOST=localhost
REDIS_PORT=6379
REDIS_DB=0
REDIS_PASSWORD=
# Monitoring
ENABLE_METRICS=true
METRICS_PORT=9090
# Memory Management Configuration
# MEMORY_APPROACH: Choose between 'external_llm' (Approach 1) or 'slm' (Approach 2)
# - external_llm: Context partitioning with compression/summarization for external LLMs
# - slm: Dual-model system with Small Language Model for memory management
MEMORY_APPROACH=external_llm
# Primary LLM Configuration (used for reasoning and responses)
PRIMARY_LLM_PROVIDER=openai # openai, anthropic
PRIMARY_LLM_MODEL=gpt-4o-mini # gpt-4o, gpt-4o-mini, gpt-4-turbo, claude-3-sonnet, etc.
# SLM Configuration (optional, used when MEMORY_APPROACH=slm)
USE_SLM=false # Enable/disable Small Language Model for memory management
SLM_MODEL_NAME=microsoft/phi-2 # gemma-3-4b, microsoft/phi-2, etc.
USE_LORA_FINETUNING=false # Enable/disable LoRA fine-tuning for SLM
# Feature Flags
ENABLE_AUTO_TRAINING=true
ENABLE_COMPRESSION=true
ENABLE_SUMMARIZATION=true