-
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathfly.toml
More file actions
65 lines (51 loc) · 1.31 KB
/
fly.toml
File metadata and controls
65 lines (51 loc) · 1.31 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
app = 'driftos-core'
primary_region = 'lhr'
[build]
[env]
NODE_ENV = 'production'
PORT = '3000'
HOST = '::'
LOG_LEVEL = 'info'
# API
API_PREFIX = '/api'
API_VERSION = 'v1'
# Rate Limiting - REMOVED: All rate limiting is handled by the gateway
# CORS - allow demo frontend
CORS_ORIGIN = 'https://driftos-demo.fly.dev,https://playground.driftos.dev'
CORS_CREDENTIALS = 'true'
# Monitoring
METRICS_ENABLED = 'true'
METRICS_PATH = '/metrics'
# Swagger
SWAGGER_ENABLED = 'true'
SWAGGER_PATH = '/documentation'
# LLM
LLM_PROVIDER = 'groq'
LLM_MODEL = 'llama-3.1-8b-instant'
LLM_TIMEOUT = '5000'
# Operation-specific LLM Models
DRIFT_ROUTING_MODEL = 'openai/gpt-oss-20b'
FACT_EXTRACTION_MODEL = 'openai/gpt-oss-20b'
CHAT_MODEL = 'llama-3.1-8b-instant'
DEMO_MODEL = 'llama-3.1-8b-instant'
# Drift
DRIFT_MAX_BRANCHES_CONTEXT = '10'
# Embeddings (local)
EMBEDDING_MODEL = 'Xenova/all-MiniLM-L6-v2'
# Internal-only via Flycast (no public IPs)
[http_service]
internal_port = 3000
force_https = false
auto_stop_machines = 'off'
auto_start_machines = true
min_machines_running = 1
[[http_service.checks]]
grace_period = '30s'
interval = '30s'
method = 'GET'
timeout = '10s'
path = '/api/v1/health'
[[vm]]
memory = '1gb'
cpu_kind = 'shared'
cpus = 1