-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathconf.yml
95 lines (81 loc) · 2.62 KB
/
conf.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
---
version: 1
threads: 3
pid_file: /tmp/burgonet.pid
error_log: /tmp/load_balancer_err.log
upgrade_sock: /tmp/load_balancer.sock
db_filepath: database.redb
port: 6191
host: 127.0.0.1
prometheus_host: 127.0.0.1
prometheus_port: 6192
admin_host: 127.0.0.1
admin_port: 6189
chat_host: 127.0.0.1
chat_port: 6190
echo_host: 127.0.0.1
echo_port: 6193
log_config_file: log4rs.yml
trust_header_authentication:
- Tailscale-User-Login
- Cf-Access-Authenticated-User-Email
- X-Forwarded-Email
models:
- location: "/echo"
model_name: "echo"
proxy_pass: "http://127.0.0.1:6193/echo"
parser: "echo"
api_key: "$DEEPSEEK_API_KEY"
pii_protection_url: "http://127.0.0.1:8001/check-pii-base64"
- location: "/ollama/gemma2/2b/"
model_name: "gemma2:2b-instruct-q6_K"
parser: "ollama"
proxy_pass: "http://127.0.0.1:11434/api/chat"
api_key: "NA"
disabled_groups: "mammals, birds"
blacklist_words: "confidential, mycorp"
pii_protection_url: "http://127.0.0.1:8001/check-pii-base64"
- location: "/quotas/test"
model_name: "gemma2:2b-instruct-q6_K"
parser: "ollama"
proxy_pass: "http://127.0.0.1:11434/api/chat"
api_key: "NA"
disabled_groups: "mammals, birds"
blacklist_words: "confidential, mycorp"
pii_protection_url: "http://127.0.0.1:8001/check-pii-base64"
quotas:
- max_tokens:
minute: 50000
hour: 60000
day: 1000000
week: 10000
- max_requests:
second: 1
minute: 15
- location: "/llamacpp/"
provider: "llamacpp"
model_name: "phi4-GGUF-Q4_K"
proxy_pass: "http://m1:8081/completion"
- location: "/api.openai.com/v1/chat/completions"
model_name: "openai"
parser: "openai"
proxy_pass: "https://api.openai.com/v1/chat/completions"
api_key: "$OPENAI_API_KEY"
- location: "/api.deepseek.com/chat/completions"
model_name: "deepseek-chat"
parser: "deepseek"
proxy_pass: "https://api.deepseek.com/chat/completions"
api_key: "$DEEPSEEK_API_KEY"
- location: "/api.openai.com/v1/chat/completions"
model_name: "gpt4o"
proxy_pass: "https://api.openai.com"
api_key: "YOUR_API_KEY"
- location: "/openai.azure.com/v1/chat/completions"
model_name: "azuregpt4"
proxy_pass: "https://YOUR_RESOURCE_NAME.openai.azure.com/openai/deployments/YOUR_DEPLOYMENT_ID-id/completions?api-version=2024-10-21"
api_key: "YOUR_API_KEY"
- location: "/gemini"
model_name: "gemini-1.5-flash"
parser: "gemini"
proxy_pass: "https://generativelanguage.googleapis.com/v1beta/models/gemini-1.5-flash:generateContent?key=$GEMINI_API_KEY"
api_key: "$GEMINI_API_KEY"