-
Notifications
You must be signed in to change notification settings - Fork 12
Expand file tree
/
Copy pathconfig-e176.yaml
More file actions
35 lines (32 loc) · 1.05 KB
/
config-e176.yaml
File metadata and controls
35 lines (32 loc) · 1.05 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
# In production, this file is automatically generated by the `ansible` playbook.
# Configuration with structured sections and default values
# Web Search Configuration
web_search:
api_key: null
api_path: "https://api.search.brave.com/res/v1/web/search"
count: 3
lang: "en"
country: "us"
timeout: 20.0
max_concurrent_requests: 20
rps: 20
# Rate Limiting Configuration
rate_limiting:
user_rate_limit: null # For-good rate limit
user_rate_limit_minute: 100
user_rate_limit_hour: 1000
user_rate_limit_day: 10000
web_search_rate_limit_minute: null
web_search_rate_limit_hour: null
web_search_rate_limit_day: 500
web_search_rate_limit: null # For-good rate limit
model_concurrent_rate_limit:
meta-llama/Llama-3.2-1B-Instruct: 45
meta-llama/Llama-3.2-3B-Instruct: 50
meta-llama/Llama-3.1-8B-Instruct: 30
cognitivecomputations/Dolphin3.0-Llama3.1-8B: 30
deepseek-ai/DeepSeek-R1-Distill-Qwen-14B: 5
hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4: 5
openai/gpt-oss-20b: 50
google/gemma-3-27b-it: 50
default: 50