-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy path.env.example
More file actions
53 lines (43 loc) · 1.25 KB
/
.env.example
File metadata and controls
53 lines (43 loc) · 1.25 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
# Environment Variables Template for Production Speech-to-Speech System
# Copy this file to .env and fill in your actual values
# HuggingFace Authentication (REQUIRED)
HF_TOKEN=your_huggingface_token_here
# GitHub Configuration (optional)
GITHUB_TOKEN=your_github_token_here
GITHUB_USERNAME=your_username
GITHUB_EMAIL=your_email@example.com
# CUDA and GPU Configuration
CUDA_VISIBLE_DEVICES=0
PYTORCH_CUDA_ALLOC_CONF=max_split_size_mb:512
TOKENIZERS_PARALLELISM=false
# System Optimization
OMP_NUM_THREADS=8
MKL_NUM_THREADS=8
# Model Configuration
MODEL_CACHE_DIR=./model_cache
MODEL_LOAD_TIMEOUT=300
MAX_MODEL_LEN=2048
GPU_MEMORY_UTILIZATION=0.8
# Server Configuration
SERVER_HOST=0.0.0.0
SERVER_HTTP_PORT=8000
SERVER_WS_PORT=8765
SERVER_HEALTH_PORT=8005
SERVER_METRICS_PORT=8766
# Performance Tuning
CHUNK_SIZE=512
SAMPLE_RATE=16000
LATENCY_TARGET=300
MEMORY_FRACTION=0.9
# Optimization Flags
ENABLE_TORCH_COMPILE=true
ENABLE_FLASH_ATTENTION=true
ENABLE_QUANTIZATION=true
ENABLE_KV_CACHE=true
# Logging Configuration
LOG_LEVEL=INFO
LOG_FILE=./logs/voxtral_streaming.log
# Security Note:
# Never commit the actual .env file with real tokens to version control
# Always use placeholder values in documentation and setup files
# Keep your actual tokens secure and private