1+ # AgentaFlow SRO Community Edition - Environment Configuration
2+ # Copy this file to .env and update with your actual values
3+
4+ # =============================================================================
5+ # GENERAL SETTINGS
6+ # =============================================================================
7+
8+ # Application environment (development, staging, production)
9+ APP_ENV = development
10+
11+ # Log level (debug, info, warn, error)
12+ LOG_LEVEL = info
13+
14+ # Application port
15+ PORT = 8080
16+
17+ # =============================================================================
18+ # KUBERNETES CONFIGURATION
19+ # =============================================================================
20+
21+ # Kubernetes cluster configuration
22+ KUBECONFIG_PATH = ~/.kube/config
23+ K8S_NAMESPACE = agentaflow-monitoring
24+ K8S_SERVICE_ACCOUNT = agentaflow-scheduler
25+
26+ # Kubernetes GPU scheduler settings
27+ K8S_GPU_SCHEDULER_ENABLED = true
28+ K8S_GPU_SCHEDULER_STRATEGY = least-utilized
29+ K8S_GPU_RESOURCE_NAME = nvidia.com/gpu
30+
31+ # =============================================================================
32+ # GPU ORCHESTRATION
33+ # =============================================================================
34+
35+ # GPU monitoring intervals (seconds)
36+ GPU_METRICS_INTERVAL = 5
37+ GPU_HEALTH_CHECK_INTERVAL = 30
38+
39+ # GPU scheduling configuration
40+ GPU_SCHEDULER_STRATEGY = least-utilized
41+ GPU_MAX_UTILIZATION_THRESHOLD = 90
42+ GPU_MIN_UTILIZATION_THRESHOLD = 10
43+
44+ # GPU resource limits
45+ GPU_MEMORY_LIMIT_MB = 16384
46+ GPU_TEMPERATURE_THRESHOLD = 85
47+ GPU_POWER_LIMIT_WATTS = 300
48+
49+ # =============================================================================
50+ # MODEL SERVING OPTIMIZATION
51+ # =============================================================================
52+
53+ # Batch processing configuration
54+ BATCH_MAX_SIZE = 32
55+ BATCH_MAX_WAIT_TIME_MS = 100
56+
57+ # Caching configuration
58+ CACHE_TTL_MINUTES = 5
59+ CACHE_MAX_SIZE_MB = 1024
60+ CACHE_ENABLED = true
61+
62+ # Load balancing
63+ LOAD_BALANCER_STRATEGY = round-robin
64+
65+ # =============================================================================
66+ # OBSERVABILITY & MONITORING
67+ # =============================================================================
68+
69+ # Prometheus configuration
70+ PROMETHEUS_ENABLED = true
71+ PROMETHEUS_PORT = 9090
72+ PROMETHEUS_METRICS_PATH = /metrics
73+ PROMETHEUS_SCRAPE_INTERVAL = 15s
74+
75+ # Grafana configuration
76+ GRAFANA_ENABLED = true
77+ GRAFANA_PORT = 3000
78+ GRAFANA_ADMIN_USER = admin
79+ GRAFANA_ADMIN_PASSWORD = agentaflow123
80+
81+ # Metrics collection
82+ METRICS_BUFFER_SIZE = 10000
83+ METRICS_RETENTION_HOURS = 24
84+ METRICS_EXPORT_INTERVAL_SECONDS = 15
85+
86+ # =============================================================================
87+ # COST TRACKING
88+ # =============================================================================
89+
90+ # GPU cost configuration (USD per hour)
91+ COST_GPU_A100 = 3.06
92+ COST_GPU_V100 = 3.06
93+ COST_GPU_T4 = 0.526
94+ COST_GPU_RTX = 1.00
95+ COST_GPU_GENERIC = 1.50
96+
97+ # Cost calculation settings
98+ COST_TRACKING_ENABLED = true
99+ COST_CURRENCY = USD
100+ COST_UTILIZATION_MIN_FACTOR = 0.1
101+ COST_UTILIZATION_MAX_FACTOR = 1.0
102+
103+ # =============================================================================
104+ # CLOUD PROVIDER INTEGRATION
105+ # =============================================================================
106+
107+ # AWS Configuration (for cost tracking and resource management)
108+ AWS_REGION = us-west-2
109+ AWS_ACCESS_KEY_ID = your_aws_access_key
110+ AWS_SECRET_ACCESS_KEY = your_aws_secret_key
111+
112+ # Google Cloud Platform
113+ GCP_PROJECT_ID = your_gcp_project
114+ GCP_SERVICE_ACCOUNT_KEY_PATH = path/to/service-account.json
115+
116+ # Azure
117+ AZURE_SUBSCRIPTION_ID = your_azure_subscription
118+ AZURE_CLIENT_ID = your_azure_client_id
119+ AZURE_CLIENT_SECRET = your_azure_client_secret
120+ AZURE_TENANT_ID = your_azure_tenant_id
121+
122+ # =============================================================================
123+ # DATABASE (if using persistent storage)
124+ # =============================================================================
125+
126+ # Database configuration (optional - for persistent metrics storage)
127+ DB_ENABLED = false
128+ DB_TYPE = postgres
129+ DB_HOST = localhost
130+ DB_PORT = 5432
131+ DB_NAME = agentaflow
132+ DB_USER = agentaflow_user
133+ DB_PASSWORD = your_db_password
134+ DB_SSL_MODE = disable
135+
136+ # =============================================================================
137+ # SECURITY
138+ # =============================================================================
139+
140+ # API authentication
141+ API_KEY = your_secure_api_key
142+ JWT_SECRET = your_jwt_secret_key
143+ AUTH_ENABLED = false
144+
145+ # TLS configuration
146+ TLS_ENABLED = false
147+ TLS_CERT_PATH = path/to/cert.pem
148+ TLS_KEY_PATH = path/to/key.pem
149+
150+ # =============================================================================
151+ # ALERTS & NOTIFICATIONS
152+ # =============================================================================
153+
154+ # Alert thresholds
155+ ALERT_GPU_HIGH_UTILIZATION = 90
156+ ALERT_GPU_HIGH_TEMPERATURE = 80
157+ ALERT_GPU_HIGH_MEMORY = 85
158+ ALERT_WORKLOAD_QUEUE_SIZE = 100
159+
160+ # Notification endpoints (optional)
161+ SLACK_WEBHOOK_URL = https://hooks.slack.com/services/YOUR/SLACK/WEBHOOK
162+ EMAIL_SMTP_HOST = smtp.gmail.com
163+ EMAIL_SMTP_PORT = 587
164+ 165+ EMAIL_PASSWORD = your_email_password
166+
167+ # =============================================================================
168+ # DEBUGGING & DEVELOPMENT
169+ # =============================================================================
170+
171+ # Debug settings
172+ DEBUG_ENABLED = false
173+ PROFILING_ENABLED = false
174+ TRACE_ENABLED = false
175+
176+ # Performance monitoring
177+ PERFORMANCE_MONITORING = true
178+ SLOW_QUERY_THRESHOLD_MS = 1000
179+
180+ # =============================================================================
181+ # EXPERIMENTAL FEATURES
182+ # =============================================================================
183+
184+ # Feature flags
185+ FEATURE_AUTO_SCALING = false
186+ FEATURE_PREDICTIVE_SCHEDULING = false
187+ FEATURE_MULTI_TENANT = false
188+ FEATURE_ADVANCED_ANALYTICS = true
189+
190+ # Experimental GPU features
191+ EXPERIMENTAL_MULTI_GPU_WORKLOADS = false
192+ EXPERIMENTAL_GPU_SHARING = false
193+ EXPERIMENTAL_DYNAMIC_BATCHING = true
0 commit comments