Skip to content

Commit 2b1fe5d

Browse files
committed
perf: true SSE streaming pass-through and reduced lock contention
Replace buffered collect-then-respond streaming with channel-backed incremental SSE forwarding for both OpenAI and Responses API endpoints. Reduce write lock hold times by performing token refresh and file I/O outside the lock. Increase default concurrency (1→10) and reduce minimum request interval (500ms→50ms).
1 parent e224f65 commit 2b1fe5d

File tree

2 files changed

+773
-549
lines changed

2 files changed

+773
-549
lines changed

src/config.rs

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -206,10 +206,10 @@ pub struct CloudCodeConfig {
206206
/// Maximum retry attempts for failed requests (default: 5)
207207
#[serde(default = "default_max_retries")]
208208
pub max_retries: u32,
209-
/// Maximum concurrent requests to Cloud Code API (default: 1)
209+
/// Maximum concurrent requests to Cloud Code API (default: 10)
210210
#[serde(default = "default_max_concurrent")]
211211
pub max_concurrent_requests: usize,
212-
/// Minimum interval between requests in milliseconds (default: 500)
212+
/// Minimum interval between requests in milliseconds (default: 50)
213213
#[serde(default = "default_min_request_interval")]
214214
pub min_request_interval_ms: u64,
215215
}
@@ -223,11 +223,11 @@ fn default_max_retries() -> u32 {
223223
}
224224

225225
fn default_max_concurrent() -> usize {
226-
1
226+
10
227227
}
228228

229229
fn default_min_request_interval() -> u64 {
230-
500
230+
50
231231
}
232232

233233
impl Default for CloudCodeConfig {

0 commit comments

Comments
 (0)