Skip to content

Commit e863cc6

Browse files
authored
Add Language Model Rate Limiting Plugin snippets and documentation (#315)
1 parent 38e11d9 commit e863cc6

File tree

4 files changed

+42
-1
lines changed

4 files changed

+42
-1
lines changed

CHANGELOG.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,8 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
1515
- Code lens: Support for JSONC files
1616
- Snippets: Added `devproxy-plugin-language-model-failure` - LanguageModelFailurePlugin instance
1717
- Snippets: Added `devproxy-plugin-language-model-failure-config` - LanguageModelFailurePlugin config section
18+
- Snippets: Added `devproxy-plugin-language-model-rate-limiting` - LanguageModelRateLimitingPlugin instance
19+
- Snippets: Added `devproxy-plugin-language-model-rate-limiting-config` - LanguageModelRateLimitingPlugin config section
1820

1921
### Changed:
2022

README.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -140,6 +140,8 @@ See [Dev Proxy MCP Server](https://github.com/dev-proxy-tools/mcp) for more info
140140
| `devproxy-plugin-latency-config` | LatencyPlugin config section |
141141
| `devproxy-plugin-language-model-failure` | LanguageModelFailurePlugin instance |
142142
| `devproxy-plugin-language-model-failure-config` | LanguageModelFailurePlugin config section |
143+
| `devproxy-plugin-language-model-rate-limiting` | LanguageModelRateLimitingPlugin instance |
144+
| `devproxy-plugin-language-model-rate-limiting-config` | LanguageModelRateLimitingPlugin config section |
143145
| `devproxy-plugin-minimal-csom-permissions` | MinimalCsomPermissionsPlugin instance |
144146
| `devproxy-plugin-minimal-csom-permissions-config` | MinimalCsomPermissionsPlugin config section |
145147
| `devproxy-plugin-minimal-permissions` | MinimalPermissionsPlugin instance |

src/constants.ts

Lines changed: 12 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -118,6 +118,13 @@ export const pluginSnippets: PluginSnippets = {
118118
required: true,
119119
}
120120
},
121+
LanguageModelRateLimitingPlugin: {
122+
instance: 'devproxy-plugin-language-model-rate-limiting',
123+
config: {
124+
name: 'devproxy-plugin-language-model-rate-limiting-config',
125+
required: true,
126+
}
127+
},
121128
LatencyPlugin: {
122129
instance: 'devproxy-plugin-latency',
123130
config: {
@@ -301,6 +308,10 @@ export const pluginDocs: PluginDocs = {
301308
name: 'Language Model Failure Plugin',
302309
url: 'https://learn.microsoft.com/microsoft-cloud/dev/dev-proxy/technical-reference/languagemodelfailureplugin',
303310
},
311+
LanguageModelRateLimitingPlugin: {
312+
name: 'Language Model Rate Limiting Plugin',
313+
url: 'https://learn.microsoft.com/microsoft-cloud/dev/dev-proxy/technical-reference/languagemodelratelimitingplugin',
314+
},
304315
LatencyPlugin: {
305316
name: 'Latency Plugin',
306317
url: 'https://learn.microsoft.com/microsoft-cloud/dev/dev-proxy/technical-reference/latencyplugin',
@@ -381,4 +392,4 @@ export const pluginDocs: PluginDocs = {
381392
name: 'Plain Text Reporter',
382393
url: 'https://learn.microsoft.com/microsoft-cloud/dev/dev-proxy/technical-reference/plaintextreporter',
383394
}
384-
};
395+
};

src/snippets.json

Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -733,6 +733,32 @@
733733
],
734734
"description": "LanguageModelFailurePlugin config section"
735735
},
736+
"LanguageModelRateLimitingPlugin": {
737+
"prefix": "devproxy-plugin-language-model-rate-limiting",
738+
"body": [
739+
"{",
740+
"\t\"name\": \"LanguageModelRateLimitingPlugin\",",
741+
"\t\"enabled\": true,",
742+
"\t\"pluginPath\": \"~appFolder/plugins/DevProxy.Plugins.dll\",",
743+
"\t\"configSection\": \"languageModelRateLimitingPlugin\"",
744+
"}"
745+
],
746+
"description": "LanguageModelRateLimitingPlugin instance"
747+
},
748+
"LanguageModelRateLimitingPluginConfig": {
749+
"prefix": "devproxy-plugin-language-model-rate-limiting-config",
750+
"body": [
751+
"\"languageModelRateLimitingPlugin\": {",
752+
"\t\"\\$schema\": \"https://raw.githubusercontent.com/dotnet/dev-proxy/main/schemas/v1.0.0/languagemodelratelimitingplugin.schema.json\",",
753+
"\t\"promptTokenLimit\": 5000,",
754+
"\t\"completionTokenLimit\": 5000,",
755+
"\t\"resetTimeWindowSeconds\": 60,",
756+
"\t\"whenLimitExceeded\": \"Throttle\",",
757+
"\t\"headerRetryAfter\": \"retry-after\"",
758+
"}"
759+
],
760+
"description": "LanguageModelRateLimitingPlugin config section"
761+
},
736762
"MinimalCsomPermissionsPlugin": {
737763
"prefix": "devproxy-plugin-minimal-csom-permissions",
738764
"body": [

0 commit comments

Comments
 (0)