Skip to content

Commit 523a3e3

Browse files
author
BitsAdmin
committed
Merge branch 'feat/reasoning-effort' into 'integration_2025-10-30_1075115650562'
feat: [development task] ark runtime (1783385) See merge request iaasng/volcengine-java-sdk!720
2 parents f9f4c74 + 3eb8636 commit 523a3e3

File tree

6 files changed

+152
-3
lines changed

6 files changed

+152
-3
lines changed

volcengine-java-sdk-ark-runtime/src/main/java/com/volcengine/ark/runtime/model/responses/common/ResponsesCaching.java

Lines changed: 26 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,10 @@ public class ResponsesCaching {
66
@JsonProperty("type")
77
private String type;
88

9+
10+
@JsonProperty("prefix")
11+
private Boolean prefix;
12+
913
public String getType() {
1014
return type;
1115
}
@@ -14,11 +18,23 @@ public void setType(String type) {
1418
this.type = type;
1519
}
1620

21+
public Boolean getPrefix() {
22+
return prefix;
23+
}
24+
25+
public void setPrefix(Boolean prefix) {
26+
this.prefix = prefix;
27+
}
28+
1729
@Override
1830
public String toString() {
19-
return "ResponsesCaching{" +
20-
"type='" + type + '\'' +
21-
'}';
31+
StringBuilder sb = new StringBuilder("ResponsesCaching{");
32+
sb.append("type='").append(type).append('\'');
33+
if (prefix != null) {
34+
sb.append(", prefix=").append(prefix);
35+
}
36+
sb.append('}');
37+
return sb.toString();
2238
}
2339

2440
public static Builder builder() {
@@ -27,15 +43,22 @@ public static Builder builder() {
2743

2844
public static class Builder {
2945
private String type;
46+
private Boolean prefix;
3047

3148
public Builder type(String type) {
3249
this.type = type;
3350
return this;
3451
}
3552

53+
public Builder prefix(Boolean prefix) {
54+
this.prefix = prefix;
55+
return this;
56+
}
57+
3658
public ResponsesCaching build() {
3759
ResponsesCaching responsesCaching = new ResponsesCaching();
3860
responsesCaching.setType(type);
61+
responsesCaching.setPrefix(prefix);
3962
return responsesCaching;
4063
}
4164
}
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
package com.volcengine.ark.runtime.model.responses.common;
2+
3+
import com.fasterxml.jackson.annotation.JsonProperty;
4+
5+
public class ResponsesReasoning {
6+
7+
@JsonProperty("effort")
8+
private String effort;
9+
10+
public String getEffort() {
11+
return effort;
12+
}
13+
14+
public void setEffort(String effort) {
15+
this.effort = effort;
16+
}
17+
18+
19+
20+
@Override
21+
public String toString() {
22+
return "ResponseReasoning{" +
23+
"effort='" + effort + '\'' +
24+
'}';
25+
}
26+
27+
public static Builder builder() {
28+
return new Builder();
29+
}
30+
31+
public static class Builder {
32+
private String effort;
33+
34+
public Builder effort(String effort) {
35+
this.effort = effort;
36+
return this;
37+
}
38+
39+
public ResponsesReasoning build() {
40+
ResponsesReasoning responsesReasoning = new ResponsesReasoning();
41+
responsesReasoning.setEffort(effort);
42+
return responsesReasoning;
43+
}
44+
}
45+
}

volcengine-java-sdk-ark-runtime/src/main/java/com/volcengine/ark/runtime/model/responses/request/CreateResponsesRequest.java

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22

33
import com.fasterxml.jackson.annotation.JsonProperty;
44
import com.volcengine.ark.runtime.model.responses.common.ResponsesCaching;
5+
import com.volcengine.ark.runtime.model.responses.common.ResponsesReasoning;
56
import com.volcengine.ark.runtime.model.responses.common.ResponsesText;
67
import com.volcengine.ark.runtime.model.responses.common.ResponsesThinking;
78
import com.volcengine.ark.runtime.model.responses.tool.ResponsesTool;
@@ -25,6 +26,9 @@ public class CreateResponsesRequest {
2526
@JsonProperty("thinking")
2627
private ResponsesThinking thinking;
2728

29+
@JsonProperty("reasoning")
30+
private ResponsesReasoning reasoning;
31+
2832
@JsonProperty("service_tier")
2933
private String serviceTier;
3034

@@ -107,6 +111,14 @@ public void setThinking(ResponsesThinking thinking) {
107111
this.thinking = thinking;
108112
}
109113

114+
public ResponsesReasoning getReasoning() {
115+
return reasoning;
116+
}
117+
118+
public void setReasoning(ResponsesReasoning reasoning) {
119+
this.reasoning = reasoning;
120+
}
121+
110122
public String getServiceTier() {
111123
return serviceTier;
112124
}
@@ -227,6 +239,7 @@ public String toString() {
227239
", maxOutputTokens=" + maxOutputTokens +
228240
", previousResponseId='" + previousResponseId + '\'' +
229241
", thinking=" + thinking +
242+
", reasoning=" + reasoning +
230243
", serviceTier='" + serviceTier + '\'' +
231244
", store=" + store +
232245
", stream=" + stream +
@@ -254,6 +267,7 @@ public static class Builder {
254267
private Long maxOutputTokens;
255268
private String previousResponseId;
256269
private ResponsesThinking thinking;
270+
private ResponsesReasoning reasoning;
257271
private String serviceTier;
258272
private Boolean store;
259273
private Boolean stream;
@@ -294,6 +308,11 @@ public Builder thinking(ResponsesThinking thinking) {
294308
return this;
295309
}
296310

311+
public Builder reasoning(ResponsesReasoning reasoning) {
312+
this.reasoning = reasoning;
313+
return this;
314+
}
315+
297316
public Builder serviceTier(String serviceTier) {
298317
this.serviceTier = serviceTier;
299318
return this;
@@ -371,6 +390,7 @@ public CreateResponsesRequest build() {
371390
responsesRequest.setMaxOutputTokens(maxOutputTokens);
372391
responsesRequest.setPreviousResponseId(previousResponseId);
373392
responsesRequest.setThinking(thinking);
393+
responsesRequest.setReasoning(reasoning);
374394
responsesRequest.setServiceTier(serviceTier);
375395
responsesRequest.setStore(store);
376396
responsesRequest.setStream(stream);

volcengine-java-sdk-ark-runtime/src/main/java/com/volcengine/ark/runtime/model/responses/response/ResponseObject.java

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22

33
import com.fasterxml.jackson.annotation.JsonProperty;
44
import com.volcengine.ark.runtime.model.responses.common.Error;
5+
import com.volcengine.ark.runtime.model.responses.common.ResponsesReasoning;
56
import com.volcengine.ark.runtime.model.responses.item.BaseItem;
67
import com.volcengine.ark.runtime.model.responses.usage.IncompleteDetails;
78
import com.volcengine.ark.runtime.model.responses.usage.Usage;
@@ -45,6 +46,9 @@ public class ResponseObject {
4546
@JsonProperty("thinking")
4647
private ResponsesThinking thinking;
4748

49+
@JsonProperty("reasoning")
50+
private ResponsesReasoning reasoning;
51+
4852
@JsonProperty("service_tier")
4953
private String serviceTier;
5054

@@ -167,6 +171,14 @@ public void setThinking(ResponsesThinking thinking) {
167171
this.thinking = thinking;
168172
}
169173

174+
public ResponsesReasoning getReasoning() {
175+
return reasoning;
176+
}
177+
178+
public void setReasoning(ResponsesReasoning reasoning) {
179+
this.reasoning = reasoning;
180+
}
181+
170182
public String getServiceTier() {
171183
return serviceTier;
172184
}
@@ -292,6 +304,7 @@ public String toString() {
292304
", output=" + output +
293305
", previousResponseId='" + previousResponseId + '\'' +
294306
", thinking=" + thinking +
307+
", reasoning=" + reasoning +
295308
", serviceTier='" + serviceTier + '\'' +
296309
", status='" + status + '\'' +
297310
", temperature=" + temperature +

volcengine-java-sdk-ark-runtime/src/main/java/com/volcengine/ark/runtime/model/responses/usage/InputTokensDetails.java

Lines changed: 7 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -15,4 +15,11 @@ public Long getCachedTokens() {
1515
public void setCachedTokens(Long cachedTokens) {
1616
this.cachedTokens = cachedTokens;
1717
}
18+
19+
@Override
20+
public String toString() {
21+
return "InputTokensDetails{" +
22+
"cachedTokens=" + cachedTokens +
23+
'}';
24+
}
1825
}

volcengine-java-sdk-ark-runtime/test/java/com/volcengine/ark/runtime/CreateResponseExample.java

Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
package com.volcengine.ark.runtime;
22

33
import com.fasterxml.jackson.databind.ObjectMapper;
4+
import com.volcengine.ark.runtime.model.responses.common.ResponsesCaching;
45
import com.volcengine.ark.runtime.model.responses.common.ResponsesThinking;
56
import com.volcengine.ark.runtime.model.responses.constant.ResponsesConstants;
67
import com.volcengine.ark.runtime.model.responses.content.*;
@@ -293,6 +294,46 @@ public static void main(String[] args) {
293294
System.err.println("Create Response 6 Error " + e.getMessage());
294295
}
295296

297+
System.out.println("\n----- [Request with Caching] Request 7-----");
298+
String longPrompt = "你是豆包,你必须用4个字回答我的问题";
299+
for (int i = 0; i < 1000; i++) {
300+
longPrompt += "你是豆包,你必须用4个字回答我的问题";
301+
}
302+
CreateResponsesRequest request7 = CreateResponsesRequest.builder()
303+
.model(modelName)
304+
.stream(false)
305+
.caching(ResponsesCaching.builder().type(ResponsesConstants.CACHE_TYPE_ENABLED).prefix(true).build())
306+
.input(ResponsesInput.builder().stringValue(longPrompt).build())
307+
.thinking(ResponsesThinking.builder().type(ResponsesConstants.THINKING_TYPE_DISABLED).build())
308+
.build();
309+
310+
String cacheResponseId = null;
311+
312+
try {
313+
ResponseObject cachePrefix = service.createResponse(request7);
314+
System.out.println("=== cache prefix response ===");
315+
printResponseObject(cachePrefix);
316+
cacheResponseId = cachePrefix.getId();
317+
} catch (Exception e) {
318+
System.err.println("Create Response 7 Error " + e.getMessage());
319+
}
320+
321+
CreateResponsesRequest cachedRequest = CreateResponsesRequest.builder()
322+
.model(modelName)
323+
.stream(false)
324+
.previousResponseId(cacheResponseId)
325+
.input(ResponsesInput.builder().stringValue("你好").build())
326+
.thinking(ResponsesThinking.builder().type(ResponsesConstants.THINKING_TYPE_DISABLED).build())
327+
.build();
328+
329+
try {
330+
ResponseObject cacheHitResponse = service.createResponse(cachedRequest);
331+
System.out.println("=== cache hit response ===");
332+
printResponseObject(cacheHitResponse);
333+
} catch (Exception e) {
334+
System.err.println("Create Cached Response Error " + e.getMessage());
335+
}
336+
296337
service.shutdownExecutor();
297338
}
298339

0 commit comments

Comments
 (0)