Skip to content

Commit 50b76fe

Browse files
author
AWS
committed
AWSDeadlineCloud Update: Added fields to track cumulative task retry attempts for steps and jobs
1 parent ee90ee6 commit 50b76fe

File tree

2 files changed

+39
-3
lines changed

2 files changed

+39
-3
lines changed
Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
{
2+
"type": "feature",
3+
"category": "AWSDeadlineCloud",
4+
"contributor": "",
5+
"description": "Added fields to track cumulative task retry attempts for steps and jobs"
6+
}

services/deadline/src/main/resources/codegen-resources/service-2.json

Lines changed: 33 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2286,11 +2286,11 @@
22862286
"members":{
22872287
"name":{
22882288
"shape":"AcceleratorName",
2289-
"documentation":"<p>The name of the chip used by the GPU accelerator.</p> <p>If you specify <code>l4</code> as the name of the accelerator, you must specify <code>latest</code> or <code>grid:r550</code> as the runtime.</p> <p>The available GPU accelerators are:</p> <ul> <li> <p> <code>t4</code> - NVIDIA T4 Tensor Core GPU</p> </li> <li> <p> <code>a10g</code> - NVIDIA A10G Tensor Core GPU</p> </li> <li> <p> <code>l4</code> - NVIDIA L4 Tensor Core GPU</p> </li> <li> <p> <code>l40s</code> - NVIDIA L40S Tensor Core GPU</p> </li> </ul>"
2289+
"documentation":"<p>The name of the chip used by the GPU accelerator.</p> <p>If you specify <code>l4</code> as the name of the accelerator, you must specify <code>latest</code> or <code>grid:r570</code> as the runtime.</p> <p>The available GPU accelerators are:</p> <ul> <li> <p> <code>t4</code> - NVIDIA T4 Tensor Core GPU</p> </li> <li> <p> <code>a10g</code> - NVIDIA A10G Tensor Core GPU</p> </li> <li> <p> <code>l4</code> - NVIDIA L4 Tensor Core GPU</p> </li> <li> <p> <code>l40s</code> - NVIDIA L40S Tensor Core GPU</p> </li> </ul>"
22902290
},
22912291
"runtime":{
22922292
"shape":"AcceleratorRuntime",
2293-
"documentation":"<p>Specifies the runtime driver to use for the GPU accelerator. You must use the same runtime for all GPUs. </p> <p>You can choose from the following runtimes:</p> <ul> <li> <p> <code>latest</code> - Use the latest runtime available for the chip. If you specify <code>latest</code> and a new version of the runtime is released, the new version of the runtime is used.</p> </li> <li> <p> <code>grid:r550</code> - <a href=\"https://docs.nvidia.com/vgpu/17.0/index.html\">NVIDIA vGPU software 17</a> </p> </li> <li> <p> <code>grid:r535</code> - <a href=\"https://docs.nvidia.com/vgpu/16.0/index.html\">NVIDIA vGPU software 16</a> </p> </li> </ul> <p>If you don't specify a runtime, Deadline Cloud uses <code>latest</code> as the default. However, if you have multiple accelerators and specify <code>latest</code> for some and leave others blank, Deadline Cloud raises an exception.</p>"
2293+
"documentation":"<p>Specifies the runtime driver to use for the GPU accelerator. You must use the same runtime for all GPUs. </p> <p>You can choose from the following runtimes:</p> <ul> <li> <p> <code>latest</code> - Use the latest runtime available for the chip. If you specify <code>latest</code> and a new version of the runtime is released, the new version of the runtime is used.</p> </li> <li> <p> <code>grid:r570</code> - <a href=\"https://docs.nvidia.com/vgpu/18.0/index.html\">NVIDIA vGPU software 18</a> </p> </li> <li> <p> <code>grid:r535</code> - <a href=\"https://docs.nvidia.com/vgpu/16.0/index.html\">NVIDIA vGPU software 16</a> </p> </li> </ul> <p>If you don't specify a runtime, Deadline Cloud uses <code>latest</code> as the default. However, if you have multiple accelerators and specify <code>latest</code> for some and leave others blank, Deadline Cloud raises an exception.</p>"
22942294
}
22952295
},
22962296
"documentation":"<p>Describes a specific GPU accelerator required for an Amazon Elastic Compute Cloud worker host.</p>"
@@ -5458,7 +5458,7 @@
54585458
},
54595459
"status":{
54605460
"shape":"FleetStatus",
5461-
"documentation":"<p>The Auto Scaling status of the fleet.</p>"
5461+
"documentation":"<p>The status of the fleet.</p>"
54625462
},
54635463
"autoScalingStatus":{
54645464
"shape":"AutoScalingStatus",
@@ -5633,6 +5633,10 @@
56335633
"shape":"TaskRunStatusCounts",
56345634
"documentation":"<p>The number of tasks running on the job.</p>"
56355635
},
5636+
"taskFailureRetryCount":{
5637+
"shape":"TaskFailureRetryCount",
5638+
"documentation":"<p>The total number of times tasks from the job failed and were retried.</p>"
5639+
},
56365640
"storageProfileId":{
56375641
"shape":"StorageProfileId",
56385642
"documentation":"<p>The storage profile ID associated with the job.</p>"
@@ -6506,6 +6510,10 @@
65066510
"shape":"TaskRunStatusCounts",
65076511
"documentation":"<p>The number of tasks running on the job.</p>"
65086512
},
6513+
"taskFailureRetryCount":{
6514+
"shape":"TaskFailureRetryCount",
6515+
"documentation":"<p>The total number of times tasks from the step failed and were retried.</p>"
6516+
},
65096517
"targetTaskRunStatus":{
65106518
"shape":"StepTargetTaskRunStatus",
65116519
"documentation":"<p>The task status with which the job started.</p>"
@@ -7410,6 +7418,10 @@
74107418
"shape":"TaskRunStatusCounts",
74117419
"documentation":"<p>The number of tasks running on the job.</p>"
74127420
},
7421+
"taskFailureRetryCount":{
7422+
"shape":"TaskFailureRetryCount",
7423+
"documentation":"<p>The total number of times tasks from the job failed and were retried.</p>"
7424+
},
74137425
"priority":{
74147426
"shape":"JobPriority",
74157427
"documentation":"<p>The job priority.</p>"
@@ -7525,6 +7537,10 @@
75257537
"shape":"TaskRunStatusCounts",
75267538
"documentation":"<p>The number of tasks running on the job.</p>"
75277539
},
7540+
"taskFailureRetryCount":{
7541+
"shape":"TaskFailureRetryCount",
7542+
"documentation":"<p>The total number of times tasks from the job failed and were retried.</p>"
7543+
},
75287544
"maxFailedTasksCount":{
75297545
"shape":"MaxFailedTasksCount",
75307546
"documentation":"<p>The number of task failures before the job stops running and is marked as <code>FAILED</code>.</p>"
@@ -11190,6 +11206,10 @@
1119011206
"shape":"TaskRunStatusCounts",
1119111207
"documentation":"<p>The number of tasks running on the job.</p>"
1119211208
},
11209+
"taskFailureRetryCount":{
11210+
"shape":"TaskFailureRetryCount",
11211+
"documentation":"<p>The total number of times tasks from the step failed and were retried.</p>"
11212+
},
1119311213
"createdAt":{
1119411214
"shape":"CreatedAt",
1119511215
"documentation":"<p>The date and time the resource was created.</p>"
@@ -11249,6 +11269,10 @@
1124911269
"shape":"TaskRunStatusCounts",
1125011270
"documentation":"<p>The number of tasks running on the job.</p>"
1125111271
},
11272+
"taskFailureRetryCount":{
11273+
"shape":"TaskFailureRetryCount",
11274+
"documentation":"<p>The total number of times tasks from the step failed and were retried.</p>"
11275+
},
1125211276
"targetTaskRunStatus":{
1125311277
"shape":"StepTargetTaskRunStatus",
1125411278
"documentation":"<p>The task status to start with on the job.</p>"
@@ -11434,6 +11458,12 @@
1143411458
"key":{"shape":"String"},
1143511459
"value":{"shape":"String"}
1143611460
},
11461+
"TaskFailureRetryCount":{
11462+
"type":"integer",
11463+
"box":true,
11464+
"max":2147483647,
11465+
"min":0
11466+
},
1143711467
"TaskId":{
1143811468
"type":"string",
1143911469
"pattern":"task-[0-9a-f]{32}-(0|([1-9][0-9]{0,9}))"

0 commit comments

Comments
 (0)