Skip to content

Commit 8927416

Browse files
Merge pull request #53 from oracle-quickstart/ray-cleanout
Cleaning distributed inference with ray related artifacts.
2 parents 12ecc07 + 600d0dd commit 8927416

File tree

2 files changed

+2
-63
lines changed

2 files changed

+2
-63
lines changed

docs/api_documentation/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@
1010
| -------------------------------------------- | ------- | -------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
1111
| recipe_id | string | Yes | One of the following: `llm_inference_nvidia`, `lora_finetune_nvidia`, or `mlcommons_lora_finetune_nvidia` |
1212
| deployment_name | string | Yes | Any deployment name to identify the deployment details easily. Must be unique from other recipe deployments. |
13-
| recipe_mode | string | Yes | One of the following: `service`, `job`, `update`, `shared_node_pool` or `raycluster`. Enter `service` for inference recipe deployments, `job` for fine-tuning recipe deployments, `update` for updating existing deployments (currently only supported for MIG), `shared_node_pool` for creating a shared node pool, and `raycluster` when doing multinode inference deployments. |
13+
| recipe_mode | string | Yes | One of the following: `service`, `job`, `update`, or `shared_node_pool`. Enter `service` for inference recipe deployments, `job` for fine-tuning recipe deployments, `update` for updating existing deployments (currently only supported for MIG), and `shared_node_pool` for creating a shared node pool. |
1414
| recipe_node_labels | object | No | Additional labels to apply to a node pool in the form `{"label": "value"}` |
1515
| service_endpoint_domain | string | No | Required for inference recipe deployments. Inference endpoint will point to this domain. |
1616
| recipe_max_pods_per_node | int | No | Allow a node to schedule more pods than default 31 from kubernetes. Required for certain MIG configurations which can slice up to 56 times. |

docs/custom_blueprints/blueprint_json_schema.json

Lines changed: 1 addition & 62 deletions
Original file line numberDiff line numberDiff line change
@@ -43,8 +43,7 @@
4343
"service",
4444
"job",
4545
"update",
46-
"shared_node_pool",
47-
"raycluster"
46+
"shared_node_pool"
4847
]
4948
},
5049
"recipe_replica_count": {
@@ -411,66 +410,6 @@
411410
},
412411
"skip_quota_validation": {
413412
"type": "boolean"
414-
},
415-
"recipe_raycluster_params": {
416-
"type": "object",
417-
"properties": {
418-
"head_node_num_cpus": {
419-
"type": "integer"
420-
},
421-
"head_node_num_gpus": {
422-
"type": "integer"
423-
},
424-
"head_node_cpu_mem_in_gbs": {
425-
"type": "integer"
426-
},
427-
"num_worker_nodes": {
428-
"type": "integer"
429-
},
430-
"worker_node_num_cpus": {
431-
"type": "integer"
432-
},
433-
"worker_node_num_gpus": {
434-
"type": "integer"
435-
},
436-
"worker_node_cpu_mem_in_gbs": {
437-
"type": "integer"
438-
},
439-
"model_path_in_container": {
440-
"type": "string"
441-
},
442-
"redis_port": {
443-
"type": "integer"
444-
},
445-
"dashboard_port": {
446-
"type": "integer"
447-
},
448-
"metrics_export_port": {
449-
"type": "integer"
450-
},
451-
"rayclient_server_port": {
452-
"type": "integer"
453-
},
454-
"worker_image_uri": {
455-
"type": "string"
456-
},
457-
"head_image_uri": {
458-
"type": "string"
459-
},
460-
"rayjob_image_uri": {
461-
"type": "string"
462-
}
463-
},
464-
"additionalProperties": false,
465-
"required": [
466-
"head_node_num_cpus",
467-
"head_node_num_gpus",
468-
"head_node_cpu_mem_in_gbs",
469-
"num_worker_nodes",
470-
"worker_node_num_cpus",
471-
"worker_node_num_gpus",
472-
"worker_node_cpu_mem_in_gbs"
473-
]
474413
}
475414
},
476415
"required": ["recipe_mode", "deployment_name"],

0 commit comments

Comments
 (0)