forked from red-hat-data-services/vllm-cpu
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdocker-bake.hcl
More file actions
123 lines (97 loc) · 2.84 KB
/
docker-bake.hcl
File metadata and controls
123 lines (97 loc) · 2.84 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
variable "REPOSITORY" {
default = "quay.io/vllm/automation-vllm"
}
variable "RELEASE_IMAGE" {
default = false
}
# GITHUB_* variables are set as env vars in github actions
variable "GITHUB_SHA" {}
variable "GITHUB_REPOSITORY" {}
variable "GITHUB_RUN_ID" {}
variable "VLLM_VERSION" {}
variable "PYTHON_VERSION" {
default = "3.12"
}
variable "ROCM_VERSION" {
# This can be overridden by the prepare-payload action
default = "6.4.3"
}
target "docker-metadata-action" {} // populated by gha docker/metadata-action
target "_common" {
context = "."
args = {
BASE_UBI_IMAGE_TAG = "9.6-1760515502"
PYTHON_VERSION = "3.12"
}
inherits = ["docker-metadata-action"]
platforms = [
"linux/amd64",
]
labels = {
"org.opencontainers.image.source" = "https://github.com/${GITHUB_REPOSITORY}"
"vcs-ref" = "${GITHUB_SHA}"
"vcs-type" = "git"
}
}
group "default" {
targets = [
"cuda",
"rocm",
"tpu",
]
}
target "cuda" {
inherits = ["_common"]
dockerfile = "Dockerfile.ubi"
args = {
PYTHON_VERSION = "${PYTHON_VERSION}"
CUDA_MAJOR = "12"
CUDA_MINOR = "9"
}
tags = [
"${REPOSITORY}:${replace(VLLM_VERSION, "+", "_")}", # vllm_version might contain local version specifiers (+) which are not valid tags
"${REPOSITORY}:cuda-${GITHUB_SHA}",
"${REPOSITORY}:cuda-${GITHUB_RUN_ID}",
RELEASE_IMAGE ? "quay.io/vllm/vllm-cuda:${replace(VLLM_VERSION, "+", "_")}" : ""
]
}
target "rocm" {
inherits = ["_common"]
dockerfile = "Dockerfile.rocm.ubi"
args = {
PYTHON_VERSION = "${PYTHON_VERSION}"
ROCM_VERSION = "${ROCM_VERSION}"
}
tags = [
"${REPOSITORY}:${replace(VLLM_VERSION, "+", "_")}", # vllm_version might contain local version specifiers (+) which are not valid tags
"${REPOSITORY}:rocm-${GITHUB_SHA}",
"${REPOSITORY}:rocm-${GITHUB_RUN_ID}",
RELEASE_IMAGE ? "quay.io/vllm/vllm-rocm:${replace(VLLM_VERSION, "+", "_")}" : ""
]
}
target "cpu" {
inherits = ["_common"]
dockerfile = "Dockerfile.cpu.ubi"
args = {
PYTHON_VERSION = "${PYTHON_VERSION}"
}
tags = [
"${REPOSITORY}:${replace(VLLM_VERSION, "+", "_")}", # vllm_version might contain local version specifiers (+) which are not valid tags
"${REPOSITORY}:cpu-${GITHUB_SHA}",
"${REPOSITORY}:cpu-${GITHUB_RUN_ID}",
RELEASE_IMAGE ? "quay.io/vllm/vllm-cpu:${replace(VLLM_VERSION, "+", "_")}" : "" # TODO: repository does not exist yet
]
}
target "tpu" {
inherits = ["_common"]
dockerfile = "Dockerfile.tpu.ubi"
args = {
PYTHON_VERSION = "${PYTHON_VERSION}"
}
tags = [
"${REPOSITORY}:${replace(VLLM_VERSION, "+", "_")}", # vllm_version might contain local version specifiers (+) which are not valid tags
"${REPOSITORY}:tpu-${GITHUB_SHA}",
"${REPOSITORY}:tpu-${GITHUB_RUN_ID}",
RELEASE_IMAGE ? "quay.io/vllm/vllm-tpu:${replace(VLLM_VERSION, "+", "_")}" : ""
]
}