File tree Expand file tree Collapse file tree 1 file changed +6
-4
lines changed
Expand file tree Collapse file tree 1 file changed +6
-4
lines changed Original file line number Diff line number Diff line change 2626HTTP_OK = 200
2727
2828# Docker image size limits
29- # Lambda container image max is 10GB, leave room for base image + dependencies
30- DOCKER_IMAGE_MAX_SIZE_BYTES = 10 * 1024 * 1024 * 1024 # 10GB
31- BASE_IMAGE_OVERHEAD_BYTES = 2 * 1024 * 1024 * 1024 # ~2GB for base image + deps
32- MAX_MODEL_SIZE_IN_IMAGE = DOCKER_IMAGE_MAX_SIZE_BYTES - BASE_IMAGE_OVERHEAD_BYTES # ~8GB
29+ # Lambda container image max is 10GB uncompressed
30+ # Base image (Python runtime, Ollama, dependencies) is ~5GB
31+ # This leaves ~5GB for the model in the Docker image
32+ DOCKER_IMAGE_MAX_SIZE_BYTES = 10 * 1024 * 1024 * 1024 # 10GB Lambda limit
33+ BASE_IMAGE_OVERHEAD_BYTES = 5 * 1024 * 1024 * 1024 # ~5GB for base image + deps
34+ MAX_MODEL_SIZE_IN_IMAGE = DOCKER_IMAGE_MAX_SIZE_BYTES - BASE_IMAGE_OVERHEAD_BYTES # ~5GB for model
3335
3436# Split metadata filename
3537SPLIT_METADATA_FILE = "split_metadata.json"
You can’t perform that action at this time.
0 commit comments