|
| 1 | +# documentation: https://docs.argilla.io/latest/ |
| 2 | +# slogan: Argilla is a collaboration tool for AI engineers and domain experts who need to build high-quality datasets for their projects. |
| 3 | +# tags: workflow, orchestration, data-pipeline, python, argilla, ai, elasticsearch, datasets, data, machine-learning, data-science, nlp |
| 4 | +# logo: svgs/argilla.png |
| 5 | +# port: 6900 |
| 6 | + |
| 7 | +version: "3" |
| 8 | + |
| 9 | +services: |
| 10 | + argilla: |
| 11 | + image: "argilla/argilla-server:v2.2.0" |
| 12 | + restart: always |
| 13 | + environment: |
| 14 | + - SERVICE_FQDN_ARGILLA_6900 |
| 15 | + - ARGILLA_HOME_PATH=/var/lib/argilla |
| 16 | + - ARGILLA_ELASTICSEARCH=http://elasticsearch:9200 |
| 17 | + - ARGILLA_DATABASE_URL=postgresql+asyncpg://${SERVICE_USER_POSTGRES}:${SERVICE_PASSWORD_POSTGRES}@postgres:5432/${POSTGRES_DB} |
| 18 | + - ARGILLA_REDIS_URL=redis://redis:6379/0 |
| 19 | + - ARGILLA_AUTH_SECRET_KEY="${SERVICE_PASSWORD_AUTHSECRET}" |
| 20 | + - ARGILLA_ENABLE_TELEMETRY=0 |
| 21 | + - HF_HUB_DISABLE_TELEMETRY=1 |
| 22 | + - REINDEX_DATASETS=1 |
| 23 | + - DEFAULT_USER_ENABLED=true |
| 24 | + - USERNAME=${ARGILLA_USERNAME:-argilla} |
| 25 | + - PASSWORD="${SERVICE_PASSWORD_ARGILLA}" |
| 26 | + - API_KEY="${SERVICE_PASSWORD_APIKEY}" |
| 27 | + - DEFAULT_USER_PASSWORD="${SERVICE_PASSWORD_ARGILLA}" |
| 28 | + - DEFAULT_USER_API_KEY="${SERVICE_PASSWORD_APIKEY}" |
| 29 | + depends_on: |
| 30 | + elasticsearch: |
| 31 | + condition: service_healthy |
| 32 | + redis: |
| 33 | + condition: service_healthy |
| 34 | + postgres: |
| 35 | + condition: service_healthy |
| 36 | + volumes: |
| 37 | + - "argilla_data:/var/lib/argilla" |
| 38 | + healthcheck: |
| 39 | + test: |
| 40 | + - CMD-SHELL |
| 41 | + - 'python -c "import requests as r;r.get(\"http://localhost:6900/api/_status\").raise_for_status()"' |
| 42 | + interval: 10s |
| 43 | + timeout: 10s |
| 44 | + retries: 5 |
| 45 | + worker: |
| 46 | + image: "argilla/argilla-server:v2.2.0" |
| 47 | + restart: always |
| 48 | + environment: |
| 49 | + - ARGILLA_HOME_PATH=/var/lib/argilla |
| 50 | + - ARGILLA_ELASTICSEARCH=http://elasticsearch:9200 |
| 51 | + - ARGILLA_DATABASE_URL=postgresql+asyncpg://${SERVICE_USER_POSTGRES}:${SERVICE_PASSWORD_POSTGRES}@postgres:5432/${POSTGRES_DB} |
| 52 | + - ARGILLA_REDIS_URL=redis://redis:6379/0 |
| 53 | + - ARGILLA_AUTH_SECRET_KEY="${SERVICE_PASSWORD_AUTHSECRET}" |
| 54 | + - ARGILLA_ENABLE_TELEMETRY=0 |
| 55 | + - HF_HUB_DISABLE_TELEMETRY=1 |
| 56 | + - REINDEX_DATASETS=1 |
| 57 | + - DEFAULT_USER_ENABLED=true |
| 58 | + - USERNAME=${ARGILLA_USERNAME:-argilla} |
| 59 | + - PASSWORD="${SERVICE_PASSWORD_ARGILLA}" |
| 60 | + - API_KEY="${SERVICE_PASSWORD_APIKEY}" |
| 61 | + - DEFAULT_USER_PASSWORD="${SERVICE_PASSWORD_ARGILLA}" |
| 62 | + - DEFAULT_USER_API_KEY="${SERVICE_PASSWORD_APIKEY}" |
| 63 | + - BACKGROUND_NUM_WORKERS=${BACKGROUND_NUM_WORKERS:-1} |
| 64 | + depends_on: |
| 65 | + elasticsearch: |
| 66 | + condition: service_healthy |
| 67 | + redis: |
| 68 | + condition: service_healthy |
| 69 | + postgres: |
| 70 | + condition: service_healthy |
| 71 | + volumes: |
| 72 | + - "argilla_data:/var/lib/argilla" |
| 73 | + command: "sh -c 'python -m argilla_server worker --num-workers $${BACKGROUND_NUM_WORKERS}'" |
| 74 | + healthcheck: |
| 75 | + test: |
| 76 | + - CMD-SHELL |
| 77 | + - pwd |
| 78 | + interval: 10s |
| 79 | + timeout: 10s |
| 80 | + retries: 5 |
| 81 | + postgres: |
| 82 | + image: "postgres:14" |
| 83 | + restart: always |
| 84 | + environment: |
| 85 | + - POSTGRES_USER=${SERVICE_USER_POSTGRES} |
| 86 | + - POSTGRES_PASSWORD=${SERVICE_PASSWORD_POSTGRES} |
| 87 | + - POSTGRES_DB=${POSTGRES_DB:-argilla} |
| 88 | + volumes: |
| 89 | + - "pg_data:/var/lib/postgresql/data" |
| 90 | + healthcheck: |
| 91 | + test: |
| 92 | + - CMD-SHELL |
| 93 | + - "pg_isready -h localhost -U $${POSTGRES_USER} -d $${POSTGRES_DB}" |
| 94 | + interval: 5s |
| 95 | + timeout: 5s |
| 96 | + retries: 3 |
| 97 | + redis: |
| 98 | + image: "redis:7" |
| 99 | + restart: always |
| 100 | + volumes: |
| 101 | + - "redis_data:/data" |
| 102 | + healthcheck: |
| 103 | + test: |
| 104 | + - CMD-SHELL |
| 105 | + - "redis-cli -h localhost -p 6379 ping" |
| 106 | + interval: 5s |
| 107 | + timeout: 5s |
| 108 | + retries: 3 |
| 109 | + elasticsearch: |
| 110 | + image: "docker.elastic.co/elasticsearch/elasticsearch:8.12.2" |
| 111 | + restart: always |
| 112 | + environment: |
| 113 | + - node.name=elasticsearch |
| 114 | + - cluster.name=es-argilla-local |
| 115 | + - discovery.type=single-node |
| 116 | + - "ES_JAVA_OPTS=-Xms512m -Xmx512m" |
| 117 | + - cluster.routing.allocation.disk.threshold_enabled=false |
| 118 | + - xpack.security.enabled=false |
| 119 | + ulimits: |
| 120 | + memlock: |
| 121 | + soft: -1 |
| 122 | + hard: -1 |
| 123 | + volumes: |
| 124 | + - "elasticsearch_data:/usr/share/elasticsearch/data/" |
| 125 | + healthcheck: |
| 126 | + test: |
| 127 | + - CMD-SHELL |
| 128 | + - "curl --silent --fail http://elasticsearch:9200" |
| 129 | + interval: 10s |
| 130 | + timeout: 10s |
| 131 | + retries: 5 |
| 132 | +volumes: |
| 133 | + argilla_data: null |
| 134 | + elastic_data: null |
| 135 | + redis_data: null |
| 136 | + pg_data: null |
0 commit comments