zenml-io
diff --git a/‎flux-dreambooth/.gitignore‎
Lines changed: 174 additions & 0 deletions b/‎flux-dreambooth/.gitignore‎
Lines changed: 174 additions & 0 deletions
diff --git a/‎flux-dreambooth/README.md‎
Lines changed: 72 additions & 0 deletions b/‎flux-dreambooth/README.md‎
Lines changed: 72 additions & 0 deletions
diff --git a/‎flux-dreambooth/assets/app_screenshot_1.png‎
855 KB b/‎flux-dreambooth/assets/app_screenshot_1.png‎
855 KB
diff --git a/‎flux-dreambooth/assets/app_screenshot_2.png‎
64 KB b/‎flux-dreambooth/assets/app_screenshot_2.png‎
64 KB
diff --git a/‎flux-dreambooth/assets/app_screenshot_3.png‎
363 KB b/‎flux-dreambooth/assets/app_screenshot_3.png‎
363 KB
diff --git a/‎flux-dreambooth/assets/batch-dreambooth.png‎
1.03 MB b/‎flux-dreambooth/assets/batch-dreambooth.png‎
1.03 MB
diff --git a/‎flux-dreambooth/assets/blupus-demo.png‎
593 KB b/‎flux-dreambooth/assets/blupus-demo.png‎
593 KB
diff --git a/‎flux-dreambooth/assets/hamza_superman.mp4‎
211 KB b/‎flux-dreambooth/assets/hamza_superman.mp4‎
211 KB
diff --git a/‎flux-dreambooth/configs/k8s_run_refactored_multi_video.yaml‎
Lines changed: 143 additions & 0 deletions b/‎flux-dreambooth/configs/k8s_run_refactored_multi_video.yaml‎
Lines changed: 143 additions & 0 deletions
diff --git a/‎flux-dreambooth/constants.py‎ b/‎flux-dreambooth/constants.py‎
@@ -0,0 +1,174 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
+.pdm.toml
+.pdm-python
+.pdm-build/
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
+
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
+
+
+# Specific to this project
+models/
+data/dog-class/
+diffusers/
+.venv/
+sd-dreambooth-blupus/
+data/cat-class/
+data/dog/
+data/aria/
+data/hamza-faces/
@@ -0,0 +1,72 @@
+# Flux DreamBooth: Personalized AI with ZenML
+
+This project was motivated by a desire to explore the limits of the latest AI
+technologies, particularly the Flux models and the Stable Diffusion img2vid
+model. By finetuning the Flux.1-dev model on images of the ZenML co-founder
+using DreamBooth, we aimed to showcase the potential for personalized AI
+applications.
+
+![](assets/batch-dreambooth.png)
+
+[DreamBooth](https://huggingface.co/docs/diffusers/v0.30.2/training/dreambooth) is a technique that allows for the creation of custom text-to-image models by finetuning a pre-trained model on a small dataset of images featuring a specific subject. In this case, we used a dataset of cropped portrait photos of the ZenML co-founder to create a personalized model capable of generating novel images of him in various styles and contexts.
+
+To make the finetuning process more efficient, we employed LoRA (Low-Rank Adaptation) adapters. LoRA allows for faster finetuning by only updating a small fraction of the model's weights, which can then be saved separately from the original model. The resulting LoRA adapters for this project have been pushed to the Hugging Face repository at [https://huggingface.co/strickvl/flux-dreambooth-hamza](https://huggingface.co/strickvl/flux-dreambooth-hamza).
+
+While we finetuned the [Flux.1-dev](https://huggingface.co/black-forest-labs/FLUX.1-dev) model for training, we switched to the [Flux-Schnell](https://huggingface.co/spaces/black-forest-labs/FLUX.1-schnell) model for inference. Flux-Schnell is a faster variant of the Flux model that maintains comparable quality, making it an excellent choice for efficient batch inference. The LoRA adapters worked seamlessly with Flux-Schnell, allowing us to generate high-quality personalized images quickly.
+
+Crafting effective prompts was a crucial aspect of this project. We experimented
+with various prompts to find those that worked best with the finetuned model.
+Additionally, we had to tailor the prompts to the limitations of our dataset,
+which consisted primarily of cropped portrait photos. By carefully designing
+prompts that played to the strengths of the available data, we were able to
+generate impressive personalized images and short animated videos.
+
+<video width="512" height="512" controls autoplay loop>
+  <source src="assets/hamza_superman.mp4" type="video/mp4">
+  Your browser does not support the video tag.
+</video>
+
+
+The pipeline outputs a grouped image showcasing the results of various prompts
+and generates short 3-second animated videos using the
+[stable-video-diffusion-img2vid-xt](https://huggingface.co/stabilityai/stable-video-diffusion-img2vid-xt)
+img2vid model. These outputs demonstrate the potential for creating engaging,
+personalized content using state-of-the-art AI technologies.
+
+## Getting Started
+
+To get started with this project, follow these steps:
+
+1. Clone the ZenML Projects repository: `git clone https://github.com/zenml-io/zenml-projects.git`
+2. Navigate to the `flux-dreambooth` directory: `cd zenml-projects/flux-dreambooth`
+3. Install the required dependencies: `pip install -r requirements.txt`
+4. For a guided walkthrough of the code, check out the `walkthrough.ipynb` notebook.
+
+## Stack Setup
+
+You'll need a cloud stack to run these pipelines, and you'll need GPU quotas so
+as to be able to run the training and batch inference steps. You can get started
+with a 1-click deployment on all the major cloud providers using [our simple
+guide](https://docs.zenml.io/how-to/stack-deployment/deploy-a-cloud-stack).
+
+## Running the pipeline
+
+To run the pipeline, use one of the following commands depending on your stack:
+   - For Kubernetes: `python k8s_run.py`
+   - For Modal: `python modal_run.py`
+
+## Project Structure
+
+The project contains the following files with comments:
+
+- `configs/k8s_run_refactored_multi_video.yaml`: Configuration files used in the notebooks
+- `k8s_run.py`: Script to run the pipeline on a Kubernetes stack
+- `modal_run.py`: Script to run the pipeline on a Modal stack
+- `test_examples_utils.py`: Related to the diffusers script used in older versions of the pipeline
+- `train_dreambooth_lora_flux.py`: From the diffusers library, used in older versions of the pipeline
+- `train_dreambooth.py`: From the diffusers library, used in older versions of the pipeline
+- `walkthrough.ipynb`: Jupyter Notebook providing a guided walkthrough of the code
+
+## Contributing
+
+Contributions to this project are welcome! If you find any issues or have suggestions for improvements, please open an issue or submit a pull request.
@@ -0,0 +1,143 @@
+# Specify the "ZenML Model"
+model:
+  name: "flux_personalized_model"
+  audience: "ML Engineers and Researchers"
+  description: "Personalized image generation model using DreamBooth and Flux.1"
+  ethics: "Ensure responsible use of generated images"
+  license: "Apache 2.0"
+  limitations: "Limited to the trained subject and style"
+  tags: ["dreambooth", "flux", "stable-diffusion-image2video"]
+
+# Parameters of the pipeline 
+parameters:
+  instance_example_dir: "az://demo-zenmlartifactstore/hamza-faces"
+  instance_name: "sks htahir1"
+  class_name: "man"
+  model_name: "black-forest-labs/FLUX.1-dev"
+  hf_username: "htahir1"
+  hf_repo_suffix: "flux-dreambooth-hamza"
+  prefix: "A portrait photo of"
+  resolution: 512
+  train_batch_size: 1
+  rank: 32
+  gradient_accumulation_steps: 1
+  learning_rate: 0.0002
+  lr_scheduler: "constant"
+  lr_warmup_steps: 0
+  max_train_steps: 1300
+  push_to_hub: True
+  checkpointing_steps: 1000
+  seed: 117
+
+# Per step configuration
+steps:
+  train_model:
+    enable_cache: True
+    # Real-time settings for Docker and resources
+    settings:
+      # Controls Docker building
+      docker:
+        parent_image: "pytorch/pytorch:2.2.2-cuda11.8-cudnn8-runtime"
+        environment:
+          PJRT_DEVICE: "CUDA"
+          USE_TORCH_XLA: "false"
+          MKL_SERVICE_FORCE_INTEL: 1
+          HF_TOKEN: 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
+          HF_HOME: "/mnt/data"
+        python_package_installer: "uv"
+        requirements: "requirements.txt"
+        python_package_installer_args:
+          system: null
+        apt_packages: ["git", "ffmpeg", "gifsicle"]
+      
+      # Kubernetes settings
+      orchestrator.kubernetes:
+        pod_settings:
+          affinity:
+            nodeAffinity:
+              requiredDuringSchedulingIgnoredDuringExecution:
+                nodeSelectorTerms:
+                  - matchExpressions:
+                      - key: "zenml.io/gpu"
+                        operator: "In"
+                        values: ["yes"]
+          volumes:
+            - name: "data-volume"
+              persistentVolumeClaim:
+                claimName: "pvc-managed-premium"
+          volume_mounts:
+            - name: "data-volume"
+              mountPath: "/mnt/data"
+
+  batch_inference:
+    settings:
+      # Controls Docker building
+      docker:
+        parent_image: "pytorch/pytorch:2.2.2-cuda11.8-cudnn8-runtime"
+        environment:
+          PJRT_DEVICE: "CUDA"
+          USE_TORCH_XLA: "false"
+          MKL_SERVICE_FORCE_INTEL: 1
+          HF_TOKEN: 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
+          HF_HOME: "/mnt/data"
+        python_package_installer: "uv"
+        requirements: "requirements.txt"
+        python_package_installer_args:
+          system: null
+        apt_packages: ["git", "ffmpeg", "gifsicle"]
+      
+      # Kubernetes settings
+      orchestrator.kubernetes:
+        pod_settings:
+          affinity:
+            nodeAffinity:
+              requiredDuringSchedulingIgnoredDuringExecution:
+                nodeSelectorTerms:
+                  - matchExpressions:
+                      - key: "zenml.io/gpu"
+                        operator: "In"
+                        values: ["yes"]
+          volumes:
+            - name: "data-volume"
+              persistentVolumeClaim:
+                claimName: "pvc-managed-premium"
+          volume_mounts:
+            - name: "data-volume"
+              mountPath: "/mnt/data"
+
+  image_to_video:
+    enable_cache: False
+    settings:
+      # Controls Docker building
+      docker:
+        parent_image: "pytorch/pytorch:2.2.2-cuda11.8-cudnn8-runtime"
+        environment:
+          PJRT_DEVICE: "CUDA"
+          USE_TORCH_XLA: "false"
+          MKL_SERVICE_FORCE_INTEL: 1
+          HF_TOKEN: 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
+          HF_HOME: "/mnt/data"
+        python_package_installer: "uv"
+        requirements: "requirements.txt"
+        python_package_installer_args:
+          system: null
+        apt_packages: ["git", "ffmpeg", "gifsicle"]
+      
+      # Kubernetes settings
+      orchestrator.kubernetes:
+        pod_settings:
+          affinity:
+            nodeAffinity:
+              requiredDuringSchedulingIgnoredDuringExecution:
+                nodeSelectorTerms:
+                  - matchExpressions:
+                      - key: "zenml.io/gpu"
+                        operator: "In"
+                        values: ["yes"]
+          volumes:
+            - name: "data-volume"
+              persistentVolumeClaim:
+                claimName: "pvc-managed-premium"
+          volume_mounts:
+            - name: "data-volume"
+              mountPath: "/mnt/data"