From 83caf92a5cf317dbb48f6b36b673c86dba7cec3c Mon Sep 17 00:00:00 2001 From: Meptl Date: Tue, 20 Feb 2024 11:01:38 -0500 Subject: [PATCH] Support network volumes (#16) * Support network volumes * README tweaks * docs: added comment on what is happening * feat: don't overwrite the default paths, but add "runpod_worker_comfy" to have additional paths * docs: updated "bring your own models" --------- Co-authored-by: Tim Pietrusky --- Dockerfile | 18 ++++++++-------- README.md | 44 +++++++++++++++++++++++++++++++++++++- src/extra_model_paths.yaml | 11 ++++++++++ 3 files changed, 63 insertions(+), 10 deletions(-) create mode 100644 src/extra_model_paths.yaml diff --git a/Dockerfile b/Dockerfile index 01409b4c..0180e220 100644 --- a/Dockerfile +++ b/Dockerfile @@ -32,15 +32,15 @@ RUN pip3 install --no-cache-dir torch torchvision torchaudio --index-url https:/ # Install runpod RUN pip3 install runpod requests -# Download checkpoints/vae/LoRA to include in image -RUN wget -O models/checkpoints/sd_xl_base_1.0.safetensors https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0/resolve/main/sd_xl_base_1.0.safetensors -RUN wget -O models/vae/sdxl_vae.safetensors https://huggingface.co/stabilityai/sdxl-vae/resolve/main/sdxl_vae.safetensors -RUN wget -O models/vae/sdxl-vae-fp16-fix.safetensors https://huggingface.co/madebyollin/sdxl-vae-fp16-fix/resolve/main/sdxl_vae.safetensors -RUN wget -O models/loras/xl_more_art-full_v1.safetensors https://civitai.com/api/download/models/152309 - -# Example for adding specific models into image -# ADD models/checkpoints/sd_xl_base_1.0.safetensors models/checkpoints/ -# ADD models/vae/sdxl_vae.safetensors models/vae/ +ARG SKIP_DEFAULT_MODELS +# Download checkpoints/vae/LoRA to include in image. +RUN if [ -z "$SKIP_DEFAULT_MODELS" ]; then wget -O models/checkpoints/sd_xl_base_1.0.safetensors https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0/resolve/main/sd_xl_base_1.0.safetensors; fi +RUN if [ -z "$SKIP_DEFAULT_MODELS" ]; then wget -O models/vae/sdxl_vae.safetensors https://huggingface.co/stabilityai/sdxl-vae/resolve/main/sdxl_vae.safetensors; fi +RUN if [ -z "$SKIP_DEFAULT_MODELS" ]; then wget -O models/vae/sdxl-vae-fp16-fix.safetensors https://huggingface.co/madebyollin/sdxl-vae-fp16-fix/resolve/main/sdxl_vae.safetensors; fi +RUN if [ -z "$SKIP_DEFAULT_MODELS" ]; then wget -O models/loras/xl_more_art-full_v1.safetensors https://civitai.com/api/download/models/152309; fi + +# Support for the network volume +ADD src/extra_model_paths.yaml ./ # Go back to the root WORKDIR / diff --git a/README.md b/README.md index 105771eb..80d51aae 100644 --- a/README.md +++ b/README.md @@ -19,6 +19,9 @@ Read our article here: https://blib.la/blog/comfyui-on-runpod - [Config](#config) - [Upload image to AWS S3](#upload-image-to-aws-s3) - [Use the Docker image on RunPod](#use-the-docker-image-on-runpod) + * [Bring your own models](#bring-your-own-models) + + [Network Volume](#network-volume) + + [Custom Docker Image](#custom-docker-image) - [API specification](#api-specification) - [JSON Request Body](#json-request-body) - [Fields](#fields) @@ -61,6 +64,7 @@ Read our article here: https://blib.la/blog/comfyui-on-runpod - [sdxl-vae-fp16-fix](https://huggingface.co/madebyollin/sdxl-vae-fp16-fix/) - Build-in LoRA: - [xl_more_art-full_v1.safetensors](https://civitai.com/models/124347?modelVersionId=152309) (Enhancer) +- [Bring your own models](#bring-your-own-models) - Based on [Ubuntu + NVIDIA CUDA](https://hub.docker.com/r/nvidia/cuda) ## Config @@ -103,12 +107,46 @@ This is only needed if you want to upload the generated picture to AWS S3. If yo - Max Workers: `3` (whatever makes sense for you) - Idle Timeout: `5` (you can leave the default) - Flash Boot: `enabled` (doesn't cost more, but provides faster boot of our worker, which is good) - - Advanced: Leave the defaults + - Advanced: If you are using a Network Volume, select it under `Select Network Volume`. Otherwise leave the defaults. - Select a GPU that has some availability - GPUs/Worker: `1` - Click `deploy` - Your endpoint will be created, you can click on it to see the dashboard +### Bring your own models + +#### Network Volume + +This is possible because of [RunPod Network Volumes](https://docs.runpod.io/docs/create-a-network-volume), which also works for [serverless](https://docs.runpod.io/serverless/references/endpoint-configurations#select-network-volume). + +- [Create a Network Volume](https://docs.runpod.io/docs/create-a-network-volume) +- Create a temporary GPU instance to populate the volume. + Navigate to `Manage > Storage`, click `Deploy` under the volume, deploy any GPU instance +- Navigate to `Manage > Pods`. Under the new GPU instance, click `Connect`. This + will give you either a Jupyter notebook where you can select `Shell` or an address you can ssh to. +- Within a shell on the GPU instance, populate the Network Volume. By default, the volume + is mounted at `/workspace`. In this example, we create the ComfyUI model + structure and download a single checkpoint. + ``` + cd /workspace + for i in checkpoints clip clip_vision configs controlnet embeddings loras upscale_models vae; do mkdir -p models/$i; done + wget -O models/checkpoints/sd_xl_turbo_1.0_fp16.safetensors https://huggingface.co/stabilityai/sdxl-turbo/blob/main/sd_xl_turbo_1.0_fp16.safetensors + ``` +- [Delete the temporary GPU instance](https://docs.runpod.io/docs/pods#terminating-a-pod) +- Configure your Endpoint to use the Network Volume. Either [create a new endpoint](#use-the-docker-image-on-runpod) or update + `Advanced > Select Network Volume (optional)` on an existing endpoint + +#### Custom Docker Image + +- Fork the repository +- Add your models directly into the [Dockerfile](./Dockerfile) like this: + +```Dockerfile +RUN wget -O models/checkpoints/sd_xl_base_1.0.safetensors https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0/resolve/main/sd_xl_base_1.0.safetensors +``` + +- [Build your Docker Image](#build-the-image) + ## API specification The following describes which fields exist when doing requests to the API. We only describe the fields that are sent via `input` as those are needed by the worker itself. For a full list of fields, please take a look at the [official documentation](https://docs.runpod.io/docs/serverless-usage). @@ -197,6 +235,10 @@ You can now take the content of this file and put it into your `workflow` when i You can build the image locally: `docker build -t timpietruskyblibla/runpod-worker-comfy:dev --platform linux/amd64 .` +If you plan to bring your own ComfyUI models, you can add the `SKIP_DEFAULT_MODELS` build arg to reduce image size: +`docker build --build-arg SKIP_DEFAULT_MODELS=1 -t timpietruskyblibla/runpod-worker-comfy:dev --platform linux/amd64 .`. +This will skip downloading the default models for this image. + 🚨 It's important to specify the `--platform linux/amd64`, otherwise you will get an error on RunPod, see [#13](https://github.com/blib-la/runpod-worker-comfy/issues/13) ## Local testing diff --git a/src/extra_model_paths.yaml b/src/extra_model_paths.yaml new file mode 100644 index 00000000..f2c82f9e --- /dev/null +++ b/src/extra_model_paths.yaml @@ -0,0 +1,11 @@ +runpod_worker_comfy: + base_path: /runpod-volume + checkpoints: models/checkpoints/ + clip: models/clip/ + clip_vision: models/clip_vision/ + configs: models/configs/ + controlnet: models/controlnet/ + embeddings: models/embeddings/ + loras: models/loras/ + upscale_models: models/upscale_models/ + vae: models/vae/