rapidrabbit76
diff --git a/‎.gitignore
Lines changed: 4 additions & 1 deletion b/‎.gitignore
Lines changed: 4 additions & 1 deletion
diff --git a/‎README.md
Lines changed: 19 additions & 27 deletions b/‎README.md
Lines changed: 19 additions & 27 deletions
diff --git a/‎app/stable_diffusion/manager/manager.py
Lines changed: 45 additions & 13 deletions b/‎app/stable_diffusion/manager/manager.py
Lines changed: 45 additions & 13 deletions
diff --git a/‎app/stable_diffusion/manager/schema.py
Lines changed: 2 additions & 2 deletions b/‎app/stable_diffusion/manager/schema.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎app/stable_diffusion/model.py
Lines changed: 0 additions & 149 deletions b/‎app/stable_diffusion/model.py
Lines changed: 0 additions & 149 deletions
diff --git a/‎app/stable_diffusion/service.py
Lines changed: 1 addition & 1 deletion b/‎app/stable_diffusion/service.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎core/settings/settings.py
Lines changed: 3 additions & 2 deletions b/‎core/settings/settings.py
Lines changed: 3 additions & 2 deletions
@@ -25,4 +25,7 @@ temp/
 
 # DEV
 debug.py
-*.ipynb
+*.ipynb
+
+static/
+lpw_stable_diffusion/
@@ -87,17 +87,18 @@ outputs:
 >> ./core/settings/settings.py
 ```
 
-| Name               | Default                       | Desc                                              |
-| ------------------ | ----------------------------- | ------------------------------------------------- |
-| MODEL_ID           | CompVis/stable-diffusion-v1-4 | tagger embedding model part                       |
-| CUDA_DEVICE        | "cpu"                         | target cuda device                                |
-| CUDA_DEVICES       | [0]                           | visible cuda device                               |
-| MB_BATCH_SIZE      | 1                             | Micro Batch: MAX Batch size                       |
-| MB_TIMEOUT         | 120                           | Micro Batch: timeout sec                          |
-| HUGGINGFACE_TOKEN  | None                          | huggingface access token                          |
-| IMAGESERVER_URL    | None                          | result image base url                             |
-| SAVE_DIR           | static                        | result image save dir                             |
-| CORS_ALLOW_ORIGINS | [*]                           | cross origin resource sharing setting for FastAPI |
+| Name                     | Default                       | Desc                                                                                                                                                                    |
+| ------------------------ | ----------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| MODEL_ID                 | CompVis/stable-diffusion-v1-4 | huggingface repo id or model path                                                                                                                                       |
+| ENABLE_ATTENTION_SLICING | True                          | [Enable sliced attention computation.](https://huggingface.co/docs/diffusers/api/pipelines/stable_diffusion#diffusers.StableDiffusionPipeline.enable_attention_slicing) |
+| CUDA_DEVICE              | "cuda"                        | target cuda device                                                                                                                                                      |
+| CUDA_DEVICES             | [0]                           | visible cuda device                                                                                                                                                     |
+| MB_BATCH_SIZE            | 1                             | Micro Batch: MAX Batch size                                                                                                                                             |
+| MB_TIMEOUT               | 120                           | Micro Batch: timeout sec                                                                                                                                                |
+| HUGGINGFACE_TOKEN        | None                          | huggingface access token                                                                                                                                                |
+| IMAGESERVER_URL          | None                          | result image base url                                                                                                                                                   |
+| SAVE_DIR                 | static                        | result image save dir                                                                                                                                                   |
+| CORS_ALLOW_ORIGINS       | [*]                           | cross origin resource sharing setting for FastAPI                                                                                                                       |
 
 # RUN from code (API)
 
@@ -117,6 +118,9 @@ python huggingface_model_download.py
 ## 3. update settings.py in ./core/settings/settings.py
 ```python
 # example
+class ModelSetting(BaseSettings):
+    MODEL_ID: str = "CompVis/stable-diffusion-v1-4" # huggingface repo id
+    ENABLE_ATTENTION_SLICING: bool = True
 ...
 class Settings(
     ...
@@ -127,13 +131,9 @@ class Settings(
     ...
 ```
 
-## 4. RUN API by uvicorn
+## 4. RUN API from code
 ```bash
-cd /REPO/ROOT/DIR/PATH
-python3 -m uvicorn app.server:app \
-    --host 0.0.0.0 \
-    --port 3000 \
-    --workers 1 
+bash docker/api/start.sh
 ```
 
 # RUN from code (frontend)
@@ -161,27 +161,19 @@ streamlit run inpaint.py
 docker-compose build
 ```
 
-## 2. downlaod and caching huggingface model
-```bash
-python huggingface_model_download.py
-# check stable-diffusion model in huggingface cache dir 
-[[ -d ~/.cache/huggingface/diffusers/models--CompVis--stable-diffusion-v1-4 ]] && echo "exist"
->> exist
-```
-
 ## 3. update docker-compose.yaml file in repo root
 ```yaml
 version: "3.7"
-
 services:
   api:
     ...
     volumes:
       # mount huggingface model cache dir path to container root user home dir
-      - /home/{USER NAME}/.cache/huggingface:/root/.cache/huggingface
+      - /model:/model  # if you load pretraind model 
       - ...
     environment:
       ...
+      MODEL_ID: "CompVis/stable-diffusion-v1-4" 
       HUGGINGFACE_TOKEN: {YOUR HUGGINGFACE ACCESS TOKEN}
       ...
 
 
@@ -6,17 +6,15 @@
 import sys
 from random import randint
 from service_streamer import ThreadedStreamer
-from app.stable_diffusion.model import (
-    build_text2image_pipeline,
-    build_image2image_pipeline,
-    build_inpaint_pipeline,
-)
+from diffusers import DiffusionPipeline, DPMSolverMultistepScheduler
+
 from app.stable_diffusion.manager.schema import (
     InpaintTask,
     Text2ImageTask,
     Image2ImageTask,
 )
 from core.settings import get_settings
+from functools import lru_cache
 
 env = get_settings()
 
@@ -27,30 +25,64 @@
 ]
 
 
+@lru_cache()
+def build_pipeline(repo: str, device: str, enable_attention_slicing: bool):
+    pipe = DiffusionPipeline.from_pretrained(
+        repo,
+        torch_dtype=torch.float16,
+        revision="fp16",
+        custom_pipeline="lpw_stable_diffusion",
+    )
+    pipe.scheduler = DPMSolverMultistepScheduler.from_config(
+        pipe.scheduler.config
+    )
+    pipe.safety_checker = lambda images, clip_input: (images, False)
+
+    if enable_attention_slicing:
+        pipe.enable_attention_slicing()
+
+    pipe = pipe.to(device)
+    return pipe
+
+
+build_pipeline(
+    repo=env.MODEL_ID,
+    device=env.CUDA_DEVICE,
+    enable_attention_slicing=env.ENABLE_ATTENTION_SLICING,
+)
+
+
 class StableDiffusionManager:
     def __init__(self):
-        self.text2image = build_text2image_pipeline()
-        self.image2image = build_image2image_pipeline()
-        self.inpaint = build_inpaint_pipeline()
+        self.pipe = build_pipeline(
+            repo=env.MODEL_ID,
+            device=env.CUDA_DEVICE,
+            enable_attention_slicing=env.ENABLE_ATTENTION_SLICING,
+        )
 
+    @torch.inference_mode()
     def predict(
         self,
         batch: T.List[_StableDiffusionTask],
     ):
         task = batch[0]
-        pipeline = self.text2image
+        pipeline = self.pipe
         if isinstance(task, Text2ImageTask):
-            pipeline = self.text2image
+            pipeline = self.pipe.text2img
         elif isinstance(task, Image2ImageTask):
-            pipeline = self.image2image
+            pipeline = self.pipe.img2img
         elif isinstance(task, InpaintTask):
-            pipeline = self.inpaint
+            pipeline = self.pipe.inpaint
+        else:
+            raise NotImplementedError
 
         device = env.CUDA_DEVICE
 
         generator = self._get_generator(task, device)
         with torch.autocast("cuda" if device != "cpu" else "cpu"):
-            images = pipeline(**task.dict(), generator=generator)
+            task = task.dict()
+            del task["seed"]
+            images = pipeline(**task, generator=generator).images
             if device != "cpu":
                 torch.cuda.empty_cache()
 
 
@@ -23,7 +23,7 @@ def size_constraint(cls, size):
 class Image2ImageTask(BaseModel):
     prompt: T.Union[str, T.List[str]] = Field(...)
     negative_prompt: T.Union[str, T.List[str]] = Field(...)
-    init_image: T.Any
+    image: T.Any
     strength: float = Field(..., ge=0.0, le=1.0)
     num_inference_steps: int = Field(..., gt=0)
     guidance_scale: float = Field(..., ge=0.0)
@@ -33,7 +33,7 @@ class Image2ImageTask(BaseModel):
 class InpaintTask(BaseModel):
     prompt: T.Union[str, T.List[str]] = Field(...)
     negative_prompt: T.Union[str, T.List[str]] = Field(...)
-    init_image: T.Any
+    image: T.Any
     mask_image: T.Any
     strength: float = Field(..., ge=0.0, le=1.0)
     num_inference_steps: int = Field(..., gt=0)
 
@@ -92,7 +92,7 @@ def image2image(
             Image2ImageTask(
                 prompt=prompt,
                 negative_prompt=[negative_prompt] * len(prompt),
-                init_image=init_image,
+                image=init_image,
                 strength=strength,
                 num_inference_steps=num_inference_steps,
                 guidance_scale=guidance_scale,
 
@@ -6,6 +6,7 @@
 
 class ModelSetting(BaseSettings):
     MODEL_ID: str = "CompVis/stable-diffusion-v1-4"
+    ENABLE_ATTENTION_SLICING: bool = True
 
 
 class DeviceSettings(BaseSettings):
@@ -23,8 +24,8 @@ class Settings(
     DeviceSettings,
     MicroBatchSettings,
 ):
-    HUGGINGFACE_TOKEN: str
-    IMAGESERVER_URL: str = 'http://localhost:3000/images'
+    HUGGINGFACE_TOKEN: str = "HUGGINGFACE_TOKEN"
+    IMAGESERVER_URL: str = "http://localhost:3000/images"
     SAVE_DIR: str = "static"
 
     CORS_ALLOW_ORIGINS: T.List[str] = ["*"]