add back enable_attention_slicing for mps device
This commit is contained in:
@@ -50,6 +50,11 @@ class SDXL(DiffusionInpaintModel):
|
||||
variant="fp16",
|
||||
)
|
||||
|
||||
if torch.backends.mps.is_available():
|
||||
# MPS: Recommended RAM < 64 GB https://huggingface.co/docs/diffusers/optimization/mps
|
||||
# CUDA: Don't enable attention slicing if you're already using `scaled_dot_product_attention` (SDPA) from PyTorch 2.0 or xFormers. https://huggingface.co/docs/diffusers/v0.25.0/en/api/pipelines/stable_diffusion/image_variation#diffusers.StableDiffusionImageVariationPipeline.enable_attention_slicing
|
||||
self.model.enable_attention_slicing()
|
||||
|
||||
if kwargs.get("cpu_offload", False) and use_gpu:
|
||||
logger.info("Enable sequential cpu offload")
|
||||
self.model.enable_sequential_cpu_offload(gpu_id=0)
|
||||
|
||||
Reference in New Issue
Block a user