Cosmos-Predict2-2B

Runtime error

multimodalart HF Staff commited on Jun 17

Commit

3a7a77c

verified ·

1 Parent(s): 37d511b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,9 +1,39 @@
 import gradio as gr
 import spaces
 import torch
 from diffusers import Cosmos2TextToImagePipeline, EDMEulerScheduler
 import random
 model_2b_id = "nvidia/Cosmos-Predict2-2B-Text2Image"
 pipe_2b = Cosmos2TextToImagePipeline.from_pretrained(

+import subprocess
+subprocess.run(
+    "pip install flash-attn --no-build-isolation", env={"FLASH_ATTENTION_SKIP_CUDA_BUILD": "TRUE"}, shell=True
+)
 import gradio as gr
 import spaces
 import torch
 from diffusers import Cosmos2TextToImagePipeline, EDMEulerScheduler
+from transformers import AutoModelForCausalLM, SiglipProcessor
 import random
+#Add flash_attention_2 to the safeguard model
+def patch_from_pretrained(cls):
+    orig_method = cls.from_pretrained
+    def new_from_pretrained(*args, **kwargs):
+        kwargs.setdefault("attn_implementation", "flash_attention_2")
+        kwargs.setdefault("torch_dtype", torch.bfloat16)
+        return orig_method(*args, **kwargs)
+    cls.from_pretrained = new_from_pretrained
+patch_from_pretrained(AutoModelForCausalLM)
+#Add a `use_fast` to the safeguard image processor
+def patch_processor_fast(cls):
+    orig_method = cls.from_pretrained
+    def new_from_pretrained(*args, **kwargs):
+        kwargs.setdefault("use_fast", True)
+        return orig_method(*args, **kwargs)
+    cls.from_pretrained = new_from_pretrained
+patch_processor_fast(SiglipProcessor)
 model_2b_id = "nvidia/Cosmos-Predict2-2B-Text2Image"
 pipe_2b = Cosmos2TextToImagePipeline.from_pretrained(