SUSSYMANBI lysandre HF Staff commited on
Commit
357de9f
·
0 Parent(s):

Duplicate from huggingface-tools/text-to-video

Browse files

Co-authored-by: Lysandre <[email protected]>

Files changed (7) hide show
  1. .gitattributes +34 -0
  2. README.md +13 -0
  3. __init__.py +0 -0
  4. app.py +4 -0
  5. requirements.txt +4 -0
  6. text_to_video.py +48 -0
  7. tool_config.json +5 -0
.gitattributes ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tflite filter=lfs diff=lfs merge=lfs -text
29
+ *.tgz filter=lfs diff=lfs merge=lfs -text
30
+ *.wasm filter=lfs diff=lfs merge=lfs -text
31
+ *.xz filter=lfs diff=lfs merge=lfs -text
32
+ *.zip filter=lfs diff=lfs merge=lfs -text
33
+ *.zst filter=lfs diff=lfs merge=lfs -text
34
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: Text to Video
3
+ emoji: ⚡
4
+ colorFrom: red
5
+ colorTo: green
6
+ sdk: gradio
7
+ sdk_version: 3.27.0
8
+ app_file: app.py
9
+ pinned: false
10
+ tags:
11
+ - tool
12
+ duplicated_from: huggingface-tools/text-to-video
13
+ ---
__init__.py ADDED
File without changes
app.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ from transformers.tools.base import launch_gradio_demo
2
+ from text_to_video import TextToVideoTool
3
+
4
+ launch_gradio_demo(TextToVideoTool)
requirements.txt ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ transformers @ git+https://github.com/huggingface/transformers@test_composition
2
+ diffusers
3
+ accelerate
4
+ torch
text_to_video.py ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+
3
+ from transformers.tools.base import Tool, get_default_device
4
+ from transformers.utils import is_accelerate_available
5
+
6
+ from diffusers import DiffusionPipeline
7
+
8
+
9
+ TEXT_TO_VIDEO_DESCRIPTION = (
10
+ "This is a tool that creates a video according to a text description. It takes an input named `prompt` which "
11
+ "contains the image description, as well as an optional input `seconds` which will be the duration of the video. "
12
+ "The default is of two seconds. The tool outputs a video object."
13
+ )
14
+
15
+
16
+ class TextToVideoTool(Tool):
17
+ default_checkpoint = "damo-vilab/text-to-video-ms-1.7b"
18
+ description = TEXT_TO_VIDEO_DESCRIPTION
19
+ inputs = ['text']
20
+ outputs = ['video']
21
+
22
+ def __init__(self, device=None, **hub_kwargs) -> None:
23
+ if not is_accelerate_available():
24
+ raise ImportError("Accelerate should be installed in order to use tools.")
25
+
26
+ super().__init__()
27
+
28
+ self.device = device
29
+ self.pipeline = None
30
+ self.hub_kwargs = hub_kwargs
31
+
32
+ def setup(self):
33
+ if self.device is None:
34
+ self.device = get_default_device()
35
+
36
+ self.pipeline = DiffusionPipeline.from_pretrained(
37
+ self.default_checkpoint, variant="fp16"
38
+ )
39
+ self.pipeline.to(self.device)
40
+
41
+ self.is_initialized = True
42
+
43
+ def __call__(self, prompt, seconds=2):
44
+ if not self.is_initialized:
45
+ self.setup()
46
+
47
+ return self.pipeline(prompt, num_frames=8 * seconds).frames
48
+
tool_config.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "description": "This is a tool that creates a video according to a text description. It takes an input named `prompt` which contains the image description, as well as an optional input `seconds` which will be the duration of the video. The default is of two seconds. The tool outputs a video object.",
3
+ "name": "video_generator",
4
+ "tool_class": "text_to_video.TextToVideoTool"
5
+ }