jree423
/

svgdreamer

vector-graphics

Model card Files Files and versions Community

xingxm commited on Mar 28, 2024

Commit

1e2958e

·

1 Parent(s): 8c557ad

feat(readme): delete unused import and add cases

Files changed (30) hide show

README.md +40 -6
assets/Lowpoly-BaldEagle/init_p0.svg +0 -0
assets/Lowpoly-BaldEagle/init_p1.svg +0 -0
assets/Lowpoly-BaldEagle/init_p2.svg +0 -0
assets/Lowpoly-BaldEagle/init_p3.svg +0 -0
assets/Lowpoly-BaldEagle/init_p4.svg +0 -0
assets/Lowpoly-BaldEagle/init_p5.svg +0 -0
assets/Lowpoly-BaldEagle/p0.svg +0 -0
assets/Lowpoly-BaldEagle/p1.svg +0 -0
assets/Lowpoly-BaldEagle/p2.svg +0 -0
assets/Lowpoly-BaldEagle/p3.svg +0 -0
assets/Lowpoly-BaldEagle/p4.svg +0 -0
assets/Lowpoly-BaldEagle/p5.svg +0 -0
assets/Sketch-Lamborghini/init_p0.svg +70 -0
assets/Sketch-Lamborghini/init_p1.svg +70 -0
assets/Sketch-Lamborghini/init_p2.svg +70 -0
assets/Sketch-Lamborghini/init_p3.svg +70 -0
assets/Sketch-Lamborghini/init_p4.svg +70 -0
assets/Sketch-Lamborghini/init_p5.svg +70 -0
assets/Sketch-Lamborghini/p0.svg +70 -0
assets/Sketch-Lamborghini/p1.svg +70 -0
assets/Sketch-Lamborghini/p2.svg +70 -0
assets/Sketch-Lamborghini/p3.svg +70 -0
assets/Sketch-Lamborghini/p4.svg +70 -0
assets/Sketch-Lamborghini/p5.svg +70 -0
assets/post.md +2 -1
conf/x/ink.yaml +2 -2
conf/x/lowpoly.yaml +1 -1
conf/x/sketch.yaml +1 -1
svgdreamer/svgtools/__init__.py +0 -2

README.md CHANGED Viewed

@@ -37,9 +37,11 @@ or using docker,
 docker run --name svgdreamer --gpus all -it --ipc=host ximingxing/svgrender:v1 /bin/bash
 ```
-## 🔥 Quickstart
-Before running the code, download the stable diffusion model. Append `diffuser.download=True` to the end of the script.
 ### SIVE + VPSD
@@ -142,15 +144,47 @@ python svgdreamer.py x=painting "prompt='Abstract Vincent van Gogh Oil Painting
 python svgdreamer.py x=pixelart "prompt='Darth vader with lightsaber.'" result_path='./logs/DarthVader'
 ```
-#### Other Styles
 ```shell
-# Style: low-ploy
 python svgdreamer.py x=lowpoly "prompt='A picture of a bald eagle. low-ploy. polygon. minimal flat 2d vector'" neg_prompt='' result_path='./logs/BaldEagle'
-# Style: sketch
 python svgdreamer.py x=sketch "prompt='A free-hand drawing of A speeding Lamborghini. black and white drawing.'" neg_prompt='' result_path='./logs/Lamborghini'
 # Style: ink and wash
-python svgdreamer.py x=ink "prompt='Big Wild Goose Pagoda. ink style. Minimalist abstract art grayscale watercolor.'" neg_prompt='' result_path='./logs/BigWildGoosePagoda'
 ```
 #### More Cases

 docker run --name svgdreamer --gpus all -it --ipc=host ximingxing/svgrender:v1 /bin/bash
 ```
+and **download pretrained models** by setting `diffuser.download=True` in `/conf/config.yaml` the first time you run it.
+(Alternatively, you can append `diffuser.download=True` to the end of the script.)
+## 🔥 Quickstart
 ### SIVE + VPSD
 python svgdreamer.py x=pixelart "prompt='Darth vader with lightsaber.'" result_path='./logs/DarthVader'
 ```
+#### Low-poly style
+**Prompt:** A picture of a bald eagle. low-ploy. polygon. minimal flat 2d vector <br/>
+**Preview:**
+|                     Particle 1                     |                     Particle 2                     |                     Particle 3                     |                     Particle 4                     |                     Particle 5                     |                     Particle 6                     |
+|:--------------------------------------------------:|:--------------------------------------------------:|:--------------------------------------------------:|:--------------------------------------------------:|:--------------------------------------------------:|:--------------------------------------------------:|
+|                      init p1                       |                      init p2                       |                      init p3                       |                      init p4                       |                      init p5                       |                      init p6                       |
+| <img src="./assets/Lowpoly-BaldEagle/init_p0.svg"> | <img src="./assets/Lowpoly-BaldEagle/init_p1.svg"> | <img src="./assets/Lowpoly-BaldEagle/init_p2.svg"> | <img src="./assets/Lowpoly-BaldEagle/init_p3.svg"> | <img src="./assets/Lowpoly-BaldEagle/init_p4.svg"> | <img src="./assets/Lowpoly-BaldEagle/init_p5.svg"> |
+|                      final p1                      |                      final p2                      |                      final p3                      |                      final p4                      |                      final p5                      |                      final p6                      |
+|   <img src="./assets/Lowpoly-BaldEagle/p0.svg">    |   <img src="./assets/Lowpoly-BaldEagle/p1.svg">    |   <img src="./assets/Lowpoly-BaldEagle/p2.svg">    |   <img src="./assets/Lowpoly-BaldEagle/p3.svg">    |   <img src="./assets/Lowpoly-BaldEagle/p4.svg">    |   <img src="./assets/Lowpoly-BaldEagle/p5.svg">    |
+**Script:**
 ```shell
 python svgdreamer.py x=lowpoly "prompt='A picture of a bald eagle. low-ploy. polygon. minimal flat 2d vector'" neg_prompt='' result_path='./logs/BaldEagle'
+```
+#### sketch style
+**Prompt:** A free-hand drawing of A speeding Lamborghini. black and white drawing. <br/>
+**Preview:**
+|                     Particle 1                      |                     Particle 2                      |                     Particle 3                      |                     Particle 4                      |                     Particle 5                      |                     Particle 6                      |
+|:---------------------------------------------------:|:---------------------------------------------------:|:---------------------------------------------------:|:---------------------------------------------------:|:---------------------------------------------------:|:---------------------------------------------------:|
+|                       init p1                       |                       init p2                       |                       init p3                       |                       init p4                       |                       init p5                       |                       init p6                       |
+| <img src="./assets/Sketch-Lamborghini/init_p0.svg"> | <img src="./assets/Sketch-Lamborghini/init_p1.svg"> | <img src="./assets/Sketch-Lamborghini/init_p2.svg"> | <img src="./assets/Sketch-Lamborghini/init_p3.svg"> | <img src="./assets/Sketch-Lamborghini/init_p4.svg"> | <img src="./assets/Sketch-Lamborghini/init_p5.svg"> |
+|                      final p1                       |                      final p2                       |                      final p3                       |                      final p4                       |                      final p5                       |                      final p6                       |
+|   <img src="./assets/Sketch-Lamborghini/p0.svg">    |   <img src="./assets/Sketch-Lamborghini/p1.svg">    |   <img src="./assets/Sketch-Lamborghini/p2.svg">    |   <img src="./assets/Sketch-Lamborghini/p3.svg">    |   <img src="./assets/Sketch-Lamborghini/p4.svg">    |   <img src="./assets/Sketch-Lamborghini/p5.svg">    |
+**Script:**
+```shell
 python svgdreamer.py x=sketch "prompt='A free-hand drawing of A speeding Lamborghini. black and white drawing.'" neg_prompt='' result_path='./logs/Lamborghini'
+```
+#### Other Styles
+```shell
 # Style: ink and wash
+python svgdreamer.py x=ink "prompt='Big Wild Goose Pagoda. ink style. Minimalist abstract art grayscale watercolor. empty background'" neg_prompt='' result_path='./logs/BigWildGoosePagoda'
 ```
 #### More Cases

assets/Lowpoly-BaldEagle/init_p0.svg ADDED Viewed

assets/Lowpoly-BaldEagle/init_p1.svg ADDED Viewed

assets/Lowpoly-BaldEagle/init_p2.svg ADDED Viewed

assets/Lowpoly-BaldEagle/init_p3.svg ADDED Viewed

assets/Lowpoly-BaldEagle/init_p4.svg ADDED Viewed

assets/Lowpoly-BaldEagle/init_p5.svg ADDED Viewed

assets/Lowpoly-BaldEagle/p0.svg ADDED Viewed

assets/Lowpoly-BaldEagle/p1.svg ADDED Viewed

assets/Lowpoly-BaldEagle/p2.svg ADDED Viewed

assets/Lowpoly-BaldEagle/p3.svg ADDED Viewed

assets/Lowpoly-BaldEagle/p4.svg ADDED Viewed

assets/Lowpoly-BaldEagle/p5.svg ADDED Viewed

assets/Sketch-Lamborghini/init_p0.svg ADDED Viewed

assets/Sketch-Lamborghini/init_p1.svg ADDED Viewed

assets/Sketch-Lamborghini/init_p2.svg ADDED Viewed

assets/Sketch-Lamborghini/init_p3.svg ADDED Viewed

assets/Sketch-Lamborghini/init_p4.svg ADDED Viewed

assets/Sketch-Lamborghini/init_p5.svg ADDED Viewed

assets/Sketch-Lamborghini/p0.svg ADDED Viewed

assets/Sketch-Lamborghini/p1.svg ADDED Viewed

assets/Sketch-Lamborghini/p2.svg ADDED Viewed

assets/Sketch-Lamborghini/p3.svg ADDED Viewed

assets/Sketch-Lamborghini/p4.svg ADDED Viewed

assets/Sketch-Lamborghini/p5.svg ADDED Viewed

assets/post.md CHANGED Viewed

@@ -1,6 +1,7 @@
 🌟 New Research Alert - CVPR 2024! 🌟
 📄 Title: "SVGDreamer: Text-Guided SVG Generation with Diffusion Model"
-📝 Description: Animatable Gaussians - a novel method for creating lifelike human avatars from RGB videos, utilizing 2D CNNs and 3D Gaussian splatting to capture pose-dependent garment details and dynamic appearances with high fidelity.
 👥 Authors: [Ximing Xing](https://ximinng.github.io/), Haitao Zhou, Chuang Wang, [Jing zhang](https://hellojing89.github.io/), [Dong Xu](https://www.cs.hku.hk/index.php/people/academic-staff/dongxu), and [Qian Yu](https://yuqian1023.github.io/)
 📅 Conference: CVPR, Jun 17-21, 2024 | Seattle WA, USA 🇺🇸
 🔍 Keywords: #SVGDreamer #Text-to-SVG #SVG #Diffusion #CVPR2024

 🌟 New Research Alert - CVPR 2024! 🌟
 📄 Title: "SVGDreamer: Text-Guided SVG Generation with Diffusion Model"
+📝 TL;DR: Given a text prompt, SVGDreamer can generate editable and versatile high-fidelity vector graphics.
+📝 Description: In this work, the author has introduced SVGDreamer, an innovative model for text-guided vector graphics synthesis. SVGDreamer incorporates two crucial technical designs: semantic-driven image vectorization (SIVE) and vectorized particle-based score distillation (VPSD), which empower our model to generate vector graphics with high editability, superior visual quality, and notable diversity.
 👥 Authors: [Ximing Xing](https://ximinng.github.io/), Haitao Zhou, Chuang Wang, [Jing zhang](https://hellojing89.github.io/), [Dong Xu](https://www.cs.hku.hk/index.php/people/academic-staff/dongxu), and [Qian Yu](https://yuqian1023.github.io/)
 📅 Conference: CVPR, Jun 17-21, 2024 | Seattle WA, USA 🇺🇸
 🔍 Keywords: #SVGDreamer #Text-to-SVG #SVG #Diffusion #CVPR2024

conf/x/ink.yaml CHANGED Viewed

@@ -84,7 +84,7 @@ sive:
     num_iter: 10
 # VPSD primitives
-num_paths: 64 # number of strokes
 trainable_bg: False # set the background to be trainable
 width: 6 # stroke width
 num_segments: 4
@@ -142,7 +142,7 @@ vpsd:
   t_range: [ 0.02, 0.98 ]
   # 'randint': random time steps, this may have a more authentic style.
   # 'max_0.5_900': annealing from 0.98 to 0.5 after 900 steps, this may have a more colorful results.
-  t_schedule: 'randint' # or 'randint'
   # phi model config
   phi_single: False # if False new an unet model to estimate noise
   phi_model: 'lora' # 'lora', 'unet_simple'

     num_iter: 10
 # VPSD primitives
+num_paths: 84 # number of strokes
 trainable_bg: False # set the background to be trainable
 width: 6 # stroke width
 num_segments: 4
   t_range: [ 0.02, 0.98 ]
   # 'randint': random time steps, this may have a more authentic style.
   # 'max_0.5_900': annealing from 0.98 to 0.5 after 900 steps, this may have a more colorful results.
+  t_schedule: 'max_0.5_1000' # or 'randint'
   # phi model config
   phi_single: False # if False new an unet model to estimate noise
   phi_model: 'lora' # 'lora', 'unet_simple'

conf/x/lowpoly.yaml CHANGED Viewed

@@ -135,7 +135,7 @@ vpsd:
   n_particle: 6 # 4, 8, 16
   vsd_n_particle: 4 # the batch size of particles
   particle_aug: False # do data enhancement for the input particles
-  num_iter: 1500 # total iterations
   guidance_scale: 7.5 # CFG value
   grad_scale: 1.0 # increase or decrease the gradient
   grad_clip_val: ~ # eg: 10, clip the gradient of VPSD

   n_particle: 6 # 4, 8, 16
   vsd_n_particle: 4 # the batch size of particles
   particle_aug: False # do data enhancement for the input particles
+  num_iter: 2000 # total iterations
   guidance_scale: 7.5 # CFG value
   grad_scale: 1.0 # increase or decrease the gradient
   grad_clip_val: ~ # eg: 10, clip the gradient of VPSD

conf/x/sketch.yaml CHANGED Viewed

@@ -142,7 +142,7 @@ vpsd:
   t_range: [ 0.02, 0.98 ]
   # 'randint': random time steps, this may have a more authentic style.
   # 'max_0.5_900': annealing from 0.98 to 0.5 after 900 steps, this may have a more colorful results.
-  t_schedule: 'randint' # or 'randint'
   # phi model config
   phi_single: False # if False new an unet model to estimate noise
   phi_model: 'lora' # 'lora', 'unet_simple'

   t_range: [ 0.02, 0.98 ]
   # 'randint': random time steps, this may have a more authentic style.
   # 'max_0.5_900': annealing from 0.98 to 0.5 after 900 steps, this may have a more colorful results.
+  t_schedule: 'max_0.5_1300' # or 'randint'
   # phi model config
   phi_single: False # if False new an unet model to estimate noise
   phi_model: 'lora' # 'lora', 'unet_simple'

svgdreamer/svgtools/__init__.py CHANGED Viewed

@@ -3,7 +3,6 @@
 # Copyright (c) 2023, XiMing Xing.
 # License: MIT License
-#from .tff import FONT_LIST
 from .type import is_valid_svg
 from .merge import merge_svg_files
 from .process import delete_empty_path, add_def_tag
@@ -11,6 +10,5 @@ from .process import delete_empty_path, add_def_tag
 __all__ = [
     'is_valid_svg',
     'merge_svg_files',
-#    'FONT_LIST',
     'delete_empty_path', 'add_def_tag'
 ]

 # Copyright (c) 2023, XiMing Xing.
 # License: MIT License
 from .type import is_valid_svg
 from .merge import merge_svg_files
 from .process import delete_empty_path, add_def_tag
 __all__ = [
     'is_valid_svg',
     'merge_svg_files',
     'delete_empty_path', 'add_def_tag'
 ]