infinity1096 commited on
Commit
01e5ffd
·
verified ·
1 Parent(s): 747bf57

Push model using huggingface_hub.

Browse files
Files changed (3) hide show
  1. README.md +4 -41
  2. config.json +144 -0
  3. model.safetensors +3 -0
README.md CHANGED
@@ -2,46 +2,9 @@
2
  tags:
3
  - model_hub_mixin
4
  - pytorch_model_hub_mixin
5
- license: cc-by-nc-4.0
6
- language:
7
- - en
8
- pipeline_tag: other
9
  ---
10
 
11
- <div align="center">
12
- <h1>UFM: A Simple Path towards Unified Dense Correspondence with Flow</h1>
13
-
14
- <a href="https://arxiv.org/abs/0000.00000"><img src="https://img.shields.io/badge/arXiv-2503.11651-b31b1b" alt="arXiv"></a>
15
- <a href="https://uniflowmatch.github.io/"><img src="https://img.shields.io/badge/Project_Page-green" alt="Project Page"></a>
16
- <a href='https://huggingface.co/spaces/infinity1096/UFM'><img src='https://img.shields.io/badge/%F0%9F%A4%97%20Hugging%20Face-Demo-blue'></a>
17
-
18
-
19
- **Carnegie Mellon University**
20
-
21
- [Yuchen Zhang](https://infinity1096.github.io/), [Nikhil Keetha](https://nik-v9.github.io/), [Chenwei Lyu](https://www.linkedin.com/in/chenwei-lyu/), [Bhuvan Jhamb](https://www.linkedin.com/in/bhuvanjhamb/), [Yutian Chen](https://www.yutianchen.blog/about/)
22
- [Yuheng Qiu](https://haleqiu.github.io), [Jay Karhade](https://jaykarhade.github.io/), [Shreyas Jha](https://www.linkedin.com/in/shreyasjha/), [Yaoyu Hu](http://www.huyaoyu.com/)
23
- [Deva Ramanan](https://www.cs.cmu.edu/~deva/), [Sebastian Scherer](https://theairlab.org/team/sebastian/), [Wenshan Wang](http://www.wangwenshan.com/)
24
- </div>
25
-
26
- ## Overview
27
-
28
- UFM(UniFlowMatch) is a simple, end-to-end trained transformer model that directly regresses pixel displacement image that applies concurrently to both optical flow and wide-baseline matching tasks.
29
-
30
- This model space contains the base model (without refinement).
31
-
32
- ## Quick Start
33
-
34
- Check out our [Github Repo](https://github.com/UniFlowMatch/UFM) and the hugging face [demo](https://huggingface.co/spaces/infinity1096/UFM).
35
-
36
-
37
- ## Citation
38
- If you find our repository useful, please consider giving it a star ⭐ and citing our paper in your work:
39
-
40
- ```bibtex
41
- @inproceedings{zhang2025ufm,
42
- title={UFM: A Simple Path towards Unified Dense Correspondence with Flow},
43
- author={Zhang, Yuchen and Keetha, Nikhil and Lyu, Chenwei and Jhamb, Bhuvan and Chen, Yutian and Qiu, Yuheng and Karhade, Jay and Jha, Shreyas and Hu, Yaoyu and Ramanan, Deva and Scherer, Sebastian and Wang, Wenshan},
44
- booktitle={TBD},
45
- year={2025}
46
- }
47
- ```
 
2
  tags:
3
  - model_hub_mixin
4
  - pytorch_model_hub_mixin
 
 
 
 
5
  ---
6
 
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Code: [More Information Needed]
9
+ - Paper: [More Information Needed]
10
+ - Docs: [More Information Needed]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
config.json ADDED
@@ -0,0 +1,144 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "adaptors_kwargs": {
3
+ "flow": {
4
+ "class": "FlowAdaptor",
5
+ "kwargs": {
6
+ "base_shape": [
7
+ 224,
8
+ 224
9
+ ],
10
+ "flow_mean": [
11
+ 0.0,
12
+ 0.0
13
+ ],
14
+ "flow_std": [
15
+ 25,
16
+ 25
17
+ ],
18
+ "name": "flow",
19
+ "output_normalized_coordinate": false,
20
+ "scale_strategy": "scale_both"
21
+ }
22
+ }
23
+ },
24
+ "detach_uncertainty_head": false,
25
+ "encoder_kwargs": {
26
+ "data_norm_type": "dinov2",
27
+ "name": "dinov2_encoder",
28
+ "patch_size": 14,
29
+ "size": "large",
30
+ "with_registers": false
31
+ },
32
+ "encoder_str": "dinov2",
33
+ "feature_head_kwargs": {
34
+ "dpt_feature": {
35
+ "feature_dim": 256,
36
+ "hooks": [
37
+ 0,
38
+ 1,
39
+ 2,
40
+ 3
41
+ ],
42
+ "input_feature_dims": [
43
+ 1024,
44
+ 768,
45
+ 768,
46
+ 768
47
+ ],
48
+ "layer_dims": [
49
+ 96,
50
+ 192,
51
+ 384,
52
+ 768
53
+ ],
54
+ "output_width_ratio": 1,
55
+ "patch_size": 14,
56
+ "pretrained_checkpoint_path": null,
57
+ "use_bn": false
58
+ },
59
+ "dpt_processor": {
60
+ "hidden_dims": [
61
+ 128,
62
+ 128
63
+ ],
64
+ "input_feature_dim": 256,
65
+ "output_dim": 2,
66
+ "pretrained_checkpoint_path": null
67
+ }
68
+ },
69
+ "head_type": "dpt",
70
+ "info_sharing_and_head_structure": "dual+single",
71
+ "info_sharing_kwargs": {
72
+ "attn_drop": 0.0,
73
+ "custom_positional_encoding": null,
74
+ "depth": 12,
75
+ "dim": 768,
76
+ "drop_path": 0.0,
77
+ "gradient_checkpointing": false,
78
+ "indices": [
79
+ 5,
80
+ 8
81
+ ],
82
+ "init_values": null,
83
+ "input_embed_dim": 1024,
84
+ "max_num_views": 2,
85
+ "mlp_ratio": 4.0,
86
+ "name": "global_attention",
87
+ "norm_intermediate": true,
88
+ "num_heads": 12,
89
+ "pretrained_checkpoint_path": null,
90
+ "proj_drop": 0.0,
91
+ "qk_norm": false,
92
+ "qkv_bias": true,
93
+ "size": "base",
94
+ "use_rand_idx_pe_for_non_reference_views": false
95
+ },
96
+ "info_sharing_str": "global_attention",
97
+ "pretrained_backbone_checkpoint_path": null,
98
+ "pretrained_checkpoint_path": null,
99
+ "uncertainty_adaptors_kwargs": {
100
+ "non_occluded_mask": {
101
+ "class": "MaskAdaptor",
102
+ "kwargs": {
103
+ "name": "non_occluded_mask"
104
+ }
105
+ }
106
+ },
107
+ "uncertainty_head_kwargs": {
108
+ "dpt_feature": {
109
+ "feature_dim": 256,
110
+ "hooks": [
111
+ 0,
112
+ 1,
113
+ 2,
114
+ 3
115
+ ],
116
+ "input_feature_dims": [
117
+ 1024,
118
+ 768,
119
+ 768,
120
+ 768
121
+ ],
122
+ "layer_dims": [
123
+ 96,
124
+ 192,
125
+ 384,
126
+ 768
127
+ ],
128
+ "output_width_ratio": 1,
129
+ "patch_size": 14,
130
+ "pretrained_checkpoint_path": null,
131
+ "use_bn": false
132
+ },
133
+ "dpt_processor": {
134
+ "hidden_dims": [
135
+ 128,
136
+ 128
137
+ ],
138
+ "input_feature_dim": 256,
139
+ "output_dim": 1,
140
+ "pretrained_checkpoint_path": null
141
+ }
142
+ },
143
+ "uncertainty_head_type": "dpt"
144
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46915ba9c2e022a73e843c5eb2595795ef5932f4c4c975035b6baeaee984e0cb
3
+ size 1713090876