NikV09 commited on
Commit
8da7be0
·
verified ·
1 Parent(s): 510e5ca

Push model using huggingface_hub.

Browse files
Files changed (3) hide show
  1. README.md +10 -3
  2. config.json +191 -0
  3. model.safetensors +3 -0
README.md CHANGED
@@ -1,3 +1,10 @@
1
- ---
2
- license: apache-2.0
3
- ---
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Code: [More Information Needed]
9
+ - Paper: [More Information Needed]
10
+ - Docs: [More Information Needed]
config.json ADDED
@@ -0,0 +1,191 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "encoder_config": {
3
+ "data_norm_type": "dinov2",
4
+ "encoder_str": "dinov2",
5
+ "gradient_checkpointing": true,
6
+ "name": "dinov2_large",
7
+ "size": "large",
8
+ "torch_hub_force_reload": false,
9
+ "uses_torch_hub": true,
10
+ "with_registers": false
11
+ },
12
+ "geometric_input_config": {
13
+ "cam_prob": 1.0,
14
+ "cam_rot_encoder_config": {
15
+ "enc_embed_dim": 1024,
16
+ "encoder_str": "global_rep_encoder",
17
+ "in_chans": 4,
18
+ "name": "cam_rot_quats_encoder"
19
+ },
20
+ "cam_trans_encoder_config": {
21
+ "enc_embed_dim": 1024,
22
+ "encoder_str": "global_rep_encoder",
23
+ "in_chans": 3,
24
+ "name": "cam_trans_encoder"
25
+ },
26
+ "depth_encoder_config": {
27
+ "apply_pe": false,
28
+ "enc_embed_dim": 1024,
29
+ "encoder_str": "dense_rep_encoder",
30
+ "in_chans": 1,
31
+ "name": "depth_encoder",
32
+ "patch_size": 14
33
+ },
34
+ "depth_prob": 1.0,
35
+ "depth_scale_norm_all_prob": 0.0,
36
+ "dropout_prob": 0.0,
37
+ "overall_prob": 1.0,
38
+ "pose_scale_norm_all_prob": 0.0,
39
+ "ray_dirs_encoder_config": {
40
+ "apply_pe": false,
41
+ "enc_embed_dim": 1024,
42
+ "encoder_str": "dense_rep_encoder",
43
+ "in_chans": 3,
44
+ "name": "ray_dirs_encoder",
45
+ "patch_size": 14
46
+ },
47
+ "ray_dirs_prob": 1.0,
48
+ "scale_encoder_config": {
49
+ "enc_embed_dim": 1024,
50
+ "encoder_str": "global_rep_encoder",
51
+ "in_chans": 1,
52
+ "name": "scale_encoder"
53
+ },
54
+ "sparse_depth_prob": 0.0,
55
+ "sparsification_removal_percent": 0.9
56
+ },
57
+ "info_sharing_config": {
58
+ "custom_positional_encoding": null,
59
+ "model_return_type": "intermediate_features",
60
+ "model_type": "alternating_attention",
61
+ "module_args": {
62
+ "custom_positional_encoding": null,
63
+ "depth": 24,
64
+ "distinguish_ref_and_non_ref_views": true,
65
+ "gradient_checkpointing": false,
66
+ "indices": [
67
+ 11,
68
+ 17
69
+ ],
70
+ "input_embed_dim": 1024,
71
+ "mlp_layer": "dummy",
72
+ "name": "aat_24_layers_ifr",
73
+ "norm_intermediate": true,
74
+ "size": "24_layers"
75
+ }
76
+ },
77
+ "info_sharing_mlp_layer_str": "mlp",
78
+ "load_specific_pretrained_submodules": false,
79
+ "name": "mapanything",
80
+ "pred_head_config": {
81
+ "adaptor_config": {
82
+ "dense_pred_init_dict": {
83
+ "confidence_type": "exp",
84
+ "confidence_vmax": Infinity,
85
+ "confidence_vmin": 1,
86
+ "depth_mode": "exp",
87
+ "depth_vmax": Infinity,
88
+ "depth_vmin": 0,
89
+ "name": "raydirs+depth+pose+confidence+mask+scale",
90
+ "ray_directions_clamp_min_of_z_dir": false,
91
+ "ray_directions_mode": "linear",
92
+ "ray_directions_normalize_to_unit_image_plane": false,
93
+ "ray_directions_normalize_to_unit_sphere": true,
94
+ "ray_directions_vmax": Infinity,
95
+ "ray_directions_vmin": -Infinity,
96
+ "ray_directions_z_dir_min": -Infinity
97
+ },
98
+ "input_dim": 6,
99
+ "pose_pred_init_dict": {
100
+ "cam_trans_mode": "linear",
101
+ "cam_trans_vmax": Infinity,
102
+ "cam_trans_vmin": -Infinity,
103
+ "name": "raydirs+depth+pose+confidence+mask+scale",
104
+ "quaternions_mode": "linear",
105
+ "quaternions_normalize": true,
106
+ "quaternions_vmax": Infinity,
107
+ "quaternions_vmin": -Infinity
108
+ },
109
+ "scale_pred_init_dict": {
110
+ "mode": "exp",
111
+ "name": "raydirs+depth+pose+confidence+mask+scale",
112
+ "vmax": Infinity,
113
+ "vmin": 1e-08
114
+ },
115
+ "scene_rep_dim": 4,
116
+ "scene_rep_type": "raydirs+depth+pose",
117
+ "type": "raydirs+depth+pose+confidence+mask"
118
+ },
119
+ "adaptor_type": "raydirs+depth+pose+confidence+mask",
120
+ "dpt_adaptor": {
121
+ "confidence_type": "exp",
122
+ "confidence_vmax": Infinity,
123
+ "confidence_vmin": 1,
124
+ "depth_mode": "exp",
125
+ "depth_vmax": Infinity,
126
+ "depth_vmin": 0,
127
+ "name": "raydirs+depth+pose+confidence+mask+scale",
128
+ "ray_directions_clamp_min_of_z_dir": false,
129
+ "ray_directions_mode": "linear",
130
+ "ray_directions_normalize_to_unit_image_plane": false,
131
+ "ray_directions_normalize_to_unit_sphere": true,
132
+ "ray_directions_vmax": Infinity,
133
+ "ray_directions_vmin": -Infinity,
134
+ "ray_directions_z_dir_min": -Infinity
135
+ },
136
+ "feature_head": {
137
+ "checkpoint_gradient": false,
138
+ "feature_dim": 256,
139
+ "hooks": [
140
+ 0,
141
+ 1,
142
+ 2,
143
+ 3
144
+ ],
145
+ "input_feature_dims": [
146
+ 1024,
147
+ 768,
148
+ 768,
149
+ 768
150
+ ],
151
+ "patch_size": 14
152
+ },
153
+ "gradient_checkpointing": false,
154
+ "pose_adaptor": {
155
+ "cam_trans_mode": "linear",
156
+ "cam_trans_vmax": Infinity,
157
+ "cam_trans_vmin": -Infinity,
158
+ "name": "raydirs+depth+pose+confidence+mask+scale",
159
+ "quaternions_mode": "linear",
160
+ "quaternions_normalize": true,
161
+ "quaternions_vmax": Infinity,
162
+ "quaternions_vmin": -Infinity
163
+ },
164
+ "pose_head": {
165
+ "input_feature_dim": 768,
166
+ "num_resconv_block": 2,
167
+ "patch_size": 14,
168
+ "rot_representation_dim": 4
169
+ },
170
+ "regressor_head": {
171
+ "checkpoint_gradient": false,
172
+ "input_feature_dim": 256,
173
+ "output_dim": 6
174
+ },
175
+ "scale_adaptor": {
176
+ "mode": "exp",
177
+ "name": "raydirs+depth+pose+confidence+mask+scale",
178
+ "vmax": Infinity,
179
+ "vmin": 1e-08
180
+ },
181
+ "scale_head": {
182
+ "input_feature_dim": 768,
183
+ "output_dim": 1
184
+ },
185
+ "type": "dpt+pose"
186
+ },
187
+ "pretrained_checkpoint_path": null,
188
+ "specific_pretrained_submodules": [],
189
+ "torch_hub_force_reload": false,
190
+ "use_register_tokens_from_encoder": false
191
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77ba70391067e4a8e525117a2cafdfe34605130d04edd213ed429630ab82283
3
+ size 2253444224