facebook
/

map-anything-apache-v1

+---
+tags:
+- model_hub_mixin
+- pytorch_model_hub_mixin
+---
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
+- Code: [More Information Needed]
+- Paper: [More Information Needed]
+- Docs: [More Information Needed]

config.json ADDED Viewed

	@@ -0,0 +1,191 @@

+{
+  "encoder_config": {
+    "data_norm_type": "dinov2",
+    "encoder_str": "dinov2",
+    "gradient_checkpointing": true,
+    "name": "dinov2_large",
+    "size": "large",
+    "torch_hub_force_reload": false,
+    "uses_torch_hub": true,
+    "with_registers": false
+  },
+  "geometric_input_config": {
+    "cam_prob": 1.0,
+    "cam_rot_encoder_config": {
+      "enc_embed_dim": 1024,
+      "encoder_str": "global_rep_encoder",
+      "in_chans": 4,
+      "name": "cam_rot_quats_encoder"
+    },
+    "cam_trans_encoder_config": {
+      "enc_embed_dim": 1024,
+      "encoder_str": "global_rep_encoder",
+      "in_chans": 3,
+      "name": "cam_trans_encoder"
+    },
+    "depth_encoder_config": {
+      "apply_pe": false,
+      "enc_embed_dim": 1024,
+      "encoder_str": "dense_rep_encoder",
+      "in_chans": 1,
+      "name": "depth_encoder",
+      "patch_size": 14
+    },
+    "depth_prob": 1.0,
+    "depth_scale_norm_all_prob": 0.0,
+    "dropout_prob": 0.0,
+    "overall_prob": 1.0,
+    "pose_scale_norm_all_prob": 0.0,
+    "ray_dirs_encoder_config": {
+      "apply_pe": false,
+      "enc_embed_dim": 1024,
+      "encoder_str": "dense_rep_encoder",
+      "in_chans": 3,
+      "name": "ray_dirs_encoder",
+      "patch_size": 14
+    },
+    "ray_dirs_prob": 1.0,
+    "scale_encoder_config": {
+      "enc_embed_dim": 1024,
+      "encoder_str": "global_rep_encoder",
+      "in_chans": 1,
+      "name": "scale_encoder"
+    },
+    "sparse_depth_prob": 0.0,
+    "sparsification_removal_percent": 0.9
+  },
+  "info_sharing_config": {
+    "custom_positional_encoding": null,
+    "model_return_type": "intermediate_features",
+    "model_type": "alternating_attention",
+    "module_args": {
+      "custom_positional_encoding": null,
+      "depth": 24,
+      "distinguish_ref_and_non_ref_views": true,
+      "gradient_checkpointing": false,
+      "indices": [
+        11,
+        17
+      ],
+      "input_embed_dim": 1024,
+      "mlp_layer": "dummy",
+      "name": "aat_24_layers_ifr",
+      "norm_intermediate": true,
+      "size": "24_layers"
+    }
+  },
+  "info_sharing_mlp_layer_str": "mlp",
+  "load_specific_pretrained_submodules": false,
+  "name": "mapanything",
+  "pred_head_config": {
+    "adaptor_config": {
+      "dense_pred_init_dict": {
+        "confidence_type": "exp",
+        "confidence_vmax": Infinity,
+        "confidence_vmin": 1,
+        "depth_mode": "exp",
+        "depth_vmax": Infinity,
+        "depth_vmin": 0,
+        "name": "raydirs+depth+pose+confidence+mask+scale",
+        "ray_directions_clamp_min_of_z_dir": false,
+        "ray_directions_mode": "linear",
+        "ray_directions_normalize_to_unit_image_plane": false,
+        "ray_directions_normalize_to_unit_sphere": true,
+        "ray_directions_vmax": Infinity,
+        "ray_directions_vmin": -Infinity,
+        "ray_directions_z_dir_min": -Infinity
+      },
+      "input_dim": 6,
+      "pose_pred_init_dict": {
+        "cam_trans_mode": "linear",
+        "cam_trans_vmax": Infinity,
+        "cam_trans_vmin": -Infinity,
+        "name": "raydirs+depth+pose+confidence+mask+scale",
+        "quaternions_mode": "linear",
+        "quaternions_normalize": true,
+        "quaternions_vmax": Infinity,
+        "quaternions_vmin": -Infinity
+      },
+      "scale_pred_init_dict": {
+        "mode": "exp",
+        "name": "raydirs+depth+pose+confidence+mask+scale",
+        "vmax": Infinity,
+        "vmin": 1e-08
+      },
+      "scene_rep_dim": 4,
+      "scene_rep_type": "raydirs+depth+pose",
+      "type": "raydirs+depth+pose+confidence+mask"
+    },
+    "adaptor_type": "raydirs+depth+pose+confidence+mask",
+    "dpt_adaptor": {
+      "confidence_type": "exp",
+      "confidence_vmax": Infinity,
+      "confidence_vmin": 1,
+      "depth_mode": "exp",
+      "depth_vmax": Infinity,
+      "depth_vmin": 0,
+      "name": "raydirs+depth+pose+confidence+mask+scale",
+      "ray_directions_clamp_min_of_z_dir": false,
+      "ray_directions_mode": "linear",
+      "ray_directions_normalize_to_unit_image_plane": false,
+      "ray_directions_normalize_to_unit_sphere": true,
+      "ray_directions_vmax": Infinity,
+      "ray_directions_vmin": -Infinity,
+      "ray_directions_z_dir_min": -Infinity
+    },
+    "feature_head": {
+      "checkpoint_gradient": false,
+      "feature_dim": 256,
+      "hooks": [
+        0,
+        1,
+        2,
+        3
+      ],
+      "input_feature_dims": [
+        1024,
+        768,
+        768,
+        768
+      ],
+      "patch_size": 14
+    },
+    "gradient_checkpointing": false,
+    "pose_adaptor": {
+      "cam_trans_mode": "linear",
+      "cam_trans_vmax": Infinity,
+      "cam_trans_vmin": -Infinity,
+      "name": "raydirs+depth+pose+confidence+mask+scale",
+      "quaternions_mode": "linear",
+      "quaternions_normalize": true,
+      "quaternions_vmax": Infinity,
+      "quaternions_vmin": -Infinity
+    },
+    "pose_head": {
+      "input_feature_dim": 768,
+      "num_resconv_block": 2,
+      "patch_size": 14,
+      "rot_representation_dim": 4
+    },
+    "regressor_head": {
+      "checkpoint_gradient": false,
+      "input_feature_dim": 256,
+      "output_dim": 6
+    },
+    "scale_adaptor": {
+      "mode": "exp",
+      "name": "raydirs+depth+pose+confidence+mask+scale",
+      "vmax": Infinity,
+      "vmin": 1e-08
+    },
+    "scale_head": {
+      "input_feature_dim": 768,
+      "output_dim": 1
+    },
+    "type": "dpt+pose"
+  },
+  "pretrained_checkpoint_path": null,
+  "specific_pretrained_submodules": [],
+  "torch_hub_force_reload": false,
+  "use_register_tokens_from_encoder": false
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c77ba70391067e4a8e525117a2cafdfe34605130d04edd213ed429630ab82283
+size 2253444224