vismatch 1.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2042) hide show
  1. vismatch/TEMPLATE.py +101 -0
  2. vismatch/__init__.py +475 -0
  3. vismatch/assets/example_pairs/false_positive/chartres.jpg +0 -0
  4. vismatch/assets/example_pairs/false_positive/notre_dame.jpg +0 -0
  5. vismatch/assets/example_pairs/fresco/fsm.jpg +0 -0
  6. vismatch/assets/example_pairs/fresco/sist_chapel.jpg +0 -0
  7. vismatch/assets/example_pairs/indoor/gcs_close.jpg +0 -0
  8. vismatch/assets/example_pairs/indoor/gcs_far.jpg +0 -0
  9. vismatch/assets/example_pairs/outdoor/montmartre_close.jpg +0 -0
  10. vismatch/assets/example_pairs/outdoor/montmartre_far.jpg +0 -0
  11. vismatch/assets/example_pairs/sat2iss/photo_from_iss.jpg +0 -0
  12. vismatch/assets/example_pairs/sat2iss/satellite_img.jpg +0 -0
  13. vismatch/assets/example_pairs/sphereglue/barbershop-00000000.jpg +0 -0
  14. vismatch/assets/example_pairs/sphereglue/barbershop-00000001.jpg +0 -0
  15. vismatch/assets/example_pairs/thermal/thermal.jpg +0 -0
  16. vismatch/assets/example_pairs/thermal/visible.jpg +0 -0
  17. vismatch/assets/example_test/original.jpg +0 -0
  18. vismatch/assets/example_test/warped.jpg +0 -0
  19. vismatch/base_matcher.py +242 -0
  20. vismatch/im_models/__init__.py +0 -0
  21. vismatch/im_models/aff_steerers.py +143 -0
  22. vismatch/im_models/aspanformer.py +74 -0
  23. vismatch/im_models/dedode.py +150 -0
  24. vismatch/im_models/duster.py +104 -0
  25. vismatch/im_models/edm.py +64 -0
  26. vismatch/im_models/efficient_loftr.py +60 -0
  27. vismatch/im_models/gim.py +187 -0
  28. vismatch/im_models/handcrafted.py +81 -0
  29. vismatch/im_models/keypt2subpx.py +154 -0
  30. vismatch/im_models/kornia.py +72 -0
  31. vismatch/im_models/liftfeat.py +44 -0
  32. vismatch/im_models/lightglue.py +75 -0
  33. vismatch/im_models/lisrd.py +98 -0
  34. vismatch/im_models/loftr.py +23 -0
  35. vismatch/im_models/master.py +107 -0
  36. vismatch/im_models/matchanything.py +221 -0
  37. vismatch/im_models/matchformer.py +61 -0
  38. vismatch/im_models/matching_toolbox.py +238 -0
  39. vismatch/im_models/minima.py +164 -0
  40. vismatch/im_models/omniglue.py +91 -0
  41. vismatch/im_models/rdd.py +250 -0
  42. vismatch/im_models/ripe.py +55 -0
  43. vismatch/im_models/roma.py +92 -0
  44. vismatch/im_models/romav2.py +62 -0
  45. vismatch/im_models/se2loftr.py +71 -0
  46. vismatch/im_models/silk.py +405 -0
  47. vismatch/im_models/sphereglue.py +97 -0
  48. vismatch/im_models/steerers.py +140 -0
  49. vismatch/im_models/topicfm.py +93 -0
  50. vismatch/im_models/ufm.py +57 -0
  51. vismatch/im_models/xfeat.py +78 -0
  52. vismatch/im_models/xfeat_steerers.py +151 -0
  53. vismatch/im_models/xoftr.py +71 -0
  54. vismatch/third_party/DeDoDe/DeDoDe/__init__.py +2 -0
  55. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/__init__.py +4 -0
  56. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/mega_pose_est.py +114 -0
  57. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/mega_pose_est_mnn.py +119 -0
  58. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/nll_benchmark.py +57 -0
  59. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/num_inliers.py +76 -0
  60. vismatch/third_party/DeDoDe/DeDoDe/checkpoint.py +59 -0
  61. vismatch/third_party/DeDoDe/DeDoDe/datasets/__init__.py +0 -0
  62. vismatch/third_party/DeDoDe/DeDoDe/datasets/megadepth.py +269 -0
  63. vismatch/third_party/DeDoDe/DeDoDe/decoder.py +90 -0
  64. vismatch/third_party/DeDoDe/DeDoDe/descriptors/__init__.py +0 -0
  65. vismatch/third_party/DeDoDe/DeDoDe/descriptors/dedode_descriptor.py +50 -0
  66. vismatch/third_party/DeDoDe/DeDoDe/descriptors/descriptor_loss.py +68 -0
  67. vismatch/third_party/DeDoDe/DeDoDe/detectors/__init__.py +0 -0
  68. vismatch/third_party/DeDoDe/DeDoDe/detectors/dedode_detector.py +76 -0
  69. vismatch/third_party/DeDoDe/DeDoDe/detectors/keypoint_loss.py +185 -0
  70. vismatch/third_party/DeDoDe/DeDoDe/encoder.py +87 -0
  71. vismatch/third_party/DeDoDe/DeDoDe/matchers/__init__.py +0 -0
  72. vismatch/third_party/DeDoDe/DeDoDe/matchers/dual_softmax_matcher.py +38 -0
  73. vismatch/third_party/DeDoDe/DeDoDe/model_zoo/__init__.py +3 -0
  74. vismatch/third_party/DeDoDe/DeDoDe/model_zoo/dedode_models.py +249 -0
  75. vismatch/third_party/DeDoDe/DeDoDe/train.py +76 -0
  76. vismatch/third_party/DeDoDe/DeDoDe/transformer/__init__.py +8 -0
  77. vismatch/third_party/DeDoDe/DeDoDe/transformer/dinov2.py +359 -0
  78. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/__init__.py +12 -0
  79. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/attention.py +81 -0
  80. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/block.py +252 -0
  81. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/dino_head.py +59 -0
  82. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/drop_path.py +35 -0
  83. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/layer_scale.py +28 -0
  84. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/mlp.py +41 -0
  85. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/patch_embed.py +89 -0
  86. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/swiglu_ffn.py +63 -0
  87. vismatch/third_party/DeDoDe/DeDoDe/utils.py +717 -0
  88. vismatch/third_party/DeDoDe/data_prep/prep_keypoints.py +103 -0
  89. vismatch/third_party/DeDoDe/demo/demo_kpts.py +24 -0
  90. vismatch/third_party/DeDoDe/demo/demo_match.py +46 -0
  91. vismatch/third_party/DeDoDe/demo/demo_match_dedode_G.py +45 -0
  92. vismatch/third_party/DeDoDe/demo/demo_scoremap.py +23 -0
  93. vismatch/third_party/DeDoDe/experiments/dedode_descriptor-B.py +135 -0
  94. vismatch/third_party/DeDoDe/experiments/dedode_descriptor-G.py +145 -0
  95. vismatch/third_party/DeDoDe/experiments/dedode_detector.py +126 -0
  96. vismatch/third_party/DeDoDe/experiments/eval/eval_dedode_descriptor-B.py +38 -0
  97. vismatch/third_party/DeDoDe/experiments/eval/eval_dedode_descriptor-G.py +38 -0
  98. vismatch/third_party/DeDoDe/setup.py +11 -0
  99. vismatch/third_party/EDM/configs/data/__init__.py +0 -0
  100. vismatch/third_party/EDM/configs/data/base.py +37 -0
  101. vismatch/third_party/EDM/configs/data/megadepth_test_1500.py +23 -0
  102. vismatch/third_party/EDM/configs/data/megadepth_trainval_832.py +32 -0
  103. vismatch/third_party/EDM/configs/data/scannet_test_1500.py +24 -0
  104. vismatch/third_party/EDM/configs/data/scannet_trainval.py +31 -0
  105. vismatch/third_party/EDM/configs/edm/indoor/edm_base.py +15 -0
  106. vismatch/third_party/EDM/configs/edm/outdoor/edm_base.py +17 -0
  107. vismatch/third_party/EDM/deploy/export_onnx.py +69 -0
  108. vismatch/third_party/EDM/deploy/run_onnx.py +138 -0
  109. vismatch/third_party/EDM/runtime_single_pair.py +73 -0
  110. vismatch/third_party/EDM/src/__init__.py +0 -0
  111. vismatch/third_party/EDM/src/config/default.py +184 -0
  112. vismatch/third_party/EDM/src/datasets/megadepth.py +164 -0
  113. vismatch/third_party/EDM/src/datasets/sampler.py +95 -0
  114. vismatch/third_party/EDM/src/datasets/scannet.py +147 -0
  115. vismatch/third_party/EDM/src/edm/__init__.py +2 -0
  116. vismatch/third_party/EDM/src/edm/backbone/resnet.py +116 -0
  117. vismatch/third_party/EDM/src/edm/edm.py +204 -0
  118. vismatch/third_party/EDM/src/edm/head/coarse_matching.py +158 -0
  119. vismatch/third_party/EDM/src/edm/head/fine_matching.py +383 -0
  120. vismatch/third_party/EDM/src/edm/neck/__init__.py +1 -0
  121. vismatch/third_party/EDM/src/edm/neck/loftr_module/__init__.py +1 -0
  122. vismatch/third_party/EDM/src/edm/neck/loftr_module/transformer.py +418 -0
  123. vismatch/third_party/EDM/src/edm/neck/neck.py +156 -0
  124. vismatch/third_party/EDM/src/edm/utils/geometry.py +58 -0
  125. vismatch/third_party/EDM/src/edm/utils/supervision.py +255 -0
  126. vismatch/third_party/EDM/src/lightning/data.py +450 -0
  127. vismatch/third_party/EDM/src/lightning/lightning_edm.py +379 -0
  128. vismatch/third_party/EDM/src/losses/edm_loss.py +206 -0
  129. vismatch/third_party/EDM/src/optimizers/__init__.py +57 -0
  130. vismatch/third_party/EDM/src/utils/augment.py +65 -0
  131. vismatch/third_party/EDM/src/utils/comm.py +271 -0
  132. vismatch/third_party/EDM/src/utils/dataloader.py +24 -0
  133. vismatch/third_party/EDM/src/utils/dataset.py +192 -0
  134. vismatch/third_party/EDM/src/utils/metrics.py +299 -0
  135. vismatch/third_party/EDM/src/utils/misc.py +113 -0
  136. vismatch/third_party/EDM/src/utils/plotting.py +186 -0
  137. vismatch/third_party/EDM/src/utils/profiler.py +40 -0
  138. vismatch/third_party/EDM/src/utils/warppers.py +428 -0
  139. vismatch/third_party/EDM/src/utils/warppers_utils.py +172 -0
  140. vismatch/third_party/EDM/test.py +132 -0
  141. vismatch/third_party/EDM/train.py +156 -0
  142. vismatch/third_party/EfficientLoFTR/configs/data/__init__.py +0 -0
  143. vismatch/third_party/EfficientLoFTR/configs/data/base.py +35 -0
  144. vismatch/third_party/EfficientLoFTR/configs/data/megadepth_test_1500.py +13 -0
  145. vismatch/third_party/EfficientLoFTR/configs/data/megadepth_trainval_832.py +24 -0
  146. vismatch/third_party/EfficientLoFTR/configs/data/scannet_test_1500.py +16 -0
  147. vismatch/third_party/EfficientLoFTR/configs/loftr/eloftr_full.py +36 -0
  148. vismatch/third_party/EfficientLoFTR/configs/loftr/eloftr_optimized.py +37 -0
  149. vismatch/third_party/EfficientLoFTR/src/__init__.py +0 -0
  150. vismatch/third_party/EfficientLoFTR/src/config/default.py +182 -0
  151. vismatch/third_party/EfficientLoFTR/src/datasets/megadepth.py +133 -0
  152. vismatch/third_party/EfficientLoFTR/src/datasets/sampler.py +77 -0
  153. vismatch/third_party/EfficientLoFTR/src/datasets/scannet.py +129 -0
  154. vismatch/third_party/EfficientLoFTR/src/lightning/data.py +357 -0
  155. vismatch/third_party/EfficientLoFTR/src/lightning/lightning_loftr.py +272 -0
  156. vismatch/third_party/EfficientLoFTR/src/loftr/__init__.py +4 -0
  157. vismatch/third_party/EfficientLoFTR/src/loftr/backbone/__init__.py +11 -0
  158. vismatch/third_party/EfficientLoFTR/src/loftr/backbone/backbone.py +37 -0
  159. vismatch/third_party/EfficientLoFTR/src/loftr/backbone/repvgg.py +224 -0
  160. vismatch/third_party/EfficientLoFTR/src/loftr/loftr.py +124 -0
  161. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/__init__.py +2 -0
  162. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/fine_preprocess.py +112 -0
  163. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/linear_attention.py +103 -0
  164. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/transformer.py +164 -0
  165. vismatch/third_party/EfficientLoFTR/src/loftr/utils/coarse_matching.py +241 -0
  166. vismatch/third_party/EfficientLoFTR/src/loftr/utils/fine_matching.py +156 -0
  167. vismatch/third_party/EfficientLoFTR/src/loftr/utils/full_config.py +50 -0
  168. vismatch/third_party/EfficientLoFTR/src/loftr/utils/geometry.py +54 -0
  169. vismatch/third_party/EfficientLoFTR/src/loftr/utils/opt_config.py +50 -0
  170. vismatch/third_party/EfficientLoFTR/src/loftr/utils/position_encoding.py +50 -0
  171. vismatch/third_party/EfficientLoFTR/src/loftr/utils/supervision.py +275 -0
  172. vismatch/third_party/EfficientLoFTR/src/losses/loftr_loss.py +229 -0
  173. vismatch/third_party/EfficientLoFTR/src/optimizers/__init__.py +42 -0
  174. vismatch/third_party/EfficientLoFTR/src/utils/augment.py +55 -0
  175. vismatch/third_party/EfficientLoFTR/src/utils/comm.py +265 -0
  176. vismatch/third_party/EfficientLoFTR/src/utils/dataloader.py +23 -0
  177. vismatch/third_party/EfficientLoFTR/src/utils/dataset.py +186 -0
  178. vismatch/third_party/EfficientLoFTR/src/utils/metrics.py +264 -0
  179. vismatch/third_party/EfficientLoFTR/src/utils/misc.py +106 -0
  180. vismatch/third_party/EfficientLoFTR/src/utils/plotting.py +154 -0
  181. vismatch/third_party/EfficientLoFTR/src/utils/profiler.py +39 -0
  182. vismatch/third_party/EfficientLoFTR/src/utils/warppers.py +426 -0
  183. vismatch/third_party/EfficientLoFTR/src/utils/warppers_utils.py +171 -0
  184. vismatch/third_party/EfficientLoFTR/test.py +143 -0
  185. vismatch/third_party/EfficientLoFTR/train.py +154 -0
  186. vismatch/third_party/LISRD/lisrd/__init__.py +0 -0
  187. vismatch/third_party/LISRD/lisrd/datasets/__init__.py +7 -0
  188. vismatch/third_party/LISRD/lisrd/datasets/base_dataset.py +38 -0
  189. vismatch/third_party/LISRD/lisrd/datasets/coco.py +148 -0
  190. vismatch/third_party/LISRD/lisrd/datasets/flashes.py +170 -0
  191. vismatch/third_party/LISRD/lisrd/datasets/hpatches.py +135 -0
  192. vismatch/third_party/LISRD/lisrd/datasets/mixed_dataset.py +53 -0
  193. vismatch/third_party/LISRD/lisrd/datasets/rdnim.py +117 -0
  194. vismatch/third_party/LISRD/lisrd/datasets/utils/data_augmentation.py +168 -0
  195. vismatch/third_party/LISRD/lisrd/datasets/utils/data_reader.py +48 -0
  196. vismatch/third_party/LISRD/lisrd/datasets/utils/homographies.py +215 -0
  197. vismatch/third_party/LISRD/lisrd/datasets/vidit.py +152 -0
  198. vismatch/third_party/LISRD/lisrd/evaluation/__init__.py +0 -0
  199. vismatch/third_party/LISRD/lisrd/evaluation/descriptor_evaluation.py +142 -0
  200. vismatch/third_party/LISRD/lisrd/experiment.py +129 -0
  201. vismatch/third_party/LISRD/lisrd/export_features.py +148 -0
  202. vismatch/third_party/LISRD/lisrd/models/__init__.py +7 -0
  203. vismatch/third_party/LISRD/lisrd/models/backbones/__init__.py +0 -0
  204. vismatch/third_party/LISRD/lisrd/models/backbones/net_vlad.py +62 -0
  205. vismatch/third_party/LISRD/lisrd/models/backbones/vgg.py +46 -0
  206. vismatch/third_party/LISRD/lisrd/models/base_model.py +336 -0
  207. vismatch/third_party/LISRD/lisrd/models/keypoint_detectors.py +34 -0
  208. vismatch/third_party/LISRD/lisrd/models/lisrd.py +328 -0
  209. vismatch/third_party/LISRD/lisrd/models/lisrd_sift.py +289 -0
  210. vismatch/third_party/LISRD/lisrd/third_party/super_point_magic_leap/demo_superpoint.py +734 -0
  211. vismatch/third_party/LISRD/lisrd/utils/geometry_utils.py +123 -0
  212. vismatch/third_party/LISRD/lisrd/utils/losses.py +191 -0
  213. vismatch/third_party/LISRD/lisrd/utils/metrics.py +66 -0
  214. vismatch/third_party/LISRD/lisrd/utils/pytorch_utils.py +14 -0
  215. vismatch/third_party/LISRD/lisrd/utils/stdout_capturing.py +81 -0
  216. vismatch/third_party/LISRD/notebooks/utils.py +103 -0
  217. vismatch/third_party/LISRD/setup.py +4 -0
  218. vismatch/third_party/LiftFeat/dataset/__init__.py +0 -0
  219. vismatch/third_party/LiftFeat/dataset/coco_augmentor.py +298 -0
  220. vismatch/third_party/LiftFeat/dataset/coco_wrapper.py +175 -0
  221. vismatch/third_party/LiftFeat/dataset/dataset_utils.py +183 -0
  222. vismatch/third_party/LiftFeat/dataset/megadepth.py +177 -0
  223. vismatch/third_party/LiftFeat/dataset/megadepth_wrapper.py +167 -0
  224. vismatch/third_party/LiftFeat/demo.py +116 -0
  225. vismatch/third_party/LiftFeat/evaluation/HPatch_evaluation.py +182 -0
  226. vismatch/third_party/LiftFeat/evaluation/MegaDepth1500_evaluation.py +105 -0
  227. vismatch/third_party/LiftFeat/evaluation/eval_utils.py +127 -0
  228. vismatch/third_party/LiftFeat/loss/loss.py +291 -0
  229. vismatch/third_party/LiftFeat/models/interpolator.py +34 -0
  230. vismatch/third_party/LiftFeat/models/liftfeat_wrapper.py +172 -0
  231. vismatch/third_party/LiftFeat/models/model.py +419 -0
  232. vismatch/third_party/LiftFeat/tools/demo_match_video.py +145 -0
  233. vismatch/third_party/LiftFeat/tools/demo_vo.py +163 -0
  234. vismatch/third_party/LiftFeat/train.py +369 -0
  235. vismatch/third_party/LiftFeat/utils/VisualOdometry.py +339 -0
  236. vismatch/third_party/LiftFeat/utils/__init__.py +0 -0
  237. vismatch/third_party/LiftFeat/utils/alike_wrapper.py +45 -0
  238. vismatch/third_party/LiftFeat/utils/config.py +16 -0
  239. vismatch/third_party/LiftFeat/utils/depth_anything_wrapper.py +150 -0
  240. vismatch/third_party/LiftFeat/utils/featurebooster.py +247 -0
  241. vismatch/third_party/LiftFeat/utils/post_process.py +21 -0
  242. vismatch/third_party/LightGlue/benchmark.py +255 -0
  243. vismatch/third_party/LightGlue/lightglue/__init__.py +7 -0
  244. vismatch/third_party/LightGlue/lightglue/aliked.py +760 -0
  245. vismatch/third_party/LightGlue/lightglue/disk.py +55 -0
  246. vismatch/third_party/LightGlue/lightglue/dog_hardnet.py +41 -0
  247. vismatch/third_party/LightGlue/lightglue/lightglue.py +662 -0
  248. vismatch/third_party/LightGlue/lightglue/sift.py +216 -0
  249. vismatch/third_party/LightGlue/lightglue/superpoint.py +227 -0
  250. vismatch/third_party/LightGlue/lightglue/utils.py +165 -0
  251. vismatch/third_party/LightGlue/lightglue/viz2d.py +203 -0
  252. vismatch/third_party/MINIMA/demo.py +201 -0
  253. vismatch/third_party/MINIMA/src/__init__.py +0 -0
  254. vismatch/third_party/MINIMA/src/config/default.py +203 -0
  255. vismatch/third_party/MINIMA/src/config/default_for_megadepth_dense.py +203 -0
  256. vismatch/third_party/MINIMA/src/config/default_for_megadepth_sparse.py +203 -0
  257. vismatch/third_party/MINIMA/src/utils/__init__.py +0 -0
  258. vismatch/third_party/MINIMA/src/utils/culculate_auc.py +28 -0
  259. vismatch/third_party/MINIMA/src/utils/data_io.py +156 -0
  260. vismatch/third_party/MINIMA/src/utils/data_io_loftr.py +152 -0
  261. vismatch/third_party/MINIMA/src/utils/data_io_roma.py +186 -0
  262. vismatch/third_party/MINIMA/src/utils/data_io_sp_lg.py +158 -0
  263. vismatch/third_party/MINIMA/src/utils/load_model.py +164 -0
  264. vismatch/third_party/MINIMA/src/utils/metrics.py +214 -0
  265. vismatch/third_party/MINIMA/src/utils/misc.py +101 -0
  266. vismatch/third_party/MINIMA/src/utils/plotting.py +291 -0
  267. vismatch/third_party/MINIMA/src/utils/sample_h.py +142 -0
  268. vismatch/third_party/MINIMA/test_relative_homo_depth.py +683 -0
  269. vismatch/third_party/MINIMA/test_relative_homo_event.py +722 -0
  270. vismatch/third_party/MINIMA/test_relative_homo_mmim.py +669 -0
  271. vismatch/third_party/MINIMA/test_relative_pose_infrared.py +500 -0
  272. vismatch/third_party/MINIMA/test_relative_pose_mega_1500.py +487 -0
  273. vismatch/third_party/MINIMA/test_relative_pose_mega_1500_syn.py +516 -0
  274. vismatch/third_party/MINIMA/third_party/LightGlue/benchmark.py +255 -0
  275. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/__init__.py +7 -0
  276. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/aliked.py +758 -0
  277. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/disk.py +55 -0
  278. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/dog_hardnet.py +41 -0
  279. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/lightglue.py +655 -0
  280. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/sift.py +216 -0
  281. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/superpoint.py +227 -0
  282. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/utils.py +165 -0
  283. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/viz2d.py +184 -0
  284. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/__init__.py +0 -0
  285. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/base.py +35 -0
  286. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/megadepth_test_1500.py +11 -0
  287. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/megadepth_trainval_640.py +22 -0
  288. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/megadepth_trainval_840.py +22 -0
  289. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/scannet_test_1500.py +11 -0
  290. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/scannet_trainval.py +17 -0
  291. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds.py +6 -0
  292. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds_dense.py +8 -0
  293. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot.py +6 -0
  294. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot_dense.py +8 -0
  295. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ds.py +5 -0
  296. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ds_dense.py +7 -0
  297. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ot.py +5 -0
  298. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ot_dense.py +7 -0
  299. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval.py +16 -0
  300. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval_new.py +18 -0
  301. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds.py +16 -0
  302. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds_dense.py +17 -0
  303. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot.py +16 -0
  304. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot_dense.py +17 -0
  305. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ds.py +15 -0
  306. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ds_dense.py +16 -0
  307. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ot.py +15 -0
  308. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ot_dense.py +16 -0
  309. vismatch/third_party/MINIMA/third_party/LoFTR/demo/demo_loftr.py +240 -0
  310. vismatch/third_party/MINIMA/third_party/LoFTR/src/__init__.py +0 -0
  311. vismatch/third_party/MINIMA/third_party/LoFTR/src/config/default.py +171 -0
  312. vismatch/third_party/MINIMA/third_party/LoFTR/src/datasets/megadepth.py +127 -0
  313. vismatch/third_party/MINIMA/third_party/LoFTR/src/datasets/sampler.py +77 -0
  314. vismatch/third_party/MINIMA/third_party/LoFTR/src/datasets/scannet.py +114 -0
  315. vismatch/third_party/MINIMA/third_party/LoFTR/src/lightning/data.py +320 -0
  316. vismatch/third_party/MINIMA/third_party/LoFTR/src/lightning/lightning_loftr.py +249 -0
  317. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/__init__.py +2 -0
  318. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/backbone/__init__.py +11 -0
  319. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/backbone/resnet_fpn.py +199 -0
  320. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr.py +81 -0
  321. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/__init__.py +2 -0
  322. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/fine_preprocess.py +59 -0
  323. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/linear_attention.py +81 -0
  324. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/transformer.py +101 -0
  325. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/coarse_matching.py +261 -0
  326. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/cvpr_ds_config.py +50 -0
  327. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/fine_matching.py +74 -0
  328. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/geometry.py +54 -0
  329. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/position_encoding.py +42 -0
  330. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/supervision.py +151 -0
  331. vismatch/third_party/MINIMA/third_party/LoFTR/src/losses/loftr_loss.py +192 -0
  332. vismatch/third_party/MINIMA/third_party/LoFTR/src/optimizers/__init__.py +42 -0
  333. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/augment.py +55 -0
  334. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/comm.py +265 -0
  335. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/dataloader.py +23 -0
  336. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/dataset.py +185 -0
  337. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/metrics.py +193 -0
  338. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/misc.py +101 -0
  339. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/plotting.py +154 -0
  340. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/profiler.py +39 -0
  341. vismatch/third_party/MINIMA/third_party/LoFTR/test.py +68 -0
  342. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/demo_superglue.py +259 -0
  343. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/match_pairs.py +425 -0
  344. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/__init__.py +0 -0
  345. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/matching.py +84 -0
  346. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/superglue.py +283 -0
  347. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/superpoint.py +202 -0
  348. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/utils.py +555 -0
  349. vismatch/third_party/MINIMA/third_party/LoFTR/train.py +123 -0
  350. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_3D_effect.py +47 -0
  351. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_fundamental.py +34 -0
  352. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_match.py +50 -0
  353. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_match_opencv_sift.py +43 -0
  354. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_match_tiny.py +77 -0
  355. vismatch/third_party/MINIMA/third_party/RoMa/experiments/eval_roma_outdoor.py +57 -0
  356. vismatch/third_party/MINIMA/third_party/RoMa/experiments/eval_tiny_roma_v1_outdoor.py +84 -0
  357. vismatch/third_party/MINIMA/third_party/RoMa/experiments/roma_indoor.py +320 -0
  358. vismatch/third_party/MINIMA/third_party/RoMa/experiments/train_roma_outdoor.py +307 -0
  359. vismatch/third_party/MINIMA/third_party/RoMa/experiments/train_tiny_roma_v1_outdoor.py +498 -0
  360. vismatch/third_party/MINIMA/third_party/RoMa/romatch/__init__.py +8 -0
  361. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/__init__.py +6 -0
  362. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/hpatches_sequences_homog_benchmark.py +113 -0
  363. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/megadepth_dense_benchmark.py +106 -0
  364. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark.py +118 -0
  365. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark_poselib.py +119 -0
  366. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/scannet_benchmark.py +143 -0
  367. vismatch/third_party/MINIMA/third_party/RoMa/romatch/checkpointing/__init__.py +1 -0
  368. vismatch/third_party/MINIMA/third_party/RoMa/romatch/checkpointing/checkpoint.py +60 -0
  369. vismatch/third_party/MINIMA/third_party/RoMa/romatch/datasets/__init__.py +2 -0
  370. vismatch/third_party/MINIMA/third_party/RoMa/romatch/datasets/megadepth.py +232 -0
  371. vismatch/third_party/MINIMA/third_party/RoMa/romatch/datasets/scannet.py +160 -0
  372. vismatch/third_party/MINIMA/third_party/RoMa/romatch/losses/__init__.py +1 -0
  373. vismatch/third_party/MINIMA/third_party/RoMa/romatch/losses/robust_loss.py +161 -0
  374. vismatch/third_party/MINIMA/third_party/RoMa/romatch/losses/robust_loss_tiny_roma.py +160 -0
  375. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/__init__.py +1 -0
  376. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/encoders.py +122 -0
  377. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/matcher.py +766 -0
  378. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/model_zoo/__init__.py +73 -0
  379. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/model_zoo/roma_models.py +170 -0
  380. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/tiny.py +304 -0
  381. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/__init__.py +48 -0
  382. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/dinov2.py +359 -0
  383. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/__init__.py +12 -0
  384. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/attention.py +81 -0
  385. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/block.py +252 -0
  386. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/dino_head.py +59 -0
  387. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/drop_path.py +35 -0
  388. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/layer_scale.py +28 -0
  389. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/mlp.py +41 -0
  390. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/patch_embed.py +89 -0
  391. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/swiglu_ffn.py +63 -0
  392. vismatch/third_party/MINIMA/third_party/RoMa/romatch/train/__init__.py +1 -0
  393. vismatch/third_party/MINIMA/third_party/RoMa/romatch/train/train.py +102 -0
  394. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/__init__.py +16 -0
  395. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/kde.py +13 -0
  396. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/local_correlation.py +48 -0
  397. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/transforms.py +118 -0
  398. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/utils.py +662 -0
  399. vismatch/third_party/MINIMA/third_party/RoMa/setup.py +9 -0
  400. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/__init__.py +0 -0
  401. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/base.py +35 -0
  402. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/megadepth_trainval_840.py +22 -0
  403. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/megadepth_vistir_trainval_640.py +23 -0
  404. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/pretrain.py +8 -0
  405. vismatch/third_party/MINIMA/third_party/XoFTR/configs/xoftr/outdoor/visible_thermal.py +17 -0
  406. vismatch/third_party/MINIMA/third_party/XoFTR/configs/xoftr/pretrain/pretrain.py +12 -0
  407. vismatch/third_party/MINIMA/third_party/XoFTR/pretrain.py +125 -0
  408. vismatch/third_party/MINIMA/third_party/XoFTR/src/__init__.py +0 -0
  409. vismatch/third_party/MINIMA/third_party/XoFTR/src/config/default.py +203 -0
  410. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/megadepth.py +143 -0
  411. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/pretrain_dataset.py +156 -0
  412. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/sampler.py +77 -0
  413. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/scannet.py +114 -0
  414. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/vistir.py +109 -0
  415. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/data.py +346 -0
  416. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/data_pretrain.py +125 -0
  417. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/lightning_xoftr.py +334 -0
  418. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/lightning_xoftr_pretrain.py +171 -0
  419. vismatch/third_party/MINIMA/third_party/XoFTR/src/losses/xoftr_loss.py +170 -0
  420. vismatch/third_party/MINIMA/third_party/XoFTR/src/losses/xoftr_loss_pretrain.py +37 -0
  421. vismatch/third_party/MINIMA/third_party/XoFTR/src/optimizers/__init__.py +42 -0
  422. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/augment.py +113 -0
  423. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/comm.py +265 -0
  424. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/data_io.py +144 -0
  425. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/dataloader.py +23 -0
  426. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/dataset.py +279 -0
  427. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/metrics.py +211 -0
  428. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/misc.py +101 -0
  429. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/plotting.py +227 -0
  430. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/pretrain_utils.py +83 -0
  431. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/profiler.py +39 -0
  432. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/__init__.py +2 -0
  433. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/backbone/__init__.py +1 -0
  434. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/backbone/resnet.py +95 -0
  435. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/utils/geometry.py +107 -0
  436. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/utils/position_encoding.py +36 -0
  437. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/utils/supervision.py +290 -0
  438. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr.py +94 -0
  439. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/__init__.py +4 -0
  440. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/coarse_matching.py +305 -0
  441. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/fine_matching.py +170 -0
  442. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/fine_process.py +321 -0
  443. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/linear_attention.py +81 -0
  444. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/transformer.py +101 -0
  445. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_pretrain.py +209 -0
  446. vismatch/third_party/MINIMA/third_party/XoFTR/test.py +68 -0
  447. vismatch/third_party/MINIMA/third_party/XoFTR/test_relative_pose.py +330 -0
  448. vismatch/third_party/MINIMA/third_party/XoFTR/train.py +126 -0
  449. vismatch/third_party/MatchAnything/app.py +27 -0
  450. vismatch/third_party/MatchAnything/imcui/__init__.py +0 -0
  451. vismatch/third_party/MatchAnything/imcui/api/__init__.py +47 -0
  452. vismatch/third_party/MatchAnything/imcui/api/client.py +232 -0
  453. vismatch/third_party/MatchAnything/imcui/api/core.py +308 -0
  454. vismatch/third_party/MatchAnything/imcui/api/server.py +170 -0
  455. vismatch/third_party/MatchAnything/imcui/hloc/__init__.py +65 -0
  456. vismatch/third_party/MatchAnything/imcui/hloc/colmap_from_nvm.py +216 -0
  457. vismatch/third_party/MatchAnything/imcui/hloc/extract_features.py +607 -0
  458. vismatch/third_party/MatchAnything/imcui/hloc/extractors/__init__.py +0 -0
  459. vismatch/third_party/MatchAnything/imcui/hloc/extractors/alike.py +61 -0
  460. vismatch/third_party/MatchAnything/imcui/hloc/extractors/aliked.py +32 -0
  461. vismatch/third_party/MatchAnything/imcui/hloc/extractors/cosplace.py +44 -0
  462. vismatch/third_party/MatchAnything/imcui/hloc/extractors/d2net.py +60 -0
  463. vismatch/third_party/MatchAnything/imcui/hloc/extractors/darkfeat.py +44 -0
  464. vismatch/third_party/MatchAnything/imcui/hloc/extractors/dedode.py +86 -0
  465. vismatch/third_party/MatchAnything/imcui/hloc/extractors/dir.py +78 -0
  466. vismatch/third_party/MatchAnything/imcui/hloc/extractors/disk.py +35 -0
  467. vismatch/third_party/MatchAnything/imcui/hloc/extractors/dog.py +135 -0
  468. vismatch/third_party/MatchAnything/imcui/hloc/extractors/eigenplaces.py +57 -0
  469. vismatch/third_party/MatchAnything/imcui/hloc/extractors/example.py +56 -0
  470. vismatch/third_party/MatchAnything/imcui/hloc/extractors/fire.py +72 -0
  471. vismatch/third_party/MatchAnything/imcui/hloc/extractors/fire_local.py +84 -0
  472. vismatch/third_party/MatchAnything/imcui/hloc/extractors/lanet.py +63 -0
  473. vismatch/third_party/MatchAnything/imcui/hloc/extractors/netvlad.py +146 -0
  474. vismatch/third_party/MatchAnything/imcui/hloc/extractors/openibl.py +26 -0
  475. vismatch/third_party/MatchAnything/imcui/hloc/extractors/r2d2.py +73 -0
  476. vismatch/third_party/MatchAnything/imcui/hloc/extractors/rekd.py +60 -0
  477. vismatch/third_party/MatchAnything/imcui/hloc/extractors/rord.py +59 -0
  478. vismatch/third_party/MatchAnything/imcui/hloc/extractors/sfd2.py +44 -0
  479. vismatch/third_party/MatchAnything/imcui/hloc/extractors/sift.py +216 -0
  480. vismatch/third_party/MatchAnything/imcui/hloc/extractors/superpoint.py +51 -0
  481. vismatch/third_party/MatchAnything/imcui/hloc/extractors/xfeat.py +33 -0
  482. vismatch/third_party/MatchAnything/imcui/hloc/localize_inloc.py +179 -0
  483. vismatch/third_party/MatchAnything/imcui/hloc/localize_sfm.py +243 -0
  484. vismatch/third_party/MatchAnything/imcui/hloc/match_dense.py +1158 -0
  485. vismatch/third_party/MatchAnything/imcui/hloc/match_features.py +459 -0
  486. vismatch/third_party/MatchAnything/imcui/hloc/matchers/__init__.py +3 -0
  487. vismatch/third_party/MatchAnything/imcui/hloc/matchers/adalam.py +68 -0
  488. vismatch/third_party/MatchAnything/imcui/hloc/matchers/aspanformer.py +66 -0
  489. vismatch/third_party/MatchAnything/imcui/hloc/matchers/cotr.py +77 -0
  490. vismatch/third_party/MatchAnything/imcui/hloc/matchers/dkm.py +53 -0
  491. vismatch/third_party/MatchAnything/imcui/hloc/matchers/dual_softmax.py +71 -0
  492. vismatch/third_party/MatchAnything/imcui/hloc/matchers/duster.py +109 -0
  493. vismatch/third_party/MatchAnything/imcui/hloc/matchers/eloftr.py +97 -0
  494. vismatch/third_party/MatchAnything/imcui/hloc/matchers/gim.py +200 -0
  495. vismatch/third_party/MatchAnything/imcui/hloc/matchers/gluestick.py +99 -0
  496. vismatch/third_party/MatchAnything/imcui/hloc/matchers/imp.py +50 -0
  497. vismatch/third_party/MatchAnything/imcui/hloc/matchers/lightglue.py +67 -0
  498. vismatch/third_party/MatchAnything/imcui/hloc/matchers/loftr.py +58 -0
  499. vismatch/third_party/MatchAnything/imcui/hloc/matchers/mast3r.py +96 -0
  500. vismatch/third_party/MatchAnything/imcui/hloc/matchers/matchanything.py +191 -0
  501. vismatch/third_party/MatchAnything/imcui/hloc/matchers/mickey.py +50 -0
  502. vismatch/third_party/MatchAnything/imcui/hloc/matchers/nearest_neighbor.py +66 -0
  503. vismatch/third_party/MatchAnything/imcui/hloc/matchers/omniglue.py +80 -0
  504. vismatch/third_party/MatchAnything/imcui/hloc/matchers/roma.py +80 -0
  505. vismatch/third_party/MatchAnything/imcui/hloc/matchers/sgmnet.py +106 -0
  506. vismatch/third_party/MatchAnything/imcui/hloc/matchers/sold2.py +144 -0
  507. vismatch/third_party/MatchAnything/imcui/hloc/matchers/superglue.py +33 -0
  508. vismatch/third_party/MatchAnything/imcui/hloc/matchers/topicfm.py +60 -0
  509. vismatch/third_party/MatchAnything/imcui/hloc/matchers/xfeat_dense.py +54 -0
  510. vismatch/third_party/MatchAnything/imcui/hloc/matchers/xfeat_lightglue.py +48 -0
  511. vismatch/third_party/MatchAnything/imcui/hloc/matchers/xoftr.py +90 -0
  512. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_covisibility.py +60 -0
  513. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_exhaustive.py +64 -0
  514. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_poses.py +68 -0
  515. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_retrieval.py +133 -0
  516. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/__init__.py +0 -0
  517. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/localize.py +89 -0
  518. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/prepare_reference.py +51 -0
  519. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/utils.py +231 -0
  520. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/__init__.py +0 -0
  521. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/create_gt_sfm.py +134 -0
  522. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/pipeline.py +139 -0
  523. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/utils.py +34 -0
  524. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen/__init__.py +0 -0
  525. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen/pipeline.py +109 -0
  526. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen_v1_1/__init__.py +0 -0
  527. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen_v1_1/pipeline.py +104 -0
  528. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen_v1_1/pipeline_loftr.py +104 -0
  529. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/CMU/__init__.py +0 -0
  530. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/CMU/pipeline.py +133 -0
  531. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Cambridge/__init__.py +0 -0
  532. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Cambridge/pipeline.py +140 -0
  533. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Cambridge/utils.py +145 -0
  534. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/RobotCar/__init__.py +0 -0
  535. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/RobotCar/colmap_from_nvm.py +176 -0
  536. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/RobotCar/pipeline.py +143 -0
  537. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/__init__.py +0 -0
  538. vismatch/third_party/MatchAnything/imcui/hloc/reconstruction.py +194 -0
  539. vismatch/third_party/MatchAnything/imcui/hloc/triangulation.py +311 -0
  540. vismatch/third_party/MatchAnything/imcui/hloc/utils/__init__.py +12 -0
  541. vismatch/third_party/MatchAnything/imcui/hloc/utils/base_model.py +56 -0
  542. vismatch/third_party/MatchAnything/imcui/hloc/utils/database.py +412 -0
  543. vismatch/third_party/MatchAnything/imcui/hloc/utils/geometry.py +16 -0
  544. vismatch/third_party/MatchAnything/imcui/hloc/utils/io.py +77 -0
  545. vismatch/third_party/MatchAnything/imcui/hloc/utils/parsers.py +59 -0
  546. vismatch/third_party/MatchAnything/imcui/hloc/utils/read_write_model.py +588 -0
  547. vismatch/third_party/MatchAnything/imcui/hloc/utils/viz.py +146 -0
  548. vismatch/third_party/MatchAnything/imcui/hloc/utils/viz_3d.py +203 -0
  549. vismatch/third_party/MatchAnything/imcui/hloc/visualization.py +178 -0
  550. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/configs/models/eloftr_model.py +128 -0
  551. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/configs/models/roma_model.py +27 -0
  552. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/notebooks/notebooks_utils/__init__.py +1 -0
  553. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/notebooks/notebooks_utils/plotting.py +344 -0
  554. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/__init__.py +0 -0
  555. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/config/default.py +344 -0
  556. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/datasets/common_data_pair.py +214 -0
  557. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/lightning/lightning_loftr.py +343 -0
  558. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/__init__.py +1 -0
  559. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/__init__.py +61 -0
  560. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/repvgg.py +319 -0
  561. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/resnet_fpn.py +1094 -0
  562. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/s2dnet.py +131 -0
  563. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr.py +273 -0
  564. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/__init__.py +2 -0
  565. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/fine_preprocess.py +350 -0
  566. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/linear_attention.py +217 -0
  567. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/transformer.py +1768 -0
  568. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/transformer_utils.py +76 -0
  569. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/coarse_matching.py +266 -0
  570. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/fine_matching.py +493 -0
  571. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/geometry.py +298 -0
  572. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/position_encoding.py +131 -0
  573. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/supervision.py +475 -0
  574. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/optimizers/__init__.py +50 -0
  575. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/__init__.py +0 -0
  576. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/augment.py +55 -0
  577. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/__init__.py +0 -0
  578. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/database.py +417 -0
  579. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/eval_helper.py +232 -0
  580. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/read_write_model.py +509 -0
  581. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap.py +530 -0
  582. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/comm.py +265 -0
  583. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/dataloader.py +23 -0
  584. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/dataset.py +518 -0
  585. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/easydict.py +148 -0
  586. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/geometry.py +366 -0
  587. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/homography_utils.py +366 -0
  588. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/metrics.py +445 -0
  589. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/misc.py +101 -0
  590. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/plotting.py +248 -0
  591. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/profiler.py +39 -0
  592. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/ray_utils.py +134 -0
  593. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/sample_homo.py +58 -0
  594. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/utils.py +600 -0
  595. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_3D_effect.py +46 -0
  596. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_fundamental.py +32 -0
  597. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_fundamental_model_warpper.py +34 -0
  598. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_match.py +50 -0
  599. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_match_opencv_sift.py +43 -0
  600. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo_single_pair.py +329 -0
  601. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/experiments/roma_indoor.py +320 -0
  602. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/experiments/roma_outdoor.py +327 -0
  603. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/notebooks/notebooks_utils/__init__.py +1 -0
  604. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/notebooks/notebooks_utils/plotting.py +331 -0
  605. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/__init__.py +8 -0
  606. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/__init__.py +4 -0
  607. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/hpatches_sequences_homog_benchmark.py +113 -0
  608. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/megadepth_dense_benchmark.py +106 -0
  609. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/megadepth_pose_estimation_benchmark.py +140 -0
  610. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/scannet_benchmark.py +143 -0
  611. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/checkpointing/__init__.py +1 -0
  612. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/checkpointing/checkpoint.py +60 -0
  613. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/datasets/__init__.py +2 -0
  614. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/datasets/megadepth.py +230 -0
  615. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/datasets/scannet.py +160 -0
  616. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/losses/__init__.py +1 -0
  617. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/losses/robust_loss.py +157 -0
  618. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/matchanything_roma_model.py +104 -0
  619. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/__init__.py +1 -0
  620. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/blocks.py +241 -0
  621. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/criterion.py +37 -0
  622. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/croco.py +253 -0
  623. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/croco_downstream.py +122 -0
  624. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/curope/__init__.py +4 -0
  625. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/curope/curope2d.py +40 -0
  626. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/curope/setup.py +34 -0
  627. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/dpt_block.py +450 -0
  628. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/head_downstream.py +58 -0
  629. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/masking.py +25 -0
  630. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/pos_embed.py +159 -0
  631. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/__init__.py +2 -0
  632. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/__init__.py +29 -0
  633. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/base_opt.py +375 -0
  634. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/commons.py +90 -0
  635. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/init_im_poses.py +312 -0
  636. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/optimizer.py +230 -0
  637. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/pair_viewer.py +125 -0
  638. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/__init__.py +42 -0
  639. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/__init__.py +2 -0
  640. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/base_stereo_view_dataset.py +220 -0
  641. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/batched_sampler.py +74 -0
  642. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/easy_dataset.py +157 -0
  643. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/co3d.py +146 -0
  644. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/utils/__init__.py +2 -0
  645. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/utils/cropping.py +119 -0
  646. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/utils/transforms.py +11 -0
  647. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/__init__.py +19 -0
  648. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/dpt_head.py +114 -0
  649. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/linear_head.py +41 -0
  650. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/postprocess.py +58 -0
  651. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/image_pairs.py +83 -0
  652. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/inference.py +165 -0
  653. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/losses.py +297 -0
  654. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/model.py +167 -0
  655. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/optim_factory.py +14 -0
  656. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/patch_embed.py +70 -0
  657. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/post_process.py +60 -0
  658. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/__init__.py +2 -0
  659. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/device.py +76 -0
  660. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/geometry.py +361 -0
  661. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/image.py +104 -0
  662. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/misc.py +121 -0
  663. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/path_to_croco.py +19 -0
  664. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/viz.py +320 -0
  665. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/encoders.py +137 -0
  666. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/matcher.py +937 -0
  667. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/model_zoo/__init__.py +53 -0
  668. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/model_zoo/roma_models.py +162 -0
  669. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/__init__.py +47 -0
  670. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/dinov2.py +359 -0
  671. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/__init__.py +12 -0
  672. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/attention.py +81 -0
  673. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/block.py +252 -0
  674. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/dino_head.py +59 -0
  675. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/drop_path.py +35 -0
  676. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/layer_scale.py +28 -0
  677. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/mlp.py +41 -0
  678. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/patch_embed.py +89 -0
  679. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/swiglu_ffn.py +63 -0
  680. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/roma_adpat_model.py +32 -0
  681. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/train/__init__.py +1 -0
  682. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/train/train.py +102 -0
  683. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/__init__.py +18 -0
  684. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/kde.py +8 -0
  685. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/local_correlation.py +44 -0
  686. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/transforms.py +118 -0
  687. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/utils.py +661 -0
  688. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/setup.py +9 -0
  689. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/__init__.py +0 -0
  690. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/evaluate_datasets.py +239 -0
  691. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/tools_utils/data_io.py +94 -0
  692. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/tools_utils/plot.py +77 -0
  693. vismatch/third_party/MatchAnything/imcui/ui/__init__.py +5 -0
  694. vismatch/third_party/MatchAnything/imcui/ui/app_class.py +824 -0
  695. vismatch/third_party/MatchAnything/imcui/ui/sfm.py +164 -0
  696. vismatch/third_party/MatchAnything/imcui/ui/utils.py +1085 -0
  697. vismatch/third_party/MatchAnything/imcui/ui/viz.py +511 -0
  698. vismatch/third_party/MatchAnything/tests/test_basic.py +111 -0
  699. vismatch/third_party/MatchFormer/config/data/__init__.py +0 -0
  700. vismatch/third_party/MatchFormer/config/data/base.py +35 -0
  701. vismatch/third_party/MatchFormer/config/data/megadepth_test_1500.py +11 -0
  702. vismatch/third_party/MatchFormer/config/data/scannet_test_1500.py +11 -0
  703. vismatch/third_party/MatchFormer/config/defaultmf.py +88 -0
  704. vismatch/third_party/MatchFormer/model/backbone/__init__.py +17 -0
  705. vismatch/third_party/MatchFormer/model/backbone/coarse_matching.py +228 -0
  706. vismatch/third_party/MatchFormer/model/backbone/fine_matching.py +74 -0
  707. vismatch/third_party/MatchFormer/model/backbone/fine_preprocess.py +59 -0
  708. vismatch/third_party/MatchFormer/model/backbone/match_LA_large.py +254 -0
  709. vismatch/third_party/MatchFormer/model/backbone/match_LA_lite.py +254 -0
  710. vismatch/third_party/MatchFormer/model/backbone/match_SEA_large.py +291 -0
  711. vismatch/third_party/MatchFormer/model/backbone/match_SEA_lite.py +291 -0
  712. vismatch/third_party/MatchFormer/model/data.py +320 -0
  713. vismatch/third_party/MatchFormer/model/datasets/dataset.py +231 -0
  714. vismatch/third_party/MatchFormer/model/datasets/megadepth.py +126 -0
  715. vismatch/third_party/MatchFormer/model/datasets/sampler.py +77 -0
  716. vismatch/third_party/MatchFormer/model/datasets/scannet.py +113 -0
  717. vismatch/third_party/MatchFormer/model/lightning_loftr.py +102 -0
  718. vismatch/third_party/MatchFormer/model/matchformer.py +54 -0
  719. vismatch/third_party/MatchFormer/model/utils/augment.py +55 -0
  720. vismatch/third_party/MatchFormer/model/utils/comm.py +265 -0
  721. vismatch/third_party/MatchFormer/model/utils/dataloader.py +23 -0
  722. vismatch/third_party/MatchFormer/model/utils/metrics.py +193 -0
  723. vismatch/third_party/MatchFormer/model/utils/misc.py +101 -0
  724. vismatch/third_party/MatchFormer/model/utils/profiler.py +39 -0
  725. vismatch/third_party/MatchFormer/test.py +55 -0
  726. vismatch/third_party/RIPE/app.py +272 -0
  727. vismatch/third_party/RIPE/demo.py +51 -0
  728. vismatch/third_party/RIPE/ripe/__init__.py +1 -0
  729. vismatch/third_party/RIPE/ripe/benchmarks/imw_2020.py +320 -0
  730. vismatch/third_party/RIPE/ripe/data/__init__.py +0 -0
  731. vismatch/third_party/RIPE/ripe/data/data_transforms.py +204 -0
  732. vismatch/third_party/RIPE/ripe/data/datasets/__init__.py +0 -0
  733. vismatch/third_party/RIPE/ripe/data/datasets/acdc.py +154 -0
  734. vismatch/third_party/RIPE/ripe/data/datasets/dataset_combinator.py +88 -0
  735. vismatch/third_party/RIPE/ripe/data/datasets/disk_imw.py +160 -0
  736. vismatch/third_party/RIPE/ripe/data/datasets/disk_megadepth.py +157 -0
  737. vismatch/third_party/RIPE/ripe/data/datasets/tokyo247.py +134 -0
  738. vismatch/third_party/RIPE/ripe/data/datasets/tokyo_query_v3.py +78 -0
  739. vismatch/third_party/RIPE/ripe/losses/__init__.py +0 -0
  740. vismatch/third_party/RIPE/ripe/losses/contrastive_loss.py +88 -0
  741. vismatch/third_party/RIPE/ripe/matcher/__init__.py +0 -0
  742. vismatch/third_party/RIPE/ripe/matcher/concurrent_matcher.py +97 -0
  743. vismatch/third_party/RIPE/ripe/matcher/pose_estimator_poselib.py +31 -0
  744. vismatch/third_party/RIPE/ripe/model_zoo/__init__.py +1 -0
  745. vismatch/third_party/RIPE/ripe/model_zoo/vgg_hyper.py +39 -0
  746. vismatch/third_party/RIPE/ripe/models/__init__.py +0 -0
  747. vismatch/third_party/RIPE/ripe/models/backbones/__init__.py +0 -0
  748. vismatch/third_party/RIPE/ripe/models/backbones/backbone_base.py +61 -0
  749. vismatch/third_party/RIPE/ripe/models/backbones/vgg.py +99 -0
  750. vismatch/third_party/RIPE/ripe/models/backbones/vgg_utils.py +143 -0
  751. vismatch/third_party/RIPE/ripe/models/ripe.py +303 -0
  752. vismatch/third_party/RIPE/ripe/models/upsampler/hypercolumn_features.py +54 -0
  753. vismatch/third_party/RIPE/ripe/models/upsampler/interpolate_sparse2d.py +37 -0
  754. vismatch/third_party/RIPE/ripe/scheduler/__init__.py +0 -0
  755. vismatch/third_party/RIPE/ripe/scheduler/constant.py +6 -0
  756. vismatch/third_party/RIPE/ripe/scheduler/expDecay.py +26 -0
  757. vismatch/third_party/RIPE/ripe/scheduler/linearLR.py +37 -0
  758. vismatch/third_party/RIPE/ripe/scheduler/linear_with_plateaus.py +44 -0
  759. vismatch/third_party/RIPE/ripe/train.py +410 -0
  760. vismatch/third_party/RIPE/ripe/utils/__init__.py +2 -0
  761. vismatch/third_party/RIPE/ripe/utils/image_utils.py +62 -0
  762. vismatch/third_party/RIPE/ripe/utils/pose_error.py +62 -0
  763. vismatch/third_party/RIPE/ripe/utils/pylogger.py +32 -0
  764. vismatch/third_party/RIPE/ripe/utils/utils.py +192 -0
  765. vismatch/third_party/RIPE/ripe/utils/wandb_utils.py +16 -0
  766. vismatch/third_party/RoMa/demo/demo_3D_effect.py +47 -0
  767. vismatch/third_party/RoMa/demo/demo_fundamental.py +34 -0
  768. vismatch/third_party/RoMa/demo/demo_match.py +50 -0
  769. vismatch/third_party/RoMa/demo/demo_match_opencv_sift.py +43 -0
  770. vismatch/third_party/RoMa/demo/demo_match_tiny.py +77 -0
  771. vismatch/third_party/RoMa/experiments/eval_roma_outdoor.py +57 -0
  772. vismatch/third_party/RoMa/experiments/eval_tiny_roma_v1_outdoor.py +84 -0
  773. vismatch/third_party/RoMa/experiments/roma_indoor.py +320 -0
  774. vismatch/third_party/RoMa/experiments/train_roma_outdoor.py +307 -0
  775. vismatch/third_party/RoMa/experiments/train_tiny_roma_v1_outdoor.py +498 -0
  776. vismatch/third_party/RoMa/romatch/__init__.py +8 -0
  777. vismatch/third_party/RoMa/romatch/benchmarks/__init__.py +6 -0
  778. vismatch/third_party/RoMa/romatch/benchmarks/hpatches_sequences_homog_benchmark.py +113 -0
  779. vismatch/third_party/RoMa/romatch/benchmarks/megadepth_dense_benchmark.py +106 -0
  780. vismatch/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark.py +118 -0
  781. vismatch/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark_poselib.py +119 -0
  782. vismatch/third_party/RoMa/romatch/benchmarks/scannet_benchmark.py +143 -0
  783. vismatch/third_party/RoMa/romatch/checkpointing/__init__.py +1 -0
  784. vismatch/third_party/RoMa/romatch/checkpointing/checkpoint.py +60 -0
  785. vismatch/third_party/RoMa/romatch/datasets/__init__.py +2 -0
  786. vismatch/third_party/RoMa/romatch/datasets/megadepth.py +232 -0
  787. vismatch/third_party/RoMa/romatch/datasets/scannet.py +160 -0
  788. vismatch/third_party/RoMa/romatch/losses/__init__.py +1 -0
  789. vismatch/third_party/RoMa/romatch/losses/robust_loss.py +161 -0
  790. vismatch/third_party/RoMa/romatch/losses/robust_loss_tiny_roma.py +160 -0
  791. vismatch/third_party/RoMa/romatch/models/__init__.py +1 -0
  792. vismatch/third_party/RoMa/romatch/models/encoders.py +122 -0
  793. vismatch/third_party/RoMa/romatch/models/matcher.py +748 -0
  794. vismatch/third_party/RoMa/romatch/models/model_zoo/__init__.py +73 -0
  795. vismatch/third_party/RoMa/romatch/models/model_zoo/roma_models.py +170 -0
  796. vismatch/third_party/RoMa/romatch/models/tiny.py +304 -0
  797. vismatch/third_party/RoMa/romatch/models/transformer/__init__.py +48 -0
  798. vismatch/third_party/RoMa/romatch/models/transformer/dinov2.py +359 -0
  799. vismatch/third_party/RoMa/romatch/models/transformer/layers/__init__.py +12 -0
  800. vismatch/third_party/RoMa/romatch/models/transformer/layers/attention.py +81 -0
  801. vismatch/third_party/RoMa/romatch/models/transformer/layers/block.py +252 -0
  802. vismatch/third_party/RoMa/romatch/models/transformer/layers/dino_head.py +59 -0
  803. vismatch/third_party/RoMa/romatch/models/transformer/layers/drop_path.py +35 -0
  804. vismatch/third_party/RoMa/romatch/models/transformer/layers/layer_scale.py +28 -0
  805. vismatch/third_party/RoMa/romatch/models/transformer/layers/mlp.py +41 -0
  806. vismatch/third_party/RoMa/romatch/models/transformer/layers/patch_embed.py +89 -0
  807. vismatch/third_party/RoMa/romatch/models/transformer/layers/swiglu_ffn.py +63 -0
  808. vismatch/third_party/RoMa/romatch/train/__init__.py +1 -0
  809. vismatch/third_party/RoMa/romatch/train/train.py +102 -0
  810. vismatch/third_party/RoMa/romatch/utils/__init__.py +16 -0
  811. vismatch/third_party/RoMa/romatch/utils/kde.py +13 -0
  812. vismatch/third_party/RoMa/romatch/utils/local_correlation.py +48 -0
  813. vismatch/third_party/RoMa/romatch/utils/transforms.py +118 -0
  814. vismatch/third_party/RoMa/romatch/utils/utils.py +654 -0
  815. vismatch/third_party/RoMa/setup.py +9 -0
  816. vismatch/third_party/RoMaV2/demo/demo_covariance.py +52 -0
  817. vismatch/third_party/RoMaV2/demo/demo_match.py +55 -0
  818. vismatch/third_party/RoMaV2/src/romav2/__init__.py +8 -0
  819. vismatch/third_party/RoMaV2/src/romav2/benchmarks/__init__.py +4 -0
  820. vismatch/third_party/RoMaV2/src/romav2/benchmarks/mega1500.py +115 -0
  821. vismatch/third_party/RoMaV2/src/romav2/benchmarks/satast.py +463 -0
  822. vismatch/third_party/RoMaV2/src/romav2/benchmarks/scannet1500.py +125 -0
  823. vismatch/third_party/RoMaV2/src/romav2/benchmarks/wxbs.py +104 -0
  824. vismatch/third_party/RoMaV2/src/romav2/device.py +9 -0
  825. vismatch/third_party/RoMaV2/src/romav2/dpt.py +516 -0
  826. vismatch/third_party/RoMaV2/src/romav2/features.py +190 -0
  827. vismatch/third_party/RoMaV2/src/romav2/geometry.py +261 -0
  828. vismatch/third_party/RoMaV2/src/romav2/io.py +24 -0
  829. vismatch/third_party/RoMaV2/src/romav2/local_correlation.py +152 -0
  830. vismatch/third_party/RoMaV2/src/romav2/logging.py +97 -0
  831. vismatch/third_party/RoMaV2/src/romav2/matcher.py +207 -0
  832. vismatch/third_party/RoMaV2/src/romav2/normalizers.py +17 -0
  833. vismatch/third_party/RoMaV2/src/romav2/refiner.py +277 -0
  834. vismatch/third_party/RoMaV2/src/romav2/romav2.py +533 -0
  835. vismatch/third_party/RoMaV2/src/romav2/types.py +75 -0
  836. vismatch/third_party/RoMaV2/src/romav2/vis.py +36 -0
  837. vismatch/third_party/RoMaV2/src/romav2/vit/__init__.py +304 -0
  838. vismatch/third_party/RoMaV2/src/romav2/vit/attention.py +181 -0
  839. vismatch/third_party/RoMaV2/src/romav2/vit/block.py +293 -0
  840. vismatch/third_party/RoMaV2/src/romav2/vit/ffn_layers.py +83 -0
  841. vismatch/third_party/RoMaV2/src/romav2/vit/layer_scale.py +29 -0
  842. vismatch/third_party/RoMaV2/src/romav2/vit/patch_embed.py +94 -0
  843. vismatch/third_party/RoMaV2/src/romav2/vit/rms_norm.py +24 -0
  844. vismatch/third_party/RoMaV2/src/romav2/vit/rope.py +133 -0
  845. vismatch/third_party/RoMaV2/src/romav2/vit/rope_mixed.py +111 -0
  846. vismatch/third_party/RoMaV2/src/romav2/vit/utils.py +48 -0
  847. vismatch/third_party/RoMaV2/tests/test_bidirectional.py +93 -0
  848. vismatch/third_party/RoMaV2/tests/test_fps.py +49 -0
  849. vismatch/third_party/RoMaV2/tests/test_mega1500.py +22 -0
  850. vismatch/third_party/RoMaV2/tests/test_scannet1500.py +21 -0
  851. vismatch/third_party/RoMaV2/tests/test_smoke.py +15 -0
  852. vismatch/third_party/Se2_LoFTR/configs/data/__init__.py +0 -0
  853. vismatch/third_party/Se2_LoFTR/configs/data/base.py +35 -0
  854. vismatch/third_party/Se2_LoFTR/configs/data/megadepth_test_1500.py +11 -0
  855. vismatch/third_party/Se2_LoFTR/configs/data/megadepth_trainval_640.py +22 -0
  856. vismatch/third_party/Se2_LoFTR/configs/data/megadepth_trainval_840.py +22 -0
  857. vismatch/third_party/Se2_LoFTR/configs/data/scannet_test_1500.py +11 -0
  858. vismatch/third_party/Se2_LoFTR/configs/data/scannet_trainval.py +17 -0
  859. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds.py +6 -0
  860. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds_dense.py +8 -0
  861. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot.py +6 -0
  862. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot_dense.py +8 -0
  863. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ds.py +5 -0
  864. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ds_dense.py +7 -0
  865. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ot.py +5 -0
  866. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ot_dense.py +7 -0
  867. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval.py +16 -0
  868. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval_new.py +18 -0
  869. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds.py +16 -0
  870. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds_dense.py +17 -0
  871. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot.py +16 -0
  872. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot_dense.py +17 -0
  873. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds.py +17 -0
  874. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_dense.py +17 -0
  875. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2.py +20 -0
  876. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2_dense.py +23 -0
  877. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2_dense_8rot.py +23 -0
  878. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2_dense_big.py +22 -0
  879. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ot.py +17 -0
  880. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ot_dense.py +18 -0
  881. vismatch/third_party/Se2_LoFTR/demo/demo_loftr.py +240 -0
  882. vismatch/third_party/Se2_LoFTR/src/__init__.py +0 -0
  883. vismatch/third_party/Se2_LoFTR/src/config/default.py +173 -0
  884. vismatch/third_party/Se2_LoFTR/src/datasets/megadepth.py +127 -0
  885. vismatch/third_party/Se2_LoFTR/src/datasets/sampler.py +77 -0
  886. vismatch/third_party/Se2_LoFTR/src/datasets/scannet.py +114 -0
  887. vismatch/third_party/Se2_LoFTR/src/lightning/data.py +320 -0
  888. vismatch/third_party/Se2_LoFTR/src/lightning/lightning_loftr.py +249 -0
  889. vismatch/third_party/Se2_LoFTR/src/loftr/__init__.py +2 -0
  890. vismatch/third_party/Se2_LoFTR/src/loftr/backbone/__init__.py +17 -0
  891. vismatch/third_party/Se2_LoFTR/src/loftr/backbone/resnet_e2.py +170 -0
  892. vismatch/third_party/Se2_LoFTR/src/loftr/backbone/resnet_fpn.py +199 -0
  893. vismatch/third_party/Se2_LoFTR/src/loftr/loftr.py +81 -0
  894. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/__init__.py +2 -0
  895. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/fine_preprocess.py +59 -0
  896. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/linear_attention.py +81 -0
  897. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/transformer.py +101 -0
  898. vismatch/third_party/Se2_LoFTR/src/loftr/utils/coarse_matching.py +261 -0
  899. vismatch/third_party/Se2_LoFTR/src/loftr/utils/cvpr_ds_config.py +50 -0
  900. vismatch/third_party/Se2_LoFTR/src/loftr/utils/fine_matching.py +74 -0
  901. vismatch/third_party/Se2_LoFTR/src/loftr/utils/geometry.py +54 -0
  902. vismatch/third_party/Se2_LoFTR/src/loftr/utils/position_encoding.py +42 -0
  903. vismatch/third_party/Se2_LoFTR/src/loftr/utils/supervision.py +151 -0
  904. vismatch/third_party/Se2_LoFTR/src/losses/loftr_loss.py +192 -0
  905. vismatch/third_party/Se2_LoFTR/src/optimizers/__init__.py +42 -0
  906. vismatch/third_party/Se2_LoFTR/src/utils/augment.py +55 -0
  907. vismatch/third_party/Se2_LoFTR/src/utils/comm.py +265 -0
  908. vismatch/third_party/Se2_LoFTR/src/utils/dataloader.py +23 -0
  909. vismatch/third_party/Se2_LoFTR/src/utils/dataset.py +185 -0
  910. vismatch/third_party/Se2_LoFTR/src/utils/metrics.py +193 -0
  911. vismatch/third_party/Se2_LoFTR/src/utils/misc.py +104 -0
  912. vismatch/third_party/Se2_LoFTR/src/utils/plotting.py +154 -0
  913. vismatch/third_party/Se2_LoFTR/src/utils/profiler.py +39 -0
  914. vismatch/third_party/Se2_LoFTR/test.py +68 -0
  915. vismatch/third_party/Se2_LoFTR/train.py +123 -0
  916. vismatch/third_party/SphereGlue/demo_SphereGlue.py +141 -0
  917. vismatch/third_party/SphereGlue/model/sphereglue.py +230 -0
  918. vismatch/third_party/SphereGlue/utils/Utils.py +191 -0
  919. vismatch/third_party/SphereGlue/utils/demo_mydataset.py +119 -0
  920. vismatch/third_party/Steerers/rotation_steerers/matchers/dual_softmax_matcher.py +44 -0
  921. vismatch/third_party/Steerers/rotation_steerers/matchers/max_matches.py +205 -0
  922. vismatch/third_party/Steerers/rotation_steerers/matchers/max_similarity.py +115 -0
  923. vismatch/third_party/Steerers/rotation_steerers/steerers.py +37 -0
  924. vismatch/third_party/Steerers/setup.py +14 -0
  925. vismatch/third_party/TopicFM/configs/megadepth_test.py +17 -0
  926. vismatch/third_party/TopicFM/configs/megadepth_test_topicfmfast.py +17 -0
  927. vismatch/third_party/TopicFM/configs/megadepth_test_topicfmplus.py +20 -0
  928. vismatch/third_party/TopicFM/configs/megadepth_train.py +36 -0
  929. vismatch/third_party/TopicFM/configs/megadepth_train_topicfmfast.py +34 -0
  930. vismatch/third_party/TopicFM/configs/megadepth_train_topicfmplus.py +37 -0
  931. vismatch/third_party/TopicFM/configs/scannet_test.py +15 -0
  932. vismatch/third_party/TopicFM/configs/scannet_test_topicfmfast.py +15 -0
  933. vismatch/third_party/TopicFM/configs/scannet_test_topicfmplus.py +19 -0
  934. vismatch/third_party/TopicFM/src/__init__.py +11 -0
  935. vismatch/third_party/TopicFM/src/config/default.py +174 -0
  936. vismatch/third_party/TopicFM/src/datasets/aachen.py +29 -0
  937. vismatch/third_party/TopicFM/src/datasets/custom_dataloader.py +126 -0
  938. vismatch/third_party/TopicFM/src/datasets/inloc.py +29 -0
  939. vismatch/third_party/TopicFM/src/datasets/megadepth.py +170 -0
  940. vismatch/third_party/TopicFM/src/datasets/sampler.py +77 -0
  941. vismatch/third_party/TopicFM/src/datasets/scannet.py +115 -0
  942. vismatch/third_party/TopicFM/src/lightning_trainer/data.py +292 -0
  943. vismatch/third_party/TopicFM/src/lightning_trainer/trainer.py +244 -0
  944. vismatch/third_party/TopicFM/src/losses/loss.py +228 -0
  945. vismatch/third_party/TopicFM/src/models/__init__.py +1 -0
  946. vismatch/third_party/TopicFM/src/models/backbone/__init__.py +12 -0
  947. vismatch/third_party/TopicFM/src/models/backbone/convnext.py +165 -0
  948. vismatch/third_party/TopicFM/src/models/backbone/fpn.py +114 -0
  949. vismatch/third_party/TopicFM/src/models/modules/__init__.py +2 -0
  950. vismatch/third_party/TopicFM/src/models/modules/encoder.py +266 -0
  951. vismatch/third_party/TopicFM/src/models/modules/fine_preprocess.py +59 -0
  952. vismatch/third_party/TopicFM/src/models/modules/linear_attention.py +84 -0
  953. vismatch/third_party/TopicFM/src/models/topic_fm.py +100 -0
  954. vismatch/third_party/TopicFM/src/models/utils/coarse_matching.py +213 -0
  955. vismatch/third_party/TopicFM/src/models/utils/fine_matching.py +172 -0
  956. vismatch/third_party/TopicFM/src/models/utils/geometry.py +54 -0
  957. vismatch/third_party/TopicFM/src/models/utils/supervision.py +167 -0
  958. vismatch/third_party/TopicFM/src/optimizers/__init__.py +42 -0
  959. vismatch/third_party/TopicFM/src/utils/augment.py +55 -0
  960. vismatch/third_party/TopicFM/src/utils/comm.py +265 -0
  961. vismatch/third_party/TopicFM/src/utils/dataloader.py +23 -0
  962. vismatch/third_party/TopicFM/src/utils/dataset.py +206 -0
  963. vismatch/third_party/TopicFM/src/utils/metrics.py +193 -0
  964. vismatch/third_party/TopicFM/src/utils/misc.py +101 -0
  965. vismatch/third_party/TopicFM/src/utils/plotting.py +313 -0
  966. vismatch/third_party/TopicFM/src/utils/profiler.py +39 -0
  967. vismatch/third_party/TopicFM/test.py +70 -0
  968. vismatch/third_party/TopicFM/third_party/__init__.py +0 -0
  969. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/indoor/aspan_test.py +7 -0
  970. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/indoor/aspan_train.py +8 -0
  971. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/outdoor/aspan_test.py +18 -0
  972. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/outdoor/aspan_train.py +17 -0
  973. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/__init__.py +0 -0
  974. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/base.py +35 -0
  975. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/megadepth_test_1500.py +13 -0
  976. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/megadepth_trainval_832.py +22 -0
  977. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/scannet_test_1500.py +11 -0
  978. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/scannet_trainval.py +17 -0
  979. vismatch/third_party/TopicFM/third_party/aspanformer/demo/demo.py +63 -0
  980. vismatch/third_party/TopicFM/third_party/aspanformer/demo/demo_utils.py +44 -0
  981. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/__init__.py +2 -0
  982. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/__init__.py +3 -0
  983. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/attention.py +198 -0
  984. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/fine_preprocess.py +59 -0
  985. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/loftr.py +112 -0
  986. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/transformer.py +244 -0
  987. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspanformer.py +133 -0
  988. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/backbone/__init__.py +11 -0
  989. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/backbone/resnet_fpn.py +199 -0
  990. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/coarse_matching.py +331 -0
  991. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/cvpr_ds_config.py +50 -0
  992. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/fine_matching.py +74 -0
  993. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/geometry.py +54 -0
  994. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/position_encoding.py +61 -0
  995. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/supervision.py +151 -0
  996. vismatch/third_party/TopicFM/third_party/aspanformer/src/__init__.py +0 -0
  997. vismatch/third_party/TopicFM/third_party/aspanformer/src/config/default.py +180 -0
  998. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/__init__.py +3 -0
  999. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/megadepth.py +127 -0
  1000. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/sampler.py +77 -0
  1001. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/scannet.py +113 -0
  1002. vismatch/third_party/TopicFM/third_party/aspanformer/src/lightning/data.py +326 -0
  1003. vismatch/third_party/TopicFM/third_party/aspanformer/src/lightning/lightning_aspanformer.py +276 -0
  1004. vismatch/third_party/TopicFM/third_party/aspanformer/src/losses/aspan_loss.py +231 -0
  1005. vismatch/third_party/TopicFM/third_party/aspanformer/src/optimizers/__init__.py +42 -0
  1006. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/augment.py +55 -0
  1007. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/comm.py +265 -0
  1008. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/dataloader.py +23 -0
  1009. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/dataset.py +222 -0
  1010. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/metrics.py +260 -0
  1011. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/misc.py +139 -0
  1012. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/plotting.py +219 -0
  1013. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/profiler.py +39 -0
  1014. vismatch/third_party/TopicFM/third_party/aspanformer/test.py +69 -0
  1015. vismatch/third_party/TopicFM/third_party/aspanformer/tools/SensorData.py +125 -0
  1016. vismatch/third_party/TopicFM/third_party/aspanformer/tools/extract.py +47 -0
  1017. vismatch/third_party/TopicFM/third_party/aspanformer/tools/preprocess_scene.py +242 -0
  1018. vismatch/third_party/TopicFM/third_party/aspanformer/tools/reader.py +39 -0
  1019. vismatch/third_party/TopicFM/third_party/aspanformer/tools/undistort_mega.py +69 -0
  1020. vismatch/third_party/TopicFM/third_party/aspanformer/train.py +134 -0
  1021. vismatch/third_party/TopicFM/third_party/loftr/configs/data/__init__.py +0 -0
  1022. vismatch/third_party/TopicFM/third_party/loftr/configs/data/base.py +35 -0
  1023. vismatch/third_party/TopicFM/third_party/loftr/configs/data/megadepth_test_1500.py +11 -0
  1024. vismatch/third_party/TopicFM/third_party/loftr/configs/data/megadepth_trainval_640.py +22 -0
  1025. vismatch/third_party/TopicFM/third_party/loftr/configs/data/megadepth_trainval_840.py +22 -0
  1026. vismatch/third_party/TopicFM/third_party/loftr/configs/data/scannet_test_1500.py +11 -0
  1027. vismatch/third_party/TopicFM/third_party/loftr/configs/data/scannet_trainval.py +17 -0
  1028. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ds.py +6 -0
  1029. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ds_dense.py +8 -0
  1030. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ot.py +6 -0
  1031. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ot_dense.py +8 -0
  1032. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ds.py +5 -0
  1033. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ds_dense.py +7 -0
  1034. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ot.py +5 -0
  1035. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ot_dense.py +7 -0
  1036. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/scannet/loftr_ds_eval.py +16 -0
  1037. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/scannet/loftr_ds_eval_new.py +18 -0
  1038. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ds.py +16 -0
  1039. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ds_dense.py +17 -0
  1040. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ot.py +16 -0
  1041. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ot_dense.py +17 -0
  1042. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ds.py +15 -0
  1043. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ds_dense.py +16 -0
  1044. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ot.py +15 -0
  1045. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ot_dense.py +16 -0
  1046. vismatch/third_party/TopicFM/third_party/loftr/demo/demo_loftr.py +240 -0
  1047. vismatch/third_party/TopicFM/third_party/loftr/src/__init__.py +0 -0
  1048. vismatch/third_party/TopicFM/third_party/loftr/src/config/default.py +171 -0
  1049. vismatch/third_party/TopicFM/third_party/loftr/src/datasets/megadepth.py +127 -0
  1050. vismatch/third_party/TopicFM/third_party/loftr/src/datasets/sampler.py +77 -0
  1051. vismatch/third_party/TopicFM/third_party/loftr/src/datasets/scannet.py +114 -0
  1052. vismatch/third_party/TopicFM/third_party/loftr/src/lightning/data.py +320 -0
  1053. vismatch/third_party/TopicFM/third_party/loftr/src/lightning/lightning_loftr.py +249 -0
  1054. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/__init__.py +2 -0
  1055. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/backbone/__init__.py +11 -0
  1056. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/backbone/resnet_fpn.py +199 -0
  1057. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr.py +81 -0
  1058. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/__init__.py +2 -0
  1059. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/fine_preprocess.py +59 -0
  1060. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/linear_attention.py +81 -0
  1061. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/transformer.py +101 -0
  1062. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/coarse_matching.py +261 -0
  1063. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/cvpr_ds_config.py +50 -0
  1064. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/fine_matching.py +74 -0
  1065. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/geometry.py +54 -0
  1066. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/position_encoding.py +42 -0
  1067. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/supervision.py +151 -0
  1068. vismatch/third_party/TopicFM/third_party/loftr/src/losses/loftr_loss.py +192 -0
  1069. vismatch/third_party/TopicFM/third_party/loftr/src/optimizers/__init__.py +42 -0
  1070. vismatch/third_party/TopicFM/third_party/loftr/src/utils/augment.py +55 -0
  1071. vismatch/third_party/TopicFM/third_party/loftr/src/utils/comm.py +265 -0
  1072. vismatch/third_party/TopicFM/third_party/loftr/src/utils/dataloader.py +23 -0
  1073. vismatch/third_party/TopicFM/third_party/loftr/src/utils/dataset.py +185 -0
  1074. vismatch/third_party/TopicFM/third_party/loftr/src/utils/metrics.py +193 -0
  1075. vismatch/third_party/TopicFM/third_party/loftr/src/utils/misc.py +101 -0
  1076. vismatch/third_party/TopicFM/third_party/loftr/src/utils/plotting.py +154 -0
  1077. vismatch/third_party/TopicFM/third_party/loftr/src/utils/profiler.py +39 -0
  1078. vismatch/third_party/TopicFM/third_party/loftr/test.py +68 -0
  1079. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/demo_superglue.py +259 -0
  1080. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/match_pairs.py +425 -0
  1081. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/__init__.py +0 -0
  1082. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/matching.py +84 -0
  1083. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/superglue.py +283 -0
  1084. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/superpoint.py +202 -0
  1085. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/utils.py +555 -0
  1086. vismatch/third_party/TopicFM/third_party/loftr/train.py +123 -0
  1087. vismatch/third_party/TopicFM/third_party/matchformer/config/data/__init__.py +0 -0
  1088. vismatch/third_party/TopicFM/third_party/matchformer/config/data/base.py +35 -0
  1089. vismatch/third_party/TopicFM/third_party/matchformer/config/data/megadepth_test_1500.py +11 -0
  1090. vismatch/third_party/TopicFM/third_party/matchformer/config/data/scannet_test_1500.py +11 -0
  1091. vismatch/third_party/TopicFM/third_party/matchformer/config/defaultmf.py +88 -0
  1092. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/__init__.py +17 -0
  1093. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/coarse_matching.py +228 -0
  1094. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/fine_matching.py +74 -0
  1095. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/fine_preprocess.py +59 -0
  1096. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_LA_large.py +254 -0
  1097. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_LA_lite.py +254 -0
  1098. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_SEA_large.py +291 -0
  1099. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_SEA_lite.py +291 -0
  1100. vismatch/third_party/TopicFM/third_party/matchformer/model/data.py +320 -0
  1101. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/dataset.py +231 -0
  1102. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/megadepth.py +126 -0
  1103. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/sampler.py +77 -0
  1104. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/scannet.py +113 -0
  1105. vismatch/third_party/TopicFM/third_party/matchformer/model/lightning_loftr.py +102 -0
  1106. vismatch/third_party/TopicFM/third_party/matchformer/model/matchformer.py +54 -0
  1107. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/augment.py +55 -0
  1108. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/comm.py +265 -0
  1109. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/dataloader.py +23 -0
  1110. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/metrics.py +193 -0
  1111. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/misc.py +101 -0
  1112. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/profiler.py +39 -0
  1113. vismatch/third_party/TopicFM/third_party/matchformer/test.py +55 -0
  1114. vismatch/third_party/TopicFM/train.py +123 -0
  1115. vismatch/third_party/TopicFM/visualization.py +123 -0
  1116. vismatch/third_party/TopicFM/viz/__init__.py +1 -0
  1117. vismatch/third_party/TopicFM/viz/configs/__init__.py +0 -0
  1118. vismatch/third_party/TopicFM/viz/methods/__init__.py +0 -0
  1119. vismatch/third_party/TopicFM/viz/methods/base.py +70 -0
  1120. vismatch/third_party/TopicFM/viz/methods/topicfmv2.py +208 -0
  1121. vismatch/third_party/UFM/UniCeption/examples/models/cosmos/autoencoding.py +48 -0
  1122. vismatch/third_party/UFM/UniCeption/examples/models/dust3r/convert_dust3r_weights_to_uniception.py +331 -0
  1123. vismatch/third_party/UFM/UniCeption/examples/models/dust3r/dust3r.py +261 -0
  1124. vismatch/third_party/UFM/UniCeption/examples/models/dust3r/profile_dust3r.py +47 -0
  1125. vismatch/third_party/UFM/UniCeption/scripts/check_dependencies.py +48 -0
  1126. vismatch/third_party/UFM/UniCeption/scripts/download_checkpoints.py +50 -0
  1127. vismatch/third_party/UFM/UniCeption/scripts/install_croco_rope.py +61 -0
  1128. vismatch/third_party/UFM/UniCeption/scripts/prepare_offline_install.py +398 -0
  1129. vismatch/third_party/UFM/UniCeption/scripts/validate_installation.py +212 -0
  1130. vismatch/third_party/UFM/UniCeption/setup.py +185 -0
  1131. vismatch/third_party/UFM/UniCeption/tests/models/encoders/conftest.py +26 -0
  1132. vismatch/third_party/UFM/UniCeption/tests/models/encoders/test_encoders.py +202 -0
  1133. vismatch/third_party/UFM/UniCeption/tests/models/encoders/viz_image_encoders.py +294 -0
  1134. vismatch/third_party/UFM/UniCeption/tests/models/info_sharing/viz_mulit_view_cross_attn_transformers.py +337 -0
  1135. vismatch/third_party/UFM/UniCeption/uniception/__init__.py +0 -0
  1136. vismatch/third_party/UFM/UniCeption/uniception/models/__init__.py +0 -0
  1137. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/__init__.py +225 -0
  1138. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/base.py +157 -0
  1139. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/cosmos.py +137 -0
  1140. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/croco.py +457 -0
  1141. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/dense_rep_encoder.py +344 -0
  1142. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/dinov2.py +333 -0
  1143. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/global_rep_encoder.py +115 -0
  1144. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/image_normalizations.py +35 -0
  1145. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/list.py +10 -0
  1146. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/patch_embedder.py +235 -0
  1147. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/radio.py +367 -0
  1148. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/utils.py +86 -0
  1149. vismatch/third_party/UFM/UniCeption/uniception/models/factory/__init__.py +3 -0
  1150. vismatch/third_party/UFM/UniCeption/uniception/models/factory/dust3r.py +332 -0
  1151. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/__init__.py +39 -0
  1152. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/alternating_attention_transformer.py +973 -0
  1153. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/base.py +116 -0
  1154. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/cross_attention_transformer.py +612 -0
  1155. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/diff_cross_attention_transformer.py +588 -0
  1156. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/global_attention_transformer.py +1154 -0
  1157. vismatch/third_party/UFM/UniCeption/uniception/models/libs/__init__.py +0 -0
  1158. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/__init__.py +14 -0
  1159. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/image_cli.py +175 -0
  1160. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/image_lib.py +123 -0
  1161. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/__init__.py +60 -0
  1162. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/distributions.py +41 -0
  1163. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/layers2d.py +326 -0
  1164. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/layers3d.py +965 -0
  1165. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/patching.py +310 -0
  1166. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/quantizers.py +510 -0
  1167. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/utils.py +115 -0
  1168. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/__init__.py +39 -0
  1169. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/configs.py +146 -0
  1170. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/continuous_image.py +86 -0
  1171. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/continuous_video.py +98 -0
  1172. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/discrete_image.py +113 -0
  1173. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/discrete_video.py +115 -0
  1174. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/utils.py +402 -0
  1175. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/video_cli.py +195 -0
  1176. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/video_lib.py +145 -0
  1177. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/__init__.py +0 -0
  1178. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/blocks.py +249 -0
  1179. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/curope/__init__.py +4 -0
  1180. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/curope/curope2d.py +39 -0
  1181. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/curope/setup.py +33 -0
  1182. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/dpt_block.py +530 -0
  1183. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/patch_embed.py +127 -0
  1184. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/pos_embed.py +155 -0
  1185. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/__init__.py +18 -0
  1186. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/adaptors.py +1765 -0
  1187. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/base.py +210 -0
  1188. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/cosmos.py +211 -0
  1189. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/dpt.py +676 -0
  1190. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/global_head.py +142 -0
  1191. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/linear.py +95 -0
  1192. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/mlp_feature.py +114 -0
  1193. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/mlp_head.py +114 -0
  1194. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/moge_conv.py +342 -0
  1195. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/pose_head.py +181 -0
  1196. vismatch/third_party/UFM/UniCeption/uniception/models/utils/__init__.py +0 -0
  1197. vismatch/third_party/UFM/UniCeption/uniception/models/utils/config.py +34 -0
  1198. vismatch/third_party/UFM/UniCeption/uniception/models/utils/intermediate_feature_return.py +85 -0
  1199. vismatch/third_party/UFM/UniCeption/uniception/models/utils/positional_encoding.py +23 -0
  1200. vismatch/third_party/UFM/UniCeption/uniception/models/utils/transformer_blocks.py +1072 -0
  1201. vismatch/third_party/UFM/UniCeption/uniception/utils/__init__.py +0 -0
  1202. vismatch/third_party/UFM/UniCeption/uniception/utils/profile.py +13 -0
  1203. vismatch/third_party/UFM/UniCeption/uniception/utils/viz.py +99 -0
  1204. vismatch/third_party/UFM/example_inference.py +138 -0
  1205. vismatch/third_party/UFM/gradio_demo.py +238 -0
  1206. vismatch/third_party/UFM/setup.py +86 -0
  1207. vismatch/third_party/UFM/uniflowmatch/__init__.py +16 -0
  1208. vismatch/third_party/UFM/uniflowmatch/cli.py +217 -0
  1209. vismatch/third_party/UFM/uniflowmatch/models/__init__.py +25 -0
  1210. vismatch/third_party/UFM/uniflowmatch/models/base.py +334 -0
  1211. vismatch/third_party/UFM/uniflowmatch/models/ufm.py +1323 -0
  1212. vismatch/third_party/UFM/uniflowmatch/models/unet_encoder.py +90 -0
  1213. vismatch/third_party/UFM/uniflowmatch/models/utils.py +16 -0
  1214. vismatch/third_party/UFM/uniflowmatch/utils/__init__.py +63 -0
  1215. vismatch/third_party/UFM/uniflowmatch/utils/flow_resizing.py +1091 -0
  1216. vismatch/third_party/UFM/uniflowmatch/utils/geometry.py +612 -0
  1217. vismatch/third_party/UFM/uniflowmatch/utils/viz.py +97 -0
  1218. vismatch/third_party/XoFTR/configs/data/__init__.py +0 -0
  1219. vismatch/third_party/XoFTR/configs/data/base.py +35 -0
  1220. vismatch/third_party/XoFTR/configs/data/megadepth_trainval_840.py +22 -0
  1221. vismatch/third_party/XoFTR/configs/data/megadepth_vistir_trainval_640.py +23 -0
  1222. vismatch/third_party/XoFTR/configs/data/pretrain.py +8 -0
  1223. vismatch/third_party/XoFTR/configs/xoftr/outdoor/visible_thermal.py +17 -0
  1224. vismatch/third_party/XoFTR/configs/xoftr/pretrain/pretrain.py +12 -0
  1225. vismatch/third_party/XoFTR/pretrain.py +125 -0
  1226. vismatch/third_party/XoFTR/src/__init__.py +0 -0
  1227. vismatch/third_party/XoFTR/src/config/default.py +203 -0
  1228. vismatch/third_party/XoFTR/src/datasets/megadepth.py +143 -0
  1229. vismatch/third_party/XoFTR/src/datasets/pretrain_dataset.py +156 -0
  1230. vismatch/third_party/XoFTR/src/datasets/sampler.py +77 -0
  1231. vismatch/third_party/XoFTR/src/datasets/scannet.py +114 -0
  1232. vismatch/third_party/XoFTR/src/datasets/vistir.py +109 -0
  1233. vismatch/third_party/XoFTR/src/lightning/data.py +346 -0
  1234. vismatch/third_party/XoFTR/src/lightning/data_pretrain.py +125 -0
  1235. vismatch/third_party/XoFTR/src/lightning/lightning_xoftr.py +334 -0
  1236. vismatch/third_party/XoFTR/src/lightning/lightning_xoftr_pretrain.py +171 -0
  1237. vismatch/third_party/XoFTR/src/losses/xoftr_loss.py +170 -0
  1238. vismatch/third_party/XoFTR/src/losses/xoftr_loss_pretrain.py +37 -0
  1239. vismatch/third_party/XoFTR/src/optimizers/__init__.py +42 -0
  1240. vismatch/third_party/XoFTR/src/utils/augment.py +113 -0
  1241. vismatch/third_party/XoFTR/src/utils/comm.py +265 -0
  1242. vismatch/third_party/XoFTR/src/utils/data_io.py +144 -0
  1243. vismatch/third_party/XoFTR/src/utils/dataloader.py +23 -0
  1244. vismatch/third_party/XoFTR/src/utils/dataset.py +279 -0
  1245. vismatch/third_party/XoFTR/src/utils/metrics.py +211 -0
  1246. vismatch/third_party/XoFTR/src/utils/misc.py +101 -0
  1247. vismatch/third_party/XoFTR/src/utils/plotting.py +227 -0
  1248. vismatch/third_party/XoFTR/src/utils/pretrain_utils.py +83 -0
  1249. vismatch/third_party/XoFTR/src/utils/profiler.py +39 -0
  1250. vismatch/third_party/XoFTR/src/xoftr/__init__.py +2 -0
  1251. vismatch/third_party/XoFTR/src/xoftr/backbone/__init__.py +1 -0
  1252. vismatch/third_party/XoFTR/src/xoftr/backbone/resnet.py +95 -0
  1253. vismatch/third_party/XoFTR/src/xoftr/utils/geometry.py +107 -0
  1254. vismatch/third_party/XoFTR/src/xoftr/utils/position_encoding.py +36 -0
  1255. vismatch/third_party/XoFTR/src/xoftr/utils/supervision.py +290 -0
  1256. vismatch/third_party/XoFTR/src/xoftr/xoftr.py +94 -0
  1257. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/__init__.py +4 -0
  1258. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/coarse_matching.py +305 -0
  1259. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/fine_matching.py +170 -0
  1260. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/fine_process.py +321 -0
  1261. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/linear_attention.py +81 -0
  1262. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/transformer.py +101 -0
  1263. vismatch/third_party/XoFTR/src/xoftr/xoftr_pretrain.py +209 -0
  1264. vismatch/third_party/XoFTR/test.py +68 -0
  1265. vismatch/third_party/XoFTR/test_relative_pose.py +330 -0
  1266. vismatch/third_party/XoFTR/train.py +126 -0
  1267. vismatch/third_party/accelerated_features/hubconf.py +15 -0
  1268. vismatch/third_party/accelerated_features/minimal_example.py +49 -0
  1269. vismatch/third_party/accelerated_features/modules/__init__.py +4 -0
  1270. vismatch/third_party/accelerated_features/modules/dataset/__init__.py +5 -0
  1271. vismatch/third_party/accelerated_features/modules/dataset/augmentation.py +314 -0
  1272. vismatch/third_party/accelerated_features/modules/dataset/megadepth/__init__.py +7 -0
  1273. vismatch/third_party/accelerated_features/modules/dataset/megadepth/megadepth.py +174 -0
  1274. vismatch/third_party/accelerated_features/modules/dataset/megadepth/megadepth_warper.py +170 -0
  1275. vismatch/third_party/accelerated_features/modules/dataset/megadepth/utils.py +160 -0
  1276. vismatch/third_party/accelerated_features/modules/interpolator.py +33 -0
  1277. vismatch/third_party/accelerated_features/modules/lighterglue.py +56 -0
  1278. vismatch/third_party/accelerated_features/modules/model.py +154 -0
  1279. vismatch/third_party/accelerated_features/modules/training/__init__.py +4 -0
  1280. vismatch/third_party/accelerated_features/modules/training/losses.py +224 -0
  1281. vismatch/third_party/accelerated_features/modules/training/train.py +311 -0
  1282. vismatch/third_party/accelerated_features/modules/training/utils.py +200 -0
  1283. vismatch/third_party/accelerated_features/modules/xfeat.py +402 -0
  1284. vismatch/third_party/accelerated_features/realtime_demo.py +295 -0
  1285. vismatch/third_party/accelerated_features/third_party/ALIKE/alike.py +143 -0
  1286. vismatch/third_party/accelerated_features/third_party/ALIKE/alnet.py +164 -0
  1287. vismatch/third_party/accelerated_features/third_party/ALIKE/demo.py +167 -0
  1288. vismatch/third_party/accelerated_features/third_party/ALIKE/hseq/eval.py +162 -0
  1289. vismatch/third_party/accelerated_features/third_party/ALIKE/hseq/extract.py +159 -0
  1290. vismatch/third_party/accelerated_features/third_party/ALIKE/soft_detect.py +194 -0
  1291. vismatch/third_party/accelerated_features/third_party/__init__.py +4 -0
  1292. vismatch/third_party/accelerated_features/third_party/alike_wrapper.py +110 -0
  1293. vismatch/third_party/affine-steerers/affine_steerers/__init__.py +7 -0
  1294. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/__init__.py +5 -0
  1295. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/hpatches.py +92 -0
  1296. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/hpatches_oracle_steer.py +108 -0
  1297. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/mega_pose_est.py +116 -0
  1298. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/mega_pose_est_mnn.py +162 -0
  1299. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/nll_benchmark.py +57 -0
  1300. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/num_inliers.py +76 -0
  1301. vismatch/third_party/affine-steerers/affine_steerers/checkpoint.py +82 -0
  1302. vismatch/third_party/affine-steerers/affine_steerers/datasets/__init__.py +0 -0
  1303. vismatch/third_party/affine-steerers/affine_steerers/datasets/homog.py +284 -0
  1304. vismatch/third_party/affine-steerers/affine_steerers/datasets/megadepth.py +408 -0
  1305. vismatch/third_party/affine-steerers/affine_steerers/decoder.py +90 -0
  1306. vismatch/third_party/affine-steerers/affine_steerers/descriptors/__init__.py +0 -0
  1307. vismatch/third_party/affine-steerers/affine_steerers/descriptors/dedode_descriptor.py +77 -0
  1308. vismatch/third_party/affine-steerers/affine_steerers/descriptors/descriptor_loss.py +358 -0
  1309. vismatch/third_party/affine-steerers/affine_steerers/detectors/__init__.py +0 -0
  1310. vismatch/third_party/affine-steerers/affine_steerers/detectors/dedode_detector.py +75 -0
  1311. vismatch/third_party/affine-steerers/affine_steerers/detectors/keypoint_loss.py +215 -0
  1312. vismatch/third_party/affine-steerers/affine_steerers/encoder.py +87 -0
  1313. vismatch/third_party/affine-steerers/affine_steerers/matchers/__init__.py +0 -0
  1314. vismatch/third_party/affine-steerers/affine_steerers/matchers/dual_softmax_matcher.py +816 -0
  1315. vismatch/third_party/affine-steerers/affine_steerers/model_zoo/__init__.py +3 -0
  1316. vismatch/third_party/affine-steerers/affine_steerers/model_zoo/dedode_models.py +298 -0
  1317. vismatch/third_party/affine-steerers/affine_steerers/steerers.py +732 -0
  1318. vismatch/third_party/affine-steerers/affine_steerers/train.py +90 -0
  1319. vismatch/third_party/affine-steerers/affine_steerers/transformer/__init__.py +8 -0
  1320. vismatch/third_party/affine-steerers/affine_steerers/transformer/dinov2.py +359 -0
  1321. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/__init__.py +12 -0
  1322. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/attention.py +81 -0
  1323. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/block.py +252 -0
  1324. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/dino_head.py +59 -0
  1325. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/drop_path.py +35 -0
  1326. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/layer_scale.py +28 -0
  1327. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/mlp.py +41 -0
  1328. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/patch_embed.py +89 -0
  1329. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/swiglu_ffn.py +63 -0
  1330. vismatch/third_party/affine-steerers/affine_steerers/utils.py +1422 -0
  1331. vismatch/third_party/affine-steerers/experiments/aff_equi_B.py +182 -0
  1332. vismatch/third_party/affine-steerers/experiments/aff_equi_G.py +193 -0
  1333. vismatch/third_party/affine-steerers/experiments/aff_steer_B.py +213 -0
  1334. vismatch/third_party/affine-steerers/experiments/aff_steer_G.py +223 -0
  1335. vismatch/third_party/affine-steerers/experiments/aff_steer_pretrain_B.py +187 -0
  1336. vismatch/third_party/affine-steerers/experiments/aff_steer_pretrain_G.py +198 -0
  1337. vismatch/third_party/affine-steerers/setup.py +15 -0
  1338. vismatch/third_party/aspanformer/configs/aspan/indoor/aspan_test.py +7 -0
  1339. vismatch/third_party/aspanformer/configs/aspan/indoor/aspan_train.py +8 -0
  1340. vismatch/third_party/aspanformer/configs/aspan/outdoor/aspan_test.py +19 -0
  1341. vismatch/third_party/aspanformer/configs/aspan/outdoor/aspan_train.py +17 -0
  1342. vismatch/third_party/aspanformer/configs/data/__init__.py +0 -0
  1343. vismatch/third_party/aspanformer/configs/data/base.py +35 -0
  1344. vismatch/third_party/aspanformer/configs/data/megadepth_test_1500.py +13 -0
  1345. vismatch/third_party/aspanformer/configs/data/megadepth_trainval_832.py +22 -0
  1346. vismatch/third_party/aspanformer/configs/data/scannet_test_1500.py +11 -0
  1347. vismatch/third_party/aspanformer/configs/data/scannet_trainval.py +17 -0
  1348. vismatch/third_party/aspanformer/demo/demo.py +63 -0
  1349. vismatch/third_party/aspanformer/demo/demo_utils.py +44 -0
  1350. vismatch/third_party/aspanformer/src/ASpanFormer/__init__.py +2 -0
  1351. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/__init__.py +3 -0
  1352. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/attention.py +198 -0
  1353. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/fine_preprocess.py +59 -0
  1354. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/loftr.py +112 -0
  1355. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/transformer.py +244 -0
  1356. vismatch/third_party/aspanformer/src/ASpanFormer/aspanformer.py +152 -0
  1357. vismatch/third_party/aspanformer/src/ASpanFormer/backbone/__init__.py +11 -0
  1358. vismatch/third_party/aspanformer/src/ASpanFormer/backbone/resnet_fpn.py +199 -0
  1359. vismatch/third_party/aspanformer/src/ASpanFormer/utils/coarse_matching.py +331 -0
  1360. vismatch/third_party/aspanformer/src/ASpanFormer/utils/cvpr_ds_config.py +50 -0
  1361. vismatch/third_party/aspanformer/src/ASpanFormer/utils/fine_matching.py +74 -0
  1362. vismatch/third_party/aspanformer/src/ASpanFormer/utils/geometry.py +54 -0
  1363. vismatch/third_party/aspanformer/src/ASpanFormer/utils/position_encoding.py +61 -0
  1364. vismatch/third_party/aspanformer/src/ASpanFormer/utils/supervision.py +151 -0
  1365. vismatch/third_party/aspanformer/src/__init__.py +0 -0
  1366. vismatch/third_party/aspanformer/src/config/default.py +180 -0
  1367. vismatch/third_party/aspanformer/src/datasets/__init__.py +3 -0
  1368. vismatch/third_party/aspanformer/src/datasets/megadepth.py +127 -0
  1369. vismatch/third_party/aspanformer/src/datasets/sampler.py +77 -0
  1370. vismatch/third_party/aspanformer/src/datasets/scannet.py +113 -0
  1371. vismatch/third_party/aspanformer/src/lightning/data.py +326 -0
  1372. vismatch/third_party/aspanformer/src/lightning/lightning_aspanformer.py +276 -0
  1373. vismatch/third_party/aspanformer/src/losses/aspan_loss.py +231 -0
  1374. vismatch/third_party/aspanformer/src/optimizers/__init__.py +42 -0
  1375. vismatch/third_party/aspanformer/src/utils/augment.py +55 -0
  1376. vismatch/third_party/aspanformer/src/utils/comm.py +265 -0
  1377. vismatch/third_party/aspanformer/src/utils/dataloader.py +23 -0
  1378. vismatch/third_party/aspanformer/src/utils/dataset.py +222 -0
  1379. vismatch/third_party/aspanformer/src/utils/metrics.py +260 -0
  1380. vismatch/third_party/aspanformer/src/utils/misc.py +139 -0
  1381. vismatch/third_party/aspanformer/src/utils/plotting.py +219 -0
  1382. vismatch/third_party/aspanformer/src/utils/profiler.py +39 -0
  1383. vismatch/third_party/aspanformer/test.py +69 -0
  1384. vismatch/third_party/aspanformer/tools/SensorData.py +125 -0
  1385. vismatch/third_party/aspanformer/tools/extract.py +47 -0
  1386. vismatch/third_party/aspanformer/tools/preprocess_scene.py +242 -0
  1387. vismatch/third_party/aspanformer/tools/reader.py +39 -0
  1388. vismatch/third_party/aspanformer/tools/undistort_mega.py +69 -0
  1389. vismatch/third_party/aspanformer/train.py +134 -0
  1390. vismatch/third_party/duster/croco/datasets/__init__.py +0 -0
  1391. vismatch/third_party/duster/croco/datasets/crops/extract_crops_from_images.py +159 -0
  1392. vismatch/third_party/duster/croco/datasets/habitat_sim/__init__.py +0 -0
  1393. vismatch/third_party/duster/croco/datasets/habitat_sim/generate_from_metadata.py +92 -0
  1394. vismatch/third_party/duster/croco/datasets/habitat_sim/generate_from_metadata_files.py +27 -0
  1395. vismatch/third_party/duster/croco/datasets/habitat_sim/generate_multiview_images.py +177 -0
  1396. vismatch/third_party/duster/croco/datasets/habitat_sim/multiview_habitat_sim_generator.py +390 -0
  1397. vismatch/third_party/duster/croco/datasets/habitat_sim/pack_metadata_files.py +69 -0
  1398. vismatch/third_party/duster/croco/datasets/habitat_sim/paths.py +129 -0
  1399. vismatch/third_party/duster/croco/datasets/pairs_dataset.py +109 -0
  1400. vismatch/third_party/duster/croco/datasets/transforms.py +95 -0
  1401. vismatch/third_party/duster/croco/demo.py +55 -0
  1402. vismatch/third_party/duster/croco/models/blocks.py +241 -0
  1403. vismatch/third_party/duster/croco/models/criterion.py +37 -0
  1404. vismatch/third_party/duster/croco/models/croco.py +249 -0
  1405. vismatch/third_party/duster/croco/models/croco_downstream.py +122 -0
  1406. vismatch/third_party/duster/croco/models/curope/__init__.py +4 -0
  1407. vismatch/third_party/duster/croco/models/curope/curope2d.py +40 -0
  1408. vismatch/third_party/duster/croco/models/curope/setup.py +34 -0
  1409. vismatch/third_party/duster/croco/models/dpt_block.py +450 -0
  1410. vismatch/third_party/duster/croco/models/head_downstream.py +58 -0
  1411. vismatch/third_party/duster/croco/models/masking.py +25 -0
  1412. vismatch/third_party/duster/croco/models/pos_embed.py +157 -0
  1413. vismatch/third_party/duster/croco/pretrain.py +254 -0
  1414. vismatch/third_party/duster/croco/stereoflow/augmentor.py +290 -0
  1415. vismatch/third_party/duster/croco/stereoflow/criterion.py +251 -0
  1416. vismatch/third_party/duster/croco/stereoflow/datasets_flow.py +630 -0
  1417. vismatch/third_party/duster/croco/stereoflow/datasets_stereo.py +674 -0
  1418. vismatch/third_party/duster/croco/stereoflow/engine.py +280 -0
  1419. vismatch/third_party/duster/croco/stereoflow/test.py +216 -0
  1420. vismatch/third_party/duster/croco/stereoflow/train.py +253 -0
  1421. vismatch/third_party/duster/croco/utils/misc.py +463 -0
  1422. vismatch/third_party/duster/datasets_preprocess/habitat/find_scenes.py +78 -0
  1423. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/__init__.py +2 -0
  1424. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/habitat_sim_envmaps_renderer.py +170 -0
  1425. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/multiview_crop_generator.py +93 -0
  1426. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/projections.py +151 -0
  1427. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/projections_conversions.py +45 -0
  1428. vismatch/third_party/duster/datasets_preprocess/habitat/preprocess_habitat.py +121 -0
  1429. vismatch/third_party/duster/datasets_preprocess/path_to_root.py +13 -0
  1430. vismatch/third_party/duster/datasets_preprocess/preprocess_arkitscenes.py +355 -0
  1431. vismatch/third_party/duster/datasets_preprocess/preprocess_blendedMVS.py +149 -0
  1432. vismatch/third_party/duster/datasets_preprocess/preprocess_co3d.py +295 -0
  1433. vismatch/third_party/duster/datasets_preprocess/preprocess_megadepth.py +198 -0
  1434. vismatch/third_party/duster/datasets_preprocess/preprocess_scannetpp.py +400 -0
  1435. vismatch/third_party/duster/datasets_preprocess/preprocess_staticthings3d.py +130 -0
  1436. vismatch/third_party/duster/datasets_preprocess/preprocess_waymo.py +257 -0
  1437. vismatch/third_party/duster/datasets_preprocess/preprocess_wildrgbd.py +209 -0
  1438. vismatch/third_party/duster/demo.py +45 -0
  1439. vismatch/third_party/duster/dust3r/__init__.py +2 -0
  1440. vismatch/third_party/duster/dust3r/cloud_opt/__init__.py +33 -0
  1441. vismatch/third_party/duster/dust3r/cloud_opt/base_opt.py +405 -0
  1442. vismatch/third_party/duster/dust3r/cloud_opt/commons.py +90 -0
  1443. vismatch/third_party/duster/dust3r/cloud_opt/init_im_poses.py +316 -0
  1444. vismatch/third_party/duster/dust3r/cloud_opt/modular_optimizer.py +145 -0
  1445. vismatch/third_party/duster/dust3r/cloud_opt/optimizer.py +248 -0
  1446. vismatch/third_party/duster/dust3r/cloud_opt/pair_viewer.py +127 -0
  1447. vismatch/third_party/duster/dust3r/datasets/__init__.py +50 -0
  1448. vismatch/third_party/duster/dust3r/datasets/arkitscenes.py +102 -0
  1449. vismatch/third_party/duster/dust3r/datasets/base/__init__.py +2 -0
  1450. vismatch/third_party/duster/dust3r/datasets/base/base_stereo_view_dataset.py +220 -0
  1451. vismatch/third_party/duster/dust3r/datasets/base/batched_sampler.py +74 -0
  1452. vismatch/third_party/duster/dust3r/datasets/base/easy_dataset.py +157 -0
  1453. vismatch/third_party/duster/dust3r/datasets/blendedmvs.py +104 -0
  1454. vismatch/third_party/duster/dust3r/datasets/co3d.py +165 -0
  1455. vismatch/third_party/duster/dust3r/datasets/habitat.py +107 -0
  1456. vismatch/third_party/duster/dust3r/datasets/megadepth.py +123 -0
  1457. vismatch/third_party/duster/dust3r/datasets/scannetpp.py +96 -0
  1458. vismatch/third_party/duster/dust3r/datasets/staticthings3d.py +96 -0
  1459. vismatch/third_party/duster/dust3r/datasets/utils/__init__.py +2 -0
  1460. vismatch/third_party/duster/dust3r/datasets/utils/cropping.py +124 -0
  1461. vismatch/third_party/duster/dust3r/datasets/utils/transforms.py +11 -0
  1462. vismatch/third_party/duster/dust3r/datasets/waymo.py +93 -0
  1463. vismatch/third_party/duster/dust3r/datasets/wildrgbd.py +67 -0
  1464. vismatch/third_party/duster/dust3r/demo.py +287 -0
  1465. vismatch/third_party/duster/dust3r/heads/__init__.py +19 -0
  1466. vismatch/third_party/duster/dust3r/heads/dpt_head.py +115 -0
  1467. vismatch/third_party/duster/dust3r/heads/linear_head.py +41 -0
  1468. vismatch/third_party/duster/dust3r/heads/postprocess.py +58 -0
  1469. vismatch/third_party/duster/dust3r/image_pairs.py +104 -0
  1470. vismatch/third_party/duster/dust3r/inference.py +150 -0
  1471. vismatch/third_party/duster/dust3r/losses.py +299 -0
  1472. vismatch/third_party/duster/dust3r/model.py +211 -0
  1473. vismatch/third_party/duster/dust3r/optim_factory.py +14 -0
  1474. vismatch/third_party/duster/dust3r/patch_embed.py +70 -0
  1475. vismatch/third_party/duster/dust3r/post_process.py +60 -0
  1476. vismatch/third_party/duster/dust3r/training.py +377 -0
  1477. vismatch/third_party/duster/dust3r/utils/__init__.py +2 -0
  1478. vismatch/third_party/duster/dust3r/utils/device.py +76 -0
  1479. vismatch/third_party/duster/dust3r/utils/geometry.py +366 -0
  1480. vismatch/third_party/duster/dust3r/utils/image.py +128 -0
  1481. vismatch/third_party/duster/dust3r/utils/misc.py +121 -0
  1482. vismatch/third_party/duster/dust3r/utils/parallel.py +79 -0
  1483. vismatch/third_party/duster/dust3r/utils/path_to_croco.py +19 -0
  1484. vismatch/third_party/duster/dust3r/viz.py +381 -0
  1485. vismatch/third_party/duster/dust3r_visloc/__init__.py +2 -0
  1486. vismatch/third_party/duster/dust3r_visloc/datasets/__init__.py +6 -0
  1487. vismatch/third_party/duster/dust3r_visloc/datasets/aachen_day_night.py +24 -0
  1488. vismatch/third_party/duster/dust3r_visloc/datasets/base_colmap.py +282 -0
  1489. vismatch/third_party/duster/dust3r_visloc/datasets/base_dataset.py +19 -0
  1490. vismatch/third_party/duster/dust3r_visloc/datasets/cambridge_landmarks.py +19 -0
  1491. vismatch/third_party/duster/dust3r_visloc/datasets/inloc.py +167 -0
  1492. vismatch/third_party/duster/dust3r_visloc/datasets/sevenscenes.py +123 -0
  1493. vismatch/third_party/duster/dust3r_visloc/datasets/utils.py +118 -0
  1494. vismatch/third_party/duster/dust3r_visloc/evaluation.py +65 -0
  1495. vismatch/third_party/duster/dust3r_visloc/localization.py +140 -0
  1496. vismatch/third_party/duster/train.py +13 -0
  1497. vismatch/third_party/duster/visloc.py +193 -0
  1498. vismatch/third_party/gim/demo.py +479 -0
  1499. vismatch/third_party/gim/dkm/__init__.py +4 -0
  1500. vismatch/third_party/gim/dkm/benchmarks/__init__.py +4 -0
  1501. vismatch/third_party/gim/dkm/benchmarks/hpatches_sequences_homog_benchmark.py +114 -0
  1502. vismatch/third_party/gim/dkm/benchmarks/megadepth1500_benchmark.py +124 -0
  1503. vismatch/third_party/gim/dkm/benchmarks/megadepth_dense_benchmark.py +86 -0
  1504. vismatch/third_party/gim/dkm/benchmarks/scannet_benchmark.py +143 -0
  1505. vismatch/third_party/gim/dkm/checkpointing/__init__.py +1 -0
  1506. vismatch/third_party/gim/dkm/checkpointing/checkpoint.py +31 -0
  1507. vismatch/third_party/gim/dkm/datasets/__init__.py +1 -0
  1508. vismatch/third_party/gim/dkm/datasets/megadepth.py +177 -0
  1509. vismatch/third_party/gim/dkm/datasets/scannet.py +151 -0
  1510. vismatch/third_party/gim/dkm/losses/__init__.py +1 -0
  1511. vismatch/third_party/gim/dkm/losses/depth_match_regression_loss.py +128 -0
  1512. vismatch/third_party/gim/dkm/models/__init__.py +4 -0
  1513. vismatch/third_party/gim/dkm/models/dkm.py +745 -0
  1514. vismatch/third_party/gim/dkm/models/encoders.py +148 -0
  1515. vismatch/third_party/gim/dkm/models/model_zoo/DKMv3.py +148 -0
  1516. vismatch/third_party/gim/dkm/models/model_zoo/__init__.py +39 -0
  1517. vismatch/third_party/gim/dkm/train/__init__.py +1 -0
  1518. vismatch/third_party/gim/dkm/train/train.py +67 -0
  1519. vismatch/third_party/gim/dkm/utils/__init__.py +13 -0
  1520. vismatch/third_party/gim/dkm/utils/kde.py +26 -0
  1521. vismatch/third_party/gim/dkm/utils/local_correlation.py +40 -0
  1522. vismatch/third_party/gim/dkm/utils/transforms.py +104 -0
  1523. vismatch/third_party/gim/dkm/utils/utils.py +341 -0
  1524. vismatch/third_party/gim/gluefactory/__init__.py +17 -0
  1525. vismatch/third_party/gim/gluefactory/datasets/__init__.py +25 -0
  1526. vismatch/third_party/gim/gluefactory/datasets/augmentations.py +244 -0
  1527. vismatch/third_party/gim/gluefactory/datasets/base_dataset.py +206 -0
  1528. vismatch/third_party/gim/gluefactory/datasets/eth3d.py +254 -0
  1529. vismatch/third_party/gim/gluefactory/datasets/homographies.py +311 -0
  1530. vismatch/third_party/gim/gluefactory/datasets/hpatches.py +145 -0
  1531. vismatch/third_party/gim/gluefactory/datasets/image_folder.py +59 -0
  1532. vismatch/third_party/gim/gluefactory/datasets/image_pairs.py +100 -0
  1533. vismatch/third_party/gim/gluefactory/datasets/megadepth.py +514 -0
  1534. vismatch/third_party/gim/gluefactory/datasets/utils.py +131 -0
  1535. vismatch/third_party/gim/gluefactory/eval/__init__.py +20 -0
  1536. vismatch/third_party/gim/gluefactory/eval/eth3d.py +202 -0
  1537. vismatch/third_party/gim/gluefactory/eval/eval_pipeline.py +109 -0
  1538. vismatch/third_party/gim/gluefactory/eval/hpatches.py +203 -0
  1539. vismatch/third_party/gim/gluefactory/eval/inspect.py +61 -0
  1540. vismatch/third_party/gim/gluefactory/eval/io.py +109 -0
  1541. vismatch/third_party/gim/gluefactory/eval/megadepth1500.py +189 -0
  1542. vismatch/third_party/gim/gluefactory/eval/utils.py +272 -0
  1543. vismatch/third_party/gim/gluefactory/geometry/depth.py +88 -0
  1544. vismatch/third_party/gim/gluefactory/geometry/epipolar.py +155 -0
  1545. vismatch/third_party/gim/gluefactory/geometry/gt_generation.py +558 -0
  1546. vismatch/third_party/gim/gluefactory/geometry/homography.py +342 -0
  1547. vismatch/third_party/gim/gluefactory/geometry/utils.py +167 -0
  1548. vismatch/third_party/gim/gluefactory/geometry/wrappers.py +425 -0
  1549. vismatch/third_party/gim/gluefactory/models/__init__.py +30 -0
  1550. vismatch/third_party/gim/gluefactory/models/backbones/__init__.py +0 -0
  1551. vismatch/third_party/gim/gluefactory/models/backbones/dinov2.py +30 -0
  1552. vismatch/third_party/gim/gluefactory/models/base_model.py +157 -0
  1553. vismatch/third_party/gim/gluefactory/models/cache_loader.py +139 -0
  1554. vismatch/third_party/gim/gluefactory/models/extractors/__init__.py +0 -0
  1555. vismatch/third_party/gim/gluefactory/models/extractors/aliked.py +786 -0
  1556. vismatch/third_party/gim/gluefactory/models/extractors/disk_kornia.py +108 -0
  1557. vismatch/third_party/gim/gluefactory/models/extractors/grid_extractor.py +60 -0
  1558. vismatch/third_party/gim/gluefactory/models/extractors/keynet_affnet_hardnet.py +74 -0
  1559. vismatch/third_party/gim/gluefactory/models/extractors/mixed.py +76 -0
  1560. vismatch/third_party/gim/gluefactory/models/extractors/sift.py +234 -0
  1561. vismatch/third_party/gim/gluefactory/models/extractors/sift_kornia.py +46 -0
  1562. vismatch/third_party/gim/gluefactory/models/extractors/superpoint_open.py +210 -0
  1563. vismatch/third_party/gim/gluefactory/models/lines/__init__.py +0 -0
  1564. vismatch/third_party/gim/gluefactory/models/lines/deeplsd.py +106 -0
  1565. vismatch/third_party/gim/gluefactory/models/lines/lsd.py +88 -0
  1566. vismatch/third_party/gim/gluefactory/models/lines/wireframe.py +312 -0
  1567. vismatch/third_party/gim/gluefactory/models/matchers/__init__.py +0 -0
  1568. vismatch/third_party/gim/gluefactory/models/matchers/adalam.py +0 -0
  1569. vismatch/third_party/gim/gluefactory/models/matchers/depth_matcher.py +82 -0
  1570. vismatch/third_party/gim/gluefactory/models/matchers/gluestick.py +776 -0
  1571. vismatch/third_party/gim/gluefactory/models/matchers/homography_matcher.py +66 -0
  1572. vismatch/third_party/gim/gluefactory/models/matchers/kornia_loftr.py +66 -0
  1573. vismatch/third_party/gim/gluefactory/models/matchers/lightglue.py +632 -0
  1574. vismatch/third_party/gim/gluefactory/models/matchers/lightglue_pretrained.py +36 -0
  1575. vismatch/third_party/gim/gluefactory/models/matchers/nearest_neighbor_matcher.py +97 -0
  1576. vismatch/third_party/gim/gluefactory/models/triplet_pipeline.py +99 -0
  1577. vismatch/third_party/gim/gluefactory/models/two_view_pipeline.py +114 -0
  1578. vismatch/third_party/gim/gluefactory/models/utils/__init__.py +0 -0
  1579. vismatch/third_party/gim/gluefactory/models/utils/losses.py +73 -0
  1580. vismatch/third_party/gim/gluefactory/models/utils/metrics.py +50 -0
  1581. vismatch/third_party/gim/gluefactory/models/utils/misc.py +70 -0
  1582. vismatch/third_party/gim/gluefactory/robust_estimators/__init__.py +15 -0
  1583. vismatch/third_party/gim/gluefactory/robust_estimators/base_estimator.py +33 -0
  1584. vismatch/third_party/gim/gluefactory/robust_estimators/homography/__init__.py +0 -0
  1585. vismatch/third_party/gim/gluefactory/robust_estimators/homography/homography_est.py +74 -0
  1586. vismatch/third_party/gim/gluefactory/robust_estimators/homography/opencv.py +53 -0
  1587. vismatch/third_party/gim/gluefactory/robust_estimators/homography/poselib.py +40 -0
  1588. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/__init__.py +0 -0
  1589. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/opencv.py +64 -0
  1590. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/poselib.py +44 -0
  1591. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/pycolmap.py +52 -0
  1592. vismatch/third_party/gim/gluefactory/scripts/__init__.py +0 -0
  1593. vismatch/third_party/gim/gluefactory/scripts/export_local_features.py +127 -0
  1594. vismatch/third_party/gim/gluefactory/scripts/export_megadepth.py +173 -0
  1595. vismatch/third_party/gim/gluefactory/settings.py +6 -0
  1596. vismatch/third_party/gim/gluefactory/superpoint.py +361 -0
  1597. vismatch/third_party/gim/gluefactory/train.py +691 -0
  1598. vismatch/third_party/gim/gluefactory/utils/__init__.py +0 -0
  1599. vismatch/third_party/gim/gluefactory/utils/benchmark.py +33 -0
  1600. vismatch/third_party/gim/gluefactory/utils/experiments.py +134 -0
  1601. vismatch/third_party/gim/gluefactory/utils/export_predictions.py +81 -0
  1602. vismatch/third_party/gim/gluefactory/utils/image.py +130 -0
  1603. vismatch/third_party/gim/gluefactory/utils/misc.py +44 -0
  1604. vismatch/third_party/gim/gluefactory/utils/patches.py +50 -0
  1605. vismatch/third_party/gim/gluefactory/utils/stdout_capturing.py +134 -0
  1606. vismatch/third_party/gim/gluefactory/utils/tensor.py +48 -0
  1607. vismatch/third_party/gim/gluefactory/utils/tools.py +269 -0
  1608. vismatch/third_party/gim/gluefactory/visualization/global_frame.py +289 -0
  1609. vismatch/third_party/gim/gluefactory/visualization/tools.py +465 -0
  1610. vismatch/third_party/gim/gluefactory/visualization/two_view_frame.py +158 -0
  1611. vismatch/third_party/gim/gluefactory/visualization/visualize_batch.py +57 -0
  1612. vismatch/third_party/gim/gluefactory/visualization/viz2d.py +486 -0
  1613. vismatch/third_party/imatch-toolbox/configs/d2net.yml +26 -0
  1614. vismatch/third_party/imatch-toolbox/configs/dogaffnethardnet.yml +10 -0
  1615. vismatch/third_party/imatch-toolbox/configs/ncnet.yml +7 -0
  1616. vismatch/third_party/imatch-toolbox/configs/patch2pix.yml +56 -0
  1617. vismatch/third_party/imatch-toolbox/configs/patch2pix_superglue.yml +58 -0
  1618. vismatch/third_party/imatch-toolbox/configs/r2d2.yml +31 -0
  1619. vismatch/third_party/imatch-toolbox/configs/sift.yml +27 -0
  1620. vismatch/third_party/imatch-toolbox/configs/superglue.yml +69 -0
  1621. vismatch/third_party/imatch-toolbox/configs/superpoint.yml +21 -0
  1622. vismatch/third_party/imatch-toolbox/environment.yml +14 -0
  1623. vismatch/third_party/imatch-toolbox/immatch/__init__.py +8 -0
  1624. vismatch/third_party/imatch-toolbox/immatch/eval_aachen.py +88 -0
  1625. vismatch/third_party/imatch-toolbox/immatch/eval_hpatches.py +117 -0
  1626. vismatch/third_party/imatch-toolbox/immatch/eval_inloc.py +45 -0
  1627. vismatch/third_party/imatch-toolbox/immatch/eval_relapose.py +231 -0
  1628. vismatch/third_party/imatch-toolbox/immatch/eval_robotcar.py +83 -0
  1629. vismatch/third_party/imatch-toolbox/immatch/modules/__init__.py +0 -0
  1630. vismatch/third_party/imatch-toolbox/immatch/modules/base.py +89 -0
  1631. vismatch/third_party/imatch-toolbox/immatch/modules/d2net.py +69 -0
  1632. vismatch/third_party/imatch-toolbox/immatch/modules/dogaffnethardnet.py +94 -0
  1633. vismatch/third_party/imatch-toolbox/immatch/modules/nn_matching.py +31 -0
  1634. vismatch/third_party/imatch-toolbox/immatch/modules/patch2pix.py +126 -0
  1635. vismatch/third_party/imatch-toolbox/immatch/modules/r2d2.py +64 -0
  1636. vismatch/third_party/imatch-toolbox/immatch/modules/sift.py +67 -0
  1637. vismatch/third_party/imatch-toolbox/immatch/modules/superglue.py +62 -0
  1638. vismatch/third_party/imatch-toolbox/immatch/modules/superpoint.py +56 -0
  1639. vismatch/third_party/imatch-toolbox/immatch/utils/__init__.py +13 -0
  1640. vismatch/third_party/imatch-toolbox/immatch/utils/colmap/data_parsing.py +257 -0
  1641. vismatch/third_party/imatch-toolbox/immatch/utils/colmap/database.py +362 -0
  1642. vismatch/third_party/imatch-toolbox/immatch/utils/colmap/read_write_model.py +506 -0
  1643. vismatch/third_party/imatch-toolbox/immatch/utils/data_io.py +111 -0
  1644. vismatch/third_party/imatch-toolbox/immatch/utils/hpatches_helper.py +242 -0
  1645. vismatch/third_party/imatch-toolbox/immatch/utils/localize_sfm_helper.py +403 -0
  1646. vismatch/third_party/imatch-toolbox/immatch/utils/metrics.py +90 -0
  1647. vismatch/third_party/imatch-toolbox/immatch/utils/model_helper.py +27 -0
  1648. vismatch/third_party/imatch-toolbox/setup.py +36 -0
  1649. vismatch/third_party/imatch-toolbox/third_party/d2net/extract_features.py +156 -0
  1650. vismatch/third_party/imatch-toolbox/third_party/d2net/extract_kapture.py +248 -0
  1651. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/dataset.py +239 -0
  1652. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/exceptions.py +6 -0
  1653. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/loss.py +340 -0
  1654. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/model.py +121 -0
  1655. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/model_test.py +187 -0
  1656. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/pyramid.py +129 -0
  1657. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/utils.py +167 -0
  1658. vismatch/third_party/imatch-toolbox/third_party/d2net/megadepth_utils/preprocess_scene.py +242 -0
  1659. vismatch/third_party/imatch-toolbox/third_party/d2net/megadepth_utils/undistort_reconstructions.py +69 -0
  1660. vismatch/third_party/imatch-toolbox/third_party/d2net/train.py +279 -0
  1661. vismatch/third_party/imatch-toolbox/third_party/patch2pix/data_pairs/precompute_immatch_val_ovs.py +20 -0
  1662. vismatch/third_party/imatch-toolbox/third_party/patch2pix/environment.yml +21 -0
  1663. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/modules.py +167 -0
  1664. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/ncn/conv4d.py +91 -0
  1665. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/ncn/extract_ncmatches.py +158 -0
  1666. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/ncn/model.py +333 -0
  1667. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/patch2pix.py +403 -0
  1668. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/resnet.py +191 -0
  1669. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/utils.py +111 -0
  1670. vismatch/third_party/imatch-toolbox/third_party/patch2pix/train_patch2pix.py +374 -0
  1671. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/colmap/data_loading.py +169 -0
  1672. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/colmap/read_database.py +175 -0
  1673. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/colmap/read_write_model.py +483 -0
  1674. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/common/plotting.py +393 -0
  1675. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/common/setup_helper.py +59 -0
  1676. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/common/visdom_helper.py +95 -0
  1677. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/__init__.py +1 -0
  1678. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/data_parsing.py +145 -0
  1679. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/dataset_megadepth.py +141 -0
  1680. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/preprocess.py +184 -0
  1681. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/eval/geometry.py +90 -0
  1682. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/eval/measure.py +161 -0
  1683. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/eval/model_helper.py +129 -0
  1684. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/train/eval_epoch_immatch.py +99 -0
  1685. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/train/helper.py +196 -0
  1686. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/__init__.py +33 -0
  1687. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/aachen.py +146 -0
  1688. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/dataset.py +77 -0
  1689. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/imgfolder.py +23 -0
  1690. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/pair_dataset.py +287 -0
  1691. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/web_images.py +64 -0
  1692. vismatch/third_party/imatch-toolbox/third_party/r2d2/extract.py +183 -0
  1693. vismatch/third_party/imatch-toolbox/third_party/r2d2/extract_kapture.py +194 -0
  1694. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/ap_loss.py +67 -0
  1695. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/losses.py +56 -0
  1696. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/patchnet.py +134 -0
  1697. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/reliability_loss.py +59 -0
  1698. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/repeatability_loss.py +66 -0
  1699. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/sampler.py +390 -0
  1700. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/common.py +41 -0
  1701. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/dataloader.py +367 -0
  1702. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/trainer.py +76 -0
  1703. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/transforms.py +513 -0
  1704. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/transforms_tools.py +230 -0
  1705. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/viz.py +191 -0
  1706. vismatch/third_party/imatch-toolbox/third_party/r2d2/train.py +138 -0
  1707. vismatch/third_party/imatch-toolbox/third_party/r2d2/viz_heatmaps.py +122 -0
  1708. vismatch/third_party/imatch-toolbox/third_party/superglue/demo_superglue.py +259 -0
  1709. vismatch/third_party/imatch-toolbox/third_party/superglue/match_pairs.py +425 -0
  1710. vismatch/third_party/imatch-toolbox/third_party/superglue/models/__init__.py +0 -0
  1711. vismatch/third_party/imatch-toolbox/third_party/superglue/models/matching.py +84 -0
  1712. vismatch/third_party/imatch-toolbox/third_party/superglue/models/superglue.py +283 -0
  1713. vismatch/third_party/imatch-toolbox/third_party/superglue/models/superpoint.py +202 -0
  1714. vismatch/third_party/imatch-toolbox/third_party/superglue/models/utils.py +555 -0
  1715. vismatch/third_party/keypt2subpx/dataprocess/aliked.py +163 -0
  1716. vismatch/third_party/keypt2subpx/dataprocess/dedode.py +215 -0
  1717. vismatch/third_party/keypt2subpx/dataprocess/splg.py +162 -0
  1718. vismatch/third_party/keypt2subpx/dataprocess/spnn.py +157 -0
  1719. vismatch/third_party/keypt2subpx/dataprocess/superpoint_densescore.py +357 -0
  1720. vismatch/third_party/keypt2subpx/dataprocess/xfeat.py +187 -0
  1721. vismatch/third_party/keypt2subpx/dataset.py +145 -0
  1722. vismatch/third_party/keypt2subpx/hubconf.py +38 -0
  1723. vismatch/third_party/keypt2subpx/logger.py +127 -0
  1724. vismatch/third_party/keypt2subpx/model.py +183 -0
  1725. vismatch/third_party/keypt2subpx/settings.py +108 -0
  1726. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/__init__.py +17 -0
  1727. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/__init__.py +25 -0
  1728. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/augmentations.py +244 -0
  1729. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/base_dataset.py +206 -0
  1730. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/eth3d.py +254 -0
  1731. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/homographies.py +311 -0
  1732. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/hpatches.py +145 -0
  1733. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/image_folder.py +59 -0
  1734. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/image_pairs.py +100 -0
  1735. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/megadepth.py +510 -0
  1736. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/utils.py +131 -0
  1737. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/__init__.py +20 -0
  1738. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/eth3d.py +202 -0
  1739. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/eval_pipeline.py +109 -0
  1740. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/hpatches.py +203 -0
  1741. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/inspect.py +61 -0
  1742. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/io.py +109 -0
  1743. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/megadepth1500.py +189 -0
  1744. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/utils.py +272 -0
  1745. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/__init__.py +0 -0
  1746. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/depth.py +88 -0
  1747. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/epipolar.py +155 -0
  1748. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/gt_generation.py +558 -0
  1749. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/homography.py +342 -0
  1750. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/utils.py +167 -0
  1751. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/wrappers.py +425 -0
  1752. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/__init__.py +30 -0
  1753. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/backbones/__init__.py +0 -0
  1754. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/backbones/dinov2.py +30 -0
  1755. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/base_model.py +157 -0
  1756. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/cache_loader.py +139 -0
  1757. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/__init__.py +0 -0
  1758. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/aliked.py +786 -0
  1759. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/disk_kornia.py +108 -0
  1760. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/grid_extractor.py +60 -0
  1761. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/keynet_affnet_hardnet.py +74 -0
  1762. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/mixed.py +76 -0
  1763. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/sift.py +234 -0
  1764. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/sift_kornia.py +46 -0
  1765. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/superpoint_open.py +210 -0
  1766. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/__init__.py +0 -0
  1767. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/deeplsd.py +106 -0
  1768. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/lsd.py +88 -0
  1769. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/wireframe.py +312 -0
  1770. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/__init__.py +0 -0
  1771. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/adalam.py +0 -0
  1772. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/depth_matcher.py +82 -0
  1773. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/gluestick.py +776 -0
  1774. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/homography_matcher.py +66 -0
  1775. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/kornia_loftr.py +66 -0
  1776. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/lightglue.py +612 -0
  1777. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/lightglue_pretrained.py +36 -0
  1778. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/nearest_neighbor_matcher.py +97 -0
  1779. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/triplet_pipeline.py +99 -0
  1780. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/two_view_pipeline.py +114 -0
  1781. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/__init__.py +0 -0
  1782. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/losses.py +73 -0
  1783. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/metrics.py +50 -0
  1784. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/misc.py +70 -0
  1785. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/__init__.py +15 -0
  1786. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/base_estimator.py +33 -0
  1787. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/__init__.py +0 -0
  1788. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/homography_est.py +74 -0
  1789. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/opencv.py +53 -0
  1790. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/poselib.py +40 -0
  1791. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/__init__.py +0 -0
  1792. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/opencv.py +64 -0
  1793. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/poselib.py +44 -0
  1794. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/pycolmap.py +52 -0
  1795. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/scripts/__init__.py +0 -0
  1796. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/scripts/export_local_features.py +127 -0
  1797. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/scripts/export_megadepth.py +173 -0
  1798. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/settings.py +6 -0
  1799. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/train.py +691 -0
  1800. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/__init__.py +0 -0
  1801. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/benchmark.py +33 -0
  1802. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/experiments.py +134 -0
  1803. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/export_predictions.py +81 -0
  1804. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/image.py +130 -0
  1805. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/misc.py +44 -0
  1806. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/patches.py +50 -0
  1807. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/stdout_capturing.py +134 -0
  1808. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/tensor.py +48 -0
  1809. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/tools.py +269 -0
  1810. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/global_frame.py +289 -0
  1811. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/tools.py +465 -0
  1812. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/two_view_frame.py +158 -0
  1813. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/visualize_batch.py +57 -0
  1814. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/viz2d.py +486 -0
  1815. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory_nonfree/__init__.py +0 -0
  1816. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory_nonfree/superglue.py +342 -0
  1817. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory_nonfree/superpoint.py +356 -0
  1818. vismatch/third_party/keypt2subpx/submodules/glue_factory/tests/__init__.py +0 -0
  1819. vismatch/third_party/keypt2subpx/submodules/glue_factory/tests/test_eval_utils.py +88 -0
  1820. vismatch/third_party/keypt2subpx/submodules/glue_factory/tests/test_integration.py +132 -0
  1821. vismatch/third_party/keypt2subpx/summarize.py +44 -0
  1822. vismatch/third_party/keypt2subpx/test.py +225 -0
  1823. vismatch/third_party/keypt2subpx/train.py +180 -0
  1824. vismatch/third_party/keypt2subpx/utils.py +150 -0
  1825. vismatch/third_party/mast3r/demo.py +51 -0
  1826. vismatch/third_party/mast3r/demo_dust3r_ga.py +99 -0
  1827. vismatch/third_party/mast3r/demo_glomap.py +52 -0
  1828. vismatch/third_party/mast3r/dust3r/croco/datasets/__init__.py +0 -0
  1829. vismatch/third_party/mast3r/dust3r/croco/datasets/crops/extract_crops_from_images.py +159 -0
  1830. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/__init__.py +0 -0
  1831. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/generate_from_metadata.py +92 -0
  1832. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/generate_from_metadata_files.py +27 -0
  1833. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/generate_multiview_images.py +177 -0
  1834. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/multiview_habitat_sim_generator.py +390 -0
  1835. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/pack_metadata_files.py +69 -0
  1836. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/paths.py +129 -0
  1837. vismatch/third_party/mast3r/dust3r/croco/datasets/pairs_dataset.py +109 -0
  1838. vismatch/third_party/mast3r/dust3r/croco/datasets/transforms.py +95 -0
  1839. vismatch/third_party/mast3r/dust3r/croco/demo.py +55 -0
  1840. vismatch/third_party/mast3r/dust3r/croco/models/blocks.py +241 -0
  1841. vismatch/third_party/mast3r/dust3r/croco/models/criterion.py +37 -0
  1842. vismatch/third_party/mast3r/dust3r/croco/models/croco.py +249 -0
  1843. vismatch/third_party/mast3r/dust3r/croco/models/croco_downstream.py +122 -0
  1844. vismatch/third_party/mast3r/dust3r/croco/models/curope/__init__.py +4 -0
  1845. vismatch/third_party/mast3r/dust3r/croco/models/curope/curope2d.py +40 -0
  1846. vismatch/third_party/mast3r/dust3r/croco/models/curope/setup.py +34 -0
  1847. vismatch/third_party/mast3r/dust3r/croco/models/dpt_block.py +450 -0
  1848. vismatch/third_party/mast3r/dust3r/croco/models/head_downstream.py +58 -0
  1849. vismatch/third_party/mast3r/dust3r/croco/models/masking.py +25 -0
  1850. vismatch/third_party/mast3r/dust3r/croco/models/pos_embed.py +157 -0
  1851. vismatch/third_party/mast3r/dust3r/croco/pretrain.py +254 -0
  1852. vismatch/third_party/mast3r/dust3r/croco/stereoflow/augmentor.py +290 -0
  1853. vismatch/third_party/mast3r/dust3r/croco/stereoflow/criterion.py +251 -0
  1854. vismatch/third_party/mast3r/dust3r/croco/stereoflow/datasets_flow.py +630 -0
  1855. vismatch/third_party/mast3r/dust3r/croco/stereoflow/datasets_stereo.py +674 -0
  1856. vismatch/third_party/mast3r/dust3r/croco/stereoflow/engine.py +280 -0
  1857. vismatch/third_party/mast3r/dust3r/croco/stereoflow/test.py +216 -0
  1858. vismatch/third_party/mast3r/dust3r/croco/stereoflow/train.py +253 -0
  1859. vismatch/third_party/mast3r/dust3r/croco/utils/misc.py +463 -0
  1860. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/find_scenes.py +78 -0
  1861. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/__init__.py +2 -0
  1862. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/habitat_sim_envmaps_renderer.py +170 -0
  1863. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/multiview_crop_generator.py +93 -0
  1864. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/projections.py +151 -0
  1865. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/projections_conversions.py +45 -0
  1866. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/preprocess_habitat.py +121 -0
  1867. vismatch/third_party/mast3r/dust3r/datasets_preprocess/path_to_root.py +13 -0
  1868. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_arkitscenes.py +355 -0
  1869. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_blendedMVS.py +149 -0
  1870. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_co3d.py +295 -0
  1871. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_megadepth.py +198 -0
  1872. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_scannetpp.py +390 -0
  1873. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_staticthings3d.py +130 -0
  1874. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_waymo.py +257 -0
  1875. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_wildrgbd.py +209 -0
  1876. vismatch/third_party/mast3r/dust3r/demo.py +45 -0
  1877. vismatch/third_party/mast3r/dust3r/dust3r/__init__.py +2 -0
  1878. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/__init__.py +33 -0
  1879. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/base_opt.py +405 -0
  1880. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/commons.py +90 -0
  1881. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/init_im_poses.py +316 -0
  1882. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/modular_optimizer.py +145 -0
  1883. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/optimizer.py +248 -0
  1884. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/pair_viewer.py +127 -0
  1885. vismatch/third_party/mast3r/dust3r/dust3r/datasets/__init__.py +50 -0
  1886. vismatch/third_party/mast3r/dust3r/dust3r/datasets/arkitscenes.py +102 -0
  1887. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/__init__.py +2 -0
  1888. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/base_stereo_view_dataset.py +220 -0
  1889. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/batched_sampler.py +74 -0
  1890. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/easy_dataset.py +157 -0
  1891. vismatch/third_party/mast3r/dust3r/dust3r/datasets/blendedmvs.py +104 -0
  1892. vismatch/third_party/mast3r/dust3r/dust3r/datasets/co3d.py +165 -0
  1893. vismatch/third_party/mast3r/dust3r/dust3r/datasets/habitat.py +107 -0
  1894. vismatch/third_party/mast3r/dust3r/dust3r/datasets/megadepth.py +123 -0
  1895. vismatch/third_party/mast3r/dust3r/dust3r/datasets/scannetpp.py +96 -0
  1896. vismatch/third_party/mast3r/dust3r/dust3r/datasets/staticthings3d.py +96 -0
  1897. vismatch/third_party/mast3r/dust3r/dust3r/datasets/utils/__init__.py +2 -0
  1898. vismatch/third_party/mast3r/dust3r/dust3r/datasets/utils/cropping.py +124 -0
  1899. vismatch/third_party/mast3r/dust3r/dust3r/datasets/utils/transforms.py +11 -0
  1900. vismatch/third_party/mast3r/dust3r/dust3r/datasets/waymo.py +93 -0
  1901. vismatch/third_party/mast3r/dust3r/dust3r/datasets/wildrgbd.py +67 -0
  1902. vismatch/third_party/mast3r/dust3r/dust3r/demo.py +287 -0
  1903. vismatch/third_party/mast3r/dust3r/dust3r/heads/__init__.py +19 -0
  1904. vismatch/third_party/mast3r/dust3r/dust3r/heads/dpt_head.py +115 -0
  1905. vismatch/third_party/mast3r/dust3r/dust3r/heads/linear_head.py +41 -0
  1906. vismatch/third_party/mast3r/dust3r/dust3r/heads/postprocess.py +58 -0
  1907. vismatch/third_party/mast3r/dust3r/dust3r/image_pairs.py +104 -0
  1908. vismatch/third_party/mast3r/dust3r/dust3r/inference.py +150 -0
  1909. vismatch/third_party/mast3r/dust3r/dust3r/losses.py +299 -0
  1910. vismatch/third_party/mast3r/dust3r/dust3r/model.py +211 -0
  1911. vismatch/third_party/mast3r/dust3r/dust3r/optim_factory.py +14 -0
  1912. vismatch/third_party/mast3r/dust3r/dust3r/patch_embed.py +70 -0
  1913. vismatch/third_party/mast3r/dust3r/dust3r/post_process.py +60 -0
  1914. vismatch/third_party/mast3r/dust3r/dust3r/training.py +377 -0
  1915. vismatch/third_party/mast3r/dust3r/dust3r/utils/__init__.py +2 -0
  1916. vismatch/third_party/mast3r/dust3r/dust3r/utils/device.py +76 -0
  1917. vismatch/third_party/mast3r/dust3r/dust3r/utils/geometry.py +366 -0
  1918. vismatch/third_party/mast3r/dust3r/dust3r/utils/image.py +128 -0
  1919. vismatch/third_party/mast3r/dust3r/dust3r/utils/misc.py +121 -0
  1920. vismatch/third_party/mast3r/dust3r/dust3r/utils/parallel.py +79 -0
  1921. vismatch/third_party/mast3r/dust3r/dust3r/utils/path_to_croco.py +19 -0
  1922. vismatch/third_party/mast3r/dust3r/dust3r/viz.py +381 -0
  1923. vismatch/third_party/mast3r/dust3r/dust3r_visloc/__init__.py +2 -0
  1924. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/__init__.py +6 -0
  1925. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/aachen_day_night.py +24 -0
  1926. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/base_colmap.py +282 -0
  1927. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/base_dataset.py +19 -0
  1928. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/cambridge_landmarks.py +19 -0
  1929. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/inloc.py +167 -0
  1930. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/sevenscenes.py +123 -0
  1931. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/utils.py +118 -0
  1932. vismatch/third_party/mast3r/dust3r/dust3r_visloc/evaluation.py +65 -0
  1933. vismatch/third_party/mast3r/dust3r/dust3r_visloc/localization.py +140 -0
  1934. vismatch/third_party/mast3r/dust3r/train.py +13 -0
  1935. vismatch/third_party/mast3r/dust3r/visloc.py +193 -0
  1936. vismatch/third_party/mast3r/kapture_mast3r_mapping.py +127 -0
  1937. vismatch/third_party/mast3r/make_pairs.py +105 -0
  1938. vismatch/third_party/mast3r/mast3r/__init__.py +2 -0
  1939. vismatch/third_party/mast3r/mast3r/catmlp_dpt_head.py +239 -0
  1940. vismatch/third_party/mast3r/mast3r/cloud_opt/__init__.py +2 -0
  1941. vismatch/third_party/mast3r/mast3r/cloud_opt/sparse_ga.py +1078 -0
  1942. vismatch/third_party/mast3r/mast3r/cloud_opt/triangulation.py +80 -0
  1943. vismatch/third_party/mast3r/mast3r/cloud_opt/tsdf_optimizer.py +273 -0
  1944. vismatch/third_party/mast3r/mast3r/cloud_opt/utils/__init__.py +2 -0
  1945. vismatch/third_party/mast3r/mast3r/cloud_opt/utils/losses.py +32 -0
  1946. vismatch/third_party/mast3r/mast3r/cloud_opt/utils/schedules.py +17 -0
  1947. vismatch/third_party/mast3r/mast3r/colmap/__init__.py +2 -0
  1948. vismatch/third_party/mast3r/mast3r/colmap/database.py +383 -0
  1949. vismatch/third_party/mast3r/mast3r/colmap/mapping.py +196 -0
  1950. vismatch/third_party/mast3r/mast3r/datasets/__init__.py +62 -0
  1951. vismatch/third_party/mast3r/mast3r/datasets/base/__init__.py +2 -0
  1952. vismatch/third_party/mast3r/mast3r/datasets/base/mast3r_base_stereo_view_dataset.py +355 -0
  1953. vismatch/third_party/mast3r/mast3r/datasets/utils/__init__.py +2 -0
  1954. vismatch/third_party/mast3r/mast3r/datasets/utils/cropping.py +219 -0
  1955. vismatch/third_party/mast3r/mast3r/demo.py +381 -0
  1956. vismatch/third_party/mast3r/mast3r/demo_glomap.py +343 -0
  1957. vismatch/third_party/mast3r/mast3r/fast_nn.py +223 -0
  1958. vismatch/third_party/mast3r/mast3r/image_pairs.py +115 -0
  1959. vismatch/third_party/mast3r/mast3r/losses.py +508 -0
  1960. vismatch/third_party/mast3r/mast3r/model.py +213 -0
  1961. vismatch/third_party/mast3r/mast3r/retrieval/graph.py +77 -0
  1962. vismatch/third_party/mast3r/mast3r/retrieval/model.py +271 -0
  1963. vismatch/third_party/mast3r/mast3r/retrieval/processor.py +129 -0
  1964. vismatch/third_party/mast3r/mast3r/utils/__init__.py +2 -0
  1965. vismatch/third_party/mast3r/mast3r/utils/coarse_to_fine.py +214 -0
  1966. vismatch/third_party/mast3r/mast3r/utils/collate.py +62 -0
  1967. vismatch/third_party/mast3r/mast3r/utils/misc.py +17 -0
  1968. vismatch/third_party/mast3r/mast3r/utils/path_to_dust3r.py +19 -0
  1969. vismatch/third_party/mast3r/train.py +48 -0
  1970. vismatch/third_party/mast3r/visloc.py +538 -0
  1971. vismatch/third_party/omniglue/__init__.py +19 -0
  1972. vismatch/third_party/omniglue/demo.py +89 -0
  1973. vismatch/third_party/omniglue/src/omniglue/__init__.py +17 -0
  1974. vismatch/third_party/omniglue/src/omniglue/dino_extract.py +215 -0
  1975. vismatch/third_party/omniglue/src/omniglue/omniglue_extract.py +159 -0
  1976. vismatch/third_party/omniglue/src/omniglue/superpoint_extract.py +214 -0
  1977. vismatch/third_party/omniglue/src/omniglue/utils.py +274 -0
  1978. vismatch/third_party/omniglue/third_party/dinov2/__init__.py +0 -0
  1979. vismatch/third_party/omniglue/third_party/dinov2/dino.py +411 -0
  1980. vismatch/third_party/omniglue/third_party/dinov2/dino_utils.py +341 -0
  1981. vismatch/third_party/rdd/RDD/RDD.py +262 -0
  1982. vismatch/third_party/rdd/RDD/RDD_helper.py +181 -0
  1983. vismatch/third_party/rdd/RDD/dataset/__init__.py +0 -0
  1984. vismatch/third_party/rdd/RDD/dataset/megadepth/__init__.py +2 -0
  1985. vismatch/third_party/rdd/RDD/dataset/megadepth/megadepth.py +313 -0
  1986. vismatch/third_party/rdd/RDD/dataset/megadepth/megadepth_warper.py +75 -0
  1987. vismatch/third_party/rdd/RDD/dataset/megadepth/utils.py +848 -0
  1988. vismatch/third_party/rdd/RDD/matchers/__init__.py +3 -0
  1989. vismatch/third_party/rdd/RDD/matchers/dense_matcher.py +137 -0
  1990. vismatch/third_party/rdd/RDD/matchers/dual_softmax_matcher.py +31 -0
  1991. vismatch/third_party/rdd/RDD/matchers/lightglue.py +667 -0
  1992. vismatch/third_party/rdd/RDD/models/backbone.py +147 -0
  1993. vismatch/third_party/rdd/RDD/models/deformable_transformer.py +270 -0
  1994. vismatch/third_party/rdd/RDD/models/descriptor.py +116 -0
  1995. vismatch/third_party/rdd/RDD/models/detector.py +141 -0
  1996. vismatch/third_party/rdd/RDD/models/interpolator.py +33 -0
  1997. vismatch/third_party/rdd/RDD/models/ops/functions/__init__.py +13 -0
  1998. vismatch/third_party/rdd/RDD/models/ops/functions/ms_deform_attn_func.py +74 -0
  1999. vismatch/third_party/rdd/RDD/models/ops/modules/__init__.py +12 -0
  2000. vismatch/third_party/rdd/RDD/models/ops/modules/ms_deform_attn.py +125 -0
  2001. vismatch/third_party/rdd/RDD/models/ops/setup.py +78 -0
  2002. vismatch/third_party/rdd/RDD/models/ops/test.py +92 -0
  2003. vismatch/third_party/rdd/RDD/models/position_encoding.py +48 -0
  2004. vismatch/third_party/rdd/RDD/models/soft_detect.py +176 -0
  2005. vismatch/third_party/rdd/RDD/utils/__init__.py +1 -0
  2006. vismatch/third_party/rdd/RDD/utils/misc.py +531 -0
  2007. vismatch/third_party/rdd/benchmarks/air_ground.py +250 -0
  2008. vismatch/third_party/rdd/benchmarks/mega_1500.py +259 -0
  2009. vismatch/third_party/rdd/benchmarks/mega_view.py +252 -0
  2010. vismatch/third_party/rdd/benchmarks/scannet_1500.py +251 -0
  2011. vismatch/third_party/rdd/benchmarks/utils.py +112 -0
  2012. vismatch/third_party/rdd/configs/default.yaml +19 -0
  2013. vismatch/third_party/rdd/sfm/extract_rdd.py +145 -0
  2014. vismatch/third_party/rdd/sfm/match_rdd.py +259 -0
  2015. vismatch/third_party/rdd/third_party/LightGlue/.github/workflows/code-quality.yml +24 -0
  2016. vismatch/third_party/rdd/third_party/LightGlue/benchmark.py +255 -0
  2017. vismatch/third_party/rdd/third_party/LightGlue/lightglue/__init__.py +7 -0
  2018. vismatch/third_party/rdd/third_party/LightGlue/lightglue/aliked.py +760 -0
  2019. vismatch/third_party/rdd/third_party/LightGlue/lightglue/disk.py +55 -0
  2020. vismatch/third_party/rdd/third_party/LightGlue/lightglue/dog_hardnet.py +41 -0
  2021. vismatch/third_party/rdd/third_party/LightGlue/lightglue/lightglue.py +662 -0
  2022. vismatch/third_party/rdd/third_party/LightGlue/lightglue/sift.py +216 -0
  2023. vismatch/third_party/rdd/third_party/LightGlue/lightglue/superpoint.py +227 -0
  2024. vismatch/third_party/rdd/third_party/LightGlue/lightglue/utils.py +165 -0
  2025. vismatch/third_party/rdd/third_party/LightGlue/lightglue/viz2d.py +203 -0
  2026. vismatch/third_party/rdd/third_party/__init__.py +1 -0
  2027. vismatch/third_party/rdd/third_party/aliked_wrapper.py +17 -0
  2028. vismatch/third_party/rdd/training/losses/descriptor_loss.py +73 -0
  2029. vismatch/third_party/rdd/training/losses/detector_loss.py +499 -0
  2030. vismatch/third_party/rdd/training/train.py +473 -0
  2031. vismatch/third_party/rdd/training/utils.py +246 -0
  2032. vismatch/utils.py +390 -0
  2033. vismatch/viz.py +222 -0
  2034. vismatch-1.1.1.dist-info/METADATA +265 -0
  2035. vismatch-1.1.1.dist-info/RECORD +2042 -0
  2036. vismatch-1.1.1.dist-info/WHEEL +5 -0
  2037. vismatch-1.1.1.dist-info/entry_points.txt +4 -0
  2038. vismatch-1.1.1.dist-info/licenses/LICENSE +28 -0
  2039. vismatch-1.1.1.dist-info/top_level.txt +4 -0
  2040. vismatch_extract.py +103 -0
  2041. vismatch_match.py +114 -0
  2042. vismatch_test.py +186 -0
@@ -0,0 +1,973 @@
1
+ """
2
+ UniCeption Alternating-Attention Transformer for Information Sharing
3
+ """
4
+
5
+ from functools import partial
6
+ from typing import Callable, List, Optional, Tuple, Type, Union
7
+
8
+ import numpy as np
9
+ import torch
10
+ import torch.nn as nn
11
+
12
+ from uniception.models.info_sharing.base import (
13
+ MultiViewTransformerInput,
14
+ MultiViewTransformerOutput,
15
+ UniCeptionInfoSharingBase,
16
+ )
17
+ from uniception.models.utils.intermediate_feature_return import IntermediateFeatureReturner, feature_take_indices
18
+ from uniception.models.utils.positional_encoding import PositionGetter
19
+ from uniception.models.utils.transformer_blocks import Mlp, SelfAttentionBlock
20
+
21
+
22
+ class MultiViewAlternatingAttentionTransformer(UniCeptionInfoSharingBase):
23
+ "UniCeption Multi-View Alternating-Attention Transformer for information sharing across image features from different views."
24
+
25
+ def __init__(
26
+ self,
27
+ name: str,
28
+ input_embed_dim: int,
29
+ use_pe_for_non_reference_views: bool = False,
30
+ max_num_views_for_pe: int = 1000,
31
+ use_rand_idx_pe_for_non_reference_views: bool = True,
32
+ size: Optional[str] = None,
33
+ depth: int = 12,
34
+ dim: int = 768,
35
+ num_heads: int = 12,
36
+ mlp_ratio: float = 4.0,
37
+ qkv_bias: bool = True,
38
+ qk_norm: bool = False,
39
+ proj_drop: float = 0.0,
40
+ attn_drop: float = 0.0,
41
+ init_values: Optional[float] = None,
42
+ drop_path: float = 0.0,
43
+ act_layer: Type[nn.Module] = nn.GELU,
44
+ norm_layer: Union[Type[nn.Module], Callable[..., nn.Module]] = partial(nn.LayerNorm, eps=1e-6),
45
+ mlp_layer: Type[nn.Module] = Mlp,
46
+ custom_positional_encoding: Optional[Callable] = None,
47
+ use_scalable_softmax: bool = False,
48
+ use_entropy_scaling: bool = False,
49
+ base_token_count_for_entropy_scaling: int = 444,
50
+ entropy_scaling_growth_factor: float = 1.4,
51
+ pretrained_checkpoint_path: Optional[str] = None,
52
+ gradient_checkpointing: bool = False,
53
+ *args,
54
+ **kwargs,
55
+ ):
56
+ """
57
+ Initialize the Multi-View Alternating-Attention Transformer for information sharing across image features from different views.
58
+ Alternates between global and frame-level attention.
59
+
60
+ Args:
61
+ input_embed_dim (int): Dimension of input embeddings.
62
+ use_pe_for_non_reference_views (bool): Whether to use view positional encoding for input non-reference views. (default: False)
63
+ max_num_views_for_pe (int): Maximum number of views for positional encoding. (default: 1000)
64
+ use_rand_idx_pe_for_non_reference_views (bool): Whether to use random index positional encoding for non-reference views. (default: True)
65
+ size (str): String to indicate interpretable size of the transformer (for e.g., base, large, ...). (default: None)
66
+ depth (int): Number of transformer layers. (default: 12, base size)
67
+ dim (int): Dimension of the transformer. (default: 768, base size)
68
+ num_heads (int): Number of attention heads. (default: 12, base size)
69
+ mlp_ratio (float): Ratio of hidden to input dimension in MLP (default: 4.)
70
+ qkv_bias (bool): Whether to include bias in qkv projection (default: True)
71
+ qk_norm (bool): Whether to normalize q and k (default: False)
72
+ proj_drop (float): Dropout rate for output (default: 0.)
73
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
74
+ init_values (float): Initial value for LayerScale gamma (default: None)
75
+ drop_path (float): Dropout rate for stochastic depth (default: 0.)
76
+ act_layer (nn.Module): Activation layer (default: nn.GELU)
77
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
78
+ mlp_layer (nn.Module): MLP layer (default: Mlp)
79
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
80
+ use_scalable_softmax (bool): Whether to use scalable softmax (default: False)
81
+ use_entropy_scaling (bool): Whether to use entropy scaling (default: False)
82
+ base_token_count_for_entropy_scaling (int): Base token count for entropy scaling (default: 444)
83
+ Computed using (518, 168) as base resolution with 14 patch size
84
+ entropy_scaling_growth_factor (float): Growth factor for entropy scaling (default: 1.4)
85
+ pretrained_checkpoint_path (str, optional): Path to the pretrained checkpoint. (default: None)
86
+ gradient_checkpointing (bool, optional): Whether to use gradient checkpointing for memory efficiency. (default: False)
87
+ """
88
+ # Initialize the base class
89
+ super().__init__(name=name, size=size, *args, **kwargs)
90
+
91
+ # Initialize the specific attributes of the transformer
92
+ self.input_embed_dim = input_embed_dim
93
+ self.use_pe_for_non_reference_views = use_pe_for_non_reference_views
94
+ self.max_num_views_for_pe = max_num_views_for_pe
95
+ self.use_rand_idx_pe_for_non_reference_views = use_rand_idx_pe_for_non_reference_views
96
+ self.depth = depth
97
+ self.dim = dim
98
+ self.num_heads = num_heads
99
+ self.mlp_ratio = mlp_ratio
100
+ self.qkv_bias = qkv_bias
101
+ self.qk_norm = qk_norm
102
+ self.proj_drop = proj_drop
103
+ self.attn_drop = attn_drop
104
+ self.init_values = init_values
105
+ self.drop_path = drop_path
106
+ self.act_layer = act_layer
107
+ self.norm_layer = norm_layer
108
+ self.mlp_layer = mlp_layer
109
+ self.custom_positional_encoding = custom_positional_encoding
110
+ self.use_scalable_softmax = use_scalable_softmax
111
+ self.use_entropy_scaling = use_entropy_scaling
112
+ self.base_token_count_for_entropy_scaling = base_token_count_for_entropy_scaling
113
+ self.entropy_scaling_growth_factor = entropy_scaling_growth_factor
114
+ self.pretrained_checkpoint_path = pretrained_checkpoint_path
115
+ self.gradient_checkpointing = gradient_checkpointing
116
+
117
+ # Initialize the projection layer for input embeddings
118
+ if self.input_embed_dim != self.dim:
119
+ self.proj_embed = nn.Linear(self.input_embed_dim, self.dim, bias=True)
120
+ else:
121
+ self.proj_embed = nn.Identity()
122
+
123
+ # Initialize the self-attention blocks which ingest all views at once
124
+ self.self_attention_blocks = nn.ModuleList(
125
+ [
126
+ SelfAttentionBlock(
127
+ dim=self.dim,
128
+ num_heads=self.num_heads,
129
+ mlp_ratio=self.mlp_ratio,
130
+ qkv_bias=self.qkv_bias,
131
+ qk_norm=self.qk_norm,
132
+ proj_drop=self.proj_drop,
133
+ attn_drop=self.attn_drop,
134
+ init_values=self.init_values,
135
+ drop_path=self.drop_path,
136
+ act_layer=self.act_layer,
137
+ norm_layer=self.norm_layer,
138
+ mlp_layer=self.mlp_layer,
139
+ custom_positional_encoding=self.custom_positional_encoding,
140
+ use_scalable_softmax=self.use_scalable_softmax,
141
+ use_entropy_scaling=self.use_entropy_scaling,
142
+ base_token_count_for_entropy_scaling=self.base_token_count_for_entropy_scaling,
143
+ entropy_scaling_growth_factor=self.entropy_scaling_growth_factor,
144
+ )
145
+ for _ in range(self.depth)
146
+ ]
147
+ )
148
+
149
+ # Initialize the final normalization layer
150
+ self.norm = self.norm_layer(self.dim)
151
+
152
+ # Initialize the position getter for patch positions if required
153
+ if self.custom_positional_encoding is not None:
154
+ self.position_getter = PositionGetter()
155
+
156
+ if self.use_pe_for_non_reference_views:
157
+ # Initialize the positional encoding table for the different views
158
+ self.register_buffer(
159
+ "view_pos_table",
160
+ self._get_sinusoid_encoding_table(self.max_num_views_for_pe, self.dim, 10000),
161
+ )
162
+ else:
163
+ # Initialize the positional encoding table for the reference view
164
+ self.register_buffer(
165
+ "view_pos_table",
166
+ self._get_sinusoid_encoding_table(1, self.dim, 10000),
167
+ )
168
+
169
+ # Initialize random weights
170
+ self.initialize_weights()
171
+
172
+ # Apply gradient checkpointing if enabled
173
+ if self.gradient_checkpointing:
174
+ for i, block in enumerate(self.self_attention_blocks):
175
+ self.self_attention_blocks[i] = self.wrap_module_with_gradient_checkpointing(block)
176
+
177
+ # Load pretrained weights if provided
178
+ if self.pretrained_checkpoint_path is not None:
179
+ print(
180
+ f"Loading pretrained multi-view Alternating-Attention transformer weights from {self.pretrained_checkpoint_path} ..."
181
+ )
182
+ ckpt = torch.load(self.pretrained_checkpoint_path, weights_only=False)
183
+ print(self.load_state_dict(ckpt["model"]))
184
+
185
+ def _get_sinusoid_encoding_table(self, n_position, d_hid, base):
186
+ "Sinusoid position encoding table"
187
+
188
+ def get_position_angle_vec(position):
189
+ return [position / np.power(base, 2 * (hid_j // 2) / d_hid) for hid_j in range(d_hid)]
190
+
191
+ sinusoid_table = np.array([get_position_angle_vec(pos_i) for pos_i in range(n_position)])
192
+ sinusoid_table[:, 0::2] = np.sin(sinusoid_table[:, 0::2])
193
+ sinusoid_table[:, 1::2] = np.cos(sinusoid_table[:, 1::2])
194
+
195
+ return torch.FloatTensor(sinusoid_table)
196
+
197
+ def initialize_weights(self):
198
+ "Initialize weights of the transformer."
199
+ # Linears and layer norms
200
+ self.apply(self._init_weights)
201
+
202
+ def _init_weights(self, m):
203
+ "Initialize the transformer linear and layer norm weights."
204
+ if isinstance(m, nn.Linear):
205
+ # We use xavier_uniform following official JAX ViT:
206
+ torch.nn.init.xavier_uniform_(m.weight)
207
+ if isinstance(m, nn.Linear) and m.bias is not None:
208
+ nn.init.constant_(m.bias, 0)
209
+ elif isinstance(m, nn.LayerNorm):
210
+ nn.init.constant_(m.bias, 0)
211
+ nn.init.constant_(m.weight, 1.0)
212
+
213
+ def forward(
214
+ self,
215
+ model_input: MultiViewTransformerInput,
216
+ ) -> MultiViewTransformerOutput:
217
+ """
218
+ Forward interface for the Multi-View Alternating-Attention Transformer.
219
+
220
+ Args:
221
+ model_input (MultiViewTransformerInput): Input to the model.
222
+ Expects the features to be a list of size (batch, input_embed_dim, height, width),
223
+ where each entry corresponds to a different view.
224
+ Optionally, the input can also include additional_input_tokens (e.g., class token, registers, pose tokens, scale token)
225
+ which are appended to the token set from the multi-view features. The tokens are of size (batch, input_embed_dim, num_of_additional_tokens).
226
+
227
+ Returns:
228
+ MultiViewTransformerOutput: Output of the model post information sharing.
229
+ """
230
+ # Check that the number of views matches the input and the features are of expected shape
231
+ if self.use_pe_for_non_reference_views:
232
+ assert (
233
+ len(model_input.features) <= self.max_num_views_for_pe
234
+ ), f"Expected less than {self.max_num_views_for_pe} views, got {len(model_input.features)}"
235
+ assert all(
236
+ view_features.shape[1] == self.input_embed_dim for view_features in model_input.features
237
+ ), f"All views must have input dimension {self.input_embed_dim}"
238
+ assert all(
239
+ view_features.ndim == 4 for view_features in model_input.features
240
+ ), "All views must have 4 dimensions (N, C, H, W)"
241
+
242
+ # Initialize the multi-view features from the model input and number of views for current input
243
+ multi_view_features = model_input.features
244
+ num_of_views = len(multi_view_features)
245
+ batch_size, _, height, width = multi_view_features[0].shape
246
+ num_of_tokens_per_view = height * width
247
+
248
+ # Stack the multi-view features (N, C, H, W) to (N, V, C, H, W) (assumes all V views have same shape)
249
+ multi_view_features = torch.stack(multi_view_features, dim=1)
250
+
251
+ # Resize the multi-view features from NVCHW to NLC, where L = V * H * W
252
+ multi_view_features = multi_view_features.permute(0, 1, 3, 4, 2) # (N, V, H, W, C)
253
+ multi_view_features = multi_view_features.reshape(
254
+ batch_size, num_of_views * height * width, self.input_embed_dim
255
+ ).contiguous()
256
+
257
+ # Process additional input tokens if provided
258
+ if model_input.additional_input_tokens is not None:
259
+
260
+ additional_tokens = model_input.additional_input_tokens
261
+ assert additional_tokens.ndim == 3, "Additional tokens must have 3 dimensions (N, C, T)"
262
+ assert (
263
+ additional_tokens.shape[1] == self.input_embed_dim
264
+ ), f"Additional tokens must have input dimension {self.input_embed_dim}"
265
+ assert additional_tokens.shape[0] == batch_size, "Batch size mismatch for additional tokens"
266
+
267
+ # Reshape to channel-last format for transformer processing
268
+ additional_tokens = additional_tokens.permute(0, 2, 1).contiguous() # (N, C, T) -> (N, T, C)
269
+
270
+ # Concatenate the additional tokens to the multi-view features
271
+ multi_view_features = torch.cat([multi_view_features, additional_tokens], dim=1)
272
+
273
+ # Project input features to the transformer dimension
274
+ multi_view_features = self.proj_embed(multi_view_features)
275
+
276
+ # Create patch positions for each view if custom positional encoding is used
277
+ if self.custom_positional_encoding is not None:
278
+ multi_view_positions = [
279
+ self.position_getter(batch_size, height, width, multi_view_features.device)
280
+ ] * num_of_views # List of length V, where each tensor is (N, H * W, C)
281
+ multi_view_positions = torch.cat(multi_view_positions, dim=1) # (N, V * H * W, C)
282
+ else:
283
+ multi_view_positions = [None] * num_of_views
284
+
285
+ # Add None positions for additional tokens if they exist
286
+ if model_input.additional_input_tokens is not None:
287
+
288
+ additional_tokens_positions = [None] * model_input.additional_input_tokens.shape[1]
289
+ multi_view_positions = multi_view_positions + additional_tokens_positions
290
+
291
+ # Add positional encoding for reference view (idx 0)
292
+ ref_view_pe = self.view_pos_table[0].clone().detach()
293
+ ref_view_pe = ref_view_pe.reshape((1, 1, self.dim))
294
+ ref_view_pe = ref_view_pe.repeat(batch_size, num_of_tokens_per_view, 1)
295
+ ref_view_features = multi_view_features[:, :num_of_tokens_per_view, :]
296
+ ref_view_features = ref_view_features + ref_view_pe
297
+
298
+ if self.use_pe_for_non_reference_views:
299
+ # Add positional encoding for non-reference views (sequential indices starting from idx 1 or random indices which are uniformly sampled)
300
+ if self.use_rand_idx_pe_for_non_reference_views:
301
+ non_ref_view_pe_indices = torch.randint(low=1, high=self.max_num_views_for_pe, size=(num_of_views - 1,))
302
+ else:
303
+ non_ref_view_pe_indices = torch.arange(1, num_of_views)
304
+ non_ref_view_pe = self.view_pos_table[non_ref_view_pe_indices].clone().detach()
305
+ non_ref_view_pe = non_ref_view_pe.reshape((1, num_of_views - 1, self.dim))
306
+ non_ref_view_pe = non_ref_view_pe.repeat_interleave(num_of_tokens_per_view, dim=1)
307
+ non_ref_view_pe = non_ref_view_pe.repeat(batch_size, 1, 1)
308
+ non_ref_view_features = multi_view_features[
309
+ :, num_of_tokens_per_view : num_of_views * num_of_tokens_per_view, :
310
+ ]
311
+ non_ref_view_features = non_ref_view_features + non_ref_view_pe
312
+ else:
313
+ non_ref_view_features = multi_view_features[
314
+ :, num_of_tokens_per_view : num_of_views * num_of_tokens_per_view, :
315
+ ]
316
+
317
+ # Concatenate the reference and non-reference view features
318
+ # Handle additional tokens (no view-based positional encoding for them)
319
+ if model_input.additional_input_tokens is not None:
320
+
321
+ additional_features = multi_view_features[:, num_of_views * num_of_tokens_per_view :, :]
322
+ multi_view_features = torch.cat([ref_view_features, non_ref_view_features, additional_features], dim=1)
323
+ else:
324
+ multi_view_features = torch.cat([ref_view_features, non_ref_view_features], dim=1)
325
+
326
+ # Loop over the depth of the transformer
327
+ for depth_idx in range(self.depth):
328
+ if depth_idx % 2 == 0:
329
+ # Apply the self-attention block and update the multi-view features
330
+ # Global attention across all views
331
+ multi_view_features = self.self_attention_blocks[depth_idx](multi_view_features, multi_view_positions)
332
+ else:
333
+ # Handle additional tokens separately for frame-level attention
334
+ additional_features = None
335
+ additional_positions = None
336
+ if model_input.additional_input_tokens is not None:
337
+
338
+ # Extract additional token features
339
+ additional_features = multi_view_features[:, num_of_views * num_of_tokens_per_view :, :]
340
+ # Keep only view features for frame-level attention
341
+ multi_view_features = multi_view_features[:, : num_of_views * num_of_tokens_per_view, :]
342
+
343
+ # Handle positions for additional tokens if custom positional encoding is used
344
+ if self.custom_positional_encoding is not None:
345
+ additional_positions = multi_view_positions[:, num_of_views * num_of_tokens_per_view :, :]
346
+ multi_view_positions = multi_view_positions[:, : num_of_views * num_of_tokens_per_view, :]
347
+
348
+ # Reshape the multi-view features from (N, V * H * W, C) to (N * V, H * W, C)
349
+ multi_view_features = multi_view_features.reshape(
350
+ batch_size * num_of_views, num_of_tokens_per_view, self.dim
351
+ ).contiguous() # (N * V, H * W, C)
352
+ if multi_view_positions[0] is not None:
353
+ multi_view_positions = multi_view_positions.reshape(
354
+ batch_size * num_of_views, num_of_tokens_per_view, 2
355
+ ).contiguous() # (N * V, H * W, C)
356
+
357
+ # Apply the self-attention block and update the multi-view features
358
+ # Frame-level attention within each view
359
+ multi_view_features = self.self_attention_blocks[depth_idx](multi_view_features, multi_view_positions)
360
+
361
+ # Reshape the multi-view features from (N * V, H * W, C) back to (N, V * H * W, C)
362
+ multi_view_features = multi_view_features.reshape(
363
+ batch_size, num_of_views * num_of_tokens_per_view, self.dim
364
+ ).contiguous() # (N, V * H * W, C)
365
+ if multi_view_positions[0] is not None:
366
+ multi_view_positions = multi_view_positions.reshape(
367
+ batch_size, num_of_views * num_of_tokens_per_view, 2
368
+ ).contiguous() # (N, V * H * W, C)
369
+
370
+ # Reattach additional tokens if they exist
371
+ if additional_features is not None:
372
+ multi_view_features = torch.cat([multi_view_features, additional_features], dim=1)
373
+ # Reattach positions for additional tokens if they exist
374
+ if additional_positions is not None:
375
+ multi_view_positions = torch.cat([multi_view_positions, additional_positions], dim=1)
376
+
377
+ # Normalize the output features
378
+ output_multi_view_features = self.norm(multi_view_features)
379
+
380
+ # Extract only the view features (excluding additional tokens)
381
+ view_features = output_multi_view_features[:, : num_of_views * num_of_tokens_per_view, :]
382
+
383
+ # Reshape the output multi-view features (N, V * H * W, C) back to (N, V, C, H, W)
384
+ view_features = view_features.reshape(batch_size, num_of_views, height, width, self.dim) # (N, V, H, W, C)
385
+ view_features = view_features.permute(0, 1, 4, 2, 3).contiguous() # (N, V, C, H, W)
386
+
387
+ # Split the output multi-view features into separate views
388
+ view_features = view_features.split(1, dim=1)
389
+ view_features = [output_view_features.squeeze(dim=1) for output_view_features in view_features]
390
+
391
+ # Extract and return additional token features if provided
392
+ if model_input.additional_input_tokens is not None:
393
+
394
+ additional_token_features = output_multi_view_features[:, num_of_views * num_of_tokens_per_view :, :]
395
+ additional_token_features = additional_token_features.permute(0, 2, 1).contiguous() # (N, C, T)
396
+ return MultiViewTransformerOutput(
397
+ features=view_features, additional_token_features=additional_token_features
398
+ )
399
+ else:
400
+ return MultiViewTransformerOutput(features=view_features)
401
+
402
+
403
+ class MultiViewAlternatingAttentionTransformerIFR(
404
+ MultiViewAlternatingAttentionTransformer, IntermediateFeatureReturner
405
+ ):
406
+ "Intermediate Feature Returner for UniCeption Multi-View Alternating-Attention Transformer"
407
+
408
+ def __init__(
409
+ self,
410
+ name: str,
411
+ input_embed_dim: int,
412
+ use_pe_for_non_reference_views: bool = False,
413
+ max_num_views_for_pe: int = 1000,
414
+ use_rand_idx_pe_for_non_reference_views: bool = True,
415
+ size: Optional[str] = None,
416
+ depth: int = 12,
417
+ dim: int = 768,
418
+ num_heads: int = 12,
419
+ mlp_ratio: float = 4.0,
420
+ qkv_bias: bool = True,
421
+ qk_norm: bool = False,
422
+ proj_drop: float = 0.0,
423
+ attn_drop: float = 0.0,
424
+ init_values: Optional[float] = None,
425
+ drop_path: float = 0.0,
426
+ act_layer: nn.Module = nn.GELU,
427
+ norm_layer: nn.Module = partial(nn.LayerNorm, eps=1e-6),
428
+ mlp_layer: nn.Module = Mlp,
429
+ custom_positional_encoding: Callable = None,
430
+ use_scalable_softmax: bool = False,
431
+ use_entropy_scaling: bool = False,
432
+ base_token_count_for_entropy_scaling: int = 444,
433
+ entropy_scaling_growth_factor: float = 1.4,
434
+ pretrained_checkpoint_path: str = None,
435
+ indices: Optional[Union[int, List[int]]] = None,
436
+ norm_intermediate: bool = True,
437
+ intermediates_only: bool = False,
438
+ gradient_checkpointing: bool = False,
439
+ *args,
440
+ **kwargs,
441
+ ):
442
+ """
443
+ Initialize the Multi-View Alternating-Attention Transformer for information sharing across image features from different views.
444
+ Extends the base class to return intermediate features.
445
+
446
+ Args:
447
+ input_embed_dim (int): Dimension of input embeddings.
448
+ use_pe_for_non_reference_views (bool): Whether to use view positional encoding for input non-reference views. (default: False)
449
+ max_num_views_for_pe (int): Maximum number of views for positional encoding. (default: 1000)
450
+ use_rand_idx_pe_for_non_reference_views (bool): Whether to use random index positional encoding for non-reference views. (default: True)
451
+ size (str): String to indicate interpretable size of the transformer (for e.g., base, large, ...). (default: None)
452
+ depth (int): Number of transformer layers. (default: 12, base size)
453
+ dim (int): Dimension of the transformer. (default: 768, base size)
454
+ num_heads (int): Number of attention heads. (default: 12, base size)
455
+ mlp_ratio (float): Ratio of hidden to input dimension in MLP (default: 4.)
456
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
457
+ qk_norm (bool): Whether to normalize q and k (default: False)
458
+ proj_drop (float): Dropout rate for output (default: 0.)
459
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
460
+ init_values (float): Initial value for LayerScale gamma (default: None)
461
+ drop_path (float): Dropout rate for stochastic depth (default: 0.)
462
+ act_layer (nn.Module): Activation layer (default: nn.GELU)
463
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
464
+ mlp_layer (nn.Module): MLP layer (default: Mlp)
465
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
466
+ use_scalable_softmax (bool): Whether to use scalable softmax (default: False)
467
+ use_entropy_scaling (bool): Whether to use entropy scaling (default: False)
468
+ base_token_count_for_entropy_scaling (int): Base token count for entropy scaling (default: 444)
469
+ Computed using (518, 168) as base resolution with 14 patch size
470
+ entropy_scaling_growth_factor (float): Growth factor for entropy scaling (default: 1.4)
471
+ pretrained_checkpoint_path (str, optional): Path to the pretrained checkpoint. (default: None)
472
+ indices (Optional[Union[int, List[int]]], optional): Indices of the layers to return. (default: None) Options:
473
+ - None: Return all intermediate layers.
474
+ - int: Return the last n layers.
475
+ - List[int]: Return the intermediate layers at the specified indices.
476
+ norm_intermediate (bool, optional): Whether to normalize the intermediate features. (default: True)
477
+ intermediates_only (bool, optional): Whether to return only the intermediate features. (default: False)
478
+ gradient_checkpointing (bool, optional): Whether to use gradient checkpointing for memory efficiency. (default: False)
479
+ """
480
+ # Init the base classes
481
+ MultiViewAlternatingAttentionTransformer.__init__(
482
+ self,
483
+ name=name,
484
+ input_embed_dim=input_embed_dim,
485
+ use_pe_for_non_reference_views=use_pe_for_non_reference_views,
486
+ max_num_views_for_pe=max_num_views_for_pe,
487
+ use_rand_idx_pe_for_non_reference_views=use_rand_idx_pe_for_non_reference_views,
488
+ size=size,
489
+ depth=depth,
490
+ dim=dim,
491
+ num_heads=num_heads,
492
+ mlp_ratio=mlp_ratio,
493
+ qkv_bias=qkv_bias,
494
+ qk_norm=qk_norm,
495
+ proj_drop=proj_drop,
496
+ attn_drop=attn_drop,
497
+ init_values=init_values,
498
+ drop_path=drop_path,
499
+ act_layer=act_layer,
500
+ norm_layer=norm_layer,
501
+ mlp_layer=mlp_layer,
502
+ custom_positional_encoding=custom_positional_encoding,
503
+ use_scalable_softmax=use_scalable_softmax,
504
+ use_entropy_scaling=use_entropy_scaling,
505
+ base_token_count_for_entropy_scaling=base_token_count_for_entropy_scaling,
506
+ entropy_scaling_growth_factor=entropy_scaling_growth_factor,
507
+ pretrained_checkpoint_path=pretrained_checkpoint_path,
508
+ gradient_checkpointing=gradient_checkpointing,
509
+ *args,
510
+ **kwargs,
511
+ )
512
+ IntermediateFeatureReturner.__init__(
513
+ self,
514
+ indices=indices,
515
+ norm_intermediate=norm_intermediate,
516
+ intermediates_only=intermediates_only,
517
+ )
518
+
519
+ def forward(
520
+ self,
521
+ model_input: MultiViewTransformerInput,
522
+ ) -> Union[
523
+ List[MultiViewTransformerOutput],
524
+ Tuple[MultiViewTransformerOutput, List[MultiViewTransformerOutput]],
525
+ ]:
526
+ """
527
+ Forward interface for the Multi-View Alternating-Attention Transformer with Intermediate Feature Return.
528
+
529
+ Args:
530
+ model_input (MultiViewTransformerInput): Input to the model.
531
+ Expects the features to be a list of size (batch, input_embed_dim, height, width),
532
+ where each entry corresponds to a different view.
533
+ Optionally, the input can also include additional_input_tokens (e.g., class token, registers, pose tokens, scale token)
534
+ which are appended to the token set from the multi-view features. The tokens are of size (batch, input_embed_dim, num_of_additional_tokens).
535
+
536
+ Returns:
537
+ Union[List[MultiViewTransformerOutput], Tuple[MultiViewTransformerOutput, List[MultiViewTransformerOutput]]]:
538
+ Output of the model post information sharing.
539
+ If intermediates_only is True, returns a list of intermediate outputs.
540
+ If intermediates_only is False, returns a tuple of final output and a list of intermediate outputs.
541
+ """
542
+ # Check that the number of views matches the input and the features are of expected shape
543
+ if self.use_pe_for_non_reference_views:
544
+ assert (
545
+ len(model_input.features) <= self.max_num_views_for_pe
546
+ ), f"Expected less than {self.max_num_views_for_pe} views, got {len(model_input.features)}"
547
+ assert all(
548
+ view_features.shape[1] == self.input_embed_dim for view_features in model_input.features
549
+ ), f"All views must have input dimension {self.input_embed_dim}"
550
+ assert all(
551
+ view_features.ndim == 4 for view_features in model_input.features
552
+ ), "All views must have 4 dimensions (N, C, H, W)"
553
+
554
+ # Get the indices of the intermediate features to return
555
+ intermediate_multi_view_features = []
556
+ take_indices, _ = feature_take_indices(self.depth, self.indices)
557
+
558
+ # Initialize the multi-view features from the model input and number of views for current input
559
+ multi_view_features = model_input.features
560
+ num_of_views = len(multi_view_features)
561
+ batch_size, _, height, width = multi_view_features[0].shape
562
+ num_of_tokens_per_view = height * width
563
+
564
+ # Stack the multi-view features (N, C, H, W) to (N, V, C, H, W) (assumes all V views have same shape)
565
+ multi_view_features = torch.stack(multi_view_features, dim=1)
566
+
567
+ # Resize the multi-view features from NVCHW to NLC, where L = V * H * W
568
+ multi_view_features = multi_view_features.permute(0, 1, 3, 4, 2) # (N, V, H, W, C)
569
+ multi_view_features = multi_view_features.reshape(
570
+ batch_size, num_of_views * height * width, self.input_embed_dim
571
+ ).contiguous()
572
+
573
+ # Process additional input tokens if provided
574
+ if model_input.additional_input_tokens is not None:
575
+
576
+ additional_tokens = model_input.additional_input_tokens
577
+ assert additional_tokens.ndim == 3, "Additional tokens must have 3 dimensions (N, C, T)"
578
+ assert (
579
+ additional_tokens.shape[1] == self.input_embed_dim
580
+ ), f"Additional tokens must have input dimension {self.input_embed_dim}"
581
+ assert additional_tokens.shape[0] == batch_size, "Batch size mismatch for additional tokens"
582
+
583
+ # Reshape to channel-last format for transformer processing
584
+ additional_tokens = additional_tokens.permute(0, 2, 1).contiguous() # (N, C, T) -> (N, T, C)
585
+
586
+ # Concatenate the additional tokens to the multi-view features
587
+ multi_view_features = torch.cat([multi_view_features, additional_tokens], dim=1)
588
+
589
+ # Project input features to the transformer dimension
590
+ multi_view_features = self.proj_embed(multi_view_features)
591
+
592
+ # Create patch positions for each view if custom positional encoding is used
593
+ if self.custom_positional_encoding is not None:
594
+ multi_view_positions = [
595
+ self.position_getter(batch_size, height, width, multi_view_features.device)
596
+ ] * num_of_views # List of length V, where each tensor is (N, H * W, C)
597
+ multi_view_positions = torch.cat(multi_view_positions, dim=1) # (N, V * H * W, C)
598
+ else:
599
+ multi_view_positions = [None] * num_of_views
600
+
601
+ # Add None positions for additional tokens if they exist
602
+ if model_input.additional_input_tokens is not None:
603
+
604
+ additional_tokens_positions = [None] * model_input.additional_input_tokens.shape[1]
605
+ multi_view_positions = multi_view_positions + additional_tokens_positions
606
+
607
+ # Add positional encoding for reference view (idx 0)
608
+ ref_view_pe = self.view_pos_table[0].clone().detach()
609
+ ref_view_pe = ref_view_pe.reshape((1, 1, self.dim))
610
+ ref_view_pe = ref_view_pe.repeat(batch_size, num_of_tokens_per_view, 1)
611
+ ref_view_features = multi_view_features[:, :num_of_tokens_per_view, :]
612
+ ref_view_features = ref_view_features + ref_view_pe
613
+
614
+ if self.use_pe_for_non_reference_views:
615
+ # Add positional encoding for non-reference views (sequential indices starting from idx 1 or random indices which are uniformly sampled)
616
+ if self.use_rand_idx_pe_for_non_reference_views:
617
+ non_ref_view_pe_indices = torch.randint(low=1, high=self.max_num_views_for_pe, size=(num_of_views - 1,))
618
+ else:
619
+ non_ref_view_pe_indices = torch.arange(1, num_of_views)
620
+ non_ref_view_pe = self.view_pos_table[non_ref_view_pe_indices].clone().detach()
621
+ non_ref_view_pe = non_ref_view_pe.reshape((1, num_of_views - 1, self.dim))
622
+ non_ref_view_pe = non_ref_view_pe.repeat_interleave(num_of_tokens_per_view, dim=1)
623
+ non_ref_view_pe = non_ref_view_pe.repeat(batch_size, 1, 1)
624
+ non_ref_view_features = multi_view_features[
625
+ :, num_of_tokens_per_view : num_of_views * num_of_tokens_per_view, :
626
+ ]
627
+ non_ref_view_features = non_ref_view_features + non_ref_view_pe
628
+ else:
629
+ non_ref_view_features = multi_view_features[
630
+ :, num_of_tokens_per_view : num_of_views * num_of_tokens_per_view, :
631
+ ]
632
+
633
+ # Concatenate the reference and non-reference view features
634
+ # Handle additional tokens (no view-based positional encoding for them)
635
+ if model_input.additional_input_tokens is not None:
636
+
637
+ additional_features = multi_view_features[:, num_of_views * num_of_tokens_per_view :, :]
638
+ multi_view_features = torch.cat([ref_view_features, non_ref_view_features, additional_features], dim=1)
639
+ else:
640
+ multi_view_features = torch.cat([ref_view_features, non_ref_view_features], dim=1)
641
+
642
+ # Loop over the depth of the transformer
643
+ for depth_idx in range(self.depth):
644
+ if depth_idx % 2 == 0:
645
+ # Apply the self-attention block and update the multi-view features
646
+ # Global attention across all views
647
+ multi_view_features = self.self_attention_blocks[depth_idx](multi_view_features, multi_view_positions)
648
+ else:
649
+ # Handle additional tokens separately for frame-level attention
650
+ additional_features = None
651
+ additional_positions = None
652
+ if model_input.additional_input_tokens is not None:
653
+
654
+ # Extract additional token features
655
+ additional_features = multi_view_features[:, num_of_views * num_of_tokens_per_view :, :]
656
+ # Keep only view features for frame-level attention
657
+ multi_view_features = multi_view_features[:, : num_of_views * num_of_tokens_per_view, :]
658
+
659
+ # Handle positions for additional tokens if custom positional encoding is used
660
+ if self.custom_positional_encoding is not None:
661
+ additional_positions = multi_view_positions[:, num_of_views * num_of_tokens_per_view :, :]
662
+ multi_view_positions = multi_view_positions[:, : num_of_views * num_of_tokens_per_view, :]
663
+
664
+ # Reshape the multi-view features from (N, V * H * W, C) to (N * V, H * W, C)
665
+ multi_view_features = multi_view_features.reshape(
666
+ batch_size * num_of_views, num_of_tokens_per_view, self.dim
667
+ ).contiguous() # (N * V, H * W, C)
668
+ if multi_view_positions[0] is not None:
669
+ multi_view_positions = multi_view_positions.reshape(
670
+ batch_size * num_of_views, num_of_tokens_per_view, 2
671
+ ).contiguous() # (N * V, H * W, C)
672
+
673
+ # Apply the self-attention block and update the multi-view features
674
+ # Frame-level attention within each view
675
+ multi_view_features = self.self_attention_blocks[depth_idx](multi_view_features, multi_view_positions)
676
+
677
+ # Reshape the multi-view features from (N * V, H * W, C) back to (N, V * H * W, C)
678
+ multi_view_features = multi_view_features.reshape(
679
+ batch_size, num_of_views * num_of_tokens_per_view, self.dim
680
+ ).contiguous() # (N, V * H * W, C)
681
+ if multi_view_positions[0] is not None:
682
+ multi_view_positions = multi_view_positions.reshape(
683
+ batch_size, num_of_views * num_of_tokens_per_view, 2
684
+ ).contiguous() # (N, V * H * W, C)
685
+
686
+ # Reattach additional tokens if they exist
687
+ if additional_features is not None:
688
+ multi_view_features = torch.cat([multi_view_features, additional_features], dim=1)
689
+ # Reattach positions for additional tokens if they exist
690
+ if additional_positions is not None:
691
+ multi_view_positions = torch.cat([multi_view_positions, additional_positions], dim=1)
692
+ if depth_idx in take_indices:
693
+ # Normalize the intermediate features with final norm layer if enabled
694
+ intermediate_multi_view_features.append(
695
+ self.norm(multi_view_features) if self.norm_intermediate else multi_view_features
696
+ )
697
+
698
+ # Reshape the intermediate features and convert to MultiViewTransformerOutput class
699
+ for idx in range(len(intermediate_multi_view_features)):
700
+ # Get the current intermediate features
701
+ current_features = intermediate_multi_view_features[idx]
702
+
703
+ # Extract additional token features if provided
704
+ additional_token_features = None
705
+ if model_input.additional_input_tokens is not None:
706
+
707
+ additional_token_features = current_features[:, num_of_views * num_of_tokens_per_view :, :]
708
+ additional_token_features = additional_token_features.permute(0, 2, 1).contiguous() # (N, C, T)
709
+ # Only keep the view features for reshaping
710
+ current_features = current_features[:, : num_of_views * num_of_tokens_per_view, :]
711
+
712
+ # Reshape the intermediate multi-view features (N, V * H * W, C) back to (N, V, C, H, W)
713
+ current_features = current_features.reshape(
714
+ batch_size, num_of_views, height, width, self.dim
715
+ ) # (N, V, H, W, C)
716
+ current_features = current_features.permute(0, 1, 4, 2, 3).contiguous() # (N, V, C, H, W)
717
+
718
+ # Split the intermediate multi-view features into separate views
719
+ current_features = current_features.split(1, dim=1)
720
+ current_features = [
721
+ intermediate_view_features.squeeze(dim=1) for intermediate_view_features in current_features
722
+ ]
723
+
724
+ intermediate_multi_view_features[idx] = MultiViewTransformerOutput(
725
+ features=current_features, additional_token_features=additional_token_features
726
+ )
727
+
728
+ # Return only the intermediate features if enabled
729
+ if self.intermediates_only:
730
+ return intermediate_multi_view_features
731
+
732
+ # Normalize the output features
733
+ output_multi_view_features = self.norm(multi_view_features)
734
+
735
+ # Extract view features (excluding additional tokens)
736
+ additional_token_features = None
737
+ if model_input.additional_input_tokens is not None:
738
+
739
+ additional_token_features = output_multi_view_features[:, num_of_views * num_of_tokens_per_view :, :]
740
+ additional_token_features = additional_token_features.permute(0, 2, 1).contiguous() # (N, C, T)
741
+ view_features = output_multi_view_features[:, : num_of_views * num_of_tokens_per_view, :]
742
+ else:
743
+ view_features = output_multi_view_features
744
+
745
+ # Reshape the output multi-view features (N, V * H * W, C) back to (N, V, C, H, W)
746
+ view_features = view_features.reshape(batch_size, num_of_views, height, width, self.dim) # (N, V, H, W, C)
747
+ view_features = view_features.permute(0, 1, 4, 2, 3).contiguous() # (N, V, C, H, W)
748
+
749
+ # Split the output multi-view features into separate views
750
+ view_features = view_features.split(1, dim=1)
751
+ view_features = [output_view_features.squeeze(dim=1) for output_view_features in view_features]
752
+
753
+ output_multi_view_features = MultiViewTransformerOutput(
754
+ features=view_features, additional_token_features=additional_token_features
755
+ )
756
+
757
+ return output_multi_view_features, intermediate_multi_view_features
758
+
759
+
760
+ def dummy_positional_encoding(x, xpos):
761
+ "Dummy function for positional encoding of tokens"
762
+ x = x
763
+ xpos = xpos
764
+ return x
765
+
766
+
767
+ def test_reshape_for_frame_attention():
768
+ "Test the reshape function for frame-level attention in the Alternating Attention Transformer"
769
+ batch_size = 2
770
+ num_of_views = 3
771
+ height = width = 2
772
+ dim = 4
773
+ num_of_tokens_per_view = height * width
774
+
775
+ # Create tensor with recognizable pattern
776
+ x = torch.zeros(batch_size, num_of_views * num_of_tokens_per_view, dim)
777
+ for b in range(batch_size):
778
+ for v in range(num_of_views):
779
+ for h in range(height):
780
+ for w in range(width):
781
+ token_idx = v * num_of_tokens_per_view + h * width + w
782
+ x[b, token_idx] = torch.tensor([b, v, h, w])
783
+
784
+ # Apply reshape
785
+ reshaped = x.reshape(batch_size * num_of_views, num_of_tokens_per_view, dim).contiguous()
786
+
787
+ # Verify shape
788
+ assert reshaped.shape == (batch_size * num_of_views, num_of_tokens_per_view, dim)
789
+
790
+ # Verify content (check a few values)
791
+ for b in range(batch_size):
792
+ for v in range(num_of_views):
793
+ for h in range(height):
794
+ for w in range(width):
795
+ batch_view_idx = b * num_of_views + v
796
+ token_idx = h * width + w
797
+ expected = torch.tensor([b, v, h, w])
798
+ assert torch.all(reshaped[batch_view_idx, token_idx] == expected)
799
+
800
+ # Verify reshape back works
801
+ back_to_original = reshaped.reshape(batch_size, num_of_views * num_of_tokens_per_view, dim)
802
+ assert torch.all(x == back_to_original)
803
+
804
+ print("Reshape test passed!")
805
+
806
+
807
+ if __name__ == "__main__":
808
+ # Unit test the reshape logic used for frame-level attention
809
+ test_reshape_for_frame_attention()
810
+
811
+ # Init multi-view alternating-attention transformer with no custom positional encoding and run a forward pass
812
+ for num_views in [2, 3, 4]:
813
+ print(f"Testing MultiViewAlternatingAttentionTransformer with {num_views} views ...")
814
+ # No positional encoding for non-reference views
815
+ model = MultiViewAlternatingAttentionTransformer(
816
+ name="MV-AAT",
817
+ input_embed_dim=1024,
818
+ )
819
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(num_views)]
820
+ model_input = MultiViewTransformerInput(features=model_input)
821
+ model_output = model(model_input)
822
+ assert len(model_output.features) == num_views
823
+ assert all(f.shape == (1, model.dim, 14, 14) for f in model_output.features)
824
+ # Sequential idx based positional encoding
825
+ model = MultiViewAlternatingAttentionTransformer(
826
+ name="MV-AAT",
827
+ input_embed_dim=1024,
828
+ use_pe_for_non_reference_views=True,
829
+ max_num_views_for_pe=1000,
830
+ use_rand_idx_pe_for_non_reference_views=False,
831
+ )
832
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(num_views)]
833
+ model_input = MultiViewTransformerInput(features=model_input)
834
+ model_output = model(model_input)
835
+ assert len(model_output.features) == num_views
836
+ assert all(f.shape == (1, model.dim, 14, 14) for f in model_output.features)
837
+ # Random idx based positional encoding
838
+ model = MultiViewAlternatingAttentionTransformer(
839
+ name="MV-AAT",
840
+ input_embed_dim=1024,
841
+ use_pe_for_non_reference_views=True,
842
+ max_num_views_for_pe=1000,
843
+ use_rand_idx_pe_for_non_reference_views=True,
844
+ )
845
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(num_views)]
846
+ model_input = MultiViewTransformerInput(features=model_input)
847
+ model_output = model(model_input)
848
+ assert len(model_output.features) == num_views
849
+ assert all(f.shape == (1, model.dim, 14, 14) for f in model_output.features)
850
+
851
+ # Init multi-view alternating-attention transformer with custom positional encoding and run a forward pass
852
+ for num_views in [2, 3, 4]:
853
+ print(
854
+ f"Testing MultiViewAlternatingAttentionTransformer with {num_views} views and custom positional encoding ..."
855
+ )
856
+ model = MultiViewAlternatingAttentionTransformer(
857
+ name="MV-AAT",
858
+ input_embed_dim=1024,
859
+ custom_positional_encoding=dummy_positional_encoding,
860
+ )
861
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(num_views)]
862
+ model_input = MultiViewTransformerInput(features=model_input)
863
+ model_output = model(model_input)
864
+ assert len(model_output.features) == num_views
865
+ assert all(f.shape == (1, model.dim, 14, 14) for f in model_output.features)
866
+
867
+ print("All multi-view alternating-attention transformers initialized and tested successfully!")
868
+
869
+ # Intermediate Feature Returner Tests
870
+ print("Running Intermediate Feature Returner Tests ...")
871
+
872
+ # Run the intermediate feature returner with last-n index
873
+ model_intermediate_feature_returner = MultiViewAlternatingAttentionTransformerIFR(
874
+ name="MV-AAT-IFR",
875
+ input_embed_dim=1024,
876
+ indices=6, # Last 6 layers
877
+ )
878
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(2)]
879
+ model_input = MultiViewTransformerInput(features=model_input)
880
+ output = model_intermediate_feature_returner(model_input)
881
+ assert isinstance(output, tuple)
882
+ assert isinstance(output[0], MultiViewTransformerOutput)
883
+ assert len(output[1]) == 6
884
+ assert all(isinstance(intermediate, MultiViewTransformerOutput) for intermediate in output[1])
885
+ assert len(output[1][0].features) == 2
886
+
887
+ # Run the intermediate feature returner with specific indices
888
+ model_intermediate_feature_returner = MultiViewAlternatingAttentionTransformerIFR(
889
+ name="MV-AAT-IFR",
890
+ input_embed_dim=1024,
891
+ indices=[0, 2, 4, 6], # Specific indices
892
+ )
893
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(2)]
894
+ model_input = MultiViewTransformerInput(features=model_input)
895
+ output = model_intermediate_feature_returner(model_input)
896
+ assert isinstance(output, tuple)
897
+ assert isinstance(output[0], MultiViewTransformerOutput)
898
+ assert len(output[1]) == 4
899
+ assert all(isinstance(intermediate, MultiViewTransformerOutput) for intermediate in output[1])
900
+ assert len(output[1][0].features) == 2
901
+
902
+ # Test the normalizing of intermediate features
903
+ model_intermediate_feature_returner = MultiViewAlternatingAttentionTransformerIFR(
904
+ name="MV-AAT-IFR",
905
+ input_embed_dim=1024,
906
+ indices=[-1], # Last layer
907
+ norm_intermediate=False, # Disable normalization
908
+ )
909
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(2)]
910
+ model_input = MultiViewTransformerInput(features=model_input)
911
+ output = model_intermediate_feature_returner(model_input)
912
+ for view_idx in range(2):
913
+ assert not torch.equal(
914
+ output[0].features[view_idx], output[1][-1].features[view_idx]
915
+ ), "Final features and intermediate features (last layer) must be different."
916
+
917
+ model_intermediate_feature_returner = MultiViewAlternatingAttentionTransformerIFR(
918
+ name="MV-AAT-IFR",
919
+ input_embed_dim=1024,
920
+ indices=[-1], # Last layer
921
+ norm_intermediate=True,
922
+ )
923
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(2)]
924
+ model_input = MultiViewTransformerInput(features=model_input)
925
+ output = model_intermediate_feature_returner(model_input)
926
+ for view_idx in range(2):
927
+ assert torch.equal(
928
+ output[0].features[view_idx], output[1][-1].features[view_idx]
929
+ ), "Final features and intermediate features (last layer) must be same."
930
+
931
+ print("All Intermediate Feature Returner Tests passed!")
932
+
933
+ # Test additonal input tokens for MultiViewAlternatingAttentionTransformer
934
+ print("Testing MultiViewAlternatingAttentionTransformer with additional input tokens ...")
935
+ model = MultiViewAlternatingAttentionTransformer(
936
+ name="MV-AAT",
937
+ input_embed_dim=1024,
938
+ )
939
+ num_views = 2
940
+ num_additional_tokens = 5
941
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(num_views)]
942
+ additional_tokens = torch.rand(1, 1024, num_additional_tokens)
943
+ model_input = MultiViewTransformerInput(features=model_input, additional_input_tokens=additional_tokens)
944
+ model_output = model(model_input)
945
+ assert len(model_output.features) == num_views
946
+ assert all(f.shape == (1, model.dim, 14, 14) for f in model_output.features)
947
+ assert model_output.additional_token_features is not None
948
+ assert model_output.additional_token_features.shape == (1, model.dim, num_additional_tokens)
949
+
950
+ # Test additonal input tokens for MultiViewAlternatingAttentionTransformerIFR
951
+ print("Testing MultiViewAlternatingAttentionTransformerIFR with additional input tokens ...")
952
+ model_ifr = MultiViewAlternatingAttentionTransformerIFR(
953
+ name="MV-AAT-IFR",
954
+ input_embed_dim=1024,
955
+ indices=[0, 2, 4],
956
+ )
957
+ model_input = [torch.rand(1, 1024, 14, 14) for _ in range(num_views)]
958
+ additional_tokens = torch.rand(1, 1024, num_additional_tokens)
959
+ model_input = MultiViewTransformerInput(features=model_input, additional_input_tokens=additional_tokens)
960
+ output = model_ifr(model_input)
961
+ assert isinstance(output, tuple)
962
+ assert isinstance(output[0], MultiViewTransformerOutput)
963
+ assert output[0].additional_token_features is not None
964
+ assert output[0].additional_token_features.shape == (1, model_ifr.dim, num_additional_tokens)
965
+ assert len(output[1]) == 3
966
+ assert all(isinstance(intermediate, MultiViewTransformerOutput) for intermediate in output[1])
967
+ assert all(intermediate.additional_token_features is not None for intermediate in output[1])
968
+ assert all(
969
+ intermediate.additional_token_features.shape == (1, model_ifr.dim, num_additional_tokens)
970
+ for intermediate in output[1]
971
+ )
972
+
973
+ print("All tests using additional input tokens passed!")