vismatch 1.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (2042) hide show
  1. vismatch/TEMPLATE.py +101 -0
  2. vismatch/__init__.py +475 -0
  3. vismatch/assets/example_pairs/false_positive/chartres.jpg +0 -0
  4. vismatch/assets/example_pairs/false_positive/notre_dame.jpg +0 -0
  5. vismatch/assets/example_pairs/fresco/fsm.jpg +0 -0
  6. vismatch/assets/example_pairs/fresco/sist_chapel.jpg +0 -0
  7. vismatch/assets/example_pairs/indoor/gcs_close.jpg +0 -0
  8. vismatch/assets/example_pairs/indoor/gcs_far.jpg +0 -0
  9. vismatch/assets/example_pairs/outdoor/montmartre_close.jpg +0 -0
  10. vismatch/assets/example_pairs/outdoor/montmartre_far.jpg +0 -0
  11. vismatch/assets/example_pairs/sat2iss/photo_from_iss.jpg +0 -0
  12. vismatch/assets/example_pairs/sat2iss/satellite_img.jpg +0 -0
  13. vismatch/assets/example_pairs/sphereglue/barbershop-00000000.jpg +0 -0
  14. vismatch/assets/example_pairs/sphereglue/barbershop-00000001.jpg +0 -0
  15. vismatch/assets/example_pairs/thermal/thermal.jpg +0 -0
  16. vismatch/assets/example_pairs/thermal/visible.jpg +0 -0
  17. vismatch/assets/example_test/original.jpg +0 -0
  18. vismatch/assets/example_test/warped.jpg +0 -0
  19. vismatch/base_matcher.py +242 -0
  20. vismatch/im_models/__init__.py +0 -0
  21. vismatch/im_models/aff_steerers.py +143 -0
  22. vismatch/im_models/aspanformer.py +74 -0
  23. vismatch/im_models/dedode.py +150 -0
  24. vismatch/im_models/duster.py +104 -0
  25. vismatch/im_models/edm.py +64 -0
  26. vismatch/im_models/efficient_loftr.py +60 -0
  27. vismatch/im_models/gim.py +187 -0
  28. vismatch/im_models/handcrafted.py +81 -0
  29. vismatch/im_models/keypt2subpx.py +154 -0
  30. vismatch/im_models/kornia.py +72 -0
  31. vismatch/im_models/liftfeat.py +44 -0
  32. vismatch/im_models/lightglue.py +75 -0
  33. vismatch/im_models/lisrd.py +98 -0
  34. vismatch/im_models/loftr.py +23 -0
  35. vismatch/im_models/master.py +107 -0
  36. vismatch/im_models/matchanything.py +221 -0
  37. vismatch/im_models/matchformer.py +61 -0
  38. vismatch/im_models/matching_toolbox.py +238 -0
  39. vismatch/im_models/minima.py +164 -0
  40. vismatch/im_models/omniglue.py +91 -0
  41. vismatch/im_models/rdd.py +250 -0
  42. vismatch/im_models/ripe.py +55 -0
  43. vismatch/im_models/roma.py +92 -0
  44. vismatch/im_models/romav2.py +62 -0
  45. vismatch/im_models/se2loftr.py +71 -0
  46. vismatch/im_models/silk.py +405 -0
  47. vismatch/im_models/sphereglue.py +97 -0
  48. vismatch/im_models/steerers.py +140 -0
  49. vismatch/im_models/topicfm.py +93 -0
  50. vismatch/im_models/ufm.py +57 -0
  51. vismatch/im_models/xfeat.py +78 -0
  52. vismatch/im_models/xfeat_steerers.py +151 -0
  53. vismatch/im_models/xoftr.py +71 -0
  54. vismatch/third_party/DeDoDe/DeDoDe/__init__.py +2 -0
  55. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/__init__.py +4 -0
  56. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/mega_pose_est.py +114 -0
  57. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/mega_pose_est_mnn.py +119 -0
  58. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/nll_benchmark.py +57 -0
  59. vismatch/third_party/DeDoDe/DeDoDe/benchmarks/num_inliers.py +76 -0
  60. vismatch/third_party/DeDoDe/DeDoDe/checkpoint.py +59 -0
  61. vismatch/third_party/DeDoDe/DeDoDe/datasets/__init__.py +0 -0
  62. vismatch/third_party/DeDoDe/DeDoDe/datasets/megadepth.py +269 -0
  63. vismatch/third_party/DeDoDe/DeDoDe/decoder.py +90 -0
  64. vismatch/third_party/DeDoDe/DeDoDe/descriptors/__init__.py +0 -0
  65. vismatch/third_party/DeDoDe/DeDoDe/descriptors/dedode_descriptor.py +50 -0
  66. vismatch/third_party/DeDoDe/DeDoDe/descriptors/descriptor_loss.py +68 -0
  67. vismatch/third_party/DeDoDe/DeDoDe/detectors/__init__.py +0 -0
  68. vismatch/third_party/DeDoDe/DeDoDe/detectors/dedode_detector.py +76 -0
  69. vismatch/third_party/DeDoDe/DeDoDe/detectors/keypoint_loss.py +185 -0
  70. vismatch/third_party/DeDoDe/DeDoDe/encoder.py +87 -0
  71. vismatch/third_party/DeDoDe/DeDoDe/matchers/__init__.py +0 -0
  72. vismatch/third_party/DeDoDe/DeDoDe/matchers/dual_softmax_matcher.py +38 -0
  73. vismatch/third_party/DeDoDe/DeDoDe/model_zoo/__init__.py +3 -0
  74. vismatch/third_party/DeDoDe/DeDoDe/model_zoo/dedode_models.py +249 -0
  75. vismatch/third_party/DeDoDe/DeDoDe/train.py +76 -0
  76. vismatch/third_party/DeDoDe/DeDoDe/transformer/__init__.py +8 -0
  77. vismatch/third_party/DeDoDe/DeDoDe/transformer/dinov2.py +359 -0
  78. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/__init__.py +12 -0
  79. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/attention.py +81 -0
  80. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/block.py +252 -0
  81. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/dino_head.py +59 -0
  82. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/drop_path.py +35 -0
  83. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/layer_scale.py +28 -0
  84. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/mlp.py +41 -0
  85. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/patch_embed.py +89 -0
  86. vismatch/third_party/DeDoDe/DeDoDe/transformer/layers/swiglu_ffn.py +63 -0
  87. vismatch/third_party/DeDoDe/DeDoDe/utils.py +717 -0
  88. vismatch/third_party/DeDoDe/data_prep/prep_keypoints.py +103 -0
  89. vismatch/third_party/DeDoDe/demo/demo_kpts.py +24 -0
  90. vismatch/third_party/DeDoDe/demo/demo_match.py +46 -0
  91. vismatch/third_party/DeDoDe/demo/demo_match_dedode_G.py +45 -0
  92. vismatch/third_party/DeDoDe/demo/demo_scoremap.py +23 -0
  93. vismatch/third_party/DeDoDe/experiments/dedode_descriptor-B.py +135 -0
  94. vismatch/third_party/DeDoDe/experiments/dedode_descriptor-G.py +145 -0
  95. vismatch/third_party/DeDoDe/experiments/dedode_detector.py +126 -0
  96. vismatch/third_party/DeDoDe/experiments/eval/eval_dedode_descriptor-B.py +38 -0
  97. vismatch/third_party/DeDoDe/experiments/eval/eval_dedode_descriptor-G.py +38 -0
  98. vismatch/third_party/DeDoDe/setup.py +11 -0
  99. vismatch/third_party/EDM/configs/data/__init__.py +0 -0
  100. vismatch/third_party/EDM/configs/data/base.py +37 -0
  101. vismatch/third_party/EDM/configs/data/megadepth_test_1500.py +23 -0
  102. vismatch/third_party/EDM/configs/data/megadepth_trainval_832.py +32 -0
  103. vismatch/third_party/EDM/configs/data/scannet_test_1500.py +24 -0
  104. vismatch/third_party/EDM/configs/data/scannet_trainval.py +31 -0
  105. vismatch/third_party/EDM/configs/edm/indoor/edm_base.py +15 -0
  106. vismatch/third_party/EDM/configs/edm/outdoor/edm_base.py +17 -0
  107. vismatch/third_party/EDM/deploy/export_onnx.py +69 -0
  108. vismatch/third_party/EDM/deploy/run_onnx.py +138 -0
  109. vismatch/third_party/EDM/runtime_single_pair.py +73 -0
  110. vismatch/third_party/EDM/src/__init__.py +0 -0
  111. vismatch/third_party/EDM/src/config/default.py +184 -0
  112. vismatch/third_party/EDM/src/datasets/megadepth.py +164 -0
  113. vismatch/third_party/EDM/src/datasets/sampler.py +95 -0
  114. vismatch/third_party/EDM/src/datasets/scannet.py +147 -0
  115. vismatch/third_party/EDM/src/edm/__init__.py +2 -0
  116. vismatch/third_party/EDM/src/edm/backbone/resnet.py +116 -0
  117. vismatch/third_party/EDM/src/edm/edm.py +204 -0
  118. vismatch/third_party/EDM/src/edm/head/coarse_matching.py +158 -0
  119. vismatch/third_party/EDM/src/edm/head/fine_matching.py +383 -0
  120. vismatch/third_party/EDM/src/edm/neck/__init__.py +1 -0
  121. vismatch/third_party/EDM/src/edm/neck/loftr_module/__init__.py +1 -0
  122. vismatch/third_party/EDM/src/edm/neck/loftr_module/transformer.py +418 -0
  123. vismatch/third_party/EDM/src/edm/neck/neck.py +156 -0
  124. vismatch/third_party/EDM/src/edm/utils/geometry.py +58 -0
  125. vismatch/third_party/EDM/src/edm/utils/supervision.py +255 -0
  126. vismatch/third_party/EDM/src/lightning/data.py +450 -0
  127. vismatch/third_party/EDM/src/lightning/lightning_edm.py +379 -0
  128. vismatch/third_party/EDM/src/losses/edm_loss.py +206 -0
  129. vismatch/third_party/EDM/src/optimizers/__init__.py +57 -0
  130. vismatch/third_party/EDM/src/utils/augment.py +65 -0
  131. vismatch/third_party/EDM/src/utils/comm.py +271 -0
  132. vismatch/third_party/EDM/src/utils/dataloader.py +24 -0
  133. vismatch/third_party/EDM/src/utils/dataset.py +192 -0
  134. vismatch/third_party/EDM/src/utils/metrics.py +299 -0
  135. vismatch/third_party/EDM/src/utils/misc.py +113 -0
  136. vismatch/third_party/EDM/src/utils/plotting.py +186 -0
  137. vismatch/third_party/EDM/src/utils/profiler.py +40 -0
  138. vismatch/third_party/EDM/src/utils/warppers.py +428 -0
  139. vismatch/third_party/EDM/src/utils/warppers_utils.py +172 -0
  140. vismatch/third_party/EDM/test.py +132 -0
  141. vismatch/third_party/EDM/train.py +156 -0
  142. vismatch/third_party/EfficientLoFTR/configs/data/__init__.py +0 -0
  143. vismatch/third_party/EfficientLoFTR/configs/data/base.py +35 -0
  144. vismatch/third_party/EfficientLoFTR/configs/data/megadepth_test_1500.py +13 -0
  145. vismatch/third_party/EfficientLoFTR/configs/data/megadepth_trainval_832.py +24 -0
  146. vismatch/third_party/EfficientLoFTR/configs/data/scannet_test_1500.py +16 -0
  147. vismatch/third_party/EfficientLoFTR/configs/loftr/eloftr_full.py +36 -0
  148. vismatch/third_party/EfficientLoFTR/configs/loftr/eloftr_optimized.py +37 -0
  149. vismatch/third_party/EfficientLoFTR/src/__init__.py +0 -0
  150. vismatch/third_party/EfficientLoFTR/src/config/default.py +182 -0
  151. vismatch/third_party/EfficientLoFTR/src/datasets/megadepth.py +133 -0
  152. vismatch/third_party/EfficientLoFTR/src/datasets/sampler.py +77 -0
  153. vismatch/third_party/EfficientLoFTR/src/datasets/scannet.py +129 -0
  154. vismatch/third_party/EfficientLoFTR/src/lightning/data.py +357 -0
  155. vismatch/third_party/EfficientLoFTR/src/lightning/lightning_loftr.py +272 -0
  156. vismatch/third_party/EfficientLoFTR/src/loftr/__init__.py +4 -0
  157. vismatch/third_party/EfficientLoFTR/src/loftr/backbone/__init__.py +11 -0
  158. vismatch/third_party/EfficientLoFTR/src/loftr/backbone/backbone.py +37 -0
  159. vismatch/third_party/EfficientLoFTR/src/loftr/backbone/repvgg.py +224 -0
  160. vismatch/third_party/EfficientLoFTR/src/loftr/loftr.py +124 -0
  161. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/__init__.py +2 -0
  162. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/fine_preprocess.py +112 -0
  163. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/linear_attention.py +103 -0
  164. vismatch/third_party/EfficientLoFTR/src/loftr/loftr_module/transformer.py +164 -0
  165. vismatch/third_party/EfficientLoFTR/src/loftr/utils/coarse_matching.py +241 -0
  166. vismatch/third_party/EfficientLoFTR/src/loftr/utils/fine_matching.py +156 -0
  167. vismatch/third_party/EfficientLoFTR/src/loftr/utils/full_config.py +50 -0
  168. vismatch/third_party/EfficientLoFTR/src/loftr/utils/geometry.py +54 -0
  169. vismatch/third_party/EfficientLoFTR/src/loftr/utils/opt_config.py +50 -0
  170. vismatch/third_party/EfficientLoFTR/src/loftr/utils/position_encoding.py +50 -0
  171. vismatch/third_party/EfficientLoFTR/src/loftr/utils/supervision.py +275 -0
  172. vismatch/third_party/EfficientLoFTR/src/losses/loftr_loss.py +229 -0
  173. vismatch/third_party/EfficientLoFTR/src/optimizers/__init__.py +42 -0
  174. vismatch/third_party/EfficientLoFTR/src/utils/augment.py +55 -0
  175. vismatch/third_party/EfficientLoFTR/src/utils/comm.py +265 -0
  176. vismatch/third_party/EfficientLoFTR/src/utils/dataloader.py +23 -0
  177. vismatch/third_party/EfficientLoFTR/src/utils/dataset.py +186 -0
  178. vismatch/third_party/EfficientLoFTR/src/utils/metrics.py +264 -0
  179. vismatch/third_party/EfficientLoFTR/src/utils/misc.py +106 -0
  180. vismatch/third_party/EfficientLoFTR/src/utils/plotting.py +154 -0
  181. vismatch/third_party/EfficientLoFTR/src/utils/profiler.py +39 -0
  182. vismatch/third_party/EfficientLoFTR/src/utils/warppers.py +426 -0
  183. vismatch/third_party/EfficientLoFTR/src/utils/warppers_utils.py +171 -0
  184. vismatch/third_party/EfficientLoFTR/test.py +143 -0
  185. vismatch/third_party/EfficientLoFTR/train.py +154 -0
  186. vismatch/third_party/LISRD/lisrd/__init__.py +0 -0
  187. vismatch/third_party/LISRD/lisrd/datasets/__init__.py +7 -0
  188. vismatch/third_party/LISRD/lisrd/datasets/base_dataset.py +38 -0
  189. vismatch/third_party/LISRD/lisrd/datasets/coco.py +148 -0
  190. vismatch/third_party/LISRD/lisrd/datasets/flashes.py +170 -0
  191. vismatch/third_party/LISRD/lisrd/datasets/hpatches.py +135 -0
  192. vismatch/third_party/LISRD/lisrd/datasets/mixed_dataset.py +53 -0
  193. vismatch/third_party/LISRD/lisrd/datasets/rdnim.py +117 -0
  194. vismatch/third_party/LISRD/lisrd/datasets/utils/data_augmentation.py +168 -0
  195. vismatch/third_party/LISRD/lisrd/datasets/utils/data_reader.py +48 -0
  196. vismatch/third_party/LISRD/lisrd/datasets/utils/homographies.py +215 -0
  197. vismatch/third_party/LISRD/lisrd/datasets/vidit.py +152 -0
  198. vismatch/third_party/LISRD/lisrd/evaluation/__init__.py +0 -0
  199. vismatch/third_party/LISRD/lisrd/evaluation/descriptor_evaluation.py +142 -0
  200. vismatch/third_party/LISRD/lisrd/experiment.py +129 -0
  201. vismatch/third_party/LISRD/lisrd/export_features.py +148 -0
  202. vismatch/third_party/LISRD/lisrd/models/__init__.py +7 -0
  203. vismatch/third_party/LISRD/lisrd/models/backbones/__init__.py +0 -0
  204. vismatch/third_party/LISRD/lisrd/models/backbones/net_vlad.py +62 -0
  205. vismatch/third_party/LISRD/lisrd/models/backbones/vgg.py +46 -0
  206. vismatch/third_party/LISRD/lisrd/models/base_model.py +336 -0
  207. vismatch/third_party/LISRD/lisrd/models/keypoint_detectors.py +34 -0
  208. vismatch/third_party/LISRD/lisrd/models/lisrd.py +328 -0
  209. vismatch/third_party/LISRD/lisrd/models/lisrd_sift.py +289 -0
  210. vismatch/third_party/LISRD/lisrd/third_party/super_point_magic_leap/demo_superpoint.py +734 -0
  211. vismatch/third_party/LISRD/lisrd/utils/geometry_utils.py +123 -0
  212. vismatch/third_party/LISRD/lisrd/utils/losses.py +191 -0
  213. vismatch/third_party/LISRD/lisrd/utils/metrics.py +66 -0
  214. vismatch/third_party/LISRD/lisrd/utils/pytorch_utils.py +14 -0
  215. vismatch/third_party/LISRD/lisrd/utils/stdout_capturing.py +81 -0
  216. vismatch/third_party/LISRD/notebooks/utils.py +103 -0
  217. vismatch/third_party/LISRD/setup.py +4 -0
  218. vismatch/third_party/LiftFeat/dataset/__init__.py +0 -0
  219. vismatch/third_party/LiftFeat/dataset/coco_augmentor.py +298 -0
  220. vismatch/third_party/LiftFeat/dataset/coco_wrapper.py +175 -0
  221. vismatch/third_party/LiftFeat/dataset/dataset_utils.py +183 -0
  222. vismatch/third_party/LiftFeat/dataset/megadepth.py +177 -0
  223. vismatch/third_party/LiftFeat/dataset/megadepth_wrapper.py +167 -0
  224. vismatch/third_party/LiftFeat/demo.py +116 -0
  225. vismatch/third_party/LiftFeat/evaluation/HPatch_evaluation.py +182 -0
  226. vismatch/third_party/LiftFeat/evaluation/MegaDepth1500_evaluation.py +105 -0
  227. vismatch/third_party/LiftFeat/evaluation/eval_utils.py +127 -0
  228. vismatch/third_party/LiftFeat/loss/loss.py +291 -0
  229. vismatch/third_party/LiftFeat/models/interpolator.py +34 -0
  230. vismatch/third_party/LiftFeat/models/liftfeat_wrapper.py +172 -0
  231. vismatch/third_party/LiftFeat/models/model.py +419 -0
  232. vismatch/third_party/LiftFeat/tools/demo_match_video.py +145 -0
  233. vismatch/third_party/LiftFeat/tools/demo_vo.py +163 -0
  234. vismatch/third_party/LiftFeat/train.py +369 -0
  235. vismatch/third_party/LiftFeat/utils/VisualOdometry.py +339 -0
  236. vismatch/third_party/LiftFeat/utils/__init__.py +0 -0
  237. vismatch/third_party/LiftFeat/utils/alike_wrapper.py +45 -0
  238. vismatch/third_party/LiftFeat/utils/config.py +16 -0
  239. vismatch/third_party/LiftFeat/utils/depth_anything_wrapper.py +150 -0
  240. vismatch/third_party/LiftFeat/utils/featurebooster.py +247 -0
  241. vismatch/third_party/LiftFeat/utils/post_process.py +21 -0
  242. vismatch/third_party/LightGlue/benchmark.py +255 -0
  243. vismatch/third_party/LightGlue/lightglue/__init__.py +7 -0
  244. vismatch/third_party/LightGlue/lightglue/aliked.py +760 -0
  245. vismatch/third_party/LightGlue/lightglue/disk.py +55 -0
  246. vismatch/third_party/LightGlue/lightglue/dog_hardnet.py +41 -0
  247. vismatch/third_party/LightGlue/lightglue/lightglue.py +662 -0
  248. vismatch/third_party/LightGlue/lightglue/sift.py +216 -0
  249. vismatch/third_party/LightGlue/lightglue/superpoint.py +227 -0
  250. vismatch/third_party/LightGlue/lightglue/utils.py +165 -0
  251. vismatch/third_party/LightGlue/lightglue/viz2d.py +203 -0
  252. vismatch/third_party/MINIMA/demo.py +201 -0
  253. vismatch/third_party/MINIMA/src/__init__.py +0 -0
  254. vismatch/third_party/MINIMA/src/config/default.py +203 -0
  255. vismatch/third_party/MINIMA/src/config/default_for_megadepth_dense.py +203 -0
  256. vismatch/third_party/MINIMA/src/config/default_for_megadepth_sparse.py +203 -0
  257. vismatch/third_party/MINIMA/src/utils/__init__.py +0 -0
  258. vismatch/third_party/MINIMA/src/utils/culculate_auc.py +28 -0
  259. vismatch/third_party/MINIMA/src/utils/data_io.py +156 -0
  260. vismatch/third_party/MINIMA/src/utils/data_io_loftr.py +152 -0
  261. vismatch/third_party/MINIMA/src/utils/data_io_roma.py +186 -0
  262. vismatch/third_party/MINIMA/src/utils/data_io_sp_lg.py +158 -0
  263. vismatch/third_party/MINIMA/src/utils/load_model.py +164 -0
  264. vismatch/third_party/MINIMA/src/utils/metrics.py +214 -0
  265. vismatch/third_party/MINIMA/src/utils/misc.py +101 -0
  266. vismatch/third_party/MINIMA/src/utils/plotting.py +291 -0
  267. vismatch/third_party/MINIMA/src/utils/sample_h.py +142 -0
  268. vismatch/third_party/MINIMA/test_relative_homo_depth.py +683 -0
  269. vismatch/third_party/MINIMA/test_relative_homo_event.py +722 -0
  270. vismatch/third_party/MINIMA/test_relative_homo_mmim.py +669 -0
  271. vismatch/third_party/MINIMA/test_relative_pose_infrared.py +500 -0
  272. vismatch/third_party/MINIMA/test_relative_pose_mega_1500.py +487 -0
  273. vismatch/third_party/MINIMA/test_relative_pose_mega_1500_syn.py +516 -0
  274. vismatch/third_party/MINIMA/third_party/LightGlue/benchmark.py +255 -0
  275. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/__init__.py +7 -0
  276. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/aliked.py +758 -0
  277. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/disk.py +55 -0
  278. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/dog_hardnet.py +41 -0
  279. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/lightglue.py +655 -0
  280. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/sift.py +216 -0
  281. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/superpoint.py +227 -0
  282. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/utils.py +165 -0
  283. vismatch/third_party/MINIMA/third_party/LightGlue/lightglue/viz2d.py +184 -0
  284. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/__init__.py +0 -0
  285. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/base.py +35 -0
  286. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/megadepth_test_1500.py +11 -0
  287. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/megadepth_trainval_640.py +22 -0
  288. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/megadepth_trainval_840.py +22 -0
  289. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/scannet_test_1500.py +11 -0
  290. vismatch/third_party/MINIMA/third_party/LoFTR/configs/data/scannet_trainval.py +17 -0
  291. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds.py +6 -0
  292. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds_dense.py +8 -0
  293. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot.py +6 -0
  294. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot_dense.py +8 -0
  295. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ds.py +5 -0
  296. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ds_dense.py +7 -0
  297. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ot.py +5 -0
  298. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/loftr_ot_dense.py +7 -0
  299. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval.py +16 -0
  300. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval_new.py +18 -0
  301. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds.py +16 -0
  302. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds_dense.py +17 -0
  303. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot.py +16 -0
  304. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot_dense.py +17 -0
  305. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ds.py +15 -0
  306. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ds_dense.py +16 -0
  307. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ot.py +15 -0
  308. vismatch/third_party/MINIMA/third_party/LoFTR/configs/loftr/outdoor/loftr_ot_dense.py +16 -0
  309. vismatch/third_party/MINIMA/third_party/LoFTR/demo/demo_loftr.py +240 -0
  310. vismatch/third_party/MINIMA/third_party/LoFTR/src/__init__.py +0 -0
  311. vismatch/third_party/MINIMA/third_party/LoFTR/src/config/default.py +171 -0
  312. vismatch/third_party/MINIMA/third_party/LoFTR/src/datasets/megadepth.py +127 -0
  313. vismatch/third_party/MINIMA/third_party/LoFTR/src/datasets/sampler.py +77 -0
  314. vismatch/third_party/MINIMA/third_party/LoFTR/src/datasets/scannet.py +114 -0
  315. vismatch/third_party/MINIMA/third_party/LoFTR/src/lightning/data.py +320 -0
  316. vismatch/third_party/MINIMA/third_party/LoFTR/src/lightning/lightning_loftr.py +249 -0
  317. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/__init__.py +2 -0
  318. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/backbone/__init__.py +11 -0
  319. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/backbone/resnet_fpn.py +199 -0
  320. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr.py +81 -0
  321. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/__init__.py +2 -0
  322. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/fine_preprocess.py +59 -0
  323. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/linear_attention.py +81 -0
  324. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/loftr_module/transformer.py +101 -0
  325. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/coarse_matching.py +261 -0
  326. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/cvpr_ds_config.py +50 -0
  327. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/fine_matching.py +74 -0
  328. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/geometry.py +54 -0
  329. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/position_encoding.py +42 -0
  330. vismatch/third_party/MINIMA/third_party/LoFTR/src/loftr/utils/supervision.py +151 -0
  331. vismatch/third_party/MINIMA/third_party/LoFTR/src/losses/loftr_loss.py +192 -0
  332. vismatch/third_party/MINIMA/third_party/LoFTR/src/optimizers/__init__.py +42 -0
  333. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/augment.py +55 -0
  334. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/comm.py +265 -0
  335. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/dataloader.py +23 -0
  336. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/dataset.py +185 -0
  337. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/metrics.py +193 -0
  338. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/misc.py +101 -0
  339. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/plotting.py +154 -0
  340. vismatch/third_party/MINIMA/third_party/LoFTR/src/utils/profiler.py +39 -0
  341. vismatch/third_party/MINIMA/third_party/LoFTR/test.py +68 -0
  342. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/demo_superglue.py +259 -0
  343. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/match_pairs.py +425 -0
  344. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/__init__.py +0 -0
  345. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/matching.py +84 -0
  346. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/superglue.py +283 -0
  347. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/superpoint.py +202 -0
  348. vismatch/third_party/MINIMA/third_party/LoFTR/third_party/SuperGluePretrainedNetwork/models/utils.py +555 -0
  349. vismatch/third_party/MINIMA/third_party/LoFTR/train.py +123 -0
  350. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_3D_effect.py +47 -0
  351. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_fundamental.py +34 -0
  352. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_match.py +50 -0
  353. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_match_opencv_sift.py +43 -0
  354. vismatch/third_party/MINIMA/third_party/RoMa/demo/demo_match_tiny.py +77 -0
  355. vismatch/third_party/MINIMA/third_party/RoMa/experiments/eval_roma_outdoor.py +57 -0
  356. vismatch/third_party/MINIMA/third_party/RoMa/experiments/eval_tiny_roma_v1_outdoor.py +84 -0
  357. vismatch/third_party/MINIMA/third_party/RoMa/experiments/roma_indoor.py +320 -0
  358. vismatch/third_party/MINIMA/third_party/RoMa/experiments/train_roma_outdoor.py +307 -0
  359. vismatch/third_party/MINIMA/third_party/RoMa/experiments/train_tiny_roma_v1_outdoor.py +498 -0
  360. vismatch/third_party/MINIMA/third_party/RoMa/romatch/__init__.py +8 -0
  361. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/__init__.py +6 -0
  362. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/hpatches_sequences_homog_benchmark.py +113 -0
  363. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/megadepth_dense_benchmark.py +106 -0
  364. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark.py +118 -0
  365. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark_poselib.py +119 -0
  366. vismatch/third_party/MINIMA/third_party/RoMa/romatch/benchmarks/scannet_benchmark.py +143 -0
  367. vismatch/third_party/MINIMA/third_party/RoMa/romatch/checkpointing/__init__.py +1 -0
  368. vismatch/third_party/MINIMA/third_party/RoMa/romatch/checkpointing/checkpoint.py +60 -0
  369. vismatch/third_party/MINIMA/third_party/RoMa/romatch/datasets/__init__.py +2 -0
  370. vismatch/third_party/MINIMA/third_party/RoMa/romatch/datasets/megadepth.py +232 -0
  371. vismatch/third_party/MINIMA/third_party/RoMa/romatch/datasets/scannet.py +160 -0
  372. vismatch/third_party/MINIMA/third_party/RoMa/romatch/losses/__init__.py +1 -0
  373. vismatch/third_party/MINIMA/third_party/RoMa/romatch/losses/robust_loss.py +161 -0
  374. vismatch/third_party/MINIMA/third_party/RoMa/romatch/losses/robust_loss_tiny_roma.py +160 -0
  375. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/__init__.py +1 -0
  376. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/encoders.py +122 -0
  377. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/matcher.py +766 -0
  378. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/model_zoo/__init__.py +73 -0
  379. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/model_zoo/roma_models.py +170 -0
  380. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/tiny.py +304 -0
  381. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/__init__.py +48 -0
  382. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/dinov2.py +359 -0
  383. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/__init__.py +12 -0
  384. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/attention.py +81 -0
  385. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/block.py +252 -0
  386. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/dino_head.py +59 -0
  387. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/drop_path.py +35 -0
  388. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/layer_scale.py +28 -0
  389. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/mlp.py +41 -0
  390. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/patch_embed.py +89 -0
  391. vismatch/third_party/MINIMA/third_party/RoMa/romatch/models/transformer/layers/swiglu_ffn.py +63 -0
  392. vismatch/third_party/MINIMA/third_party/RoMa/romatch/train/__init__.py +1 -0
  393. vismatch/third_party/MINIMA/third_party/RoMa/romatch/train/train.py +102 -0
  394. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/__init__.py +16 -0
  395. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/kde.py +13 -0
  396. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/local_correlation.py +48 -0
  397. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/transforms.py +118 -0
  398. vismatch/third_party/MINIMA/third_party/RoMa/romatch/utils/utils.py +662 -0
  399. vismatch/third_party/MINIMA/third_party/RoMa/setup.py +9 -0
  400. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/__init__.py +0 -0
  401. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/base.py +35 -0
  402. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/megadepth_trainval_840.py +22 -0
  403. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/megadepth_vistir_trainval_640.py +23 -0
  404. vismatch/third_party/MINIMA/third_party/XoFTR/configs/data/pretrain.py +8 -0
  405. vismatch/third_party/MINIMA/third_party/XoFTR/configs/xoftr/outdoor/visible_thermal.py +17 -0
  406. vismatch/third_party/MINIMA/third_party/XoFTR/configs/xoftr/pretrain/pretrain.py +12 -0
  407. vismatch/third_party/MINIMA/third_party/XoFTR/pretrain.py +125 -0
  408. vismatch/third_party/MINIMA/third_party/XoFTR/src/__init__.py +0 -0
  409. vismatch/third_party/MINIMA/third_party/XoFTR/src/config/default.py +203 -0
  410. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/megadepth.py +143 -0
  411. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/pretrain_dataset.py +156 -0
  412. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/sampler.py +77 -0
  413. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/scannet.py +114 -0
  414. vismatch/third_party/MINIMA/third_party/XoFTR/src/datasets/vistir.py +109 -0
  415. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/data.py +346 -0
  416. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/data_pretrain.py +125 -0
  417. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/lightning_xoftr.py +334 -0
  418. vismatch/third_party/MINIMA/third_party/XoFTR/src/lightning/lightning_xoftr_pretrain.py +171 -0
  419. vismatch/third_party/MINIMA/third_party/XoFTR/src/losses/xoftr_loss.py +170 -0
  420. vismatch/third_party/MINIMA/third_party/XoFTR/src/losses/xoftr_loss_pretrain.py +37 -0
  421. vismatch/third_party/MINIMA/third_party/XoFTR/src/optimizers/__init__.py +42 -0
  422. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/augment.py +113 -0
  423. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/comm.py +265 -0
  424. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/data_io.py +144 -0
  425. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/dataloader.py +23 -0
  426. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/dataset.py +279 -0
  427. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/metrics.py +211 -0
  428. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/misc.py +101 -0
  429. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/plotting.py +227 -0
  430. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/pretrain_utils.py +83 -0
  431. vismatch/third_party/MINIMA/third_party/XoFTR/src/utils/profiler.py +39 -0
  432. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/__init__.py +2 -0
  433. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/backbone/__init__.py +1 -0
  434. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/backbone/resnet.py +95 -0
  435. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/utils/geometry.py +107 -0
  436. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/utils/position_encoding.py +36 -0
  437. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/utils/supervision.py +290 -0
  438. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr.py +94 -0
  439. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/__init__.py +4 -0
  440. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/coarse_matching.py +305 -0
  441. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/fine_matching.py +170 -0
  442. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/fine_process.py +321 -0
  443. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/linear_attention.py +81 -0
  444. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_module/transformer.py +101 -0
  445. vismatch/third_party/MINIMA/third_party/XoFTR/src/xoftr/xoftr_pretrain.py +209 -0
  446. vismatch/third_party/MINIMA/third_party/XoFTR/test.py +68 -0
  447. vismatch/third_party/MINIMA/third_party/XoFTR/test_relative_pose.py +330 -0
  448. vismatch/third_party/MINIMA/third_party/XoFTR/train.py +126 -0
  449. vismatch/third_party/MatchAnything/app.py +27 -0
  450. vismatch/third_party/MatchAnything/imcui/__init__.py +0 -0
  451. vismatch/third_party/MatchAnything/imcui/api/__init__.py +47 -0
  452. vismatch/third_party/MatchAnything/imcui/api/client.py +232 -0
  453. vismatch/third_party/MatchAnything/imcui/api/core.py +308 -0
  454. vismatch/third_party/MatchAnything/imcui/api/server.py +170 -0
  455. vismatch/third_party/MatchAnything/imcui/hloc/__init__.py +65 -0
  456. vismatch/third_party/MatchAnything/imcui/hloc/colmap_from_nvm.py +216 -0
  457. vismatch/third_party/MatchAnything/imcui/hloc/extract_features.py +607 -0
  458. vismatch/third_party/MatchAnything/imcui/hloc/extractors/__init__.py +0 -0
  459. vismatch/third_party/MatchAnything/imcui/hloc/extractors/alike.py +61 -0
  460. vismatch/third_party/MatchAnything/imcui/hloc/extractors/aliked.py +32 -0
  461. vismatch/third_party/MatchAnything/imcui/hloc/extractors/cosplace.py +44 -0
  462. vismatch/third_party/MatchAnything/imcui/hloc/extractors/d2net.py +60 -0
  463. vismatch/third_party/MatchAnything/imcui/hloc/extractors/darkfeat.py +44 -0
  464. vismatch/third_party/MatchAnything/imcui/hloc/extractors/dedode.py +86 -0
  465. vismatch/third_party/MatchAnything/imcui/hloc/extractors/dir.py +78 -0
  466. vismatch/third_party/MatchAnything/imcui/hloc/extractors/disk.py +35 -0
  467. vismatch/third_party/MatchAnything/imcui/hloc/extractors/dog.py +135 -0
  468. vismatch/third_party/MatchAnything/imcui/hloc/extractors/eigenplaces.py +57 -0
  469. vismatch/third_party/MatchAnything/imcui/hloc/extractors/example.py +56 -0
  470. vismatch/third_party/MatchAnything/imcui/hloc/extractors/fire.py +72 -0
  471. vismatch/third_party/MatchAnything/imcui/hloc/extractors/fire_local.py +84 -0
  472. vismatch/third_party/MatchAnything/imcui/hloc/extractors/lanet.py +63 -0
  473. vismatch/third_party/MatchAnything/imcui/hloc/extractors/netvlad.py +146 -0
  474. vismatch/third_party/MatchAnything/imcui/hloc/extractors/openibl.py +26 -0
  475. vismatch/third_party/MatchAnything/imcui/hloc/extractors/r2d2.py +73 -0
  476. vismatch/third_party/MatchAnything/imcui/hloc/extractors/rekd.py +60 -0
  477. vismatch/third_party/MatchAnything/imcui/hloc/extractors/rord.py +59 -0
  478. vismatch/third_party/MatchAnything/imcui/hloc/extractors/sfd2.py +44 -0
  479. vismatch/third_party/MatchAnything/imcui/hloc/extractors/sift.py +216 -0
  480. vismatch/third_party/MatchAnything/imcui/hloc/extractors/superpoint.py +51 -0
  481. vismatch/third_party/MatchAnything/imcui/hloc/extractors/xfeat.py +33 -0
  482. vismatch/third_party/MatchAnything/imcui/hloc/localize_inloc.py +179 -0
  483. vismatch/third_party/MatchAnything/imcui/hloc/localize_sfm.py +243 -0
  484. vismatch/third_party/MatchAnything/imcui/hloc/match_dense.py +1158 -0
  485. vismatch/third_party/MatchAnything/imcui/hloc/match_features.py +459 -0
  486. vismatch/third_party/MatchAnything/imcui/hloc/matchers/__init__.py +3 -0
  487. vismatch/third_party/MatchAnything/imcui/hloc/matchers/adalam.py +68 -0
  488. vismatch/third_party/MatchAnything/imcui/hloc/matchers/aspanformer.py +66 -0
  489. vismatch/third_party/MatchAnything/imcui/hloc/matchers/cotr.py +77 -0
  490. vismatch/third_party/MatchAnything/imcui/hloc/matchers/dkm.py +53 -0
  491. vismatch/third_party/MatchAnything/imcui/hloc/matchers/dual_softmax.py +71 -0
  492. vismatch/third_party/MatchAnything/imcui/hloc/matchers/duster.py +109 -0
  493. vismatch/third_party/MatchAnything/imcui/hloc/matchers/eloftr.py +97 -0
  494. vismatch/third_party/MatchAnything/imcui/hloc/matchers/gim.py +200 -0
  495. vismatch/third_party/MatchAnything/imcui/hloc/matchers/gluestick.py +99 -0
  496. vismatch/third_party/MatchAnything/imcui/hloc/matchers/imp.py +50 -0
  497. vismatch/third_party/MatchAnything/imcui/hloc/matchers/lightglue.py +67 -0
  498. vismatch/third_party/MatchAnything/imcui/hloc/matchers/loftr.py +58 -0
  499. vismatch/third_party/MatchAnything/imcui/hloc/matchers/mast3r.py +96 -0
  500. vismatch/third_party/MatchAnything/imcui/hloc/matchers/matchanything.py +191 -0
  501. vismatch/third_party/MatchAnything/imcui/hloc/matchers/mickey.py +50 -0
  502. vismatch/third_party/MatchAnything/imcui/hloc/matchers/nearest_neighbor.py +66 -0
  503. vismatch/third_party/MatchAnything/imcui/hloc/matchers/omniglue.py +80 -0
  504. vismatch/third_party/MatchAnything/imcui/hloc/matchers/roma.py +80 -0
  505. vismatch/third_party/MatchAnything/imcui/hloc/matchers/sgmnet.py +106 -0
  506. vismatch/third_party/MatchAnything/imcui/hloc/matchers/sold2.py +144 -0
  507. vismatch/third_party/MatchAnything/imcui/hloc/matchers/superglue.py +33 -0
  508. vismatch/third_party/MatchAnything/imcui/hloc/matchers/topicfm.py +60 -0
  509. vismatch/third_party/MatchAnything/imcui/hloc/matchers/xfeat_dense.py +54 -0
  510. vismatch/third_party/MatchAnything/imcui/hloc/matchers/xfeat_lightglue.py +48 -0
  511. vismatch/third_party/MatchAnything/imcui/hloc/matchers/xoftr.py +90 -0
  512. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_covisibility.py +60 -0
  513. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_exhaustive.py +64 -0
  514. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_poses.py +68 -0
  515. vismatch/third_party/MatchAnything/imcui/hloc/pairs_from_retrieval.py +133 -0
  516. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/__init__.py +0 -0
  517. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/localize.py +89 -0
  518. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/prepare_reference.py +51 -0
  519. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/4Seasons/utils.py +231 -0
  520. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/__init__.py +0 -0
  521. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/create_gt_sfm.py +134 -0
  522. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/pipeline.py +139 -0
  523. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/7Scenes/utils.py +34 -0
  524. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen/__init__.py +0 -0
  525. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen/pipeline.py +109 -0
  526. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen_v1_1/__init__.py +0 -0
  527. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen_v1_1/pipeline.py +104 -0
  528. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Aachen_v1_1/pipeline_loftr.py +104 -0
  529. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/CMU/__init__.py +0 -0
  530. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/CMU/pipeline.py +133 -0
  531. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Cambridge/__init__.py +0 -0
  532. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Cambridge/pipeline.py +140 -0
  533. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/Cambridge/utils.py +145 -0
  534. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/RobotCar/__init__.py +0 -0
  535. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/RobotCar/colmap_from_nvm.py +176 -0
  536. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/RobotCar/pipeline.py +143 -0
  537. vismatch/third_party/MatchAnything/imcui/hloc/pipelines/__init__.py +0 -0
  538. vismatch/third_party/MatchAnything/imcui/hloc/reconstruction.py +194 -0
  539. vismatch/third_party/MatchAnything/imcui/hloc/triangulation.py +311 -0
  540. vismatch/third_party/MatchAnything/imcui/hloc/utils/__init__.py +12 -0
  541. vismatch/third_party/MatchAnything/imcui/hloc/utils/base_model.py +56 -0
  542. vismatch/third_party/MatchAnything/imcui/hloc/utils/database.py +412 -0
  543. vismatch/third_party/MatchAnything/imcui/hloc/utils/geometry.py +16 -0
  544. vismatch/third_party/MatchAnything/imcui/hloc/utils/io.py +77 -0
  545. vismatch/third_party/MatchAnything/imcui/hloc/utils/parsers.py +59 -0
  546. vismatch/third_party/MatchAnything/imcui/hloc/utils/read_write_model.py +588 -0
  547. vismatch/third_party/MatchAnything/imcui/hloc/utils/viz.py +146 -0
  548. vismatch/third_party/MatchAnything/imcui/hloc/utils/viz_3d.py +203 -0
  549. vismatch/third_party/MatchAnything/imcui/hloc/visualization.py +178 -0
  550. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/configs/models/eloftr_model.py +128 -0
  551. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/configs/models/roma_model.py +27 -0
  552. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/notebooks/notebooks_utils/__init__.py +1 -0
  553. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/notebooks/notebooks_utils/plotting.py +344 -0
  554. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/__init__.py +0 -0
  555. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/config/default.py +344 -0
  556. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/datasets/common_data_pair.py +214 -0
  557. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/lightning/lightning_loftr.py +343 -0
  558. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/__init__.py +1 -0
  559. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/__init__.py +61 -0
  560. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/repvgg.py +319 -0
  561. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/resnet_fpn.py +1094 -0
  562. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/backbone/s2dnet.py +131 -0
  563. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr.py +273 -0
  564. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/__init__.py +2 -0
  565. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/fine_preprocess.py +350 -0
  566. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/linear_attention.py +217 -0
  567. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/transformer.py +1768 -0
  568. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/loftr_module/transformer_utils.py +76 -0
  569. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/coarse_matching.py +266 -0
  570. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/fine_matching.py +493 -0
  571. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/geometry.py +298 -0
  572. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/position_encoding.py +131 -0
  573. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/loftr/utils/supervision.py +475 -0
  574. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/optimizers/__init__.py +50 -0
  575. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/__init__.py +0 -0
  576. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/augment.py +55 -0
  577. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/__init__.py +0 -0
  578. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/database.py +417 -0
  579. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/eval_helper.py +232 -0
  580. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap/read_write_model.py +509 -0
  581. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/colmap.py +530 -0
  582. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/comm.py +265 -0
  583. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/dataloader.py +23 -0
  584. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/dataset.py +518 -0
  585. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/easydict.py +148 -0
  586. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/geometry.py +366 -0
  587. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/homography_utils.py +366 -0
  588. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/metrics.py +445 -0
  589. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/misc.py +101 -0
  590. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/plotting.py +248 -0
  591. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/profiler.py +39 -0
  592. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/ray_utils.py +134 -0
  593. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/sample_homo.py +58 -0
  594. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/src/utils/utils.py +600 -0
  595. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_3D_effect.py +46 -0
  596. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_fundamental.py +32 -0
  597. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_fundamental_model_warpper.py +34 -0
  598. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_match.py +50 -0
  599. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo/demo_match_opencv_sift.py +43 -0
  600. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/demo_single_pair.py +329 -0
  601. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/experiments/roma_indoor.py +320 -0
  602. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/experiments/roma_outdoor.py +327 -0
  603. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/notebooks/notebooks_utils/__init__.py +1 -0
  604. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/notebooks/notebooks_utils/plotting.py +331 -0
  605. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/__init__.py +8 -0
  606. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/__init__.py +4 -0
  607. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/hpatches_sequences_homog_benchmark.py +113 -0
  608. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/megadepth_dense_benchmark.py +106 -0
  609. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/megadepth_pose_estimation_benchmark.py +140 -0
  610. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/benchmarks/scannet_benchmark.py +143 -0
  611. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/checkpointing/__init__.py +1 -0
  612. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/checkpointing/checkpoint.py +60 -0
  613. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/datasets/__init__.py +2 -0
  614. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/datasets/megadepth.py +230 -0
  615. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/datasets/scannet.py +160 -0
  616. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/losses/__init__.py +1 -0
  617. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/losses/robust_loss.py +157 -0
  618. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/matchanything_roma_model.py +104 -0
  619. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/__init__.py +1 -0
  620. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/blocks.py +241 -0
  621. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/criterion.py +37 -0
  622. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/croco.py +253 -0
  623. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/croco_downstream.py +122 -0
  624. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/curope/__init__.py +4 -0
  625. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/curope/curope2d.py +40 -0
  626. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/curope/setup.py +34 -0
  627. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/dpt_block.py +450 -0
  628. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/head_downstream.py +58 -0
  629. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/masking.py +25 -0
  630. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/croco/pos_embed.py +159 -0
  631. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/__init__.py +2 -0
  632. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/__init__.py +29 -0
  633. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/base_opt.py +375 -0
  634. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/commons.py +90 -0
  635. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/init_im_poses.py +312 -0
  636. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/optimizer.py +230 -0
  637. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/cloud_opt/pair_viewer.py +125 -0
  638. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/__init__.py +42 -0
  639. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/__init__.py +2 -0
  640. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/base_stereo_view_dataset.py +220 -0
  641. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/batched_sampler.py +74 -0
  642. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/base/easy_dataset.py +157 -0
  643. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/co3d.py +146 -0
  644. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/utils/__init__.py +2 -0
  645. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/utils/cropping.py +119 -0
  646. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/datasets/utils/transforms.py +11 -0
  647. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/__init__.py +19 -0
  648. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/dpt_head.py +114 -0
  649. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/linear_head.py +41 -0
  650. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/heads/postprocess.py +58 -0
  651. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/image_pairs.py +83 -0
  652. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/inference.py +165 -0
  653. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/losses.py +297 -0
  654. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/model.py +167 -0
  655. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/optim_factory.py +14 -0
  656. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/patch_embed.py +70 -0
  657. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/post_process.py +60 -0
  658. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/__init__.py +2 -0
  659. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/device.py +76 -0
  660. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/geometry.py +361 -0
  661. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/image.py +104 -0
  662. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/misc.py +121 -0
  663. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/utils/path_to_croco.py +19 -0
  664. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/dust3r/viz.py +320 -0
  665. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/encoders.py +137 -0
  666. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/matcher.py +937 -0
  667. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/model_zoo/__init__.py +53 -0
  668. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/model_zoo/roma_models.py +162 -0
  669. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/__init__.py +47 -0
  670. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/dinov2.py +359 -0
  671. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/__init__.py +12 -0
  672. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/attention.py +81 -0
  673. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/block.py +252 -0
  674. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/dino_head.py +59 -0
  675. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/drop_path.py +35 -0
  676. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/layer_scale.py +28 -0
  677. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/mlp.py +41 -0
  678. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/patch_embed.py +89 -0
  679. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/models/transformer/layers/swiglu_ffn.py +63 -0
  680. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/roma_adpat_model.py +32 -0
  681. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/train/__init__.py +1 -0
  682. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/train/train.py +102 -0
  683. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/__init__.py +18 -0
  684. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/kde.py +8 -0
  685. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/local_correlation.py +44 -0
  686. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/transforms.py +118 -0
  687. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/roma/utils/utils.py +661 -0
  688. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/third_party/ROMA/setup.py +9 -0
  689. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/__init__.py +0 -0
  690. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/evaluate_datasets.py +239 -0
  691. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/tools_utils/data_io.py +94 -0
  692. vismatch/third_party/MatchAnything/imcui/third_party/MatchAnything/tools/tools_utils/plot.py +77 -0
  693. vismatch/third_party/MatchAnything/imcui/ui/__init__.py +5 -0
  694. vismatch/third_party/MatchAnything/imcui/ui/app_class.py +824 -0
  695. vismatch/third_party/MatchAnything/imcui/ui/sfm.py +164 -0
  696. vismatch/third_party/MatchAnything/imcui/ui/utils.py +1085 -0
  697. vismatch/third_party/MatchAnything/imcui/ui/viz.py +511 -0
  698. vismatch/third_party/MatchAnything/tests/test_basic.py +111 -0
  699. vismatch/third_party/MatchFormer/config/data/__init__.py +0 -0
  700. vismatch/third_party/MatchFormer/config/data/base.py +35 -0
  701. vismatch/third_party/MatchFormer/config/data/megadepth_test_1500.py +11 -0
  702. vismatch/third_party/MatchFormer/config/data/scannet_test_1500.py +11 -0
  703. vismatch/third_party/MatchFormer/config/defaultmf.py +88 -0
  704. vismatch/third_party/MatchFormer/model/backbone/__init__.py +17 -0
  705. vismatch/third_party/MatchFormer/model/backbone/coarse_matching.py +228 -0
  706. vismatch/third_party/MatchFormer/model/backbone/fine_matching.py +74 -0
  707. vismatch/third_party/MatchFormer/model/backbone/fine_preprocess.py +59 -0
  708. vismatch/third_party/MatchFormer/model/backbone/match_LA_large.py +254 -0
  709. vismatch/third_party/MatchFormer/model/backbone/match_LA_lite.py +254 -0
  710. vismatch/third_party/MatchFormer/model/backbone/match_SEA_large.py +291 -0
  711. vismatch/third_party/MatchFormer/model/backbone/match_SEA_lite.py +291 -0
  712. vismatch/third_party/MatchFormer/model/data.py +320 -0
  713. vismatch/third_party/MatchFormer/model/datasets/dataset.py +231 -0
  714. vismatch/third_party/MatchFormer/model/datasets/megadepth.py +126 -0
  715. vismatch/third_party/MatchFormer/model/datasets/sampler.py +77 -0
  716. vismatch/third_party/MatchFormer/model/datasets/scannet.py +113 -0
  717. vismatch/third_party/MatchFormer/model/lightning_loftr.py +102 -0
  718. vismatch/third_party/MatchFormer/model/matchformer.py +54 -0
  719. vismatch/third_party/MatchFormer/model/utils/augment.py +55 -0
  720. vismatch/third_party/MatchFormer/model/utils/comm.py +265 -0
  721. vismatch/third_party/MatchFormer/model/utils/dataloader.py +23 -0
  722. vismatch/third_party/MatchFormer/model/utils/metrics.py +193 -0
  723. vismatch/third_party/MatchFormer/model/utils/misc.py +101 -0
  724. vismatch/third_party/MatchFormer/model/utils/profiler.py +39 -0
  725. vismatch/third_party/MatchFormer/test.py +55 -0
  726. vismatch/third_party/RIPE/app.py +272 -0
  727. vismatch/third_party/RIPE/demo.py +51 -0
  728. vismatch/third_party/RIPE/ripe/__init__.py +1 -0
  729. vismatch/third_party/RIPE/ripe/benchmarks/imw_2020.py +320 -0
  730. vismatch/third_party/RIPE/ripe/data/__init__.py +0 -0
  731. vismatch/third_party/RIPE/ripe/data/data_transforms.py +204 -0
  732. vismatch/third_party/RIPE/ripe/data/datasets/__init__.py +0 -0
  733. vismatch/third_party/RIPE/ripe/data/datasets/acdc.py +154 -0
  734. vismatch/third_party/RIPE/ripe/data/datasets/dataset_combinator.py +88 -0
  735. vismatch/third_party/RIPE/ripe/data/datasets/disk_imw.py +160 -0
  736. vismatch/third_party/RIPE/ripe/data/datasets/disk_megadepth.py +157 -0
  737. vismatch/third_party/RIPE/ripe/data/datasets/tokyo247.py +134 -0
  738. vismatch/third_party/RIPE/ripe/data/datasets/tokyo_query_v3.py +78 -0
  739. vismatch/third_party/RIPE/ripe/losses/__init__.py +0 -0
  740. vismatch/third_party/RIPE/ripe/losses/contrastive_loss.py +88 -0
  741. vismatch/third_party/RIPE/ripe/matcher/__init__.py +0 -0
  742. vismatch/third_party/RIPE/ripe/matcher/concurrent_matcher.py +97 -0
  743. vismatch/third_party/RIPE/ripe/matcher/pose_estimator_poselib.py +31 -0
  744. vismatch/third_party/RIPE/ripe/model_zoo/__init__.py +1 -0
  745. vismatch/third_party/RIPE/ripe/model_zoo/vgg_hyper.py +39 -0
  746. vismatch/third_party/RIPE/ripe/models/__init__.py +0 -0
  747. vismatch/third_party/RIPE/ripe/models/backbones/__init__.py +0 -0
  748. vismatch/third_party/RIPE/ripe/models/backbones/backbone_base.py +61 -0
  749. vismatch/third_party/RIPE/ripe/models/backbones/vgg.py +99 -0
  750. vismatch/third_party/RIPE/ripe/models/backbones/vgg_utils.py +143 -0
  751. vismatch/third_party/RIPE/ripe/models/ripe.py +303 -0
  752. vismatch/third_party/RIPE/ripe/models/upsampler/hypercolumn_features.py +54 -0
  753. vismatch/third_party/RIPE/ripe/models/upsampler/interpolate_sparse2d.py +37 -0
  754. vismatch/third_party/RIPE/ripe/scheduler/__init__.py +0 -0
  755. vismatch/third_party/RIPE/ripe/scheduler/constant.py +6 -0
  756. vismatch/third_party/RIPE/ripe/scheduler/expDecay.py +26 -0
  757. vismatch/third_party/RIPE/ripe/scheduler/linearLR.py +37 -0
  758. vismatch/third_party/RIPE/ripe/scheduler/linear_with_plateaus.py +44 -0
  759. vismatch/third_party/RIPE/ripe/train.py +410 -0
  760. vismatch/third_party/RIPE/ripe/utils/__init__.py +2 -0
  761. vismatch/third_party/RIPE/ripe/utils/image_utils.py +62 -0
  762. vismatch/third_party/RIPE/ripe/utils/pose_error.py +62 -0
  763. vismatch/third_party/RIPE/ripe/utils/pylogger.py +32 -0
  764. vismatch/third_party/RIPE/ripe/utils/utils.py +192 -0
  765. vismatch/third_party/RIPE/ripe/utils/wandb_utils.py +16 -0
  766. vismatch/third_party/RoMa/demo/demo_3D_effect.py +47 -0
  767. vismatch/third_party/RoMa/demo/demo_fundamental.py +34 -0
  768. vismatch/third_party/RoMa/demo/demo_match.py +50 -0
  769. vismatch/third_party/RoMa/demo/demo_match_opencv_sift.py +43 -0
  770. vismatch/third_party/RoMa/demo/demo_match_tiny.py +77 -0
  771. vismatch/third_party/RoMa/experiments/eval_roma_outdoor.py +57 -0
  772. vismatch/third_party/RoMa/experiments/eval_tiny_roma_v1_outdoor.py +84 -0
  773. vismatch/third_party/RoMa/experiments/roma_indoor.py +320 -0
  774. vismatch/third_party/RoMa/experiments/train_roma_outdoor.py +307 -0
  775. vismatch/third_party/RoMa/experiments/train_tiny_roma_v1_outdoor.py +498 -0
  776. vismatch/third_party/RoMa/romatch/__init__.py +8 -0
  777. vismatch/third_party/RoMa/romatch/benchmarks/__init__.py +6 -0
  778. vismatch/third_party/RoMa/romatch/benchmarks/hpatches_sequences_homog_benchmark.py +113 -0
  779. vismatch/third_party/RoMa/romatch/benchmarks/megadepth_dense_benchmark.py +106 -0
  780. vismatch/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark.py +118 -0
  781. vismatch/third_party/RoMa/romatch/benchmarks/megadepth_pose_estimation_benchmark_poselib.py +119 -0
  782. vismatch/third_party/RoMa/romatch/benchmarks/scannet_benchmark.py +143 -0
  783. vismatch/third_party/RoMa/romatch/checkpointing/__init__.py +1 -0
  784. vismatch/third_party/RoMa/romatch/checkpointing/checkpoint.py +60 -0
  785. vismatch/third_party/RoMa/romatch/datasets/__init__.py +2 -0
  786. vismatch/third_party/RoMa/romatch/datasets/megadepth.py +232 -0
  787. vismatch/third_party/RoMa/romatch/datasets/scannet.py +160 -0
  788. vismatch/third_party/RoMa/romatch/losses/__init__.py +1 -0
  789. vismatch/third_party/RoMa/romatch/losses/robust_loss.py +161 -0
  790. vismatch/third_party/RoMa/romatch/losses/robust_loss_tiny_roma.py +160 -0
  791. vismatch/third_party/RoMa/romatch/models/__init__.py +1 -0
  792. vismatch/third_party/RoMa/romatch/models/encoders.py +122 -0
  793. vismatch/third_party/RoMa/romatch/models/matcher.py +748 -0
  794. vismatch/third_party/RoMa/romatch/models/model_zoo/__init__.py +73 -0
  795. vismatch/third_party/RoMa/romatch/models/model_zoo/roma_models.py +170 -0
  796. vismatch/third_party/RoMa/romatch/models/tiny.py +304 -0
  797. vismatch/third_party/RoMa/romatch/models/transformer/__init__.py +48 -0
  798. vismatch/third_party/RoMa/romatch/models/transformer/dinov2.py +359 -0
  799. vismatch/third_party/RoMa/romatch/models/transformer/layers/__init__.py +12 -0
  800. vismatch/third_party/RoMa/romatch/models/transformer/layers/attention.py +81 -0
  801. vismatch/third_party/RoMa/romatch/models/transformer/layers/block.py +252 -0
  802. vismatch/third_party/RoMa/romatch/models/transformer/layers/dino_head.py +59 -0
  803. vismatch/third_party/RoMa/romatch/models/transformer/layers/drop_path.py +35 -0
  804. vismatch/third_party/RoMa/romatch/models/transformer/layers/layer_scale.py +28 -0
  805. vismatch/third_party/RoMa/romatch/models/transformer/layers/mlp.py +41 -0
  806. vismatch/third_party/RoMa/romatch/models/transformer/layers/patch_embed.py +89 -0
  807. vismatch/third_party/RoMa/romatch/models/transformer/layers/swiglu_ffn.py +63 -0
  808. vismatch/third_party/RoMa/romatch/train/__init__.py +1 -0
  809. vismatch/third_party/RoMa/romatch/train/train.py +102 -0
  810. vismatch/third_party/RoMa/romatch/utils/__init__.py +16 -0
  811. vismatch/third_party/RoMa/romatch/utils/kde.py +13 -0
  812. vismatch/third_party/RoMa/romatch/utils/local_correlation.py +48 -0
  813. vismatch/third_party/RoMa/romatch/utils/transforms.py +118 -0
  814. vismatch/third_party/RoMa/romatch/utils/utils.py +654 -0
  815. vismatch/third_party/RoMa/setup.py +9 -0
  816. vismatch/third_party/RoMaV2/demo/demo_covariance.py +52 -0
  817. vismatch/third_party/RoMaV2/demo/demo_match.py +55 -0
  818. vismatch/third_party/RoMaV2/src/romav2/__init__.py +8 -0
  819. vismatch/third_party/RoMaV2/src/romav2/benchmarks/__init__.py +4 -0
  820. vismatch/third_party/RoMaV2/src/romav2/benchmarks/mega1500.py +115 -0
  821. vismatch/third_party/RoMaV2/src/romav2/benchmarks/satast.py +463 -0
  822. vismatch/third_party/RoMaV2/src/romav2/benchmarks/scannet1500.py +125 -0
  823. vismatch/third_party/RoMaV2/src/romav2/benchmarks/wxbs.py +104 -0
  824. vismatch/third_party/RoMaV2/src/romav2/device.py +9 -0
  825. vismatch/third_party/RoMaV2/src/romav2/dpt.py +516 -0
  826. vismatch/third_party/RoMaV2/src/romav2/features.py +190 -0
  827. vismatch/third_party/RoMaV2/src/romav2/geometry.py +261 -0
  828. vismatch/third_party/RoMaV2/src/romav2/io.py +24 -0
  829. vismatch/third_party/RoMaV2/src/romav2/local_correlation.py +152 -0
  830. vismatch/third_party/RoMaV2/src/romav2/logging.py +97 -0
  831. vismatch/third_party/RoMaV2/src/romav2/matcher.py +207 -0
  832. vismatch/third_party/RoMaV2/src/romav2/normalizers.py +17 -0
  833. vismatch/third_party/RoMaV2/src/romav2/refiner.py +277 -0
  834. vismatch/third_party/RoMaV2/src/romav2/romav2.py +533 -0
  835. vismatch/third_party/RoMaV2/src/romav2/types.py +75 -0
  836. vismatch/third_party/RoMaV2/src/romav2/vis.py +36 -0
  837. vismatch/third_party/RoMaV2/src/romav2/vit/__init__.py +304 -0
  838. vismatch/third_party/RoMaV2/src/romav2/vit/attention.py +181 -0
  839. vismatch/third_party/RoMaV2/src/romav2/vit/block.py +293 -0
  840. vismatch/third_party/RoMaV2/src/romav2/vit/ffn_layers.py +83 -0
  841. vismatch/third_party/RoMaV2/src/romav2/vit/layer_scale.py +29 -0
  842. vismatch/third_party/RoMaV2/src/romav2/vit/patch_embed.py +94 -0
  843. vismatch/third_party/RoMaV2/src/romav2/vit/rms_norm.py +24 -0
  844. vismatch/third_party/RoMaV2/src/romav2/vit/rope.py +133 -0
  845. vismatch/third_party/RoMaV2/src/romav2/vit/rope_mixed.py +111 -0
  846. vismatch/third_party/RoMaV2/src/romav2/vit/utils.py +48 -0
  847. vismatch/third_party/RoMaV2/tests/test_bidirectional.py +93 -0
  848. vismatch/third_party/RoMaV2/tests/test_fps.py +49 -0
  849. vismatch/third_party/RoMaV2/tests/test_mega1500.py +22 -0
  850. vismatch/third_party/RoMaV2/tests/test_scannet1500.py +21 -0
  851. vismatch/third_party/RoMaV2/tests/test_smoke.py +15 -0
  852. vismatch/third_party/Se2_LoFTR/configs/data/__init__.py +0 -0
  853. vismatch/third_party/Se2_LoFTR/configs/data/base.py +35 -0
  854. vismatch/third_party/Se2_LoFTR/configs/data/megadepth_test_1500.py +11 -0
  855. vismatch/third_party/Se2_LoFTR/configs/data/megadepth_trainval_640.py +22 -0
  856. vismatch/third_party/Se2_LoFTR/configs/data/megadepth_trainval_840.py +22 -0
  857. vismatch/third_party/Se2_LoFTR/configs/data/scannet_test_1500.py +11 -0
  858. vismatch/third_party/Se2_LoFTR/configs/data/scannet_trainval.py +17 -0
  859. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds.py +6 -0
  860. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ds_dense.py +8 -0
  861. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot.py +6 -0
  862. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/buggy_pos_enc/loftr_ot_dense.py +8 -0
  863. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ds.py +5 -0
  864. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ds_dense.py +7 -0
  865. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ot.py +5 -0
  866. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/loftr_ot_dense.py +7 -0
  867. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval.py +16 -0
  868. vismatch/third_party/Se2_LoFTR/configs/loftr/indoor/scannet/loftr_ds_eval_new.py +18 -0
  869. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds.py +16 -0
  870. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ds_dense.py +17 -0
  871. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot.py +16 -0
  872. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/buggy_pos_enc/loftr_ot_dense.py +17 -0
  873. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds.py +17 -0
  874. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_dense.py +17 -0
  875. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2.py +20 -0
  876. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2_dense.py +23 -0
  877. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2_dense_8rot.py +23 -0
  878. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ds_e2_dense_big.py +22 -0
  879. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ot.py +17 -0
  880. vismatch/third_party/Se2_LoFTR/configs/loftr/outdoor/loftr_ot_dense.py +18 -0
  881. vismatch/third_party/Se2_LoFTR/demo/demo_loftr.py +240 -0
  882. vismatch/third_party/Se2_LoFTR/src/__init__.py +0 -0
  883. vismatch/third_party/Se2_LoFTR/src/config/default.py +173 -0
  884. vismatch/third_party/Se2_LoFTR/src/datasets/megadepth.py +127 -0
  885. vismatch/third_party/Se2_LoFTR/src/datasets/sampler.py +77 -0
  886. vismatch/third_party/Se2_LoFTR/src/datasets/scannet.py +114 -0
  887. vismatch/third_party/Se2_LoFTR/src/lightning/data.py +320 -0
  888. vismatch/third_party/Se2_LoFTR/src/lightning/lightning_loftr.py +249 -0
  889. vismatch/third_party/Se2_LoFTR/src/loftr/__init__.py +2 -0
  890. vismatch/third_party/Se2_LoFTR/src/loftr/backbone/__init__.py +17 -0
  891. vismatch/third_party/Se2_LoFTR/src/loftr/backbone/resnet_e2.py +170 -0
  892. vismatch/third_party/Se2_LoFTR/src/loftr/backbone/resnet_fpn.py +199 -0
  893. vismatch/third_party/Se2_LoFTR/src/loftr/loftr.py +81 -0
  894. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/__init__.py +2 -0
  895. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/fine_preprocess.py +59 -0
  896. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/linear_attention.py +81 -0
  897. vismatch/third_party/Se2_LoFTR/src/loftr/loftr_module/transformer.py +101 -0
  898. vismatch/third_party/Se2_LoFTR/src/loftr/utils/coarse_matching.py +261 -0
  899. vismatch/third_party/Se2_LoFTR/src/loftr/utils/cvpr_ds_config.py +50 -0
  900. vismatch/third_party/Se2_LoFTR/src/loftr/utils/fine_matching.py +74 -0
  901. vismatch/third_party/Se2_LoFTR/src/loftr/utils/geometry.py +54 -0
  902. vismatch/third_party/Se2_LoFTR/src/loftr/utils/position_encoding.py +42 -0
  903. vismatch/third_party/Se2_LoFTR/src/loftr/utils/supervision.py +151 -0
  904. vismatch/third_party/Se2_LoFTR/src/losses/loftr_loss.py +192 -0
  905. vismatch/third_party/Se2_LoFTR/src/optimizers/__init__.py +42 -0
  906. vismatch/third_party/Se2_LoFTR/src/utils/augment.py +55 -0
  907. vismatch/third_party/Se2_LoFTR/src/utils/comm.py +265 -0
  908. vismatch/third_party/Se2_LoFTR/src/utils/dataloader.py +23 -0
  909. vismatch/third_party/Se2_LoFTR/src/utils/dataset.py +185 -0
  910. vismatch/third_party/Se2_LoFTR/src/utils/metrics.py +193 -0
  911. vismatch/third_party/Se2_LoFTR/src/utils/misc.py +104 -0
  912. vismatch/third_party/Se2_LoFTR/src/utils/plotting.py +154 -0
  913. vismatch/third_party/Se2_LoFTR/src/utils/profiler.py +39 -0
  914. vismatch/third_party/Se2_LoFTR/test.py +68 -0
  915. vismatch/third_party/Se2_LoFTR/train.py +123 -0
  916. vismatch/third_party/SphereGlue/demo_SphereGlue.py +141 -0
  917. vismatch/third_party/SphereGlue/model/sphereglue.py +230 -0
  918. vismatch/third_party/SphereGlue/utils/Utils.py +191 -0
  919. vismatch/third_party/SphereGlue/utils/demo_mydataset.py +119 -0
  920. vismatch/third_party/Steerers/rotation_steerers/matchers/dual_softmax_matcher.py +44 -0
  921. vismatch/third_party/Steerers/rotation_steerers/matchers/max_matches.py +205 -0
  922. vismatch/third_party/Steerers/rotation_steerers/matchers/max_similarity.py +115 -0
  923. vismatch/third_party/Steerers/rotation_steerers/steerers.py +37 -0
  924. vismatch/third_party/Steerers/setup.py +14 -0
  925. vismatch/third_party/TopicFM/configs/megadepth_test.py +17 -0
  926. vismatch/third_party/TopicFM/configs/megadepth_test_topicfmfast.py +17 -0
  927. vismatch/third_party/TopicFM/configs/megadepth_test_topicfmplus.py +20 -0
  928. vismatch/third_party/TopicFM/configs/megadepth_train.py +36 -0
  929. vismatch/third_party/TopicFM/configs/megadepth_train_topicfmfast.py +34 -0
  930. vismatch/third_party/TopicFM/configs/megadepth_train_topicfmplus.py +37 -0
  931. vismatch/third_party/TopicFM/configs/scannet_test.py +15 -0
  932. vismatch/third_party/TopicFM/configs/scannet_test_topicfmfast.py +15 -0
  933. vismatch/third_party/TopicFM/configs/scannet_test_topicfmplus.py +19 -0
  934. vismatch/third_party/TopicFM/src/__init__.py +11 -0
  935. vismatch/third_party/TopicFM/src/config/default.py +174 -0
  936. vismatch/third_party/TopicFM/src/datasets/aachen.py +29 -0
  937. vismatch/third_party/TopicFM/src/datasets/custom_dataloader.py +126 -0
  938. vismatch/third_party/TopicFM/src/datasets/inloc.py +29 -0
  939. vismatch/third_party/TopicFM/src/datasets/megadepth.py +170 -0
  940. vismatch/third_party/TopicFM/src/datasets/sampler.py +77 -0
  941. vismatch/third_party/TopicFM/src/datasets/scannet.py +115 -0
  942. vismatch/third_party/TopicFM/src/lightning_trainer/data.py +292 -0
  943. vismatch/third_party/TopicFM/src/lightning_trainer/trainer.py +244 -0
  944. vismatch/third_party/TopicFM/src/losses/loss.py +228 -0
  945. vismatch/third_party/TopicFM/src/models/__init__.py +1 -0
  946. vismatch/third_party/TopicFM/src/models/backbone/__init__.py +12 -0
  947. vismatch/third_party/TopicFM/src/models/backbone/convnext.py +165 -0
  948. vismatch/third_party/TopicFM/src/models/backbone/fpn.py +114 -0
  949. vismatch/third_party/TopicFM/src/models/modules/__init__.py +2 -0
  950. vismatch/third_party/TopicFM/src/models/modules/encoder.py +266 -0
  951. vismatch/third_party/TopicFM/src/models/modules/fine_preprocess.py +59 -0
  952. vismatch/third_party/TopicFM/src/models/modules/linear_attention.py +84 -0
  953. vismatch/third_party/TopicFM/src/models/topic_fm.py +100 -0
  954. vismatch/third_party/TopicFM/src/models/utils/coarse_matching.py +213 -0
  955. vismatch/third_party/TopicFM/src/models/utils/fine_matching.py +172 -0
  956. vismatch/third_party/TopicFM/src/models/utils/geometry.py +54 -0
  957. vismatch/third_party/TopicFM/src/models/utils/supervision.py +167 -0
  958. vismatch/third_party/TopicFM/src/optimizers/__init__.py +42 -0
  959. vismatch/third_party/TopicFM/src/utils/augment.py +55 -0
  960. vismatch/third_party/TopicFM/src/utils/comm.py +265 -0
  961. vismatch/third_party/TopicFM/src/utils/dataloader.py +23 -0
  962. vismatch/third_party/TopicFM/src/utils/dataset.py +206 -0
  963. vismatch/third_party/TopicFM/src/utils/metrics.py +193 -0
  964. vismatch/third_party/TopicFM/src/utils/misc.py +101 -0
  965. vismatch/third_party/TopicFM/src/utils/plotting.py +313 -0
  966. vismatch/third_party/TopicFM/src/utils/profiler.py +39 -0
  967. vismatch/third_party/TopicFM/test.py +70 -0
  968. vismatch/third_party/TopicFM/third_party/__init__.py +0 -0
  969. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/indoor/aspan_test.py +7 -0
  970. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/indoor/aspan_train.py +8 -0
  971. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/outdoor/aspan_test.py +18 -0
  972. vismatch/third_party/TopicFM/third_party/aspanformer/configs/aspan/outdoor/aspan_train.py +17 -0
  973. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/__init__.py +0 -0
  974. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/base.py +35 -0
  975. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/megadepth_test_1500.py +13 -0
  976. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/megadepth_trainval_832.py +22 -0
  977. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/scannet_test_1500.py +11 -0
  978. vismatch/third_party/TopicFM/third_party/aspanformer/configs/data/scannet_trainval.py +17 -0
  979. vismatch/third_party/TopicFM/third_party/aspanformer/demo/demo.py +63 -0
  980. vismatch/third_party/TopicFM/third_party/aspanformer/demo/demo_utils.py +44 -0
  981. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/__init__.py +2 -0
  982. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/__init__.py +3 -0
  983. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/attention.py +198 -0
  984. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/fine_preprocess.py +59 -0
  985. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/loftr.py +112 -0
  986. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspan_module/transformer.py +244 -0
  987. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/aspanformer.py +133 -0
  988. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/backbone/__init__.py +11 -0
  989. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/backbone/resnet_fpn.py +199 -0
  990. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/coarse_matching.py +331 -0
  991. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/cvpr_ds_config.py +50 -0
  992. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/fine_matching.py +74 -0
  993. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/geometry.py +54 -0
  994. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/position_encoding.py +61 -0
  995. vismatch/third_party/TopicFM/third_party/aspanformer/src/ASpanFormer/utils/supervision.py +151 -0
  996. vismatch/third_party/TopicFM/third_party/aspanformer/src/__init__.py +0 -0
  997. vismatch/third_party/TopicFM/third_party/aspanformer/src/config/default.py +180 -0
  998. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/__init__.py +3 -0
  999. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/megadepth.py +127 -0
  1000. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/sampler.py +77 -0
  1001. vismatch/third_party/TopicFM/third_party/aspanformer/src/datasets/scannet.py +113 -0
  1002. vismatch/third_party/TopicFM/third_party/aspanformer/src/lightning/data.py +326 -0
  1003. vismatch/third_party/TopicFM/third_party/aspanformer/src/lightning/lightning_aspanformer.py +276 -0
  1004. vismatch/third_party/TopicFM/third_party/aspanformer/src/losses/aspan_loss.py +231 -0
  1005. vismatch/third_party/TopicFM/third_party/aspanformer/src/optimizers/__init__.py +42 -0
  1006. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/augment.py +55 -0
  1007. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/comm.py +265 -0
  1008. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/dataloader.py +23 -0
  1009. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/dataset.py +222 -0
  1010. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/metrics.py +260 -0
  1011. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/misc.py +139 -0
  1012. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/plotting.py +219 -0
  1013. vismatch/third_party/TopicFM/third_party/aspanformer/src/utils/profiler.py +39 -0
  1014. vismatch/third_party/TopicFM/third_party/aspanformer/test.py +69 -0
  1015. vismatch/third_party/TopicFM/third_party/aspanformer/tools/SensorData.py +125 -0
  1016. vismatch/third_party/TopicFM/third_party/aspanformer/tools/extract.py +47 -0
  1017. vismatch/third_party/TopicFM/third_party/aspanformer/tools/preprocess_scene.py +242 -0
  1018. vismatch/third_party/TopicFM/third_party/aspanformer/tools/reader.py +39 -0
  1019. vismatch/third_party/TopicFM/third_party/aspanformer/tools/undistort_mega.py +69 -0
  1020. vismatch/third_party/TopicFM/third_party/aspanformer/train.py +134 -0
  1021. vismatch/third_party/TopicFM/third_party/loftr/configs/data/__init__.py +0 -0
  1022. vismatch/third_party/TopicFM/third_party/loftr/configs/data/base.py +35 -0
  1023. vismatch/third_party/TopicFM/third_party/loftr/configs/data/megadepth_test_1500.py +11 -0
  1024. vismatch/third_party/TopicFM/third_party/loftr/configs/data/megadepth_trainval_640.py +22 -0
  1025. vismatch/third_party/TopicFM/third_party/loftr/configs/data/megadepth_trainval_840.py +22 -0
  1026. vismatch/third_party/TopicFM/third_party/loftr/configs/data/scannet_test_1500.py +11 -0
  1027. vismatch/third_party/TopicFM/third_party/loftr/configs/data/scannet_trainval.py +17 -0
  1028. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ds.py +6 -0
  1029. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ds_dense.py +8 -0
  1030. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ot.py +6 -0
  1031. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/buggy_pos_enc/loftr_ot_dense.py +8 -0
  1032. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ds.py +5 -0
  1033. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ds_dense.py +7 -0
  1034. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ot.py +5 -0
  1035. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/loftr_ot_dense.py +7 -0
  1036. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/scannet/loftr_ds_eval.py +16 -0
  1037. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/indoor/scannet/loftr_ds_eval_new.py +18 -0
  1038. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ds.py +16 -0
  1039. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ds_dense.py +17 -0
  1040. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ot.py +16 -0
  1041. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/buggy_pos_enc/loftr_ot_dense.py +17 -0
  1042. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ds.py +15 -0
  1043. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ds_dense.py +16 -0
  1044. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ot.py +15 -0
  1045. vismatch/third_party/TopicFM/third_party/loftr/configs/loftr/outdoor/loftr_ot_dense.py +16 -0
  1046. vismatch/third_party/TopicFM/third_party/loftr/demo/demo_loftr.py +240 -0
  1047. vismatch/third_party/TopicFM/third_party/loftr/src/__init__.py +0 -0
  1048. vismatch/third_party/TopicFM/third_party/loftr/src/config/default.py +171 -0
  1049. vismatch/third_party/TopicFM/third_party/loftr/src/datasets/megadepth.py +127 -0
  1050. vismatch/third_party/TopicFM/third_party/loftr/src/datasets/sampler.py +77 -0
  1051. vismatch/third_party/TopicFM/third_party/loftr/src/datasets/scannet.py +114 -0
  1052. vismatch/third_party/TopicFM/third_party/loftr/src/lightning/data.py +320 -0
  1053. vismatch/third_party/TopicFM/third_party/loftr/src/lightning/lightning_loftr.py +249 -0
  1054. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/__init__.py +2 -0
  1055. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/backbone/__init__.py +11 -0
  1056. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/backbone/resnet_fpn.py +199 -0
  1057. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr.py +81 -0
  1058. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/__init__.py +2 -0
  1059. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/fine_preprocess.py +59 -0
  1060. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/linear_attention.py +81 -0
  1061. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/loftr_module/transformer.py +101 -0
  1062. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/coarse_matching.py +261 -0
  1063. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/cvpr_ds_config.py +50 -0
  1064. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/fine_matching.py +74 -0
  1065. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/geometry.py +54 -0
  1066. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/position_encoding.py +42 -0
  1067. vismatch/third_party/TopicFM/third_party/loftr/src/loftr/utils/supervision.py +151 -0
  1068. vismatch/third_party/TopicFM/third_party/loftr/src/losses/loftr_loss.py +192 -0
  1069. vismatch/third_party/TopicFM/third_party/loftr/src/optimizers/__init__.py +42 -0
  1070. vismatch/third_party/TopicFM/third_party/loftr/src/utils/augment.py +55 -0
  1071. vismatch/third_party/TopicFM/third_party/loftr/src/utils/comm.py +265 -0
  1072. vismatch/third_party/TopicFM/third_party/loftr/src/utils/dataloader.py +23 -0
  1073. vismatch/third_party/TopicFM/third_party/loftr/src/utils/dataset.py +185 -0
  1074. vismatch/third_party/TopicFM/third_party/loftr/src/utils/metrics.py +193 -0
  1075. vismatch/third_party/TopicFM/third_party/loftr/src/utils/misc.py +101 -0
  1076. vismatch/third_party/TopicFM/third_party/loftr/src/utils/plotting.py +154 -0
  1077. vismatch/third_party/TopicFM/third_party/loftr/src/utils/profiler.py +39 -0
  1078. vismatch/third_party/TopicFM/third_party/loftr/test.py +68 -0
  1079. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/demo_superglue.py +259 -0
  1080. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/match_pairs.py +425 -0
  1081. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/__init__.py +0 -0
  1082. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/matching.py +84 -0
  1083. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/superglue.py +283 -0
  1084. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/superpoint.py +202 -0
  1085. vismatch/third_party/TopicFM/third_party/loftr/third_party/SuperGluePretrainedNetwork/models/utils.py +555 -0
  1086. vismatch/third_party/TopicFM/third_party/loftr/train.py +123 -0
  1087. vismatch/third_party/TopicFM/third_party/matchformer/config/data/__init__.py +0 -0
  1088. vismatch/third_party/TopicFM/third_party/matchformer/config/data/base.py +35 -0
  1089. vismatch/third_party/TopicFM/third_party/matchformer/config/data/megadepth_test_1500.py +11 -0
  1090. vismatch/third_party/TopicFM/third_party/matchformer/config/data/scannet_test_1500.py +11 -0
  1091. vismatch/third_party/TopicFM/third_party/matchformer/config/defaultmf.py +88 -0
  1092. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/__init__.py +17 -0
  1093. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/coarse_matching.py +228 -0
  1094. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/fine_matching.py +74 -0
  1095. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/fine_preprocess.py +59 -0
  1096. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_LA_large.py +254 -0
  1097. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_LA_lite.py +254 -0
  1098. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_SEA_large.py +291 -0
  1099. vismatch/third_party/TopicFM/third_party/matchformer/model/backbone/match_SEA_lite.py +291 -0
  1100. vismatch/third_party/TopicFM/third_party/matchformer/model/data.py +320 -0
  1101. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/dataset.py +231 -0
  1102. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/megadepth.py +126 -0
  1103. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/sampler.py +77 -0
  1104. vismatch/third_party/TopicFM/third_party/matchformer/model/datasets/scannet.py +113 -0
  1105. vismatch/third_party/TopicFM/third_party/matchformer/model/lightning_loftr.py +102 -0
  1106. vismatch/third_party/TopicFM/third_party/matchformer/model/matchformer.py +54 -0
  1107. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/augment.py +55 -0
  1108. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/comm.py +265 -0
  1109. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/dataloader.py +23 -0
  1110. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/metrics.py +193 -0
  1111. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/misc.py +101 -0
  1112. vismatch/third_party/TopicFM/third_party/matchformer/model/utils/profiler.py +39 -0
  1113. vismatch/third_party/TopicFM/third_party/matchformer/test.py +55 -0
  1114. vismatch/third_party/TopicFM/train.py +123 -0
  1115. vismatch/third_party/TopicFM/visualization.py +123 -0
  1116. vismatch/third_party/TopicFM/viz/__init__.py +1 -0
  1117. vismatch/third_party/TopicFM/viz/configs/__init__.py +0 -0
  1118. vismatch/third_party/TopicFM/viz/methods/__init__.py +0 -0
  1119. vismatch/third_party/TopicFM/viz/methods/base.py +70 -0
  1120. vismatch/third_party/TopicFM/viz/methods/topicfmv2.py +208 -0
  1121. vismatch/third_party/UFM/UniCeption/examples/models/cosmos/autoencoding.py +48 -0
  1122. vismatch/third_party/UFM/UniCeption/examples/models/dust3r/convert_dust3r_weights_to_uniception.py +331 -0
  1123. vismatch/third_party/UFM/UniCeption/examples/models/dust3r/dust3r.py +261 -0
  1124. vismatch/third_party/UFM/UniCeption/examples/models/dust3r/profile_dust3r.py +47 -0
  1125. vismatch/third_party/UFM/UniCeption/scripts/check_dependencies.py +48 -0
  1126. vismatch/third_party/UFM/UniCeption/scripts/download_checkpoints.py +50 -0
  1127. vismatch/third_party/UFM/UniCeption/scripts/install_croco_rope.py +61 -0
  1128. vismatch/third_party/UFM/UniCeption/scripts/prepare_offline_install.py +398 -0
  1129. vismatch/third_party/UFM/UniCeption/scripts/validate_installation.py +212 -0
  1130. vismatch/third_party/UFM/UniCeption/setup.py +185 -0
  1131. vismatch/third_party/UFM/UniCeption/tests/models/encoders/conftest.py +26 -0
  1132. vismatch/third_party/UFM/UniCeption/tests/models/encoders/test_encoders.py +202 -0
  1133. vismatch/third_party/UFM/UniCeption/tests/models/encoders/viz_image_encoders.py +294 -0
  1134. vismatch/third_party/UFM/UniCeption/tests/models/info_sharing/viz_mulit_view_cross_attn_transformers.py +337 -0
  1135. vismatch/third_party/UFM/UniCeption/uniception/__init__.py +0 -0
  1136. vismatch/third_party/UFM/UniCeption/uniception/models/__init__.py +0 -0
  1137. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/__init__.py +225 -0
  1138. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/base.py +157 -0
  1139. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/cosmos.py +137 -0
  1140. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/croco.py +457 -0
  1141. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/dense_rep_encoder.py +344 -0
  1142. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/dinov2.py +333 -0
  1143. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/global_rep_encoder.py +115 -0
  1144. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/image_normalizations.py +35 -0
  1145. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/list.py +10 -0
  1146. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/patch_embedder.py +235 -0
  1147. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/radio.py +367 -0
  1148. vismatch/third_party/UFM/UniCeption/uniception/models/encoders/utils.py +86 -0
  1149. vismatch/third_party/UFM/UniCeption/uniception/models/factory/__init__.py +3 -0
  1150. vismatch/third_party/UFM/UniCeption/uniception/models/factory/dust3r.py +332 -0
  1151. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/__init__.py +39 -0
  1152. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/alternating_attention_transformer.py +973 -0
  1153. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/base.py +116 -0
  1154. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/cross_attention_transformer.py +612 -0
  1155. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/diff_cross_attention_transformer.py +588 -0
  1156. vismatch/third_party/UFM/UniCeption/uniception/models/info_sharing/global_attention_transformer.py +1154 -0
  1157. vismatch/third_party/UFM/UniCeption/uniception/models/libs/__init__.py +0 -0
  1158. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/__init__.py +14 -0
  1159. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/image_cli.py +175 -0
  1160. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/image_lib.py +123 -0
  1161. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/__init__.py +60 -0
  1162. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/distributions.py +41 -0
  1163. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/layers2d.py +326 -0
  1164. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/layers3d.py +965 -0
  1165. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/patching.py +310 -0
  1166. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/quantizers.py +510 -0
  1167. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/modules/utils.py +115 -0
  1168. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/__init__.py +39 -0
  1169. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/configs.py +146 -0
  1170. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/continuous_image.py +86 -0
  1171. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/continuous_video.py +98 -0
  1172. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/discrete_image.py +113 -0
  1173. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/networks/discrete_video.py +115 -0
  1174. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/utils.py +402 -0
  1175. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/video_cli.py +195 -0
  1176. vismatch/third_party/UFM/UniCeption/uniception/models/libs/cosmos_tokenizer/video_lib.py +145 -0
  1177. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/__init__.py +0 -0
  1178. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/blocks.py +249 -0
  1179. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/curope/__init__.py +4 -0
  1180. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/curope/curope2d.py +39 -0
  1181. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/curope/setup.py +33 -0
  1182. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/dpt_block.py +530 -0
  1183. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/patch_embed.py +127 -0
  1184. vismatch/third_party/UFM/UniCeption/uniception/models/libs/croco/pos_embed.py +155 -0
  1185. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/__init__.py +18 -0
  1186. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/adaptors.py +1765 -0
  1187. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/base.py +210 -0
  1188. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/cosmos.py +211 -0
  1189. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/dpt.py +676 -0
  1190. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/global_head.py +142 -0
  1191. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/linear.py +95 -0
  1192. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/mlp_feature.py +114 -0
  1193. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/mlp_head.py +114 -0
  1194. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/moge_conv.py +342 -0
  1195. vismatch/third_party/UFM/UniCeption/uniception/models/prediction_heads/pose_head.py +181 -0
  1196. vismatch/third_party/UFM/UniCeption/uniception/models/utils/__init__.py +0 -0
  1197. vismatch/third_party/UFM/UniCeption/uniception/models/utils/config.py +34 -0
  1198. vismatch/third_party/UFM/UniCeption/uniception/models/utils/intermediate_feature_return.py +85 -0
  1199. vismatch/third_party/UFM/UniCeption/uniception/models/utils/positional_encoding.py +23 -0
  1200. vismatch/third_party/UFM/UniCeption/uniception/models/utils/transformer_blocks.py +1072 -0
  1201. vismatch/third_party/UFM/UniCeption/uniception/utils/__init__.py +0 -0
  1202. vismatch/third_party/UFM/UniCeption/uniception/utils/profile.py +13 -0
  1203. vismatch/third_party/UFM/UniCeption/uniception/utils/viz.py +99 -0
  1204. vismatch/third_party/UFM/example_inference.py +138 -0
  1205. vismatch/third_party/UFM/gradio_demo.py +238 -0
  1206. vismatch/third_party/UFM/setup.py +86 -0
  1207. vismatch/third_party/UFM/uniflowmatch/__init__.py +16 -0
  1208. vismatch/third_party/UFM/uniflowmatch/cli.py +217 -0
  1209. vismatch/third_party/UFM/uniflowmatch/models/__init__.py +25 -0
  1210. vismatch/third_party/UFM/uniflowmatch/models/base.py +334 -0
  1211. vismatch/third_party/UFM/uniflowmatch/models/ufm.py +1323 -0
  1212. vismatch/third_party/UFM/uniflowmatch/models/unet_encoder.py +90 -0
  1213. vismatch/third_party/UFM/uniflowmatch/models/utils.py +16 -0
  1214. vismatch/third_party/UFM/uniflowmatch/utils/__init__.py +63 -0
  1215. vismatch/third_party/UFM/uniflowmatch/utils/flow_resizing.py +1091 -0
  1216. vismatch/third_party/UFM/uniflowmatch/utils/geometry.py +612 -0
  1217. vismatch/third_party/UFM/uniflowmatch/utils/viz.py +97 -0
  1218. vismatch/third_party/XoFTR/configs/data/__init__.py +0 -0
  1219. vismatch/third_party/XoFTR/configs/data/base.py +35 -0
  1220. vismatch/third_party/XoFTR/configs/data/megadepth_trainval_840.py +22 -0
  1221. vismatch/third_party/XoFTR/configs/data/megadepth_vistir_trainval_640.py +23 -0
  1222. vismatch/third_party/XoFTR/configs/data/pretrain.py +8 -0
  1223. vismatch/third_party/XoFTR/configs/xoftr/outdoor/visible_thermal.py +17 -0
  1224. vismatch/third_party/XoFTR/configs/xoftr/pretrain/pretrain.py +12 -0
  1225. vismatch/third_party/XoFTR/pretrain.py +125 -0
  1226. vismatch/third_party/XoFTR/src/__init__.py +0 -0
  1227. vismatch/third_party/XoFTR/src/config/default.py +203 -0
  1228. vismatch/third_party/XoFTR/src/datasets/megadepth.py +143 -0
  1229. vismatch/third_party/XoFTR/src/datasets/pretrain_dataset.py +156 -0
  1230. vismatch/third_party/XoFTR/src/datasets/sampler.py +77 -0
  1231. vismatch/third_party/XoFTR/src/datasets/scannet.py +114 -0
  1232. vismatch/third_party/XoFTR/src/datasets/vistir.py +109 -0
  1233. vismatch/third_party/XoFTR/src/lightning/data.py +346 -0
  1234. vismatch/third_party/XoFTR/src/lightning/data_pretrain.py +125 -0
  1235. vismatch/third_party/XoFTR/src/lightning/lightning_xoftr.py +334 -0
  1236. vismatch/third_party/XoFTR/src/lightning/lightning_xoftr_pretrain.py +171 -0
  1237. vismatch/third_party/XoFTR/src/losses/xoftr_loss.py +170 -0
  1238. vismatch/third_party/XoFTR/src/losses/xoftr_loss_pretrain.py +37 -0
  1239. vismatch/third_party/XoFTR/src/optimizers/__init__.py +42 -0
  1240. vismatch/third_party/XoFTR/src/utils/augment.py +113 -0
  1241. vismatch/third_party/XoFTR/src/utils/comm.py +265 -0
  1242. vismatch/third_party/XoFTR/src/utils/data_io.py +144 -0
  1243. vismatch/third_party/XoFTR/src/utils/dataloader.py +23 -0
  1244. vismatch/third_party/XoFTR/src/utils/dataset.py +279 -0
  1245. vismatch/third_party/XoFTR/src/utils/metrics.py +211 -0
  1246. vismatch/third_party/XoFTR/src/utils/misc.py +101 -0
  1247. vismatch/third_party/XoFTR/src/utils/plotting.py +227 -0
  1248. vismatch/third_party/XoFTR/src/utils/pretrain_utils.py +83 -0
  1249. vismatch/third_party/XoFTR/src/utils/profiler.py +39 -0
  1250. vismatch/third_party/XoFTR/src/xoftr/__init__.py +2 -0
  1251. vismatch/third_party/XoFTR/src/xoftr/backbone/__init__.py +1 -0
  1252. vismatch/third_party/XoFTR/src/xoftr/backbone/resnet.py +95 -0
  1253. vismatch/third_party/XoFTR/src/xoftr/utils/geometry.py +107 -0
  1254. vismatch/third_party/XoFTR/src/xoftr/utils/position_encoding.py +36 -0
  1255. vismatch/third_party/XoFTR/src/xoftr/utils/supervision.py +290 -0
  1256. vismatch/third_party/XoFTR/src/xoftr/xoftr.py +94 -0
  1257. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/__init__.py +4 -0
  1258. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/coarse_matching.py +305 -0
  1259. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/fine_matching.py +170 -0
  1260. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/fine_process.py +321 -0
  1261. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/linear_attention.py +81 -0
  1262. vismatch/third_party/XoFTR/src/xoftr/xoftr_module/transformer.py +101 -0
  1263. vismatch/third_party/XoFTR/src/xoftr/xoftr_pretrain.py +209 -0
  1264. vismatch/third_party/XoFTR/test.py +68 -0
  1265. vismatch/third_party/XoFTR/test_relative_pose.py +330 -0
  1266. vismatch/third_party/XoFTR/train.py +126 -0
  1267. vismatch/third_party/accelerated_features/hubconf.py +15 -0
  1268. vismatch/third_party/accelerated_features/minimal_example.py +49 -0
  1269. vismatch/third_party/accelerated_features/modules/__init__.py +4 -0
  1270. vismatch/third_party/accelerated_features/modules/dataset/__init__.py +5 -0
  1271. vismatch/third_party/accelerated_features/modules/dataset/augmentation.py +314 -0
  1272. vismatch/third_party/accelerated_features/modules/dataset/megadepth/__init__.py +7 -0
  1273. vismatch/third_party/accelerated_features/modules/dataset/megadepth/megadepth.py +174 -0
  1274. vismatch/third_party/accelerated_features/modules/dataset/megadepth/megadepth_warper.py +170 -0
  1275. vismatch/third_party/accelerated_features/modules/dataset/megadepth/utils.py +160 -0
  1276. vismatch/third_party/accelerated_features/modules/interpolator.py +33 -0
  1277. vismatch/third_party/accelerated_features/modules/lighterglue.py +56 -0
  1278. vismatch/third_party/accelerated_features/modules/model.py +154 -0
  1279. vismatch/third_party/accelerated_features/modules/training/__init__.py +4 -0
  1280. vismatch/third_party/accelerated_features/modules/training/losses.py +224 -0
  1281. vismatch/third_party/accelerated_features/modules/training/train.py +311 -0
  1282. vismatch/third_party/accelerated_features/modules/training/utils.py +200 -0
  1283. vismatch/third_party/accelerated_features/modules/xfeat.py +402 -0
  1284. vismatch/third_party/accelerated_features/realtime_demo.py +295 -0
  1285. vismatch/third_party/accelerated_features/third_party/ALIKE/alike.py +143 -0
  1286. vismatch/third_party/accelerated_features/third_party/ALIKE/alnet.py +164 -0
  1287. vismatch/third_party/accelerated_features/third_party/ALIKE/demo.py +167 -0
  1288. vismatch/third_party/accelerated_features/third_party/ALIKE/hseq/eval.py +162 -0
  1289. vismatch/third_party/accelerated_features/third_party/ALIKE/hseq/extract.py +159 -0
  1290. vismatch/third_party/accelerated_features/third_party/ALIKE/soft_detect.py +194 -0
  1291. vismatch/third_party/accelerated_features/third_party/__init__.py +4 -0
  1292. vismatch/third_party/accelerated_features/third_party/alike_wrapper.py +110 -0
  1293. vismatch/third_party/affine-steerers/affine_steerers/__init__.py +7 -0
  1294. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/__init__.py +5 -0
  1295. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/hpatches.py +92 -0
  1296. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/hpatches_oracle_steer.py +108 -0
  1297. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/mega_pose_est.py +116 -0
  1298. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/mega_pose_est_mnn.py +162 -0
  1299. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/nll_benchmark.py +57 -0
  1300. vismatch/third_party/affine-steerers/affine_steerers/benchmarks/num_inliers.py +76 -0
  1301. vismatch/third_party/affine-steerers/affine_steerers/checkpoint.py +82 -0
  1302. vismatch/third_party/affine-steerers/affine_steerers/datasets/__init__.py +0 -0
  1303. vismatch/third_party/affine-steerers/affine_steerers/datasets/homog.py +284 -0
  1304. vismatch/third_party/affine-steerers/affine_steerers/datasets/megadepth.py +408 -0
  1305. vismatch/third_party/affine-steerers/affine_steerers/decoder.py +90 -0
  1306. vismatch/third_party/affine-steerers/affine_steerers/descriptors/__init__.py +0 -0
  1307. vismatch/third_party/affine-steerers/affine_steerers/descriptors/dedode_descriptor.py +77 -0
  1308. vismatch/third_party/affine-steerers/affine_steerers/descriptors/descriptor_loss.py +358 -0
  1309. vismatch/third_party/affine-steerers/affine_steerers/detectors/__init__.py +0 -0
  1310. vismatch/third_party/affine-steerers/affine_steerers/detectors/dedode_detector.py +75 -0
  1311. vismatch/third_party/affine-steerers/affine_steerers/detectors/keypoint_loss.py +215 -0
  1312. vismatch/third_party/affine-steerers/affine_steerers/encoder.py +87 -0
  1313. vismatch/third_party/affine-steerers/affine_steerers/matchers/__init__.py +0 -0
  1314. vismatch/third_party/affine-steerers/affine_steerers/matchers/dual_softmax_matcher.py +816 -0
  1315. vismatch/third_party/affine-steerers/affine_steerers/model_zoo/__init__.py +3 -0
  1316. vismatch/third_party/affine-steerers/affine_steerers/model_zoo/dedode_models.py +298 -0
  1317. vismatch/third_party/affine-steerers/affine_steerers/steerers.py +732 -0
  1318. vismatch/third_party/affine-steerers/affine_steerers/train.py +90 -0
  1319. vismatch/third_party/affine-steerers/affine_steerers/transformer/__init__.py +8 -0
  1320. vismatch/third_party/affine-steerers/affine_steerers/transformer/dinov2.py +359 -0
  1321. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/__init__.py +12 -0
  1322. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/attention.py +81 -0
  1323. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/block.py +252 -0
  1324. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/dino_head.py +59 -0
  1325. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/drop_path.py +35 -0
  1326. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/layer_scale.py +28 -0
  1327. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/mlp.py +41 -0
  1328. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/patch_embed.py +89 -0
  1329. vismatch/third_party/affine-steerers/affine_steerers/transformer/layers/swiglu_ffn.py +63 -0
  1330. vismatch/third_party/affine-steerers/affine_steerers/utils.py +1422 -0
  1331. vismatch/third_party/affine-steerers/experiments/aff_equi_B.py +182 -0
  1332. vismatch/third_party/affine-steerers/experiments/aff_equi_G.py +193 -0
  1333. vismatch/third_party/affine-steerers/experiments/aff_steer_B.py +213 -0
  1334. vismatch/third_party/affine-steerers/experiments/aff_steer_G.py +223 -0
  1335. vismatch/third_party/affine-steerers/experiments/aff_steer_pretrain_B.py +187 -0
  1336. vismatch/third_party/affine-steerers/experiments/aff_steer_pretrain_G.py +198 -0
  1337. vismatch/third_party/affine-steerers/setup.py +15 -0
  1338. vismatch/third_party/aspanformer/configs/aspan/indoor/aspan_test.py +7 -0
  1339. vismatch/third_party/aspanformer/configs/aspan/indoor/aspan_train.py +8 -0
  1340. vismatch/third_party/aspanformer/configs/aspan/outdoor/aspan_test.py +19 -0
  1341. vismatch/third_party/aspanformer/configs/aspan/outdoor/aspan_train.py +17 -0
  1342. vismatch/third_party/aspanformer/configs/data/__init__.py +0 -0
  1343. vismatch/third_party/aspanformer/configs/data/base.py +35 -0
  1344. vismatch/third_party/aspanformer/configs/data/megadepth_test_1500.py +13 -0
  1345. vismatch/third_party/aspanformer/configs/data/megadepth_trainval_832.py +22 -0
  1346. vismatch/third_party/aspanformer/configs/data/scannet_test_1500.py +11 -0
  1347. vismatch/third_party/aspanformer/configs/data/scannet_trainval.py +17 -0
  1348. vismatch/third_party/aspanformer/demo/demo.py +63 -0
  1349. vismatch/third_party/aspanformer/demo/demo_utils.py +44 -0
  1350. vismatch/third_party/aspanformer/src/ASpanFormer/__init__.py +2 -0
  1351. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/__init__.py +3 -0
  1352. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/attention.py +198 -0
  1353. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/fine_preprocess.py +59 -0
  1354. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/loftr.py +112 -0
  1355. vismatch/third_party/aspanformer/src/ASpanFormer/aspan_module/transformer.py +244 -0
  1356. vismatch/third_party/aspanformer/src/ASpanFormer/aspanformer.py +152 -0
  1357. vismatch/third_party/aspanformer/src/ASpanFormer/backbone/__init__.py +11 -0
  1358. vismatch/third_party/aspanformer/src/ASpanFormer/backbone/resnet_fpn.py +199 -0
  1359. vismatch/third_party/aspanformer/src/ASpanFormer/utils/coarse_matching.py +331 -0
  1360. vismatch/third_party/aspanformer/src/ASpanFormer/utils/cvpr_ds_config.py +50 -0
  1361. vismatch/third_party/aspanformer/src/ASpanFormer/utils/fine_matching.py +74 -0
  1362. vismatch/third_party/aspanformer/src/ASpanFormer/utils/geometry.py +54 -0
  1363. vismatch/third_party/aspanformer/src/ASpanFormer/utils/position_encoding.py +61 -0
  1364. vismatch/third_party/aspanformer/src/ASpanFormer/utils/supervision.py +151 -0
  1365. vismatch/third_party/aspanformer/src/__init__.py +0 -0
  1366. vismatch/third_party/aspanformer/src/config/default.py +180 -0
  1367. vismatch/third_party/aspanformer/src/datasets/__init__.py +3 -0
  1368. vismatch/third_party/aspanformer/src/datasets/megadepth.py +127 -0
  1369. vismatch/third_party/aspanformer/src/datasets/sampler.py +77 -0
  1370. vismatch/third_party/aspanformer/src/datasets/scannet.py +113 -0
  1371. vismatch/third_party/aspanformer/src/lightning/data.py +326 -0
  1372. vismatch/third_party/aspanformer/src/lightning/lightning_aspanformer.py +276 -0
  1373. vismatch/third_party/aspanformer/src/losses/aspan_loss.py +231 -0
  1374. vismatch/third_party/aspanformer/src/optimizers/__init__.py +42 -0
  1375. vismatch/third_party/aspanformer/src/utils/augment.py +55 -0
  1376. vismatch/third_party/aspanformer/src/utils/comm.py +265 -0
  1377. vismatch/third_party/aspanformer/src/utils/dataloader.py +23 -0
  1378. vismatch/third_party/aspanformer/src/utils/dataset.py +222 -0
  1379. vismatch/third_party/aspanformer/src/utils/metrics.py +260 -0
  1380. vismatch/third_party/aspanformer/src/utils/misc.py +139 -0
  1381. vismatch/third_party/aspanformer/src/utils/plotting.py +219 -0
  1382. vismatch/third_party/aspanformer/src/utils/profiler.py +39 -0
  1383. vismatch/third_party/aspanformer/test.py +69 -0
  1384. vismatch/third_party/aspanformer/tools/SensorData.py +125 -0
  1385. vismatch/third_party/aspanformer/tools/extract.py +47 -0
  1386. vismatch/third_party/aspanformer/tools/preprocess_scene.py +242 -0
  1387. vismatch/third_party/aspanformer/tools/reader.py +39 -0
  1388. vismatch/third_party/aspanformer/tools/undistort_mega.py +69 -0
  1389. vismatch/third_party/aspanformer/train.py +134 -0
  1390. vismatch/third_party/duster/croco/datasets/__init__.py +0 -0
  1391. vismatch/third_party/duster/croco/datasets/crops/extract_crops_from_images.py +159 -0
  1392. vismatch/third_party/duster/croco/datasets/habitat_sim/__init__.py +0 -0
  1393. vismatch/third_party/duster/croco/datasets/habitat_sim/generate_from_metadata.py +92 -0
  1394. vismatch/third_party/duster/croco/datasets/habitat_sim/generate_from_metadata_files.py +27 -0
  1395. vismatch/third_party/duster/croco/datasets/habitat_sim/generate_multiview_images.py +177 -0
  1396. vismatch/third_party/duster/croco/datasets/habitat_sim/multiview_habitat_sim_generator.py +390 -0
  1397. vismatch/third_party/duster/croco/datasets/habitat_sim/pack_metadata_files.py +69 -0
  1398. vismatch/third_party/duster/croco/datasets/habitat_sim/paths.py +129 -0
  1399. vismatch/third_party/duster/croco/datasets/pairs_dataset.py +109 -0
  1400. vismatch/third_party/duster/croco/datasets/transforms.py +95 -0
  1401. vismatch/third_party/duster/croco/demo.py +55 -0
  1402. vismatch/third_party/duster/croco/models/blocks.py +241 -0
  1403. vismatch/third_party/duster/croco/models/criterion.py +37 -0
  1404. vismatch/third_party/duster/croco/models/croco.py +249 -0
  1405. vismatch/third_party/duster/croco/models/croco_downstream.py +122 -0
  1406. vismatch/third_party/duster/croco/models/curope/__init__.py +4 -0
  1407. vismatch/third_party/duster/croco/models/curope/curope2d.py +40 -0
  1408. vismatch/third_party/duster/croco/models/curope/setup.py +34 -0
  1409. vismatch/third_party/duster/croco/models/dpt_block.py +450 -0
  1410. vismatch/third_party/duster/croco/models/head_downstream.py +58 -0
  1411. vismatch/third_party/duster/croco/models/masking.py +25 -0
  1412. vismatch/third_party/duster/croco/models/pos_embed.py +157 -0
  1413. vismatch/third_party/duster/croco/pretrain.py +254 -0
  1414. vismatch/third_party/duster/croco/stereoflow/augmentor.py +290 -0
  1415. vismatch/third_party/duster/croco/stereoflow/criterion.py +251 -0
  1416. vismatch/third_party/duster/croco/stereoflow/datasets_flow.py +630 -0
  1417. vismatch/third_party/duster/croco/stereoflow/datasets_stereo.py +674 -0
  1418. vismatch/third_party/duster/croco/stereoflow/engine.py +280 -0
  1419. vismatch/third_party/duster/croco/stereoflow/test.py +216 -0
  1420. vismatch/third_party/duster/croco/stereoflow/train.py +253 -0
  1421. vismatch/third_party/duster/croco/utils/misc.py +463 -0
  1422. vismatch/third_party/duster/datasets_preprocess/habitat/find_scenes.py +78 -0
  1423. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/__init__.py +2 -0
  1424. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/habitat_sim_envmaps_renderer.py +170 -0
  1425. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/multiview_crop_generator.py +93 -0
  1426. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/projections.py +151 -0
  1427. vismatch/third_party/duster/datasets_preprocess/habitat/habitat_renderer/projections_conversions.py +45 -0
  1428. vismatch/third_party/duster/datasets_preprocess/habitat/preprocess_habitat.py +121 -0
  1429. vismatch/third_party/duster/datasets_preprocess/path_to_root.py +13 -0
  1430. vismatch/third_party/duster/datasets_preprocess/preprocess_arkitscenes.py +355 -0
  1431. vismatch/third_party/duster/datasets_preprocess/preprocess_blendedMVS.py +149 -0
  1432. vismatch/third_party/duster/datasets_preprocess/preprocess_co3d.py +295 -0
  1433. vismatch/third_party/duster/datasets_preprocess/preprocess_megadepth.py +198 -0
  1434. vismatch/third_party/duster/datasets_preprocess/preprocess_scannetpp.py +400 -0
  1435. vismatch/third_party/duster/datasets_preprocess/preprocess_staticthings3d.py +130 -0
  1436. vismatch/third_party/duster/datasets_preprocess/preprocess_waymo.py +257 -0
  1437. vismatch/third_party/duster/datasets_preprocess/preprocess_wildrgbd.py +209 -0
  1438. vismatch/third_party/duster/demo.py +45 -0
  1439. vismatch/third_party/duster/dust3r/__init__.py +2 -0
  1440. vismatch/third_party/duster/dust3r/cloud_opt/__init__.py +33 -0
  1441. vismatch/third_party/duster/dust3r/cloud_opt/base_opt.py +405 -0
  1442. vismatch/third_party/duster/dust3r/cloud_opt/commons.py +90 -0
  1443. vismatch/third_party/duster/dust3r/cloud_opt/init_im_poses.py +316 -0
  1444. vismatch/third_party/duster/dust3r/cloud_opt/modular_optimizer.py +145 -0
  1445. vismatch/third_party/duster/dust3r/cloud_opt/optimizer.py +248 -0
  1446. vismatch/third_party/duster/dust3r/cloud_opt/pair_viewer.py +127 -0
  1447. vismatch/third_party/duster/dust3r/datasets/__init__.py +50 -0
  1448. vismatch/third_party/duster/dust3r/datasets/arkitscenes.py +102 -0
  1449. vismatch/third_party/duster/dust3r/datasets/base/__init__.py +2 -0
  1450. vismatch/third_party/duster/dust3r/datasets/base/base_stereo_view_dataset.py +220 -0
  1451. vismatch/third_party/duster/dust3r/datasets/base/batched_sampler.py +74 -0
  1452. vismatch/third_party/duster/dust3r/datasets/base/easy_dataset.py +157 -0
  1453. vismatch/third_party/duster/dust3r/datasets/blendedmvs.py +104 -0
  1454. vismatch/third_party/duster/dust3r/datasets/co3d.py +165 -0
  1455. vismatch/third_party/duster/dust3r/datasets/habitat.py +107 -0
  1456. vismatch/third_party/duster/dust3r/datasets/megadepth.py +123 -0
  1457. vismatch/third_party/duster/dust3r/datasets/scannetpp.py +96 -0
  1458. vismatch/third_party/duster/dust3r/datasets/staticthings3d.py +96 -0
  1459. vismatch/third_party/duster/dust3r/datasets/utils/__init__.py +2 -0
  1460. vismatch/third_party/duster/dust3r/datasets/utils/cropping.py +124 -0
  1461. vismatch/third_party/duster/dust3r/datasets/utils/transforms.py +11 -0
  1462. vismatch/third_party/duster/dust3r/datasets/waymo.py +93 -0
  1463. vismatch/third_party/duster/dust3r/datasets/wildrgbd.py +67 -0
  1464. vismatch/third_party/duster/dust3r/demo.py +287 -0
  1465. vismatch/third_party/duster/dust3r/heads/__init__.py +19 -0
  1466. vismatch/third_party/duster/dust3r/heads/dpt_head.py +115 -0
  1467. vismatch/third_party/duster/dust3r/heads/linear_head.py +41 -0
  1468. vismatch/third_party/duster/dust3r/heads/postprocess.py +58 -0
  1469. vismatch/third_party/duster/dust3r/image_pairs.py +104 -0
  1470. vismatch/third_party/duster/dust3r/inference.py +150 -0
  1471. vismatch/third_party/duster/dust3r/losses.py +299 -0
  1472. vismatch/third_party/duster/dust3r/model.py +211 -0
  1473. vismatch/third_party/duster/dust3r/optim_factory.py +14 -0
  1474. vismatch/third_party/duster/dust3r/patch_embed.py +70 -0
  1475. vismatch/third_party/duster/dust3r/post_process.py +60 -0
  1476. vismatch/third_party/duster/dust3r/training.py +377 -0
  1477. vismatch/third_party/duster/dust3r/utils/__init__.py +2 -0
  1478. vismatch/third_party/duster/dust3r/utils/device.py +76 -0
  1479. vismatch/third_party/duster/dust3r/utils/geometry.py +366 -0
  1480. vismatch/third_party/duster/dust3r/utils/image.py +128 -0
  1481. vismatch/third_party/duster/dust3r/utils/misc.py +121 -0
  1482. vismatch/third_party/duster/dust3r/utils/parallel.py +79 -0
  1483. vismatch/third_party/duster/dust3r/utils/path_to_croco.py +19 -0
  1484. vismatch/third_party/duster/dust3r/viz.py +381 -0
  1485. vismatch/third_party/duster/dust3r_visloc/__init__.py +2 -0
  1486. vismatch/third_party/duster/dust3r_visloc/datasets/__init__.py +6 -0
  1487. vismatch/third_party/duster/dust3r_visloc/datasets/aachen_day_night.py +24 -0
  1488. vismatch/third_party/duster/dust3r_visloc/datasets/base_colmap.py +282 -0
  1489. vismatch/third_party/duster/dust3r_visloc/datasets/base_dataset.py +19 -0
  1490. vismatch/third_party/duster/dust3r_visloc/datasets/cambridge_landmarks.py +19 -0
  1491. vismatch/third_party/duster/dust3r_visloc/datasets/inloc.py +167 -0
  1492. vismatch/third_party/duster/dust3r_visloc/datasets/sevenscenes.py +123 -0
  1493. vismatch/third_party/duster/dust3r_visloc/datasets/utils.py +118 -0
  1494. vismatch/third_party/duster/dust3r_visloc/evaluation.py +65 -0
  1495. vismatch/third_party/duster/dust3r_visloc/localization.py +140 -0
  1496. vismatch/third_party/duster/train.py +13 -0
  1497. vismatch/third_party/duster/visloc.py +193 -0
  1498. vismatch/third_party/gim/demo.py +479 -0
  1499. vismatch/third_party/gim/dkm/__init__.py +4 -0
  1500. vismatch/third_party/gim/dkm/benchmarks/__init__.py +4 -0
  1501. vismatch/third_party/gim/dkm/benchmarks/hpatches_sequences_homog_benchmark.py +114 -0
  1502. vismatch/third_party/gim/dkm/benchmarks/megadepth1500_benchmark.py +124 -0
  1503. vismatch/third_party/gim/dkm/benchmarks/megadepth_dense_benchmark.py +86 -0
  1504. vismatch/third_party/gim/dkm/benchmarks/scannet_benchmark.py +143 -0
  1505. vismatch/third_party/gim/dkm/checkpointing/__init__.py +1 -0
  1506. vismatch/third_party/gim/dkm/checkpointing/checkpoint.py +31 -0
  1507. vismatch/third_party/gim/dkm/datasets/__init__.py +1 -0
  1508. vismatch/third_party/gim/dkm/datasets/megadepth.py +177 -0
  1509. vismatch/third_party/gim/dkm/datasets/scannet.py +151 -0
  1510. vismatch/third_party/gim/dkm/losses/__init__.py +1 -0
  1511. vismatch/third_party/gim/dkm/losses/depth_match_regression_loss.py +128 -0
  1512. vismatch/third_party/gim/dkm/models/__init__.py +4 -0
  1513. vismatch/third_party/gim/dkm/models/dkm.py +745 -0
  1514. vismatch/third_party/gim/dkm/models/encoders.py +148 -0
  1515. vismatch/third_party/gim/dkm/models/model_zoo/DKMv3.py +148 -0
  1516. vismatch/third_party/gim/dkm/models/model_zoo/__init__.py +39 -0
  1517. vismatch/third_party/gim/dkm/train/__init__.py +1 -0
  1518. vismatch/third_party/gim/dkm/train/train.py +67 -0
  1519. vismatch/third_party/gim/dkm/utils/__init__.py +13 -0
  1520. vismatch/third_party/gim/dkm/utils/kde.py +26 -0
  1521. vismatch/third_party/gim/dkm/utils/local_correlation.py +40 -0
  1522. vismatch/third_party/gim/dkm/utils/transforms.py +104 -0
  1523. vismatch/third_party/gim/dkm/utils/utils.py +341 -0
  1524. vismatch/third_party/gim/gluefactory/__init__.py +17 -0
  1525. vismatch/third_party/gim/gluefactory/datasets/__init__.py +25 -0
  1526. vismatch/third_party/gim/gluefactory/datasets/augmentations.py +244 -0
  1527. vismatch/third_party/gim/gluefactory/datasets/base_dataset.py +206 -0
  1528. vismatch/third_party/gim/gluefactory/datasets/eth3d.py +254 -0
  1529. vismatch/third_party/gim/gluefactory/datasets/homographies.py +311 -0
  1530. vismatch/third_party/gim/gluefactory/datasets/hpatches.py +145 -0
  1531. vismatch/third_party/gim/gluefactory/datasets/image_folder.py +59 -0
  1532. vismatch/third_party/gim/gluefactory/datasets/image_pairs.py +100 -0
  1533. vismatch/third_party/gim/gluefactory/datasets/megadepth.py +514 -0
  1534. vismatch/third_party/gim/gluefactory/datasets/utils.py +131 -0
  1535. vismatch/third_party/gim/gluefactory/eval/__init__.py +20 -0
  1536. vismatch/third_party/gim/gluefactory/eval/eth3d.py +202 -0
  1537. vismatch/third_party/gim/gluefactory/eval/eval_pipeline.py +109 -0
  1538. vismatch/third_party/gim/gluefactory/eval/hpatches.py +203 -0
  1539. vismatch/third_party/gim/gluefactory/eval/inspect.py +61 -0
  1540. vismatch/third_party/gim/gluefactory/eval/io.py +109 -0
  1541. vismatch/third_party/gim/gluefactory/eval/megadepth1500.py +189 -0
  1542. vismatch/third_party/gim/gluefactory/eval/utils.py +272 -0
  1543. vismatch/third_party/gim/gluefactory/geometry/depth.py +88 -0
  1544. vismatch/third_party/gim/gluefactory/geometry/epipolar.py +155 -0
  1545. vismatch/third_party/gim/gluefactory/geometry/gt_generation.py +558 -0
  1546. vismatch/third_party/gim/gluefactory/geometry/homography.py +342 -0
  1547. vismatch/third_party/gim/gluefactory/geometry/utils.py +167 -0
  1548. vismatch/third_party/gim/gluefactory/geometry/wrappers.py +425 -0
  1549. vismatch/third_party/gim/gluefactory/models/__init__.py +30 -0
  1550. vismatch/third_party/gim/gluefactory/models/backbones/__init__.py +0 -0
  1551. vismatch/third_party/gim/gluefactory/models/backbones/dinov2.py +30 -0
  1552. vismatch/third_party/gim/gluefactory/models/base_model.py +157 -0
  1553. vismatch/third_party/gim/gluefactory/models/cache_loader.py +139 -0
  1554. vismatch/third_party/gim/gluefactory/models/extractors/__init__.py +0 -0
  1555. vismatch/third_party/gim/gluefactory/models/extractors/aliked.py +786 -0
  1556. vismatch/third_party/gim/gluefactory/models/extractors/disk_kornia.py +108 -0
  1557. vismatch/third_party/gim/gluefactory/models/extractors/grid_extractor.py +60 -0
  1558. vismatch/third_party/gim/gluefactory/models/extractors/keynet_affnet_hardnet.py +74 -0
  1559. vismatch/third_party/gim/gluefactory/models/extractors/mixed.py +76 -0
  1560. vismatch/third_party/gim/gluefactory/models/extractors/sift.py +234 -0
  1561. vismatch/third_party/gim/gluefactory/models/extractors/sift_kornia.py +46 -0
  1562. vismatch/third_party/gim/gluefactory/models/extractors/superpoint_open.py +210 -0
  1563. vismatch/third_party/gim/gluefactory/models/lines/__init__.py +0 -0
  1564. vismatch/third_party/gim/gluefactory/models/lines/deeplsd.py +106 -0
  1565. vismatch/third_party/gim/gluefactory/models/lines/lsd.py +88 -0
  1566. vismatch/third_party/gim/gluefactory/models/lines/wireframe.py +312 -0
  1567. vismatch/third_party/gim/gluefactory/models/matchers/__init__.py +0 -0
  1568. vismatch/third_party/gim/gluefactory/models/matchers/adalam.py +0 -0
  1569. vismatch/third_party/gim/gluefactory/models/matchers/depth_matcher.py +82 -0
  1570. vismatch/third_party/gim/gluefactory/models/matchers/gluestick.py +776 -0
  1571. vismatch/third_party/gim/gluefactory/models/matchers/homography_matcher.py +66 -0
  1572. vismatch/third_party/gim/gluefactory/models/matchers/kornia_loftr.py +66 -0
  1573. vismatch/third_party/gim/gluefactory/models/matchers/lightglue.py +632 -0
  1574. vismatch/third_party/gim/gluefactory/models/matchers/lightglue_pretrained.py +36 -0
  1575. vismatch/third_party/gim/gluefactory/models/matchers/nearest_neighbor_matcher.py +97 -0
  1576. vismatch/third_party/gim/gluefactory/models/triplet_pipeline.py +99 -0
  1577. vismatch/third_party/gim/gluefactory/models/two_view_pipeline.py +114 -0
  1578. vismatch/third_party/gim/gluefactory/models/utils/__init__.py +0 -0
  1579. vismatch/third_party/gim/gluefactory/models/utils/losses.py +73 -0
  1580. vismatch/third_party/gim/gluefactory/models/utils/metrics.py +50 -0
  1581. vismatch/third_party/gim/gluefactory/models/utils/misc.py +70 -0
  1582. vismatch/third_party/gim/gluefactory/robust_estimators/__init__.py +15 -0
  1583. vismatch/third_party/gim/gluefactory/robust_estimators/base_estimator.py +33 -0
  1584. vismatch/third_party/gim/gluefactory/robust_estimators/homography/__init__.py +0 -0
  1585. vismatch/third_party/gim/gluefactory/robust_estimators/homography/homography_est.py +74 -0
  1586. vismatch/third_party/gim/gluefactory/robust_estimators/homography/opencv.py +53 -0
  1587. vismatch/third_party/gim/gluefactory/robust_estimators/homography/poselib.py +40 -0
  1588. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/__init__.py +0 -0
  1589. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/opencv.py +64 -0
  1590. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/poselib.py +44 -0
  1591. vismatch/third_party/gim/gluefactory/robust_estimators/relative_pose/pycolmap.py +52 -0
  1592. vismatch/third_party/gim/gluefactory/scripts/__init__.py +0 -0
  1593. vismatch/third_party/gim/gluefactory/scripts/export_local_features.py +127 -0
  1594. vismatch/third_party/gim/gluefactory/scripts/export_megadepth.py +173 -0
  1595. vismatch/third_party/gim/gluefactory/settings.py +6 -0
  1596. vismatch/third_party/gim/gluefactory/superpoint.py +361 -0
  1597. vismatch/third_party/gim/gluefactory/train.py +691 -0
  1598. vismatch/third_party/gim/gluefactory/utils/__init__.py +0 -0
  1599. vismatch/third_party/gim/gluefactory/utils/benchmark.py +33 -0
  1600. vismatch/third_party/gim/gluefactory/utils/experiments.py +134 -0
  1601. vismatch/third_party/gim/gluefactory/utils/export_predictions.py +81 -0
  1602. vismatch/third_party/gim/gluefactory/utils/image.py +130 -0
  1603. vismatch/third_party/gim/gluefactory/utils/misc.py +44 -0
  1604. vismatch/third_party/gim/gluefactory/utils/patches.py +50 -0
  1605. vismatch/third_party/gim/gluefactory/utils/stdout_capturing.py +134 -0
  1606. vismatch/third_party/gim/gluefactory/utils/tensor.py +48 -0
  1607. vismatch/third_party/gim/gluefactory/utils/tools.py +269 -0
  1608. vismatch/third_party/gim/gluefactory/visualization/global_frame.py +289 -0
  1609. vismatch/third_party/gim/gluefactory/visualization/tools.py +465 -0
  1610. vismatch/third_party/gim/gluefactory/visualization/two_view_frame.py +158 -0
  1611. vismatch/third_party/gim/gluefactory/visualization/visualize_batch.py +57 -0
  1612. vismatch/third_party/gim/gluefactory/visualization/viz2d.py +486 -0
  1613. vismatch/third_party/imatch-toolbox/configs/d2net.yml +26 -0
  1614. vismatch/third_party/imatch-toolbox/configs/dogaffnethardnet.yml +10 -0
  1615. vismatch/third_party/imatch-toolbox/configs/ncnet.yml +7 -0
  1616. vismatch/third_party/imatch-toolbox/configs/patch2pix.yml +56 -0
  1617. vismatch/third_party/imatch-toolbox/configs/patch2pix_superglue.yml +58 -0
  1618. vismatch/third_party/imatch-toolbox/configs/r2d2.yml +31 -0
  1619. vismatch/third_party/imatch-toolbox/configs/sift.yml +27 -0
  1620. vismatch/third_party/imatch-toolbox/configs/superglue.yml +69 -0
  1621. vismatch/third_party/imatch-toolbox/configs/superpoint.yml +21 -0
  1622. vismatch/third_party/imatch-toolbox/environment.yml +14 -0
  1623. vismatch/third_party/imatch-toolbox/immatch/__init__.py +8 -0
  1624. vismatch/third_party/imatch-toolbox/immatch/eval_aachen.py +88 -0
  1625. vismatch/third_party/imatch-toolbox/immatch/eval_hpatches.py +117 -0
  1626. vismatch/third_party/imatch-toolbox/immatch/eval_inloc.py +45 -0
  1627. vismatch/third_party/imatch-toolbox/immatch/eval_relapose.py +231 -0
  1628. vismatch/third_party/imatch-toolbox/immatch/eval_robotcar.py +83 -0
  1629. vismatch/third_party/imatch-toolbox/immatch/modules/__init__.py +0 -0
  1630. vismatch/third_party/imatch-toolbox/immatch/modules/base.py +89 -0
  1631. vismatch/third_party/imatch-toolbox/immatch/modules/d2net.py +69 -0
  1632. vismatch/third_party/imatch-toolbox/immatch/modules/dogaffnethardnet.py +94 -0
  1633. vismatch/third_party/imatch-toolbox/immatch/modules/nn_matching.py +31 -0
  1634. vismatch/third_party/imatch-toolbox/immatch/modules/patch2pix.py +126 -0
  1635. vismatch/third_party/imatch-toolbox/immatch/modules/r2d2.py +64 -0
  1636. vismatch/third_party/imatch-toolbox/immatch/modules/sift.py +67 -0
  1637. vismatch/third_party/imatch-toolbox/immatch/modules/superglue.py +62 -0
  1638. vismatch/third_party/imatch-toolbox/immatch/modules/superpoint.py +56 -0
  1639. vismatch/third_party/imatch-toolbox/immatch/utils/__init__.py +13 -0
  1640. vismatch/third_party/imatch-toolbox/immatch/utils/colmap/data_parsing.py +257 -0
  1641. vismatch/third_party/imatch-toolbox/immatch/utils/colmap/database.py +362 -0
  1642. vismatch/third_party/imatch-toolbox/immatch/utils/colmap/read_write_model.py +506 -0
  1643. vismatch/third_party/imatch-toolbox/immatch/utils/data_io.py +111 -0
  1644. vismatch/third_party/imatch-toolbox/immatch/utils/hpatches_helper.py +242 -0
  1645. vismatch/third_party/imatch-toolbox/immatch/utils/localize_sfm_helper.py +403 -0
  1646. vismatch/third_party/imatch-toolbox/immatch/utils/metrics.py +90 -0
  1647. vismatch/third_party/imatch-toolbox/immatch/utils/model_helper.py +27 -0
  1648. vismatch/third_party/imatch-toolbox/setup.py +36 -0
  1649. vismatch/third_party/imatch-toolbox/third_party/d2net/extract_features.py +156 -0
  1650. vismatch/third_party/imatch-toolbox/third_party/d2net/extract_kapture.py +248 -0
  1651. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/dataset.py +239 -0
  1652. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/exceptions.py +6 -0
  1653. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/loss.py +340 -0
  1654. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/model.py +121 -0
  1655. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/model_test.py +187 -0
  1656. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/pyramid.py +129 -0
  1657. vismatch/third_party/imatch-toolbox/third_party/d2net/lib/utils.py +167 -0
  1658. vismatch/third_party/imatch-toolbox/third_party/d2net/megadepth_utils/preprocess_scene.py +242 -0
  1659. vismatch/third_party/imatch-toolbox/third_party/d2net/megadepth_utils/undistort_reconstructions.py +69 -0
  1660. vismatch/third_party/imatch-toolbox/third_party/d2net/train.py +279 -0
  1661. vismatch/third_party/imatch-toolbox/third_party/patch2pix/data_pairs/precompute_immatch_val_ovs.py +20 -0
  1662. vismatch/third_party/imatch-toolbox/third_party/patch2pix/environment.yml +21 -0
  1663. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/modules.py +167 -0
  1664. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/ncn/conv4d.py +91 -0
  1665. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/ncn/extract_ncmatches.py +158 -0
  1666. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/ncn/model.py +333 -0
  1667. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/patch2pix.py +403 -0
  1668. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/resnet.py +191 -0
  1669. vismatch/third_party/imatch-toolbox/third_party/patch2pix/networks/utils.py +111 -0
  1670. vismatch/third_party/imatch-toolbox/third_party/patch2pix/train_patch2pix.py +374 -0
  1671. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/colmap/data_loading.py +169 -0
  1672. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/colmap/read_database.py +175 -0
  1673. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/colmap/read_write_model.py +483 -0
  1674. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/common/plotting.py +393 -0
  1675. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/common/setup_helper.py +59 -0
  1676. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/common/visdom_helper.py +95 -0
  1677. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/__init__.py +1 -0
  1678. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/data_parsing.py +145 -0
  1679. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/dataset_megadepth.py +141 -0
  1680. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/datasets/preprocess.py +184 -0
  1681. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/eval/geometry.py +90 -0
  1682. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/eval/measure.py +161 -0
  1683. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/eval/model_helper.py +129 -0
  1684. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/train/eval_epoch_immatch.py +99 -0
  1685. vismatch/third_party/imatch-toolbox/third_party/patch2pix/utils/train/helper.py +196 -0
  1686. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/__init__.py +33 -0
  1687. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/aachen.py +146 -0
  1688. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/dataset.py +77 -0
  1689. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/imgfolder.py +23 -0
  1690. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/pair_dataset.py +287 -0
  1691. vismatch/third_party/imatch-toolbox/third_party/r2d2/datasets/web_images.py +64 -0
  1692. vismatch/third_party/imatch-toolbox/third_party/r2d2/extract.py +183 -0
  1693. vismatch/third_party/imatch-toolbox/third_party/r2d2/extract_kapture.py +194 -0
  1694. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/ap_loss.py +67 -0
  1695. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/losses.py +56 -0
  1696. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/patchnet.py +134 -0
  1697. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/reliability_loss.py +59 -0
  1698. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/repeatability_loss.py +66 -0
  1699. vismatch/third_party/imatch-toolbox/third_party/r2d2/nets/sampler.py +390 -0
  1700. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/common.py +41 -0
  1701. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/dataloader.py +367 -0
  1702. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/trainer.py +76 -0
  1703. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/transforms.py +513 -0
  1704. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/transforms_tools.py +230 -0
  1705. vismatch/third_party/imatch-toolbox/third_party/r2d2/tools/viz.py +191 -0
  1706. vismatch/third_party/imatch-toolbox/third_party/r2d2/train.py +138 -0
  1707. vismatch/third_party/imatch-toolbox/third_party/r2d2/viz_heatmaps.py +122 -0
  1708. vismatch/third_party/imatch-toolbox/third_party/superglue/demo_superglue.py +259 -0
  1709. vismatch/third_party/imatch-toolbox/third_party/superglue/match_pairs.py +425 -0
  1710. vismatch/third_party/imatch-toolbox/third_party/superglue/models/__init__.py +0 -0
  1711. vismatch/third_party/imatch-toolbox/third_party/superglue/models/matching.py +84 -0
  1712. vismatch/third_party/imatch-toolbox/third_party/superglue/models/superglue.py +283 -0
  1713. vismatch/third_party/imatch-toolbox/third_party/superglue/models/superpoint.py +202 -0
  1714. vismatch/third_party/imatch-toolbox/third_party/superglue/models/utils.py +555 -0
  1715. vismatch/third_party/keypt2subpx/dataprocess/aliked.py +163 -0
  1716. vismatch/third_party/keypt2subpx/dataprocess/dedode.py +215 -0
  1717. vismatch/third_party/keypt2subpx/dataprocess/splg.py +162 -0
  1718. vismatch/third_party/keypt2subpx/dataprocess/spnn.py +157 -0
  1719. vismatch/third_party/keypt2subpx/dataprocess/superpoint_densescore.py +357 -0
  1720. vismatch/third_party/keypt2subpx/dataprocess/xfeat.py +187 -0
  1721. vismatch/third_party/keypt2subpx/dataset.py +145 -0
  1722. vismatch/third_party/keypt2subpx/hubconf.py +38 -0
  1723. vismatch/third_party/keypt2subpx/logger.py +127 -0
  1724. vismatch/third_party/keypt2subpx/model.py +183 -0
  1725. vismatch/third_party/keypt2subpx/settings.py +108 -0
  1726. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/__init__.py +17 -0
  1727. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/__init__.py +25 -0
  1728. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/augmentations.py +244 -0
  1729. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/base_dataset.py +206 -0
  1730. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/eth3d.py +254 -0
  1731. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/homographies.py +311 -0
  1732. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/hpatches.py +145 -0
  1733. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/image_folder.py +59 -0
  1734. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/image_pairs.py +100 -0
  1735. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/megadepth.py +510 -0
  1736. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/datasets/utils.py +131 -0
  1737. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/__init__.py +20 -0
  1738. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/eth3d.py +202 -0
  1739. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/eval_pipeline.py +109 -0
  1740. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/hpatches.py +203 -0
  1741. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/inspect.py +61 -0
  1742. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/io.py +109 -0
  1743. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/megadepth1500.py +189 -0
  1744. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/eval/utils.py +272 -0
  1745. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/__init__.py +0 -0
  1746. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/depth.py +88 -0
  1747. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/epipolar.py +155 -0
  1748. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/gt_generation.py +558 -0
  1749. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/homography.py +342 -0
  1750. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/utils.py +167 -0
  1751. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/geometry/wrappers.py +425 -0
  1752. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/__init__.py +30 -0
  1753. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/backbones/__init__.py +0 -0
  1754. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/backbones/dinov2.py +30 -0
  1755. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/base_model.py +157 -0
  1756. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/cache_loader.py +139 -0
  1757. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/__init__.py +0 -0
  1758. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/aliked.py +786 -0
  1759. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/disk_kornia.py +108 -0
  1760. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/grid_extractor.py +60 -0
  1761. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/keynet_affnet_hardnet.py +74 -0
  1762. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/mixed.py +76 -0
  1763. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/sift.py +234 -0
  1764. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/sift_kornia.py +46 -0
  1765. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/extractors/superpoint_open.py +210 -0
  1766. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/__init__.py +0 -0
  1767. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/deeplsd.py +106 -0
  1768. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/lsd.py +88 -0
  1769. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/lines/wireframe.py +312 -0
  1770. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/__init__.py +0 -0
  1771. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/adalam.py +0 -0
  1772. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/depth_matcher.py +82 -0
  1773. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/gluestick.py +776 -0
  1774. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/homography_matcher.py +66 -0
  1775. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/kornia_loftr.py +66 -0
  1776. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/lightglue.py +612 -0
  1777. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/lightglue_pretrained.py +36 -0
  1778. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/matchers/nearest_neighbor_matcher.py +97 -0
  1779. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/triplet_pipeline.py +99 -0
  1780. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/two_view_pipeline.py +114 -0
  1781. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/__init__.py +0 -0
  1782. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/losses.py +73 -0
  1783. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/metrics.py +50 -0
  1784. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/models/utils/misc.py +70 -0
  1785. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/__init__.py +15 -0
  1786. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/base_estimator.py +33 -0
  1787. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/__init__.py +0 -0
  1788. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/homography_est.py +74 -0
  1789. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/opencv.py +53 -0
  1790. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/homography/poselib.py +40 -0
  1791. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/__init__.py +0 -0
  1792. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/opencv.py +64 -0
  1793. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/poselib.py +44 -0
  1794. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/robust_estimators/relative_pose/pycolmap.py +52 -0
  1795. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/scripts/__init__.py +0 -0
  1796. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/scripts/export_local_features.py +127 -0
  1797. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/scripts/export_megadepth.py +173 -0
  1798. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/settings.py +6 -0
  1799. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/train.py +691 -0
  1800. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/__init__.py +0 -0
  1801. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/benchmark.py +33 -0
  1802. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/experiments.py +134 -0
  1803. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/export_predictions.py +81 -0
  1804. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/image.py +130 -0
  1805. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/misc.py +44 -0
  1806. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/patches.py +50 -0
  1807. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/stdout_capturing.py +134 -0
  1808. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/tensor.py +48 -0
  1809. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/utils/tools.py +269 -0
  1810. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/global_frame.py +289 -0
  1811. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/tools.py +465 -0
  1812. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/two_view_frame.py +158 -0
  1813. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/visualize_batch.py +57 -0
  1814. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory/visualization/viz2d.py +486 -0
  1815. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory_nonfree/__init__.py +0 -0
  1816. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory_nonfree/superglue.py +342 -0
  1817. vismatch/third_party/keypt2subpx/submodules/glue_factory/gluefactory_nonfree/superpoint.py +356 -0
  1818. vismatch/third_party/keypt2subpx/submodules/glue_factory/tests/__init__.py +0 -0
  1819. vismatch/third_party/keypt2subpx/submodules/glue_factory/tests/test_eval_utils.py +88 -0
  1820. vismatch/third_party/keypt2subpx/submodules/glue_factory/tests/test_integration.py +132 -0
  1821. vismatch/third_party/keypt2subpx/summarize.py +44 -0
  1822. vismatch/third_party/keypt2subpx/test.py +225 -0
  1823. vismatch/third_party/keypt2subpx/train.py +180 -0
  1824. vismatch/third_party/keypt2subpx/utils.py +150 -0
  1825. vismatch/third_party/mast3r/demo.py +51 -0
  1826. vismatch/third_party/mast3r/demo_dust3r_ga.py +99 -0
  1827. vismatch/third_party/mast3r/demo_glomap.py +52 -0
  1828. vismatch/third_party/mast3r/dust3r/croco/datasets/__init__.py +0 -0
  1829. vismatch/third_party/mast3r/dust3r/croco/datasets/crops/extract_crops_from_images.py +159 -0
  1830. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/__init__.py +0 -0
  1831. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/generate_from_metadata.py +92 -0
  1832. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/generate_from_metadata_files.py +27 -0
  1833. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/generate_multiview_images.py +177 -0
  1834. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/multiview_habitat_sim_generator.py +390 -0
  1835. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/pack_metadata_files.py +69 -0
  1836. vismatch/third_party/mast3r/dust3r/croco/datasets/habitat_sim/paths.py +129 -0
  1837. vismatch/third_party/mast3r/dust3r/croco/datasets/pairs_dataset.py +109 -0
  1838. vismatch/third_party/mast3r/dust3r/croco/datasets/transforms.py +95 -0
  1839. vismatch/third_party/mast3r/dust3r/croco/demo.py +55 -0
  1840. vismatch/third_party/mast3r/dust3r/croco/models/blocks.py +241 -0
  1841. vismatch/third_party/mast3r/dust3r/croco/models/criterion.py +37 -0
  1842. vismatch/third_party/mast3r/dust3r/croco/models/croco.py +249 -0
  1843. vismatch/third_party/mast3r/dust3r/croco/models/croco_downstream.py +122 -0
  1844. vismatch/third_party/mast3r/dust3r/croco/models/curope/__init__.py +4 -0
  1845. vismatch/third_party/mast3r/dust3r/croco/models/curope/curope2d.py +40 -0
  1846. vismatch/third_party/mast3r/dust3r/croco/models/curope/setup.py +34 -0
  1847. vismatch/third_party/mast3r/dust3r/croco/models/dpt_block.py +450 -0
  1848. vismatch/third_party/mast3r/dust3r/croco/models/head_downstream.py +58 -0
  1849. vismatch/third_party/mast3r/dust3r/croco/models/masking.py +25 -0
  1850. vismatch/third_party/mast3r/dust3r/croco/models/pos_embed.py +157 -0
  1851. vismatch/third_party/mast3r/dust3r/croco/pretrain.py +254 -0
  1852. vismatch/third_party/mast3r/dust3r/croco/stereoflow/augmentor.py +290 -0
  1853. vismatch/third_party/mast3r/dust3r/croco/stereoflow/criterion.py +251 -0
  1854. vismatch/third_party/mast3r/dust3r/croco/stereoflow/datasets_flow.py +630 -0
  1855. vismatch/third_party/mast3r/dust3r/croco/stereoflow/datasets_stereo.py +674 -0
  1856. vismatch/third_party/mast3r/dust3r/croco/stereoflow/engine.py +280 -0
  1857. vismatch/third_party/mast3r/dust3r/croco/stereoflow/test.py +216 -0
  1858. vismatch/third_party/mast3r/dust3r/croco/stereoflow/train.py +253 -0
  1859. vismatch/third_party/mast3r/dust3r/croco/utils/misc.py +463 -0
  1860. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/find_scenes.py +78 -0
  1861. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/__init__.py +2 -0
  1862. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/habitat_sim_envmaps_renderer.py +170 -0
  1863. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/multiview_crop_generator.py +93 -0
  1864. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/projections.py +151 -0
  1865. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/habitat_renderer/projections_conversions.py +45 -0
  1866. vismatch/third_party/mast3r/dust3r/datasets_preprocess/habitat/preprocess_habitat.py +121 -0
  1867. vismatch/third_party/mast3r/dust3r/datasets_preprocess/path_to_root.py +13 -0
  1868. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_arkitscenes.py +355 -0
  1869. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_blendedMVS.py +149 -0
  1870. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_co3d.py +295 -0
  1871. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_megadepth.py +198 -0
  1872. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_scannetpp.py +390 -0
  1873. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_staticthings3d.py +130 -0
  1874. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_waymo.py +257 -0
  1875. vismatch/third_party/mast3r/dust3r/datasets_preprocess/preprocess_wildrgbd.py +209 -0
  1876. vismatch/third_party/mast3r/dust3r/demo.py +45 -0
  1877. vismatch/third_party/mast3r/dust3r/dust3r/__init__.py +2 -0
  1878. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/__init__.py +33 -0
  1879. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/base_opt.py +405 -0
  1880. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/commons.py +90 -0
  1881. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/init_im_poses.py +316 -0
  1882. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/modular_optimizer.py +145 -0
  1883. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/optimizer.py +248 -0
  1884. vismatch/third_party/mast3r/dust3r/dust3r/cloud_opt/pair_viewer.py +127 -0
  1885. vismatch/third_party/mast3r/dust3r/dust3r/datasets/__init__.py +50 -0
  1886. vismatch/third_party/mast3r/dust3r/dust3r/datasets/arkitscenes.py +102 -0
  1887. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/__init__.py +2 -0
  1888. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/base_stereo_view_dataset.py +220 -0
  1889. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/batched_sampler.py +74 -0
  1890. vismatch/third_party/mast3r/dust3r/dust3r/datasets/base/easy_dataset.py +157 -0
  1891. vismatch/third_party/mast3r/dust3r/dust3r/datasets/blendedmvs.py +104 -0
  1892. vismatch/third_party/mast3r/dust3r/dust3r/datasets/co3d.py +165 -0
  1893. vismatch/third_party/mast3r/dust3r/dust3r/datasets/habitat.py +107 -0
  1894. vismatch/third_party/mast3r/dust3r/dust3r/datasets/megadepth.py +123 -0
  1895. vismatch/third_party/mast3r/dust3r/dust3r/datasets/scannetpp.py +96 -0
  1896. vismatch/third_party/mast3r/dust3r/dust3r/datasets/staticthings3d.py +96 -0
  1897. vismatch/third_party/mast3r/dust3r/dust3r/datasets/utils/__init__.py +2 -0
  1898. vismatch/third_party/mast3r/dust3r/dust3r/datasets/utils/cropping.py +124 -0
  1899. vismatch/third_party/mast3r/dust3r/dust3r/datasets/utils/transforms.py +11 -0
  1900. vismatch/third_party/mast3r/dust3r/dust3r/datasets/waymo.py +93 -0
  1901. vismatch/third_party/mast3r/dust3r/dust3r/datasets/wildrgbd.py +67 -0
  1902. vismatch/third_party/mast3r/dust3r/dust3r/demo.py +287 -0
  1903. vismatch/third_party/mast3r/dust3r/dust3r/heads/__init__.py +19 -0
  1904. vismatch/third_party/mast3r/dust3r/dust3r/heads/dpt_head.py +115 -0
  1905. vismatch/third_party/mast3r/dust3r/dust3r/heads/linear_head.py +41 -0
  1906. vismatch/third_party/mast3r/dust3r/dust3r/heads/postprocess.py +58 -0
  1907. vismatch/third_party/mast3r/dust3r/dust3r/image_pairs.py +104 -0
  1908. vismatch/third_party/mast3r/dust3r/dust3r/inference.py +150 -0
  1909. vismatch/third_party/mast3r/dust3r/dust3r/losses.py +299 -0
  1910. vismatch/third_party/mast3r/dust3r/dust3r/model.py +211 -0
  1911. vismatch/third_party/mast3r/dust3r/dust3r/optim_factory.py +14 -0
  1912. vismatch/third_party/mast3r/dust3r/dust3r/patch_embed.py +70 -0
  1913. vismatch/third_party/mast3r/dust3r/dust3r/post_process.py +60 -0
  1914. vismatch/third_party/mast3r/dust3r/dust3r/training.py +377 -0
  1915. vismatch/third_party/mast3r/dust3r/dust3r/utils/__init__.py +2 -0
  1916. vismatch/third_party/mast3r/dust3r/dust3r/utils/device.py +76 -0
  1917. vismatch/third_party/mast3r/dust3r/dust3r/utils/geometry.py +366 -0
  1918. vismatch/third_party/mast3r/dust3r/dust3r/utils/image.py +128 -0
  1919. vismatch/third_party/mast3r/dust3r/dust3r/utils/misc.py +121 -0
  1920. vismatch/third_party/mast3r/dust3r/dust3r/utils/parallel.py +79 -0
  1921. vismatch/third_party/mast3r/dust3r/dust3r/utils/path_to_croco.py +19 -0
  1922. vismatch/third_party/mast3r/dust3r/dust3r/viz.py +381 -0
  1923. vismatch/third_party/mast3r/dust3r/dust3r_visloc/__init__.py +2 -0
  1924. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/__init__.py +6 -0
  1925. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/aachen_day_night.py +24 -0
  1926. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/base_colmap.py +282 -0
  1927. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/base_dataset.py +19 -0
  1928. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/cambridge_landmarks.py +19 -0
  1929. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/inloc.py +167 -0
  1930. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/sevenscenes.py +123 -0
  1931. vismatch/third_party/mast3r/dust3r/dust3r_visloc/datasets/utils.py +118 -0
  1932. vismatch/third_party/mast3r/dust3r/dust3r_visloc/evaluation.py +65 -0
  1933. vismatch/third_party/mast3r/dust3r/dust3r_visloc/localization.py +140 -0
  1934. vismatch/third_party/mast3r/dust3r/train.py +13 -0
  1935. vismatch/third_party/mast3r/dust3r/visloc.py +193 -0
  1936. vismatch/third_party/mast3r/kapture_mast3r_mapping.py +127 -0
  1937. vismatch/third_party/mast3r/make_pairs.py +105 -0
  1938. vismatch/third_party/mast3r/mast3r/__init__.py +2 -0
  1939. vismatch/third_party/mast3r/mast3r/catmlp_dpt_head.py +239 -0
  1940. vismatch/third_party/mast3r/mast3r/cloud_opt/__init__.py +2 -0
  1941. vismatch/third_party/mast3r/mast3r/cloud_opt/sparse_ga.py +1078 -0
  1942. vismatch/third_party/mast3r/mast3r/cloud_opt/triangulation.py +80 -0
  1943. vismatch/third_party/mast3r/mast3r/cloud_opt/tsdf_optimizer.py +273 -0
  1944. vismatch/third_party/mast3r/mast3r/cloud_opt/utils/__init__.py +2 -0
  1945. vismatch/third_party/mast3r/mast3r/cloud_opt/utils/losses.py +32 -0
  1946. vismatch/third_party/mast3r/mast3r/cloud_opt/utils/schedules.py +17 -0
  1947. vismatch/third_party/mast3r/mast3r/colmap/__init__.py +2 -0
  1948. vismatch/third_party/mast3r/mast3r/colmap/database.py +383 -0
  1949. vismatch/third_party/mast3r/mast3r/colmap/mapping.py +196 -0
  1950. vismatch/third_party/mast3r/mast3r/datasets/__init__.py +62 -0
  1951. vismatch/third_party/mast3r/mast3r/datasets/base/__init__.py +2 -0
  1952. vismatch/third_party/mast3r/mast3r/datasets/base/mast3r_base_stereo_view_dataset.py +355 -0
  1953. vismatch/third_party/mast3r/mast3r/datasets/utils/__init__.py +2 -0
  1954. vismatch/third_party/mast3r/mast3r/datasets/utils/cropping.py +219 -0
  1955. vismatch/third_party/mast3r/mast3r/demo.py +381 -0
  1956. vismatch/third_party/mast3r/mast3r/demo_glomap.py +343 -0
  1957. vismatch/third_party/mast3r/mast3r/fast_nn.py +223 -0
  1958. vismatch/third_party/mast3r/mast3r/image_pairs.py +115 -0
  1959. vismatch/third_party/mast3r/mast3r/losses.py +508 -0
  1960. vismatch/third_party/mast3r/mast3r/model.py +213 -0
  1961. vismatch/third_party/mast3r/mast3r/retrieval/graph.py +77 -0
  1962. vismatch/third_party/mast3r/mast3r/retrieval/model.py +271 -0
  1963. vismatch/third_party/mast3r/mast3r/retrieval/processor.py +129 -0
  1964. vismatch/third_party/mast3r/mast3r/utils/__init__.py +2 -0
  1965. vismatch/third_party/mast3r/mast3r/utils/coarse_to_fine.py +214 -0
  1966. vismatch/third_party/mast3r/mast3r/utils/collate.py +62 -0
  1967. vismatch/third_party/mast3r/mast3r/utils/misc.py +17 -0
  1968. vismatch/third_party/mast3r/mast3r/utils/path_to_dust3r.py +19 -0
  1969. vismatch/third_party/mast3r/train.py +48 -0
  1970. vismatch/third_party/mast3r/visloc.py +538 -0
  1971. vismatch/third_party/omniglue/__init__.py +19 -0
  1972. vismatch/third_party/omniglue/demo.py +89 -0
  1973. vismatch/third_party/omniglue/src/omniglue/__init__.py +17 -0
  1974. vismatch/third_party/omniglue/src/omniglue/dino_extract.py +215 -0
  1975. vismatch/third_party/omniglue/src/omniglue/omniglue_extract.py +159 -0
  1976. vismatch/third_party/omniglue/src/omniglue/superpoint_extract.py +214 -0
  1977. vismatch/third_party/omniglue/src/omniglue/utils.py +274 -0
  1978. vismatch/third_party/omniglue/third_party/dinov2/__init__.py +0 -0
  1979. vismatch/third_party/omniglue/third_party/dinov2/dino.py +411 -0
  1980. vismatch/third_party/omniglue/third_party/dinov2/dino_utils.py +341 -0
  1981. vismatch/third_party/rdd/RDD/RDD.py +262 -0
  1982. vismatch/third_party/rdd/RDD/RDD_helper.py +181 -0
  1983. vismatch/third_party/rdd/RDD/dataset/__init__.py +0 -0
  1984. vismatch/third_party/rdd/RDD/dataset/megadepth/__init__.py +2 -0
  1985. vismatch/third_party/rdd/RDD/dataset/megadepth/megadepth.py +313 -0
  1986. vismatch/third_party/rdd/RDD/dataset/megadepth/megadepth_warper.py +75 -0
  1987. vismatch/third_party/rdd/RDD/dataset/megadepth/utils.py +848 -0
  1988. vismatch/third_party/rdd/RDD/matchers/__init__.py +3 -0
  1989. vismatch/third_party/rdd/RDD/matchers/dense_matcher.py +137 -0
  1990. vismatch/third_party/rdd/RDD/matchers/dual_softmax_matcher.py +31 -0
  1991. vismatch/third_party/rdd/RDD/matchers/lightglue.py +667 -0
  1992. vismatch/third_party/rdd/RDD/models/backbone.py +147 -0
  1993. vismatch/third_party/rdd/RDD/models/deformable_transformer.py +270 -0
  1994. vismatch/third_party/rdd/RDD/models/descriptor.py +116 -0
  1995. vismatch/third_party/rdd/RDD/models/detector.py +141 -0
  1996. vismatch/third_party/rdd/RDD/models/interpolator.py +33 -0
  1997. vismatch/third_party/rdd/RDD/models/ops/functions/__init__.py +13 -0
  1998. vismatch/third_party/rdd/RDD/models/ops/functions/ms_deform_attn_func.py +74 -0
  1999. vismatch/third_party/rdd/RDD/models/ops/modules/__init__.py +12 -0
  2000. vismatch/third_party/rdd/RDD/models/ops/modules/ms_deform_attn.py +125 -0
  2001. vismatch/third_party/rdd/RDD/models/ops/setup.py +78 -0
  2002. vismatch/third_party/rdd/RDD/models/ops/test.py +92 -0
  2003. vismatch/third_party/rdd/RDD/models/position_encoding.py +48 -0
  2004. vismatch/third_party/rdd/RDD/models/soft_detect.py +176 -0
  2005. vismatch/third_party/rdd/RDD/utils/__init__.py +1 -0
  2006. vismatch/third_party/rdd/RDD/utils/misc.py +531 -0
  2007. vismatch/third_party/rdd/benchmarks/air_ground.py +250 -0
  2008. vismatch/third_party/rdd/benchmarks/mega_1500.py +259 -0
  2009. vismatch/third_party/rdd/benchmarks/mega_view.py +252 -0
  2010. vismatch/third_party/rdd/benchmarks/scannet_1500.py +251 -0
  2011. vismatch/third_party/rdd/benchmarks/utils.py +112 -0
  2012. vismatch/third_party/rdd/configs/default.yaml +19 -0
  2013. vismatch/third_party/rdd/sfm/extract_rdd.py +145 -0
  2014. vismatch/third_party/rdd/sfm/match_rdd.py +259 -0
  2015. vismatch/third_party/rdd/third_party/LightGlue/.github/workflows/code-quality.yml +24 -0
  2016. vismatch/third_party/rdd/third_party/LightGlue/benchmark.py +255 -0
  2017. vismatch/third_party/rdd/third_party/LightGlue/lightglue/__init__.py +7 -0
  2018. vismatch/third_party/rdd/third_party/LightGlue/lightglue/aliked.py +760 -0
  2019. vismatch/third_party/rdd/third_party/LightGlue/lightglue/disk.py +55 -0
  2020. vismatch/third_party/rdd/third_party/LightGlue/lightglue/dog_hardnet.py +41 -0
  2021. vismatch/third_party/rdd/third_party/LightGlue/lightglue/lightglue.py +662 -0
  2022. vismatch/third_party/rdd/third_party/LightGlue/lightglue/sift.py +216 -0
  2023. vismatch/third_party/rdd/third_party/LightGlue/lightglue/superpoint.py +227 -0
  2024. vismatch/third_party/rdd/third_party/LightGlue/lightglue/utils.py +165 -0
  2025. vismatch/third_party/rdd/third_party/LightGlue/lightglue/viz2d.py +203 -0
  2026. vismatch/third_party/rdd/third_party/__init__.py +1 -0
  2027. vismatch/third_party/rdd/third_party/aliked_wrapper.py +17 -0
  2028. vismatch/third_party/rdd/training/losses/descriptor_loss.py +73 -0
  2029. vismatch/third_party/rdd/training/losses/detector_loss.py +499 -0
  2030. vismatch/third_party/rdd/training/train.py +473 -0
  2031. vismatch/third_party/rdd/training/utils.py +246 -0
  2032. vismatch/utils.py +390 -0
  2033. vismatch/viz.py +222 -0
  2034. vismatch-1.1.1.dist-info/METADATA +265 -0
  2035. vismatch-1.1.1.dist-info/RECORD +2042 -0
  2036. vismatch-1.1.1.dist-info/WHEEL +5 -0
  2037. vismatch-1.1.1.dist-info/entry_points.txt +4 -0
  2038. vismatch-1.1.1.dist-info/licenses/LICENSE +28 -0
  2039. vismatch-1.1.1.dist-info/top_level.txt +4 -0
  2040. vismatch_extract.py +103 -0
  2041. vismatch_match.py +114 -0
  2042. vismatch_test.py +186 -0
@@ -0,0 +1,1072 @@
1
+ """
2
+ Utils for Common Transformer Blocks used in UniCeption
3
+ References:
4
+ HuggingFace PyTorch Image Models (Timm)
5
+ CroCoV2
6
+ """
7
+
8
+ import collections.abc
9
+ import math
10
+ from itertools import repeat
11
+ from typing import Callable, Optional
12
+
13
+ import torch
14
+ import torch.nn as nn
15
+ import torch.nn.functional as F
16
+ from torch.jit import Final
17
+
18
+ from uniception.models.utils.config import use_fused_attn
19
+
20
+ torch.backends.cuda.matmul.allow_tf32 = True
21
+
22
+
23
+ def _ntuple(n):
24
+ "Helper function to create n-tuple."
25
+
26
+ def parse(x):
27
+ if isinstance(x, collections.abc.Iterable) and not isinstance(x, str):
28
+ return x
29
+ return tuple(repeat(x, n))
30
+
31
+ return parse
32
+
33
+
34
+ to_2tuple = _ntuple(2)
35
+
36
+
37
+ def drop_path(x, drop_prob: float = 0.0, training: bool = False, scale_by_keep: bool = True):
38
+ """Drop paths (Stochastic Depth) per sample (when applied in main path of residual blocks)."""
39
+ if drop_prob == 0.0 or not training:
40
+ return x
41
+ keep_prob = 1 - drop_prob
42
+ shape = (x.shape[0],) + (1,) * (x.ndim - 1) # work with diff dim tensors, not just 2D ConvNets
43
+ random_tensor = x.new_empty(shape).bernoulli_(keep_prob)
44
+ if keep_prob > 0.0 and scale_by_keep:
45
+ random_tensor.div_(keep_prob)
46
+
47
+ return x * random_tensor
48
+
49
+
50
+ class DropPath(nn.Module):
51
+ """Drop paths (Stochastic Depth) per sample (when applied in main path of residual blocks)."""
52
+
53
+ def __init__(self, drop_prob: float = 0.0, scale_by_keep: bool = True):
54
+ super(DropPath, self).__init__()
55
+ self.drop_prob = drop_prob
56
+ self.scale_by_keep = scale_by_keep
57
+
58
+ def forward(self, x):
59
+ return drop_path(x, self.drop_prob, self.training, self.scale_by_keep)
60
+
61
+ def extra_repr(self):
62
+ return f"drop_prob={round(self.drop_prob,3):0.3f}"
63
+
64
+
65
+ class Mlp(nn.Module):
66
+ """MLP as used in Vision Transformer, MLP-Mixer and related networks"""
67
+
68
+ def __init__(self, in_features, hidden_features=None, out_features=None, act_layer=nn.GELU, bias=True, drop=0.0):
69
+ super().__init__()
70
+ out_features = out_features or in_features
71
+ hidden_features = hidden_features or in_features
72
+ bias = to_2tuple(bias)
73
+ drop_probs = to_2tuple(drop)
74
+
75
+ self.fc1 = nn.Linear(in_features, hidden_features, bias=bias[0])
76
+ self.act = act_layer()
77
+ self.drop1 = nn.Dropout(drop_probs[0])
78
+ self.fc2 = nn.Linear(hidden_features, out_features, bias=bias[1])
79
+ self.drop2 = nn.Dropout(drop_probs[1])
80
+
81
+ def forward(self, x):
82
+ x = self.fc1(x)
83
+ x = self.act(x)
84
+ x = self.drop1(x)
85
+ x = self.fc2(x)
86
+ x = self.drop2(x)
87
+
88
+ return x
89
+
90
+
91
+ class Attention(nn.Module):
92
+ "Self-Attention Layer"
93
+
94
+ fused_attn: Final[bool]
95
+
96
+ def __init__(
97
+ self,
98
+ dim: int,
99
+ latent_attn_dim: Optional[int] = None,
100
+ num_heads: int = 8,
101
+ qkv_bias: bool = False,
102
+ qk_norm: bool = False,
103
+ attn_drop: float = 0.0,
104
+ proj_drop: float = 0.0,
105
+ norm_layer: nn.Module = nn.LayerNorm,
106
+ custom_positional_encoding: Callable = None,
107
+ use_scalable_softmax: bool = False,
108
+ use_entropy_scaling: bool = False,
109
+ base_token_count_for_entropy_scaling: int = 444,
110
+ entropy_scaling_growth_factor: float = 1.4,
111
+ ):
112
+ """
113
+ Initialize the Attention layer.
114
+
115
+ Args:
116
+ dim (int): Dimension of input features
117
+ latent_attn_dim (int): Dimension of latent attention features (default: None)
118
+ num_heads (int): Number of attention heads (default: 8)
119
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
120
+ qk_norm (bool): Whether to normalize q and k (default: False)
121
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
122
+ proj_drop (float): Dropout rate for output (default: 0.)
123
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
124
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
125
+ use_scalable_softmax (bool): Whether to use scalable softmax (default: False)
126
+ use_entropy_scaling (bool): Whether to use entropy scaling (default: False)
127
+ base_token_count_for_entropy_scaling (int): Base token count for entropy scaling (default: 444)
128
+ Computed using (518, 168) as base resolution with 14 patch size
129
+ entropy_scaling_growth_factor (float): Growth factor for entropy scaling (default: 1.4)
130
+ """
131
+ super().__init__()
132
+
133
+ if latent_attn_dim is not None:
134
+ assert latent_attn_dim % num_heads == 0, "latent_attn_dim should be divisible by num_heads"
135
+ self.latent_attn_dim = latent_attn_dim
136
+ self.latent_attn = True
137
+ else:
138
+ self.latent_attn = False
139
+ assert dim % num_heads == 0, "dim should be divisible by num_heads"
140
+
141
+ self.num_heads = num_heads
142
+ self.head_dim = dim // num_heads if not self.latent_attn else latent_attn_dim // num_heads
143
+ self.scale = self.head_dim**-0.5
144
+ self.fused_attn = use_fused_attn()
145
+
146
+ self.qkv = (
147
+ nn.Linear(dim, dim * 3, bias=qkv_bias)
148
+ if not self.latent_attn
149
+ else nn.Linear(dim, latent_attn_dim * 3, bias=qkv_bias)
150
+ )
151
+ self.q_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
152
+ self.k_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
153
+ self.attn_drop = nn.Dropout(attn_drop)
154
+ self.proj = nn.Linear(dim, dim) if not self.latent_attn else nn.Linear(latent_attn_dim, dim)
155
+ self.proj_drop = nn.Dropout(proj_drop)
156
+
157
+ self.custom_positional_encoding = custom_positional_encoding
158
+ self.use_scalable_softmax = use_scalable_softmax
159
+ self.use_entropy_scaling = use_entropy_scaling
160
+ self.base_token_count_for_entropy_scaling = base_token_count_for_entropy_scaling
161
+ self.entropy_scaling_growth_factor = entropy_scaling_growth_factor
162
+
163
+ def forward(self, x: torch.Tensor, xpos: torch.Tensor = None) -> torch.Tensor:
164
+ """
165
+ Forward pass of the Attention layer.
166
+
167
+ Args:
168
+ x (torch.Tensor): Input features
169
+ xpos (torch.Tensor): Positions of tokens (required when using custom positional encoding)
170
+
171
+ Returns:
172
+ torch.Tensor: Output features of same shape as input
173
+ """
174
+ B, N, C = x.shape
175
+ qkv = self.qkv(x).reshape(B, N, 3, self.num_heads, self.head_dim).permute(2, 0, 3, 1, 4)
176
+ q, k, v = qkv[0], qkv[1], qkv[2]
177
+ q, k = self.q_norm(q), self.k_norm(k)
178
+
179
+ if self.custom_positional_encoding is not None:
180
+ assert (
181
+ xpos is not None
182
+ ), "Positions of tokens (xpos) are a required input when using custom positional encoding"
183
+ q = self.custom_positional_encoding(q, xpos)
184
+ k = self.custom_positional_encoding(k, xpos)
185
+
186
+ if self.use_scalable_softmax:
187
+ # Scales the exponential base using the number of tokens (https://arxiv.org/pdf/2501.19399)
188
+ q = q * torch.log(torch.tensor(N, device=q.device))
189
+
190
+ if self.use_entropy_scaling:
191
+ # Scales the exponential base using the number of tokens (https://arxiv.org/pdf/2502.07785#page=7.35)
192
+ scaling_factor = torch.sqrt(
193
+ (self.entropy_scaling_growth_factor * torch.log(torch.tensor(N, device=q.device)))
194
+ / torch.log(torch.tensor(self.base_token_count_for_entropy_scaling, device=q.device))
195
+ )
196
+ q = q * scaling_factor
197
+
198
+ if self.fused_attn:
199
+ x = F.scaled_dot_product_attention(
200
+ q, k, v, dropout_p=(self.attn_drop.p if self.training else 0.0), scale=self.scale
201
+ )
202
+ else:
203
+ q = q * self.scale
204
+ attn = q @ k.transpose(-2, -1)
205
+ attn = attn.softmax(dim=-1)
206
+ attn = self.attn_drop(attn)
207
+ x = attn @ v
208
+
209
+ x = x.transpose(1, 2).reshape(B, N, -1)
210
+ x = self.proj(x)
211
+ x = self.proj_drop(x)
212
+ return x
213
+
214
+
215
+ class CrossAttention(nn.Module):
216
+ "Cross-Attention Layer"
217
+
218
+ fused_attn: Final[bool]
219
+
220
+ def __init__(
221
+ self,
222
+ dim: int,
223
+ num_heads: int = 8,
224
+ qkv_bias: bool = False,
225
+ qk_norm: bool = False,
226
+ attn_drop: float = 0.0,
227
+ proj_drop: float = 0.0,
228
+ norm_layer: nn.Module = nn.LayerNorm,
229
+ custom_positional_encoding: Callable = None,
230
+ use_scalable_softmax: bool = False,
231
+ use_entropy_scaling: bool = False,
232
+ base_token_count_for_entropy_scaling: int = 444,
233
+ entropy_scaling_growth_factor: float = 1.4,
234
+ ):
235
+ """
236
+ Initialize the Cross-Attention layer.
237
+
238
+ Args:
239
+ dim (int): Dimension of input features
240
+ num_heads (int): Number of attention heads (default: 8)
241
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
242
+ qk_norm (bool): Whether to normalize q and k (default: False)
243
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
244
+ proj_drop (float): Dropout rate for output (default: 0.)
245
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
246
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
247
+ use_scalable_softmax (bool): Whether to use scalable softmax (default: False)
248
+ use_entropy_scaling (bool): Whether to use entropy scaling (default: False)
249
+ base_token_count_for_entropy_scaling (int): Base token count for entropy scaling (default: 444)
250
+ Computed using (518, 168) as base resolution with 14 patch size
251
+ entropy_scaling_growth_factor (float): Growth factor for entropy scaling (default: 1.4)
252
+ """
253
+ super().__init__()
254
+ assert dim % num_heads == 0, "dim should be divisible by num_heads"
255
+ self.num_heads = num_heads
256
+ self.head_dim = dim // num_heads
257
+ self.scale = self.head_dim**-0.5
258
+ self.fused_attn = use_fused_attn()
259
+
260
+ self.projq = nn.Linear(dim, dim, bias=qkv_bias)
261
+ self.projk = nn.Linear(dim, dim, bias=qkv_bias)
262
+ self.projv = nn.Linear(dim, dim, bias=qkv_bias)
263
+ self.q_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
264
+ self.k_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
265
+ self.attn_drop = nn.Dropout(attn_drop)
266
+ self.proj = nn.Linear(dim, dim)
267
+ self.proj_drop = nn.Dropout(proj_drop)
268
+
269
+ self.custom_positional_encoding = custom_positional_encoding
270
+ self.use_scalable_softmax = use_scalable_softmax
271
+ self.use_entropy_scaling = use_entropy_scaling
272
+ self.base_token_count_for_entropy_scaling = base_token_count_for_entropy_scaling
273
+ self.entropy_scaling_growth_factor = entropy_scaling_growth_factor
274
+
275
+ def forward(
276
+ self,
277
+ query: torch.Tensor,
278
+ key: torch.Tensor,
279
+ value: torch.Tensor,
280
+ qpos: torch.Tensor = None,
281
+ kpos: torch.Tensor = None,
282
+ ) -> torch.Tensor:
283
+ """
284
+ Forward pass of the Cross-Attention layer.
285
+
286
+ Args:
287
+ query (torch.Tensor): Query features
288
+ key (torch.Tensor): Key features
289
+ value (torch.Tensor): Value features
290
+ qpos (torch.Tensor): Positions of queries (required when using custom positional encoding)
291
+ kpos (torch.Tensor): Positions of keys (required when using custom positional encoding)
292
+
293
+ Returns:
294
+ torch.Tensor: Output features of same shape as input
295
+ """
296
+ B, Nq, C = query.shape
297
+ Nk = key.shape[1]
298
+ Nv = value.shape[1]
299
+
300
+ q = self.projq(query).reshape(B, Nq, self.num_heads, self.head_dim).permute(0, 2, 1, 3)
301
+ k = self.projk(key).reshape(B, Nk, self.num_heads, self.head_dim).permute(0, 2, 1, 3)
302
+ v = self.projv(value).reshape(B, Nv, self.num_heads, self.head_dim).permute(0, 2, 1, 3)
303
+ q, k = self.q_norm(q), self.k_norm(k)
304
+
305
+ if self.custom_positional_encoding is not None:
306
+ assert (
307
+ qpos is not None
308
+ ), "Positions of queries (qpos) are a required input when using custom positional encoding"
309
+ assert (
310
+ kpos is not None
311
+ ), "Positions of keys (kpos) are a required input when using custom positional encoding"
312
+ q = self.custom_positional_encoding(q, qpos)
313
+ k = self.custom_positional_encoding(k, kpos)
314
+
315
+ if self.use_scalable_softmax:
316
+ # Scales the exponential base using the number of tokens (https://arxiv.org/pdf/2501.19399)
317
+ q = q * torch.log(torch.tensor(Nq, device=q.device))
318
+
319
+ if self.use_entropy_scaling:
320
+ # Scales the exponential base using the number of tokens (https://arxiv.org/pdf/2502.07785#page=7.35)
321
+ scaling_factor = torch.sqrt(
322
+ (self.entropy_scaling_growth_factor * torch.log(torch.tensor(Nq, device=q.device)))
323
+ / torch.log(torch.tensor(self.base_token_count_for_entropy_scaling, device=q.device))
324
+ )
325
+ q = q * scaling_factor
326
+
327
+ if self.fused_attn:
328
+ x = F.scaled_dot_product_attention(
329
+ q, k, v, dropout_p=(self.attn_drop.p if self.training else 0.0), scale=self.scale
330
+ )
331
+ else:
332
+ q = q * self.scale
333
+ attn = q @ k.transpose(-2, -1)
334
+ attn = attn.softmax(dim=-1)
335
+ attn = self.attn_drop(attn)
336
+ x = attn @ v
337
+
338
+ x = x.transpose(1, 2).reshape(B, Nq, C)
339
+ x = self.proj(x)
340
+ x = self.proj_drop(x)
341
+ return x
342
+
343
+
344
+ class LayerScale(nn.Module):
345
+ "Layer Scale Layer"
346
+
347
+ def __init__(
348
+ self,
349
+ dim: int,
350
+ init_values: float = 1e-5,
351
+ inplace: bool = False,
352
+ ):
353
+ """
354
+ Initialize the Layer Scale layer
355
+
356
+ Args:
357
+ dim (int): Dimension of input features
358
+ init_values (float): Initial value for LayerScale gamma (default: 1e-5)
359
+ inplace (bool): Whether to perform inplace operations (default: False)
360
+ """
361
+ super().__init__()
362
+ self.inplace = inplace
363
+ self.gamma = nn.Parameter(init_values * torch.ones(dim))
364
+
365
+ def forward(self, x: torch.Tensor) -> torch.Tensor:
366
+ "Forward pass of the Layer Scale layer"
367
+ return x.mul_(self.gamma) if self.inplace else x * self.gamma
368
+
369
+
370
+ class SelfAttentionBlock(nn.Module):
371
+ "Self-Attention Block"
372
+
373
+ def __init__(
374
+ self,
375
+ dim: int,
376
+ num_heads: int,
377
+ latent_attn_dim: Optional[int] = None,
378
+ mlp_ratio: float = 4.0,
379
+ qkv_bias: bool = False,
380
+ qk_norm: bool = False,
381
+ proj_drop: float = 0.0,
382
+ attn_drop: float = 0.0,
383
+ init_values: Optional[float] = None,
384
+ drop_path: float = 0.0,
385
+ act_layer: nn.Module = nn.GELU,
386
+ norm_layer: nn.Module = nn.LayerNorm,
387
+ mlp_layer: nn.Module = Mlp,
388
+ custom_positional_encoding: Callable = None,
389
+ use_scalable_softmax: bool = False,
390
+ use_entropy_scaling: bool = False,
391
+ base_token_count_for_entropy_scaling: int = 444,
392
+ entropy_scaling_growth_factor: float = 1.4,
393
+ ):
394
+ """
395
+ Initialize the Self-Attention Block.
396
+
397
+ Args:
398
+ dim (int): Dimension of input features
399
+ num_heads (int): Number of attention heads
400
+ mlp_ratio (float): Ratio of hidden to input dimension in MLP (default: 4.)
401
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
402
+ qk_norm (bool): Whether to normalize q and k (default: False)
403
+ proj_drop (float): Dropout rate for output (default: 0.)
404
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
405
+ init_values (float): Initial value for LayerScale gamma (default: None)
406
+ drop_path (float): Dropout rate for stochastic depth (default: 0.)
407
+ act_layer (nn.Module): Activation layer (default: nn.GELU)
408
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
409
+ mlp_layer (nn.Module): MLP layer (default: Mlp)
410
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
411
+ use_scalable_softmax (bool): Whether to use scalable softmax (default: False)
412
+ use_entropy_scaling (bool): Whether to use entropy scaling (default: False)
413
+ base_token_count_for_entropy_scaling (int): Base token count for entropy scaling (default: 444)
414
+ Computed using (518, 168) as base resolution with 14 patch size
415
+ entropy_scaling_growth_factor (float): Growth factor for entropy scaling (default: 1.4)
416
+
417
+ Returns:
418
+ torch.Tensor: Output features of same shape as input
419
+ """
420
+ super().__init__()
421
+ self.norm1 = norm_layer(dim)
422
+ self.attn = Attention(
423
+ dim,
424
+ latent_attn_dim=latent_attn_dim,
425
+ num_heads=num_heads,
426
+ qkv_bias=qkv_bias,
427
+ qk_norm=qk_norm,
428
+ attn_drop=attn_drop,
429
+ proj_drop=proj_drop,
430
+ norm_layer=norm_layer,
431
+ custom_positional_encoding=custom_positional_encoding,
432
+ use_scalable_softmax=use_scalable_softmax,
433
+ use_entropy_scaling=use_entropy_scaling,
434
+ base_token_count_for_entropy_scaling=base_token_count_for_entropy_scaling,
435
+ entropy_scaling_growth_factor=entropy_scaling_growth_factor,
436
+ )
437
+ self.ls1 = LayerScale(dim, init_values=init_values) if init_values else nn.Identity()
438
+ self.drop_path1 = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
439
+
440
+ self.norm2 = norm_layer(dim)
441
+ self.mlp = mlp_layer(
442
+ in_features=dim,
443
+ hidden_features=int(dim * mlp_ratio),
444
+ act_layer=act_layer,
445
+ drop=proj_drop,
446
+ )
447
+ self.ls2 = LayerScale(dim, init_values=init_values) if init_values else nn.Identity()
448
+ self.drop_path2 = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
449
+
450
+ self.custom_positional_encoding = custom_positional_encoding
451
+
452
+ def forward(self, x: torch.Tensor, xpos: torch.Tensor = None) -> torch.Tensor:
453
+ """
454
+ Forward pass of the Self-Attention Block.
455
+
456
+ Args:
457
+ x (torch.Tensor): Input features
458
+ xpos (torch.Tensor): Positions of tokens (required when using custom positional encoding)
459
+
460
+ Returns:
461
+ torch.Tensor: Output features of same shape as input
462
+ """
463
+ if self.custom_positional_encoding is not None:
464
+ assert (
465
+ xpos is not None
466
+ ), "Positions of tokens (xpos) are a required input when using custom positional encoding"
467
+ x = x + self.drop_path1(self.ls1(self.attn(self.norm1(x), xpos)))
468
+ x = x + self.drop_path2(self.ls2(self.mlp(self.norm2(x))))
469
+ return x
470
+
471
+
472
+ class CrossAttentionBlock(nn.Module):
473
+ "Cross-Attention Block"
474
+
475
+ def __init__(
476
+ self,
477
+ dim: int,
478
+ num_heads: int,
479
+ mlp_ratio: float = 4.0,
480
+ qkv_bias: bool = False,
481
+ qk_norm: bool = False,
482
+ proj_drop: float = 0.0,
483
+ attn_drop: float = 0.0,
484
+ init_values: Optional[float] = None,
485
+ drop_path: float = 0.0,
486
+ act_layer: nn.Module = nn.GELU,
487
+ norm_layer: nn.Module = nn.LayerNorm,
488
+ mlp_layer: nn.Module = Mlp,
489
+ custom_positional_encoding: Callable = None,
490
+ norm_cross_tokens: bool = True,
491
+ use_scalable_softmax: bool = False,
492
+ use_entropy_scaling: bool = False,
493
+ base_token_count_for_entropy_scaling: int = 444,
494
+ entropy_scaling_growth_factor: float = 1.4,
495
+ ):
496
+ """
497
+ Initialize the Cross-Attention Block.
498
+
499
+ Args:
500
+ dim (int): Dimension of input features
501
+ num_heads (int): Number of attention heads
502
+ mlp_ratio (float): Ratio of hidden to input dimension in MLP (default: 4.)
503
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
504
+ qk_norm (bool): Whether to normalize q and k (default: False)
505
+ proj_drop (float): Dropout rate for output (default: 0.)
506
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
507
+ init_values (float): Initial value for LayerScale gamma (default: None)
508
+ drop_path (float): Dropout rate for stochastic depth (default: 0.)
509
+ act_layer (nn.Module): Activation layer (default: nn.GELU)
510
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
511
+ mlp_layer (nn.Module): MLP layer (default: Mlp)
512
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
513
+ norm_cross_tokens (bool): Whether to normalize cross tokens (default: True)
514
+ use_scalable_softmax (bool): Whether to use scalable softmax (default: False)
515
+ use_entropy_scaling (bool): Whether to use entropy scaling (default: False)
516
+ base_token_count_for_entropy_scaling (int): Base token count for entropy scaling (default: 444)
517
+ Computed using (518, 168) as base resolution with 14 patch size
518
+ entropy_scaling_growth_factor (float): Growth factor for entropy scaling (default: 1.4)
519
+
520
+ Returns:
521
+ torch.Tensor: Output features of same shape as input
522
+ """
523
+ super().__init__()
524
+ self.norm1 = norm_layer(dim)
525
+ self.attn = Attention(
526
+ dim,
527
+ num_heads=num_heads,
528
+ qkv_bias=qkv_bias,
529
+ qk_norm=qk_norm,
530
+ attn_drop=attn_drop,
531
+ proj_drop=proj_drop,
532
+ norm_layer=norm_layer,
533
+ custom_positional_encoding=custom_positional_encoding,
534
+ use_scalable_softmax=use_scalable_softmax,
535
+ use_entropy_scaling=use_entropy_scaling,
536
+ base_token_count_for_entropy_scaling=base_token_count_for_entropy_scaling,
537
+ entropy_scaling_growth_factor=entropy_scaling_growth_factor,
538
+ )
539
+ self.ls1 = LayerScale(dim, init_values=init_values) if init_values else nn.Identity()
540
+ self.drop_path1 = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
541
+
542
+ self.norm_y = norm_layer(dim) if norm_cross_tokens else nn.Identity()
543
+ self.custom_positional_encoding = custom_positional_encoding
544
+ self.norm2 = norm_layer(dim)
545
+ self.cross_attn = CrossAttention(
546
+ dim,
547
+ num_heads=num_heads,
548
+ qkv_bias=qkv_bias,
549
+ qk_norm=qk_norm,
550
+ attn_drop=attn_drop,
551
+ proj_drop=proj_drop,
552
+ norm_layer=norm_layer,
553
+ custom_positional_encoding=custom_positional_encoding,
554
+ use_scalable_softmax=use_scalable_softmax,
555
+ use_entropy_scaling=use_entropy_scaling,
556
+ base_token_count_for_entropy_scaling=base_token_count_for_entropy_scaling,
557
+ entropy_scaling_growth_factor=entropy_scaling_growth_factor,
558
+ )
559
+ self.ls2 = LayerScale(dim, init_values=init_values) if init_values else nn.Identity()
560
+ self.drop_path2 = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
561
+
562
+ self.norm3 = norm_layer(dim)
563
+ self.mlp = mlp_layer(
564
+ in_features=dim,
565
+ hidden_features=int(dim * mlp_ratio),
566
+ act_layer=act_layer,
567
+ drop=proj_drop,
568
+ )
569
+ self.ls3 = LayerScale(dim, init_values=init_values) if init_values else nn.Identity()
570
+ self.drop_path3 = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
571
+
572
+ def forward(
573
+ self,
574
+ x: torch.Tensor,
575
+ y: torch.Tensor,
576
+ xpos: torch.Tensor = None,
577
+ ypos: torch.Tensor = None,
578
+ ) -> torch.Tensor:
579
+ """
580
+ Forward pass of the Cross-Attention Block.
581
+
582
+ Args:
583
+ x (torch.Tensor): Input features
584
+ y (torch.Tensor): Cross features
585
+ xpos (torch.Tensor): Positions of tokens (required when using custom positional encoding)
586
+ ypos (torch.Tensor): Positions of cross tokens (required when using custom positional encoding)
587
+
588
+ Returns:
589
+ torch.Tensor: Output features of same shape as input
590
+ """
591
+ if self.custom_positional_encoding is not None:
592
+ assert (
593
+ xpos is not None
594
+ ), "Positions of tokens (xpos) are a required input when using custom positional encoding"
595
+ assert (
596
+ ypos is not None
597
+ ), "Positions of cross tokens (ypos) are a required input when using custom positional encoding"
598
+ x = x + self.drop_path1(self.ls1(self.attn(self.norm1(x), xpos)))
599
+ y_ = self.norm_y(y)
600
+ x = x + self.drop_path2(self.ls2(self.cross_attn(self.norm2(x), y_, y_, xpos, ypos)))
601
+ x = x + self.drop_path3(self.ls3(self.mlp(self.norm3(x))))
602
+ return x
603
+
604
+
605
+ def dummy_positional_encoding(x, xpos):
606
+ "Dummy function for positional encoding of tokens"
607
+ x = x
608
+ xpos = xpos
609
+ return x
610
+
611
+
612
+ # copied from DiffTrsformer
613
+ class RMSNorm(nn.Module):
614
+ def __init__(self, dim: int, eps: float = 1e-6, elementwise_affine=True, memory_efficient=False):
615
+ super().__init__()
616
+ self.dim = dim
617
+ self.eps = eps
618
+ self.elementwise_affine = elementwise_affine
619
+ if self.elementwise_affine:
620
+ self.weight = nn.Parameter(torch.ones(dim))
621
+ else:
622
+ self.register_parameter("weight", None)
623
+
624
+ def _norm(self, x):
625
+ return x * torch.rsqrt(x.pow(2).mean(-1, keepdim=True) + self.eps)
626
+
627
+ def forward(self, x):
628
+ output = self._norm(x.float()).type_as(x)
629
+ if self.weight is not None:
630
+ output = output * self.weight
631
+ return output
632
+
633
+ def extra_repr(self) -> str:
634
+ return f"dim={self.dim}, eps={self.eps}, elementwise_affine={self.elementwise_affine}"
635
+
636
+
637
+ def lambda_init_fn(depth):
638
+ return 0.8 - 0.6 * math.exp(-0.3 * depth) # copied from DiffTrsformer
639
+
640
+
641
+ class DiffAttention(nn.Module):
642
+ "Differential Self-Attention Layer"
643
+
644
+ fused_attn: Final[bool]
645
+
646
+ def __init__(
647
+ self,
648
+ dim: int,
649
+ depth: int,
650
+ num_heads: int = 8,
651
+ qkv_bias: bool = False,
652
+ qk_norm: bool = False,
653
+ attn_drop: float = 0.0,
654
+ proj_drop: float = 0.0,
655
+ norm_layer: nn.Module = nn.LayerNorm,
656
+ custom_positional_encoding: Callable = None,
657
+ ):
658
+ """
659
+ Initialize the DiffAttention layer.
660
+
661
+ Args:
662
+ dim (int): Dimension of input features
663
+ depth (int): Depth of the current layer, used in lambda initialization (default: 0)
664
+ num_heads (int): Number of attention heads (default: 8)
665
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
666
+ qk_norm (bool): Whether to normalize q and k (default: False)
667
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
668
+ proj_drop (float): Dropout rate for output (default: 0.)
669
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
670
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
671
+ """
672
+ super().__init__()
673
+ assert dim % num_heads == 0, "dim should be divisible by num_heads"
674
+ self.num_heads = num_heads
675
+ self.head_dim = dim // num_heads // 2
676
+ self.scale = self.head_dim**-0.5
677
+ self.fused_attn = use_fused_attn()
678
+
679
+ self.qkv = nn.Linear(dim, dim * 3, bias=qkv_bias)
680
+ self.q_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
681
+ self.k_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
682
+ self.attn_drop = nn.Dropout(attn_drop)
683
+ self.proj = nn.Linear(dim, dim)
684
+ self.proj_drop = nn.Dropout(proj_drop)
685
+
686
+ self.custom_positional_encoding = custom_positional_encoding
687
+
688
+ # DiffTransformer specific
689
+ self.lambda_init = lambda_init_fn(depth)
690
+ self.lambda_q1 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
691
+ self.lambda_k1 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
692
+ self.lambda_q2 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
693
+ self.lambda_k2 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
694
+
695
+ self.subln = RMSNorm(2 * self.head_dim, eps=1e-5, elementwise_affine=True)
696
+
697
+ def forward(self, x: torch.Tensor, xpos: torch.Tensor = None) -> torch.Tensor:
698
+ """
699
+ Forward pass of the Attention layer.
700
+
701
+ Args:
702
+ x (torch.Tensor): Input features
703
+ xpos (torch.Tensor): Positions of tokens (required when using custom positional encoding)
704
+
705
+ Returns:
706
+ torch.Tensor: Output features of same shape as input
707
+ """
708
+ B, N, C = x.shape
709
+ qkv = self.qkv(x).reshape(B, N, 3, self.num_heads, self.head_dim * 2)
710
+ q, k, v = torch.chunk(qkv, 3, dim=2) # B, N, Nh, Dh
711
+
712
+ q = q.view(B, N, 2 * self.num_heads, self.head_dim).permute(0, 2, 1, 3)
713
+ k = k.view(B, N, 2 * self.num_heads, self.head_dim).permute(0, 2, 1, 3)
714
+ v = v.view(B, N, self.num_heads, 2 * self.head_dim).permute(0, 2, 1, 3)
715
+
716
+ q, k = self.q_norm(q), self.k_norm(k)
717
+
718
+ if self.custom_positional_encoding is not None:
719
+ assert (
720
+ xpos is not None
721
+ ), "Positions of tokens (xpos) are a required input when using custom positional encoding"
722
+ q = self.custom_positional_encoding(q, xpos)
723
+ k = self.custom_positional_encoding(k, xpos)
724
+
725
+ q1, q2 = q.chunk(2, dim=1) # split heads dimension into two
726
+ k1, k2 = k.chunk(2, dim=1) # split heads dimension into two
727
+
728
+ if self.fused_attn:
729
+ attn1 = F.scaled_dot_product_attention(
730
+ q1, k1, v, dropout_p=(self.attn_drop.p if self.training else 0.0), scale=self.scale
731
+ )
732
+ attn2 = F.scaled_dot_product_attention(
733
+ q2, k2, v, dropout_p=(self.attn_drop.p if self.training else 0.0), scale=self.scale
734
+ )
735
+ else:
736
+ q1 = q1 * self.scale
737
+ attn = q1 @ k1.transpose(-2, -1)
738
+ attn = attn.softmax(dim=-1)
739
+ attn = self.attn_drop(attn)
740
+ attn1 = attn @ v
741
+
742
+ q2 = q2 * self.scale
743
+ attn = q2 @ k2.transpose(-2, -1)
744
+ attn = attn.softmax(dim=-1)
745
+ attn = self.attn_drop(attn)
746
+ attn2 = attn @ v
747
+
748
+ lambda_1 = torch.exp(torch.sum(self.lambda_q1 * self.lambda_k1, dim=-1).float()).type_as(q)
749
+ lambda_2 = torch.exp(torch.sum(self.lambda_q2 * self.lambda_k2, dim=-1).float()).type_as(q)
750
+ lambda_full = lambda_1 - lambda_2 + self.lambda_init
751
+ attn = attn1 - lambda_full * attn2
752
+
753
+ attn = self.subln(attn)
754
+ attn = attn * (1 - self.lambda_init)
755
+ attn = attn.reshape(B, N, self.num_heads * 2 * self.head_dim)
756
+
757
+ x = self.proj(attn)
758
+ x = self.proj_drop(x)
759
+ return x
760
+
761
+
762
+ class DiffCrossAttention(nn.Module):
763
+ "Differential Cross-Attention Layer, following https://arxiv.org/abs/2410.05258"
764
+
765
+ fused_attn: Final[bool]
766
+
767
+ def __init__(
768
+ self,
769
+ dim: int,
770
+ depth: int,
771
+ num_heads: int = 8,
772
+ qkv_bias: bool = False,
773
+ qk_norm: bool = False,
774
+ attn_drop: float = 0.0,
775
+ proj_drop: float = 0.0,
776
+ norm_layer: nn.Module = nn.LayerNorm,
777
+ custom_positional_encoding: Callable = None,
778
+ ):
779
+ """
780
+ Initialize the Cross-Attention layer.
781
+
782
+ Args:
783
+ dim (int): Dimension of input features
784
+ depth (int): Depth of the current layer, used in lambda initialization (default: 0)
785
+ num_heads (int): Number of attention heads (default: 8)
786
+ qkv_bias (bool): Whether to include bias in qkv projection (default: False)
787
+ qk_norm (bool): Whether to normalize q and k (default: False)
788
+ attn_drop (float): Dropout rate for attention weights (default: 0.)
789
+ proj_drop (float): Dropout rate for output (default: 0.)
790
+ norm_layer (nn.Module): Normalization layer (default: nn.LayerNorm)
791
+ custom_positional_encoding (Callable): Custom positional encoding function (default: None)
792
+ """
793
+ super().__init__()
794
+ assert dim % num_heads == 0, "dim should be divisible by num_heads"
795
+ self.num_heads = num_heads
796
+ self.head_dim = dim // num_heads // 2
797
+ self.scale = self.head_dim**-0.5
798
+ self.fused_attn = use_fused_attn()
799
+
800
+ self.projq = nn.Linear(dim, dim, bias=qkv_bias)
801
+ self.projk = nn.Linear(dim, dim, bias=qkv_bias)
802
+ self.projv = nn.Linear(dim, dim, bias=qkv_bias)
803
+ self.q_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
804
+ self.k_norm = norm_layer(self.head_dim) if qk_norm else nn.Identity()
805
+ self.attn_drop = nn.Dropout(attn_drop)
806
+ self.proj = nn.Linear(dim, dim)
807
+ self.proj_drop = nn.Dropout(proj_drop)
808
+
809
+ # DiffTransformer specific
810
+ self.lambda_init = lambda_init_fn(depth)
811
+ self.lambda_q1 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
812
+ self.lambda_k1 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
813
+ self.lambda_q2 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
814
+ self.lambda_k2 = nn.Parameter(torch.zeros(self.head_dim, dtype=torch.float32).normal_(mean=0, std=0.1))
815
+
816
+ self.subln = RMSNorm(2 * self.head_dim, eps=1e-5, elementwise_affine=True)
817
+
818
+ self.custom_positional_encoding = custom_positional_encoding
819
+
820
+ def lambda_init_fn(self, depth):
821
+ return 0.8 - 0.6 * math.exp(-0.3 * depth) # copied from DiffTrsformer
822
+
823
+ def forward(
824
+ self,
825
+ query: torch.Tensor,
826
+ key: torch.Tensor,
827
+ value: torch.Tensor,
828
+ qpos: torch.Tensor = None,
829
+ kpos: torch.Tensor = None,
830
+ ) -> torch.Tensor:
831
+ """
832
+ Forward pass of the Cross-Attention layer.
833
+
834
+ Args:
835
+ query (torch.Tensor): Query features
836
+ key (torch.Tensor): Key features
837
+ value (torch.Tensor): Value features
838
+ qpos (torch.Tensor): Positions of queries (required when using custom positional encoding)
839
+ kpos (torch.Tensor): Positions of keys (required when using custom positional encoding)
840
+
841
+ Returns:
842
+ torch.Tensor: Output features of same shape as input
843
+ """
844
+ B, Nq, C = query.shape
845
+ Nk = key.shape[1]
846
+ Nv = value.shape[1]
847
+
848
+ q = self.projq(query).reshape(B, Nq, 2 * self.num_heads, self.head_dim).permute(0, 2, 1, 3)
849
+ k = self.projk(key).reshape(B, Nk, 2 * self.num_heads, self.head_dim).permute(0, 2, 1, 3)
850
+ v = self.projv(value).reshape(B, Nv, self.num_heads, 2 * self.head_dim).permute(0, 2, 1, 3)
851
+ q, k = self.q_norm(q), self.k_norm(k)
852
+
853
+ if self.custom_positional_encoding is not None:
854
+ assert (
855
+ qpos is not None
856
+ ), "Positions of queries (qpos) are a required input when using custom positional encoding"
857
+ assert (
858
+ kpos is not None
859
+ ), "Positions of keys (kpos) are a required input when using custom positional encoding"
860
+ q = self.custom_positional_encoding(q, qpos)
861
+ k = self.custom_positional_encoding(k, kpos)
862
+
863
+ q1, q2 = q.chunk(2, dim=1) # split heads dimension into two
864
+ k1, k2 = k.chunk(2, dim=1) # split heads dimension into two
865
+
866
+ if self.fused_attn:
867
+ attn1 = F.scaled_dot_product_attention(
868
+ q1, k1, v, dropout_p=(self.attn_drop.p if self.training else 0.0), scale=self.scale
869
+ )
870
+ attn2 = F.scaled_dot_product_attention(
871
+ q2, k2, v, dropout_p=(self.attn_drop.p if self.training else 0.0), scale=self.scale
872
+ )
873
+ else:
874
+ q1 = q1 * self.scale
875
+ attn = q1 @ k1.transpose(-2, -1)
876
+ attn = attn.softmax(dim=-1)
877
+ attn = self.attn_drop(attn)
878
+ attn1 = attn @ v
879
+
880
+ q2 = q2 * self.scale
881
+ attn = q2 @ k2.transpose(-2, -1)
882
+ attn = attn.softmax(dim=-1)
883
+ attn = self.attn_drop(attn)
884
+ attn2 = attn @ v
885
+
886
+ attn1 = attn1.transpose(1, 2) # B, Nq, Nh, Dh
887
+ attn2 = attn2.transpose(1, 2)
888
+
889
+ lambda_1 = torch.exp(torch.sum(self.lambda_q1 * self.lambda_k1, dim=-1).float()).type_as(q)
890
+ lambda_2 = torch.exp(torch.sum(self.lambda_q2 * self.lambda_k2, dim=-1).float()).type_as(q)
891
+ lambda_full = lambda_1 - lambda_2 + self.lambda_init
892
+ attn = attn1 - lambda_full * attn2
893
+
894
+ attn = self.subln(attn)
895
+ attn = attn * (1 - self.lambda_init)
896
+ attn = attn.reshape(B, Nq, self.num_heads * 2 * self.head_dim)
897
+
898
+ x = self.proj(attn)
899
+ x = self.proj_drop(x)
900
+ return x
901
+
902
+
903
+ class DiffSelfAttentionBlock(SelfAttentionBlock):
904
+ "Differential Self-Attention Block"
905
+
906
+ def __init__(
907
+ self,
908
+ dim: int,
909
+ depth: int,
910
+ num_heads: int,
911
+ mlp_ratio: float = 4.0,
912
+ qkv_bias: bool = False,
913
+ qk_norm: bool = False,
914
+ proj_drop: float = 0.0,
915
+ attn_drop: float = 0.0,
916
+ init_values: Optional[float] = None,
917
+ drop_path: float = 0.0,
918
+ act_layer: nn.Module = nn.GELU,
919
+ norm_layer: nn.Module = nn.LayerNorm,
920
+ mlp_layer: nn.Module = Mlp,
921
+ custom_positional_encoding: Callable = None,
922
+ ):
923
+ super().__init__(
924
+ dim=dim,
925
+ num_heads=num_heads,
926
+ mlp_ratio=mlp_ratio,
927
+ qkv_bias=qkv_bias,
928
+ qk_norm=qk_norm,
929
+ proj_drop=proj_drop,
930
+ attn_drop=attn_drop,
931
+ init_values=init_values,
932
+ drop_path=drop_path,
933
+ act_layer=act_layer,
934
+ norm_layer=norm_layer,
935
+ mlp_layer=mlp_layer,
936
+ custom_positional_encoding=custom_positional_encoding,
937
+ )
938
+
939
+ self.attn = DiffAttention(
940
+ dim,
941
+ depth,
942
+ num_heads=num_heads,
943
+ qkv_bias=qkv_bias,
944
+ qk_norm=qk_norm,
945
+ attn_drop=attn_drop,
946
+ proj_drop=proj_drop,
947
+ norm_layer=norm_layer,
948
+ custom_positional_encoding=custom_positional_encoding,
949
+ )
950
+
951
+
952
+ class DiffCrossAttentionBlock(CrossAttentionBlock):
953
+ "Differential Cross-Attention Block"
954
+
955
+ def __init__(
956
+ self,
957
+ dim: int,
958
+ depth: int,
959
+ num_heads: int,
960
+ mlp_ratio: float = 4.0,
961
+ qkv_bias: bool = False,
962
+ qk_norm: bool = False,
963
+ proj_drop: float = 0.0,
964
+ attn_drop: float = 0.0,
965
+ init_values: Optional[float] = None,
966
+ drop_path: float = 0.0,
967
+ act_layer: nn.Module = nn.GELU,
968
+ norm_layer: nn.Module = nn.LayerNorm,
969
+ mlp_layer: nn.Module = Mlp,
970
+ custom_positional_encoding: Callable = None,
971
+ norm_cross_tokens: bool = True,
972
+ ):
973
+ super().__init__(
974
+ dim=dim,
975
+ num_heads=num_heads,
976
+ mlp_ratio=mlp_ratio,
977
+ qkv_bias=qkv_bias,
978
+ qk_norm=qk_norm,
979
+ proj_drop=proj_drop,
980
+ attn_drop=attn_drop,
981
+ init_values=init_values,
982
+ drop_path=drop_path,
983
+ act_layer=act_layer,
984
+ norm_layer=norm_layer,
985
+ mlp_layer=mlp_layer,
986
+ custom_positional_encoding=custom_positional_encoding,
987
+ norm_cross_tokens=norm_cross_tokens,
988
+ )
989
+
990
+ self.cross_attn = DiffCrossAttention(
991
+ dim,
992
+ depth,
993
+ num_heads=num_heads,
994
+ qkv_bias=qkv_bias,
995
+ qk_norm=qk_norm,
996
+ attn_drop=attn_drop,
997
+ proj_drop=proj_drop,
998
+ norm_layer=norm_layer,
999
+ custom_positional_encoding=custom_positional_encoding,
1000
+ )
1001
+
1002
+
1003
+ if __name__ == "__main__":
1004
+ # Init Attention & CrossAttention classes
1005
+ self_attn = Attention(dim=768, custom_positional_encoding=dummy_positional_encoding)
1006
+ cross_attn = CrossAttention(dim=768, custom_positional_encoding=dummy_positional_encoding)
1007
+
1008
+ # Perform dummy inference with the Attention classes
1009
+ dummy_input = torch.randn((1, 256, 768))
1010
+ dummy_x = torch.arange(16)
1011
+ dummy_y = torch.arange(16)
1012
+ dummy_xpos = torch.cartesian_prod(dummy_y, dummy_x).view(1, 256, 2).expand(1, -1, 2).clone()
1013
+ self_attn_output = self_attn(dummy_input, dummy_xpos)
1014
+ cross_attn_output = cross_attn(dummy_input, dummy_input, dummy_input, dummy_xpos, dummy_xpos)
1015
+ print("Init of Attention & CrossAttention classes is successful!")
1016
+
1017
+ # Init SelfAttentionBlock & CrossAttentionBlock
1018
+ self_attn_block = SelfAttentionBlock(dim=768, num_heads=16, custom_positional_encoding=dummy_positional_encoding)
1019
+ cross_attn_block = CrossAttentionBlock(dim=768, num_heads=16, custom_positional_encoding=dummy_positional_encoding)
1020
+
1021
+ # Perform dummy inference with the Attention blocks
1022
+ self_attn_block_output = self_attn_block(dummy_input, dummy_xpos)
1023
+ cross_attn_block_output = cross_attn_block(dummy_input, dummy_input, dummy_xpos, dummy_xpos)
1024
+ print("Init of SelfAttentionBlock & CrossAttentionBlock is successful!")
1025
+
1026
+ # Init DiffAttention & DiffCrossAttention classes
1027
+ diff_self_attn = DiffAttention(dim=768, depth=0, custom_positional_encoding=dummy_positional_encoding)
1028
+ diff_cross_attn = DiffCrossAttention(dim=768, depth=0, custom_positional_encoding=dummy_positional_encoding)
1029
+
1030
+ # Perform dummy inference with the DiffAttention classes
1031
+ diff_self_attn_output = diff_self_attn(dummy_input, dummy_xpos)
1032
+ diff_cross_attn_output = diff_cross_attn(dummy_input, dummy_input, dummy_input, dummy_xpos, dummy_xpos)
1033
+ print("Init of DiffAttention & DiffCrossAttention classes is successful!")
1034
+
1035
+ # Init DiffSelfAttentionBlock & DiffCrossAttentionBlock
1036
+ diff_self_attn_block = DiffSelfAttentionBlock(
1037
+ dim=768, depth=0, num_heads=8, custom_positional_encoding=dummy_positional_encoding
1038
+ )
1039
+ diff_cross_attn_block = DiffCrossAttentionBlock(
1040
+ dim=768, depth=0, num_heads=8, custom_positional_encoding=dummy_positional_encoding
1041
+ )
1042
+
1043
+ # Perform dummy inference with the DiffAttention blocks
1044
+ diff_self_attn_block_output = diff_self_attn_block(dummy_input, dummy_xpos)
1045
+ diff_cross_attn_block_output = diff_cross_attn_block(dummy_input, dummy_input, dummy_xpos, dummy_xpos)
1046
+ print("Init of DiffSelfAttentionBlock & DiffCrossAttentionBlock is successful!")
1047
+
1048
+ # Init SelfAttentionBlock & CrossAttentionBlock with scalable softmax
1049
+ self_attn_block = SelfAttentionBlock(
1050
+ dim=768, num_heads=16, custom_positional_encoding=dummy_positional_encoding, use_scalable_softmax=True
1051
+ )
1052
+ cross_attn_block = CrossAttentionBlock(
1053
+ dim=768, num_heads=16, custom_positional_encoding=dummy_positional_encoding, use_scalable_softmax=True
1054
+ )
1055
+
1056
+ # Perform dummy inference with the Attention blocks
1057
+ self_attn_block_output = self_attn_block(dummy_input, dummy_xpos)
1058
+ cross_attn_block_output = cross_attn_block(dummy_input, dummy_input, dummy_xpos, dummy_xpos)
1059
+ print("Init of SelfAttentionBlock & CrossAttentionBlock with scalable softmax is successful!")
1060
+
1061
+ # Init SelfAttentionBlock & CrossAttentionBlock with entropy scaling
1062
+ self_attn_block = SelfAttentionBlock(
1063
+ dim=768, num_heads=16, custom_positional_encoding=dummy_positional_encoding, use_entropy_scaling=True
1064
+ )
1065
+ cross_attn_block = CrossAttentionBlock(
1066
+ dim=768, num_heads=16, custom_positional_encoding=dummy_positional_encoding, use_entropy_scaling=True
1067
+ )
1068
+
1069
+ # Perform dummy inference with the Attention blocks
1070
+ self_attn_block_output = self_attn_block(dummy_input, dummy_xpos)
1071
+ cross_attn_block_output = cross_attn_block(dummy_input, dummy_input, dummy_xpos, dummy_xpos)
1072
+ print("Init of SelfAttentionBlock & CrossAttentionBlock with entropy scaling is successful!")