fusion-bench 0.2.21__tar.gz → 0.2.22__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (940) hide show
  1. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/PKG-INFO +1 -23
  2. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/__init__.py +21 -2
  3. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/constants/__init__.py +1 -0
  4. fusion_bench-0.2.22/fusion_bench/constants/runtime.py +57 -0
  5. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/__init__.py +8 -2
  6. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/bitdelta/__init__.py +1 -0
  7. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/classification/clip_finetune.py +1 -1
  8. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fisher_merging/clip_fisher_merging.py +0 -4
  9. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fisher_merging/gpt2_fisher_merging.py +2 -2
  10. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/linear/simple_average_for_llama.py +16 -11
  11. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/simple_average.py +7 -7
  12. fusion_bench-0.2.22/fusion_bench/method/smile_upscaling/causal_lm_upscaling.py +371 -0
  13. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/projected_energy.py +1 -2
  14. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/smile_mistral_upscaling.py +5 -1
  15. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/smile_qwen2_upscaling.py +40 -31
  16. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/we_moe/__init__.py +1 -0
  17. fusion_bench-0.2.22/fusion_bench/method/we_moe/entropy_loss.py +25 -0
  18. fusion_bench-0.2.22/fusion_bench/method/we_moe/flan_t5_we_moe.py +331 -0
  19. fusion_bench-0.2.22/fusion_bench/method/we_moe/utils.py +15 -0
  20. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/clip_classification.py +11 -42
  21. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/serialization.py +18 -8
  22. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/causal_lm/causal_lm.py +32 -33
  23. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/__init__.py +5 -0
  24. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/hf_utils.py +65 -87
  25. fusion_bench-0.2.22/fusion_bench/models/model_card_templates/default.md +46 -0
  26. fusion_bench-0.2.22/fusion_bench/models/modeling_smile_llama/__init__.py +7 -0
  27. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_llama/modeling_smile_llama.py +1 -8
  28. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_qwen2/modeling_smile_qwen2.py +1 -5
  29. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/programs/fabric_fusion_program.py +29 -60
  30. fusion_bench-0.2.22/fusion_bench/scripts/cli.py +76 -0
  31. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/clip_vision/taskpool.py +9 -4
  32. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/__init__.py +1 -0
  33. fusion_bench-0.2.22/fusion_bench/utils/cache_utils.py +158 -0
  34. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/fabric.py +2 -2
  35. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/lazy_imports.py +23 -0
  36. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/lazy_state_dict.py +38 -3
  37. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/modelscope.py +3 -3
  38. fusion_bench-0.2.22/fusion_bench/utils/path.py +78 -0
  39. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/pylogger.py +1 -1
  40. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench.egg-info/PKG-INFO +1 -23
  41. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench.egg-info/SOURCES.txt +8 -0
  42. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/fisher_merging/clip_fisher_merging.yaml +0 -1
  43. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/simple_average_for_llama.yaml +3 -2
  44. fusion_bench-0.2.22/fusion_bench_config/method/smile_upscaling/causal_lm_upscaling.yaml +21 -0
  45. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/smile_upscaling/smile_qwen2_upscaling.yaml +1 -1
  46. fusion_bench-0.2.22/fusion_bench_config/method/wemoe/flan_t5_weight_ensembling_moe.yaml +20 -0
  47. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/Qwen2.5-1.5B_math_and_coder.yaml +1 -1
  48. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/pyproject.toml +6 -3
  49. fusion_bench-0.2.21/fusion_bench/scripts/cli.py +0 -43
  50. fusion_bench-0.2.21/fusion_bench/utils/cache_utils.py +0 -58
  51. fusion_bench-0.2.21/fusion_bench/utils/path.py +0 -22
  52. fusion_bench-0.2.21/fusion_bench/utils/plot/__init__.py +0 -0
  53. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/LICENSE +0 -0
  54. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/README.md +0 -0
  55. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/__main__.py +0 -0
  56. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/_get_started/__init__.py +0 -0
  57. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/_get_started/greeting_program.py +0 -0
  58. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/__init__.py +0 -0
  59. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/method/__init__.py +0 -0
  60. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/method/base_algorithm.py +0 -0
  61. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/modelpool/AutoModelForSeq2SeqLM.py +0 -0
  62. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/modelpool/__init__.py +0 -0
  63. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/modelpool/base_pool.py +0 -0
  64. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/modelpool/huggingface_clip_vision.py +0 -0
  65. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/taskpool/__init__.py +0 -0
  66. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/taskpool/base_pool.py +0 -0
  67. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/taskpool/clip_image_classification.py +0 -0
  68. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/compat/taskpool/flan_t5_glue_text_generation.py +0 -0
  69. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/constants/banner.py +0 -0
  70. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/constants/clip_vision.py +0 -0
  71. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/constants/paths.py +0 -0
  72. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/__init__.py +0 -0
  73. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/__init__.py +0 -0
  74. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/arc.py +0 -0
  75. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/arc_agi.py +0 -0
  76. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/augmenters.py +0 -0
  77. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/messagers.py +0 -0
  78. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/np_cache.py +0 -0
  79. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/preprocess.py +0 -0
  80. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/arc_agi/representers.py +0 -0
  81. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/clip_dataset.py +0 -0
  82. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/fer2013.py +0 -0
  83. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/gpt2_glue.py +0 -0
  84. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/gsm8k.py +0 -0
  85. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/image_corruption/__init__.py +0 -0
  86. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/image_corruption/make_corruption.py +0 -0
  87. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/image_dataset.py +0 -0
  88. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/imdb.py +0 -0
  89. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/__init__.py +0 -0
  90. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/alpaca.py +0 -0
  91. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/collate.py +0 -0
  92. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/metamathqa.py +0 -0
  93. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/openai.py +0 -0
  94. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/preference_700k.py +0 -0
  95. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/sharegpt.py +0 -0
  96. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/squad.py +0 -0
  97. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/stanford_shp.py +0 -0
  98. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/ultrachat.py +0 -0
  99. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/utils/__init__.py +0 -0
  100. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/llama/wikitext.py +0 -0
  101. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/dataset/nyuv2.py +0 -0
  102. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/ada_svd/__init__.py +0 -0
  103. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/ada_svd/clip_vision.py +0 -0
  104. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/__init__.py +0 -0
  105. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/clip_layer_wise_adamerging.py +0 -0
  106. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/clip_task_wise_adamerging.py +0 -0
  107. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/entropy_loss.py +0 -0
  108. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/flan_t5_layer_wise_adamerging.py +0 -0
  109. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/gpt2_layer_wise_adamerging.py +0 -0
  110. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/layer_wise_adamerging.py +0 -0
  111. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/llama_adamerging.py +0 -0
  112. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/min_norm_solvers.py +0 -0
  113. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/task_wise_adamerging.py +0 -0
  114. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/adamerging/utils.py +0 -0
  115. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/analysis/__init__.py +0 -0
  116. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/analysis/task_vector_cos_similarity.py +0 -0
  117. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/analysis/task_vector_violin_plot.py +0 -0
  118. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/base_algorithm.py +0 -0
  119. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/bitdelta/bitdelta.py +0 -0
  120. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/bitdelta/bitdelta_utils/__init__.py +0 -0
  121. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/bitdelta/bitdelta_utils/binary_gemm_kernel.py +0 -0
  122. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/bitdelta/bitdelta_utils/data.py +0 -0
  123. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/bitdelta/bitdelta_utils/diff.py +0 -0
  124. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/classification/__init__.py +0 -0
  125. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/classification/continual_clip_finetune.py +0 -0
  126. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/concrete_subspace/__init__.py +0 -0
  127. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/concrete_subspace/clip_concrete_adamerging.py +0 -0
  128. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/concrete_subspace/clip_concrete_task_arithmetic.py +0 -0
  129. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/concrete_subspace/clip_post_defense.py +0 -0
  130. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/concrete_subspace/clip_safe_concrete_adamerging.py +0 -0
  131. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dare/__init__.py +0 -0
  132. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dare/simple_average.py +0 -0
  133. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dare/task_arithmetic.py +0 -0
  134. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dare/ties_merging.py +0 -0
  135. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dare/utils.py +0 -0
  136. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dawe/__init__.py +0 -0
  137. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dawe/dawe_for_clip.py +0 -0
  138. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dawe/warppers/__init__.py +0 -0
  139. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dawe/warppers/dawe_model.py +0 -0
  140. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/depth_upscaling/__init__.py +0 -0
  141. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/depth_upscaling/depth_upscaling.py +0 -0
  142. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/depth_upscaling/depth_upscaling_for_llama.py +0 -0
  143. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/doge_ta/__init__.py +0 -0
  144. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/doge_ta/clip_layer_wise_adamerging.py +0 -0
  145. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/doge_ta/doge_ta.py +0 -0
  146. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/doge_ta/layer_wise_adamerging.py +0 -0
  147. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/dummy.py +0 -0
  148. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/ensemble.py +0 -0
  149. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/expert_sparsity/__init__.py +0 -0
  150. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/expert_sparsity/mixtral/__init__.py +0 -0
  151. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/expert_sparsity/mixtral/dynamic_skipping.py +0 -0
  152. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/expert_sparsity/mixtral/layer_wise_pruning.py +0 -0
  153. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/expert_sparsity/mixtral/progressive_pruning.py +0 -0
  154. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/expert_sparsity/utils/calibration_data.py +0 -0
  155. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fisher_merging/__init__.py +0 -0
  156. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fisher_merging/fisher_merging.py +0 -0
  157. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fw_merging/__init__.py +0 -0
  158. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fw_merging/fw_hard.py +0 -0
  159. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fw_merging/fw_soft.py +0 -0
  160. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/fw_merging/utils.py +0 -0
  161. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/__init__.py +0 -0
  162. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/clip_layer_wise_gossip.py +0 -0
  163. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/clip_task_wise_gossip.py +0 -0
  164. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/entropy_loss.py +0 -0
  165. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/flan_t5_layer_wise_gossip.py +0 -0
  166. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/layer_wise_gossip.py +0 -0
  167. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/min_norm_solvers.py +0 -0
  168. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/task_wise_gossip.py +0 -0
  169. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/gossip/utils.py +0 -0
  170. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/isotropic_merging/__init__.py +0 -0
  171. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/isotropic_merging/iso.py +0 -0
  172. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/isotropic_merging/iso_utils.py +0 -0
  173. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/knots/__init__.py +0 -0
  174. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/knots/knots_utils.py +0 -0
  175. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/linear/__init__.py +0 -0
  176. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/linear/expo.py +0 -0
  177. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/linear/linear_interpolation.py +0 -0
  178. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/linear/llama_expo.py +0 -0
  179. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/linear/task_arithmetic_for_llama.py +0 -0
  180. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/lm_finetune/__init__.py +0 -0
  181. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/lm_finetune/bradley_terry_rm.py +0 -0
  182. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/lm_finetune/causal_lm_pretrain.py +0 -0
  183. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/lm_finetune/fullfinetune_sft.py +0 -0
  184. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/lm_finetune/peftfinetune_sft.py +0 -0
  185. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/mixture_of_experts/__init__.py +0 -0
  186. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/mixture_of_experts/mixtral_merging.py +0 -0
  187. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/mixture_of_experts/mixtral_upcycling.py +0 -0
  188. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/model_recombination.py +0 -0
  189. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/__init__.py +0 -0
  190. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/hooks/__init__.py +0 -0
  191. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/hooks/deepseek_v2.py +0 -0
  192. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/hooks/hook.py +0 -0
  193. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/hooks/mixtral.py +0 -0
  194. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/moe_pruner.py +0 -0
  195. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/utils/__init__.py +0 -0
  196. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/utils/data.py +0 -0
  197. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/utils/layerwrapper.py +0 -0
  198. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/utils/prune.py +0 -0
  199. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/moe_pruner/utils/score.py +0 -0
  200. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/opcm/__init__.py +0 -0
  201. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/opcm/opcm.py +0 -0
  202. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/opcm/task_arithmetic.py +0 -0
  203. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/opcm/ties_merging.py +0 -0
  204. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/opcm/utils.py +0 -0
  205. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/opcm/weight_average.py +0 -0
  206. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/__init__.py +0 -0
  207. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/llama_magnitude_prune.py +0 -0
  208. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/llama_random_prune.py +0 -0
  209. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/llama_sparsegpt_prune.py +0 -0
  210. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/llama_wanda_prune.py +0 -0
  211. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/magnitude_diff_pruning.py +0 -0
  212. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/prune_utils.py +0 -0
  213. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/sparsegpt_utils/__init__.py +0 -0
  214. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/sparsegpt_utils/sparsegpt.py +0 -0
  215. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/__init__.py +0 -0
  216. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/ablate.py +0 -0
  217. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/data.py +0 -0
  218. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/eval.py +0 -0
  219. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/layerwrapper.py +0 -0
  220. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/prune.py +0 -0
  221. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/prune_opt.py +0 -0
  222. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pruning/wanda_utils/sparsegpt.py +0 -0
  223. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/__init__.py +0 -0
  224. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/clip_pwe_moe.py +0 -0
  225. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/module.py +0 -0
  226. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/openclip_pwe_moe.py +0 -0
  227. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/phn/__init__.py +0 -0
  228. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/phn/solvers.py +0 -0
  229. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/pwe_moe/utils.py +0 -0
  230. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/randes/__init__.py +0 -0
  231. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/randes/base_algorithm.py +0 -0
  232. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/randes/modelsoup.py +0 -0
  233. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/randes/task_arithmetic.py +0 -0
  234. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/rankone_moe/__init__.py +0 -0
  235. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/rankone_moe/clip_rankone_moe.py +0 -0
  236. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/rankone_moe/rankone_moe.py +0 -0
  237. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean/__init__.py +0 -0
  238. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean/clip_regmean.py +0 -0
  239. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean/gpt2_regmean.py +0 -0
  240. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean/regmean.py +0 -0
  241. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean_plusplus/__init__.py +0 -0
  242. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean_plusplus/clip_regmean_plusplus.py +0 -0
  243. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/regmean_plusplus/regmean_plusplus.py +0 -0
  244. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/slerp/__init__.py +0 -0
  245. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/slerp/slerp.py +0 -0
  246. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/slerp/slerp_utils.py +0 -0
  247. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/__init__.py +0 -0
  248. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/error_accumulation.py +0 -0
  249. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/singular_projection_merging.py +0 -0
  250. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/smile_upscaling/smile_upscaling.py +1 -1
  251. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/sparse_we_moe/__init__.py +0 -0
  252. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/sparse_we_moe/sparse_clip_we_moe.py +0 -0
  253. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/sparse_we_moe/sparse_we_moe.py +0 -0
  254. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/sparselo/__init__.py +0 -0
  255. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/sparselo/sparselo.py +0 -0
  256. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/surgery/__init__.py +0 -0
  257. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/surgery/clip_layer_wise_adamerging_surgery.py +0 -0
  258. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/tall_mask/__init__.py +0 -0
  259. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/tall_mask/task_arithmetic.py +0 -0
  260. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/tall_mask/utils.py +0 -0
  261. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_arithmetic/__init__.py +0 -0
  262. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_arithmetic/task_arithmetic.py +0 -0
  263. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/TSVC.py +0 -0
  264. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/TSVM.py +0 -0
  265. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/__init__.py +0 -0
  266. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/utils/TSVC_utils.py +0 -0
  267. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/utils/TSVM_utils.py +0 -0
  268. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/utils/__init__.py +0 -0
  269. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/task_singular_vector/utils/task_singular_interference.py +0 -0
  270. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/ties_merging/__init__.py +0 -0
  271. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/ties_merging/ties_merging.py +0 -0
  272. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/ties_merging/ties_merging_utils.py +0 -0
  273. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/trust_region/__init__.py +0 -0
  274. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/trust_region/clip_task_arithmetic.py +0 -0
  275. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/trust_region/utils.py +0 -0
  276. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/we_moe/clip_we_moe.py +0 -0
  277. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/we_moe/we_moe.py +0 -0
  278. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/weighted_average/__init__.py +0 -0
  279. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/weighted_average/llama.py +1 -1
  280. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/method/weighted_average/weighted_average.py +0 -0
  281. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/__init__.py +0 -0
  282. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/continual_learning/__init__.py +0 -0
  283. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/continual_learning/backward_transfer.py +0 -0
  284. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/nyuv2/__init__.py +0 -0
  285. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/nyuv2/depth.py +0 -0
  286. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/nyuv2/loss.py +0 -0
  287. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/nyuv2/noise.py +0 -0
  288. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/nyuv2/normal.py +0 -0
  289. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/nyuv2/segmentation.py +0 -0
  290. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/text_to_image_generation/__init__.py +0 -0
  291. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/text_to_image_generation/aesthetic_scorer.py +0 -0
  292. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/text_to_image_generation/compressibility.py +0 -0
  293. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/metrics/text_to_image_generation/pickscore_scorer.py +0 -0
  294. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/__init__.py +0 -0
  295. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/fabric_training.py +0 -0
  296. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/hydra_config.py +0 -0
  297. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/lightning_fabric.py +0 -0
  298. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/openclip_classification.py +0 -0
  299. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/optim/__init__.py +0 -0
  300. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/optim/adamw_with_warmup.py +0 -0
  301. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/rich_live.py +0 -0
  302. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/mixins/simple_profiler.py +0 -0
  303. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/PeftModelForSeq2SeqLM.py +0 -0
  304. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/__init__.py +0 -0
  305. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/base_pool.py +0 -0
  306. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/causal_lm/__init__.py +0 -0
  307. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/clip_vision/__init__.py +0 -0
  308. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/clip_vision/modelpool.py +0 -0
  309. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/huggingface_automodel.py +0 -0
  310. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/huggingface_gpt2_classification.py +0 -0
  311. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/lazy_state_dict_pool.py +0 -0
  312. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/nyuv2_modelpool.py +0 -0
  313. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/openclip_vision/__init__.py +0 -0
  314. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/openclip_vision/modelpool.py +0 -0
  315. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/seq2seq_lm/__init__.py +0 -0
  316. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/seq2seq_lm/modelpool.py +0 -0
  317. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/seq_classification_lm/__init__.py +0 -0
  318. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/seq_classification_lm/reward_model.py +0 -0
  319. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/modelpool/seq_classification_lm/seq_classification_lm.py +0 -0
  320. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/chat_templates/__init__.py +0 -0
  321. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/chat_templates/llama_3_Instruct.py +0 -0
  322. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/chat_templates/load_tokenizer.py +0 -0
  323. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/expert_sparsity/__init__.py +0 -0
  324. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/expert_sparsity/mixtral/__init__.py +0 -0
  325. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/expert_sparsity/mixtral/dataset.py +0 -0
  326. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/expert_sparsity/mixtral/modeling_mixtral.py +0 -0
  327. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/expert_sparsity/mixtral/wrapper.py +0 -0
  328. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/hf_clip.py +0 -0
  329. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/linearized/__init__.py +0 -0
  330. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/linearized/linearized_model_utils.py +0 -0
  331. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/linearized/vision_model.py +0 -0
  332. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/__init__.py +0 -0
  333. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/model_utils/__init__.py +0 -0
  334. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/model_utils/embedding.py +0 -0
  335. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/model_utils/liger_kernel.py +0 -0
  336. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/model_utils/misc.py +0 -0
  337. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/model_utils/mod.py +0 -0
  338. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/model_utils/visual.py +0 -0
  339. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/patcher.py +0 -0
  340. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/llama/tokenizer_loader.py +0 -0
  341. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/masks/__init__.py +0 -0
  342. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/masks/mask_model.py +0 -0
  343. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_deepseek_v2/__init__.py +0 -0
  344. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_deepseek_v2/configuration_deepseek.py +0 -0
  345. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_deepseek_v2/modeling_deepseek.py +0 -0
  346. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_deepseek_v2/tokenization_deepseek_fast.py +0 -0
  347. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_losparse_llama/__init__.py +0 -0
  348. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_losparse_llama/configuration_losparse_llama.py +0 -0
  349. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_losparse_llama/losparse_linear.py +0 -0
  350. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_losparse_llama/modeling_losparse_llama.py +0 -0
  351. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_losparse_llama/register.py +0 -0
  352. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_losparse_llama/utils.py +0 -0
  353. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_gemma2/__init__.py +0 -0
  354. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_gemma2/configuration_smile_gemma2.py +0 -0
  355. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_gemma2/modeling_smile_gemma2.py +0 -0
  356. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_gemma2/register.py +0 -0
  357. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_llama/configuration_smile_llama.py +0 -0
  358. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_llama/register.py +0 -0
  359. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_mistral/__init__.py +1 -1
  360. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_mistral/configuration_smile_mistral.py +0 -0
  361. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_mistral/modeling_smile_mistral.py +0 -0
  362. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_mistral/register.py +0 -0
  363. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_qwen2/__init__.py +0 -0
  364. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_qwen2/configuration_smile_qwen2.py +0 -0
  365. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/modeling_smile_qwen2/register.py +0 -0
  366. {fusion_bench-0.2.21/fusion_bench/models/modeling_smile_llama → fusion_bench-0.2.22/fusion_bench/models/nyuv2}/__init__.py +0 -0
  367. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/nyuv2/aspp.py +0 -0
  368. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/nyuv2/lightning_module.py +0 -0
  369. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/nyuv2/resnet.py +0 -0
  370. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/nyuv2/resnet_dilated.py +0 -0
  371. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/open_clip/__init__.py +0 -0
  372. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/open_clip/modeling.py +0 -0
  373. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/open_clip/utils.py +0 -0
  374. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/open_clip/variables_and_paths.py +0 -0
  375. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/parameter_dict.py +0 -0
  376. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/rankone_moe.py +0 -0
  377. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/separate_io.py +0 -0
  378. {fusion_bench-0.2.21/fusion_bench/models/nyuv2 → fusion_bench-0.2.22/fusion_bench/models/smile_moe}/__init__.py +0 -0
  379. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/smile_moe/linear_from_hf_config.py +0 -0
  380. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/smile_moe/linear_from_module.py +0 -0
  381. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/smile_moe/utils/__init__.py +0 -0
  382. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/smile_moe/utils/svd_utils.py +0 -0
  383. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/sparse_we_moe.py +0 -0
  384. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/surgery/__init__.py +0 -0
  385. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/surgery/surgerymodelwrapper.py +0 -0
  386. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/utils.py +0 -0
  387. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/we_moe.py +0 -0
  388. {fusion_bench-0.2.21/fusion_bench/models/smile_moe → fusion_bench-0.2.22/fusion_bench/models/wrappers}/__init__.py +0 -0
  389. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/wrappers/ensemble.py +0 -0
  390. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/wrappers/layer_wise_fusion.py +0 -0
  391. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/wrappers/layer_wise_fusion_doge_ta.py +0 -0
  392. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/models/wrappers/task_wise_fusion.py +0 -0
  393. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/__init__.py +0 -0
  394. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/exception.py +0 -0
  395. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/lr_scheduler/__init__.py +0 -0
  396. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/lr_scheduler/linear_warmup.py +0 -0
  397. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/lr_scheduler/utils/__init__.py +0 -0
  398. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/lr_scheduler/utils/visualization.py +0 -0
  399. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/optim/mezo.py +0 -0
  400. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/programs/__init__.py +0 -0
  401. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/programs/base_program.py +0 -0
  402. {fusion_bench-0.2.21/fusion_bench/models/wrappers → fusion_bench-0.2.22/fusion_bench/scripts}/__init__.py +0 -0
  403. {fusion_bench-0.2.21/fusion_bench/scripts → fusion_bench-0.2.22/fusion_bench/scripts/clip}/__init__.py +0 -0
  404. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/scripts/clip/convert_checkpoint.py +0 -0
  405. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/scripts/imgui.py +0 -0
  406. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/scripts/nyuv2_mtl_train.py +0 -0
  407. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/scripts/webui.py +0 -0
  408. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/__init__.py +0 -0
  409. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/base_pool.py +0 -0
  410. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/clip_vision/__init__.py +0 -0
  411. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/clip_vision/clip_rankone_moe_taskpool.py +0 -0
  412. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/clip_vision/clip_smile_taskpool.py +0 -0
  413. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/clip_vision/clip_sparse_wemoe_taskpool.py +0 -0
  414. {fusion_bench-0.2.21/fusion_bench/scripts/clip → fusion_bench-0.2.22/fusion_bench/taskpool/clip_vision/utils}/__init__.py +0 -0
  415. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/clip_vision/utils/routing_analysis_utils.py +0 -0
  416. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/dummy.py +0 -0
  417. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/gpt2_text_classification.py +0 -0
  418. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/llama/__init__.py +0 -0
  419. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/llama/reward_model.py +0 -0
  420. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/llama/test_generation.py +0 -0
  421. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/lm_eval_harness/__init__.py +0 -0
  422. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/lm_eval_harness/taskpool.py +0 -0
  423. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/nyuv2_taskpool.py +0 -0
  424. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/openclip_vision/__init__.py +0 -0
  425. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/taskpool/openclip_vision/openclip_taskpool.py +0 -0
  426. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/__init__.py +0 -0
  427. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/base_task.py +0 -0
  428. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/classification.py +0 -0
  429. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/__init__.py +0 -0
  430. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/cifar10.py +0 -0
  431. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/cifar100.py +0 -0
  432. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/clip_dataset.py +0 -0
  433. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/cub_200_2011.py +0 -0
  434. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/dtd.py +0 -0
  435. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/emnist_letters.py +0 -0
  436. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/emnist_mnist.py +0 -0
  437. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/eurosat.py +0 -0
  438. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/fashion_mnist.py +0 -0
  439. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/fer2013.py +0 -0
  440. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/flower102.py +0 -0
  441. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/food101.py +0 -0
  442. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/gtsrb.py +0 -0
  443. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/imagenet.py +0 -0
  444. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/kmnist.py +0 -0
  445. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/mnist.py +0 -0
  446. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/mongo_leaf_disease.py +0 -0
  447. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/oxford_iiit_pet.py +0 -0
  448. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/pcam.py +0 -0
  449. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/rendered_sst2.py +0 -0
  450. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/resisc45.py +0 -0
  451. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/stanford_cars.py +0 -0
  452. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/stl10.py +0 -0
  453. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/sun397.py +0 -0
  454. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/svhn.py +0 -0
  455. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/clip_classification/tiny_imagenet.py +0 -0
  456. {fusion_bench-0.2.21/fusion_bench/taskpool/clip_vision/utils → fusion_bench-0.2.22/fusion_bench/tasks/flan_t5_text_generation}/__init__.py +0 -0
  457. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/flan_t5_text_generation/datasets_preprocess.py +0 -0
  458. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/flan_t5_text_generation/glue_evaluation.py +0 -0
  459. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/flan_t5_text_generation/glue_load_dataset.py +0 -0
  460. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/flan_t5_text_generation/glue_preprocessors.py +0 -0
  461. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/tasks/flan_t5_text_generation/glue_prompt_templates.py +0 -0
  462. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/auto.py +0 -0
  463. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/data.py +0 -0
  464. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/devices.py +0 -0
  465. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/dict.py +0 -0
  466. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/dtype.py +0 -0
  467. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/expr.py +0 -0
  468. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/functools.py +0 -0
  469. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/hydra_utils.py +0 -0
  470. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/instantiate_utils.py +0 -0
  471. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/json.py +0 -0
  472. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/misc.py +0 -0
  473. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/packages.py +0 -0
  474. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/parameters.py +0 -0
  475. {fusion_bench-0.2.21/fusion_bench/tasks/flan_t5_text_generation → fusion_bench-0.2.22/fusion_bench/utils/plot}/__init__.py +0 -0
  476. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/plot/color_data.py +0 -0
  477. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/plot/token.py +0 -0
  478. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/plot/token_notebook.py +0 -0
  479. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/rich_utils.py +0 -0
  480. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/set.py +0 -0
  481. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/state_dict_arithmetic.py +0 -0
  482. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/strenum/__init__.py +0 -0
  483. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/strenum/_name_mangler.py +0 -0
  484. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/strenum/_version.py +0 -0
  485. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/tensorboard.py +0 -0
  486. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/timer.py +0 -0
  487. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench/utils/type.py +0 -0
  488. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench.egg-info/dependency_links.txt +0 -0
  489. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench.egg-info/entry_points.txt +0 -0
  490. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench.egg-info/requires.txt +0 -0
  491. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench.egg-info/top_level.txt +0 -0
  492. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/README.md +0 -0
  493. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/_get_started/clip_evaluate_single_model.yaml +0 -0
  494. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/_get_started/clip_simple_average.yaml +0 -0
  495. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/_get_started/clip_task_arithmetic.yaml +0 -0
  496. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/_get_started/greeting_program.yaml +0 -0
  497. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/clip-vit-base-patch32_robustness_corrupted.yaml +0 -0
  498. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/README.md +0 -0
  499. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/TALL10.yaml +0 -0
  500. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/TALL12.yaml +0 -0
  501. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/TALL14.yaml +0 -0
  502. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/TALL16.yaml +0 -0
  503. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/TALL18.yaml +0 -0
  504. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/TALL20.yaml +0 -0
  505. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/cifar10.yaml +0 -0
  506. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/cifar100.yaml +0 -0
  507. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/cub-200-2011.yaml +0 -0
  508. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/dtd.yaml +0 -0
  509. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/emnist_letters.yaml +0 -0
  510. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/emnist_mnist.yaml +0 -0
  511. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/eurosat.yaml +0 -0
  512. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/fashion_mnist.yaml +0 -0
  513. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/fer2013.yaml +0 -0
  514. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/food101.yaml +0 -0
  515. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/gtsrb.yaml +0 -0
  516. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/kmnist.yaml +0 -0
  517. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/mango-leaf-disease.yaml +0 -0
  518. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/mnist.yaml +0 -0
  519. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/oxford-iiit-pet.yaml +0 -0
  520. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/oxford_flowers102.yaml +0 -0
  521. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/pcam.yaml +0 -0
  522. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/rendered-sst2.yaml +0 -0
  523. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/resisc45.yaml +0 -0
  524. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/stanford-cars.yaml +0 -0
  525. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/stl10.yaml +0 -0
  526. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/sun397.yaml +0 -0
  527. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/svhn.yaml +0 -0
  528. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/the_eight_tasks.yaml +0 -0
  529. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/test/tiny-imagenet.yaml +0 -0
  530. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/TALL10.yaml +0 -0
  531. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/TALL12.yaml +0 -0
  532. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/TALL14.yaml +0 -0
  533. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/TALL16.yaml +0 -0
  534. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/TALL18.yaml +0 -0
  535. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/TALL20.yaml +0 -0
  536. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/cifar10.yaml +0 -0
  537. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/cifar100.yaml +0 -0
  538. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/cub-200-2011.yaml +0 -0
  539. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/dtd.yaml +0 -0
  540. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/emnist_letters.yaml +0 -0
  541. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/emnist_mnist.yaml +0 -0
  542. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/eurosat.yaml +0 -0
  543. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/fashion_mnist.yaml +0 -0
  544. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/fer2013.yaml +0 -0
  545. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/food101.yaml +0 -0
  546. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/gtsrb.yaml +0 -0
  547. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/kmnist.yaml +0 -0
  548. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/mango-leaf-disease.yaml +0 -0
  549. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/mnist.yaml +0 -0
  550. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/oxford-iiit-pet.yaml +0 -0
  551. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/oxford_flowers102.yaml +0 -0
  552. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/pcam.yaml +0 -0
  553. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/rendered-sst2.yaml +0 -0
  554. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/resisc45.yaml +0 -0
  555. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/stanford-cars.yaml +0 -0
  556. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/stl10.yaml +0 -0
  557. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/sun397.yaml +0 -0
  558. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/svhn.yaml +0 -0
  559. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/the_eight_tasks.yaml +0 -0
  560. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/train/tiny-imagenet.yaml +0 -0
  561. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/dtd.yaml +0 -0
  562. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/eurosat.yaml +0 -0
  563. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/gtsrb.yaml +0 -0
  564. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/mnist.yaml +0 -0
  565. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/resisc45.yaml +0 -0
  566. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/stanford-cars.yaml +0 -0
  567. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/sun397.yaml +0 -0
  568. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/svhn.yaml +0 -0
  569. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/image_classification/val/the_eight_tasks.yaml +0 -0
  570. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/llm_sft/alpaca_cleaned.yaml +0 -0
  571. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/llm_sft/ultrachat_200k.yaml +0 -0
  572. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/question_answering/search_qa.yaml +0 -0
  573. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/question_answering/test/search_qa.yaml +0 -0
  574. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/question_answering/train/MetaMathQA.yaml +0 -0
  575. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/question_answering/train/search_qa.yaml +0 -0
  576. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/question_answering/val/search_qa.yaml +0 -0
  577. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/summarization/test/xsum.yaml +0 -0
  578. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/summarization/train/xsum.yaml +0 -0
  579. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/summarization/val/xsum.yaml +0 -0
  580. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/summarization/xsum.yaml +0 -0
  581. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/text_generation/test/gsm-hard.yaml +0 -0
  582. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/text_generation/test/gsm8k.yaml +0 -0
  583. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/text_generation/test/gsm8k_question_label.yaml +0 -0
  584. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/text_generation/train/CodeAlpaca-20k.yaml +0 -0
  585. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/text_generation/train/gsm8k.yaml +0 -0
  586. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/dataset/text_generation/train/gsm8k_question_label.yaml +0 -0
  587. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/auto.yaml +0 -0
  588. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/llama_ddp.yaml +0 -0
  589. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/llama_fsdp.yaml +0 -0
  590. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/llama_peft_fsdp.yaml +0 -0
  591. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/loggers/csv_logger.yaml +0 -0
  592. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/loggers/mlflow_logger.yaml +0 -0
  593. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/loggers/tensorboard_logger.yaml +0 -0
  594. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/loggers/wandb_logger.yaml +0 -0
  595. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/strategy/deepspeed.yaml +0 -0
  596. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/strategy/llama_fsdp.yaml +0 -0
  597. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric/strategy/llama_peft_fsdp.yaml +0 -0
  598. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/fabric_model_fusion.yaml +0 -0
  599. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/hydra/default.yaml +0 -0
  600. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/hydra/help/fusion_bench_help.yaml +0 -0
  601. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/hydra/job_logging/rich_logging.yaml +0 -0
  602. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/llama_full_finetune.yaml +0 -0
  603. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/llama_magnitude_pruning.yaml +0 -0
  604. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/llama_model_fusion.yaml +0 -0
  605. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/ada_svd/clip_vision.yaml +0 -0
  606. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/adamerging/clip.yaml +0 -0
  607. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/adamerging/layer_wise_flan_t5.yaml +0 -0
  608. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/adamerging/layer_wise_gpt2.yaml +0 -0
  609. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/adamerging/llama_sft.yaml +0 -0
  610. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/analysis/task_vector_cos_similarity.yaml +0 -0
  611. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/analysis/task_vector_violin_plot.yaml +0 -0
  612. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/bitdelta/bitdelta.yaml +0 -0
  613. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/classification/clip_continual_finetune.yaml +0 -0
  614. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/classification/clip_finetune.yaml +0 -0
  615. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/clip_finetune.yaml +0 -0
  616. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_concrete_layer_wise_adamerging.yaml +0 -0
  617. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_concrete_task_arithmetic.yaml +0 -0
  618. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_concrete_task_wise_adamerging.yaml +0 -0
  619. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_post_defense_AWM.yaml +0 -0
  620. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_post_defense_SAU.yaml +0 -0
  621. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_safe_concrete_layer_wise_adamerging.yaml +0 -0
  622. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/concrete_subspace/clip_safe_concrete_task_arithmetic.yaml +0 -0
  623. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/dare/simple_average.yaml +0 -0
  624. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/dare/task_arithmetic.yaml +0 -0
  625. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/dare/ties_merging.yaml +0 -0
  626. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/dawe/dawe_for_clip.yaml +0 -0
  627. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/depth_upscaling.yaml +0 -0
  628. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/doge_ta/doge_ta.yaml +0 -0
  629. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/dummy.yaml +0 -0
  630. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/ensemble/max_model_predictor.yaml +0 -0
  631. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/ensemble/simple_ensemble.yaml +0 -0
  632. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/ensemble/weighted_ensemble.yaml +0 -0
  633. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/expert_sparsity/README.md +0 -0
  634. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/expert_sparsity/mixtral.yaml +0 -0
  635. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/fisher_merging/fisher_merging.yaml +0 -0
  636. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/fisher_merging/gpt2_fisher_merging.yaml +0 -0
  637. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/fw_merging/fw_hard.yaml +0 -0
  638. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/fw_merging/fw_soft.yaml +0 -0
  639. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/gossip/layer_wise_clip.yaml +0 -0
  640. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/gossip/layer_wise_flan_t5.yaml +0 -0
  641. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/isotropic_merging/iso_c.yaml +0 -0
  642. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/isotropic_merging/iso_cts.yaml +0 -0
  643. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/expo.yaml +0 -0
  644. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/linear_interpolation.yaml +0 -0
  645. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/llama_expo.yaml +0 -0
  646. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/llama_expo_with_dare.yaml +0 -0
  647. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/task_arithmetic_for_llama.yaml +0 -0
  648. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/weighted_average.yaml +0 -0
  649. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/linear/weighted_average_for_llama.yaml +0 -0
  650. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/lm_finetune/bradley_terry_rm.yaml +0 -0
  651. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/lm_finetune/fullfinetune_sft.yaml +0 -0
  652. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/lm_finetune/peftfinetune_sft.yaml +0 -0
  653. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/mixtral_moe_merging.yaml +0 -0
  654. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/mixtral_moe_upscaling.yaml +0 -0
  655. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/model_recombination.yaml +0 -0
  656. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/moe_pruner/moe_pruner.yaml +0 -0
  657. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/opcm/opcm.yaml +0 -0
  658. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/opcm/task_arithmetic.yaml +0 -0
  659. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/opcm/ties_merging.yaml +0 -0
  660. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/opcm/weight_average.yaml +0 -0
  661. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pruning/llama_magnitude_pruning.yaml +0 -0
  662. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pruning/llama_random_pruning.yaml +0 -0
  663. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pruning/llama_sparsegpt_pruning.yaml +0 -0
  664. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pruning/llama_wanda_pruning.yaml +0 -0
  665. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pruning/magnitude_diff_pruning.yaml +0 -0
  666. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pwe_moe/epo_for_openclip.yaml +0 -0
  667. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pwe_moe/ls_for_openclip.yaml +0 -0
  668. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/pwe_moe/pwe_moe_ls_for_clip.yaml +0 -0
  669. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/randes/superposed_model_soup.yaml +0 -0
  670. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/randes/superposed_task_arithmetic.yaml +0 -0
  671. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/randes/superposed_task_arithmetic_lora.yaml +0 -0
  672. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/rankone_moe/rankone_moe.yaml +0 -0
  673. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/regmean/clip_regmean.yaml +0 -0
  674. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/regmean/gpt2_regmean.yaml +0 -0
  675. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/regmean/regmean.yaml +0 -0
  676. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/regmean_plusplus/clip_regmean_plusplus.yaml +0 -0
  677. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/simple_average.yaml +0 -0
  678. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/slerp/slerp.yaml +0 -0
  679. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/smile_upscaling/error_accumulation.yaml +0 -0
  680. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/smile_upscaling/projected_energy.yaml +0 -0
  681. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/smile_upscaling/singular_projection_merging.yaml +0 -0
  682. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/smile_upscaling/smile_mistral_upscaling.yaml +0 -0
  683. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/smile_upscaling/smile_upscaling.yaml +0 -0
  684. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/sparselo_pruning/llama_iterative_sparselo.yaml +0 -0
  685. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/sparselo_pruning/llama_pcp_sparselo.yaml +0 -0
  686. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/sparselo_pruning/llama_sparselo.yaml +0 -0
  687. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/surgery/adamerging_surgery.yaml +0 -0
  688. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/tall_mask/task_arithmetic.yaml +0 -0
  689. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/task_arithmetic.yaml +0 -0
  690. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/task_singular_vector/TaskSingularVectorMerging.yaml +0 -0
  691. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/ties_merging.yaml +0 -0
  692. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/trust_region/clip_task_arithmetic.yaml +0 -0
  693. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/wemoe/sparse_weight_ensembling_moe.yaml +0 -0
  694. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/method/wemoe/weight_ensembling_moe.yaml +0 -0
  695. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/README.md +0 -0
  696. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16.yaml +0 -0
  697. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_TALL14.yaml +0 -0
  698. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_TALL20.yaml +0 -0
  699. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_cifar10.yaml +0 -0
  700. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_cifar100.yaml +0 -0
  701. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_dtd.yaml +0 -0
  702. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_eight_tasks.yaml +0 -0
  703. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_emnist_letters.yaml +0 -0
  704. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_eurosat.yaml +0 -0
  705. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_fashion_mnist.yaml +0 -0
  706. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_fer2013.yaml +0 -0
  707. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_food101.yaml +0 -0
  708. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_gtsrb.yaml +0 -0
  709. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_kmnist.yaml +0 -0
  710. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_mnist.yaml +0 -0
  711. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_oxford-iiit-pet.yaml +0 -0
  712. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_oxford_flowers102.yaml +0 -0
  713. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_pcam.yaml +0 -0
  714. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_rendered-sst2.yaml +0 -0
  715. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_resisc45.yaml +0 -0
  716. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_stanford-cars.yaml +0 -0
  717. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_stl10.yaml +0 -0
  718. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_sun397.yaml +0 -0
  719. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch16_svhn.yaml +0 -0
  720. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32.yaml +0 -0
  721. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_TALL10.yaml +0 -0
  722. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_TALL12.yaml +0 -0
  723. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_TALL14.yaml +0 -0
  724. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_TALL16.yaml +0 -0
  725. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_TALL18.yaml +0 -0
  726. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_TALL20.yaml +0 -0
  727. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_cifar10.yaml +0 -0
  728. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_cifar100.yaml +0 -0
  729. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_dtd.yaml +0 -0
  730. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_eight_tasks.yaml +0 -0
  731. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_emnist_letters.yaml +0 -0
  732. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_eurosat.yaml +0 -0
  733. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_fashion_mnist.yaml +0 -0
  734. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_fer2013.yaml +0 -0
  735. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_food101.yaml +0 -0
  736. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_gtsrb.yaml +0 -0
  737. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_kmnist.yaml +0 -0
  738. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_mnist.yaml +0 -0
  739. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_oxford-iiit-pet.yaml +0 -0
  740. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_oxford_flowers102.yaml +0 -0
  741. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_pcam.yaml +0 -0
  742. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_rendered-sst2.yaml +0 -0
  743. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_resisc45.yaml +0 -0
  744. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_stanford-cars.yaml +0 -0
  745. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_stl10.yaml +0 -0
  746. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_sun397.yaml +0 -0
  747. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-base-patch32_svhn.yaml +0 -0
  748. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14.yaml +0 -0
  749. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_TALL14.yaml +0 -0
  750. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_TALL20.yaml +0 -0
  751. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_cifar10.yaml +0 -0
  752. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_cifar100.yaml +0 -0
  753. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_dtd.yaml +0 -0
  754. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_eight_tasks.yaml +0 -0
  755. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_emnist_letters.yaml +0 -0
  756. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_eurosat.yaml +0 -0
  757. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_fashion_mnist.yaml +0 -0
  758. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_fer2013.yaml +0 -0
  759. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_food101.yaml +0 -0
  760. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_gtsrb.yaml +0 -0
  761. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_kmnist.yaml +0 -0
  762. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_mnist.yaml +0 -0
  763. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_oxford-iiit-pet.yaml +0 -0
  764. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_oxford_flowers102.yaml +0 -0
  765. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_pcam.yaml +0 -0
  766. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_rendered-sst2.yaml +0 -0
  767. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_resisc45.yaml +0 -0
  768. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_stanford-cars.yaml +0 -0
  769. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_stl10.yaml +0 -0
  770. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_sun397.yaml +0 -0
  771. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/clip-vit-large-patch14_svhn.yaml +0 -0
  772. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/download_TALL20_models.sh +0 -0
  773. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/clip-vit/generate_vit_model_config.sh +0 -0
  774. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base.yaml +0 -0
  775. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-cola.yaml +0 -0
  776. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-cola_lora-16.yaml +0 -0
  777. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-mnli.yaml +0 -0
  778. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-mnli_lora-16.yaml +0 -0
  779. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-mrpc.yaml +0 -0
  780. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-mrpc_lora-16.yaml +0 -0
  781. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-qnli.yaml +0 -0
  782. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-qnli_lora-16.yaml +0 -0
  783. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-qqp.yaml +0 -0
  784. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-qqp_lora-16.yaml +0 -0
  785. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-rte.yaml +0 -0
  786. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-rte_lora-16.yaml +0 -0
  787. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-sst2.yaml +0 -0
  788. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-sst2_lora-16.yaml +0 -0
  789. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-stsb.yaml +0 -0
  790. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-base_glue-stsb_lora-16.yaml +0 -0
  791. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large.yaml +0 -0
  792. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-cola_lora-16.yaml +0 -0
  793. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-mnli_lora-16.yaml +0 -0
  794. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-mrpc_lora-16.yaml +0 -0
  795. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-qnli_lora-16.yaml +0 -0
  796. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-qqp_lora-16.yaml +0 -0
  797. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-rte_lora-16.yaml +0 -0
  798. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-sst2_lora-16.yaml +0 -0
  799. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/flan-t5-large_glue-stsb_lora-16.yaml +0 -0
  800. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/model/flan-t5/generate_flan-t5.sh +0 -0
  801. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/_template.yaml +0 -0
  802. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TA8.yaml +0 -0
  803. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TA8_lora.yaml +0 -0
  804. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TA8_model_only.yaml +0 -0
  805. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TALL14.yaml +0 -0
  806. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TALL14_model_only.yaml +0 -0
  807. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TALL20.yaml +0 -0
  808. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TALL20_model_only.yaml +0 -0
  809. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_individual.yaml +0 -0
  810. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_individual_lora.yaml +0 -0
  811. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TA8.yaml +0 -0
  812. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TA8_control_task.yaml +0 -0
  813. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TA8_model_only.yaml +0 -0
  814. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL10.yaml +0 -0
  815. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL12.yaml +0 -0
  816. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL14.yaml +0 -0
  817. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL14_model_only.yaml +0 -0
  818. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL16.yaml +0 -0
  819. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL18.yaml +0 -0
  820. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL20.yaml +0 -0
  821. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL20_model_only.yaml +0 -0
  822. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_cars_and_dtd.yaml +0 -0
  823. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_generalization_exp1.yaml +0 -0
  824. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_generalization_exp2.yaml +0 -0
  825. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_individual.yaml +0 -0
  826. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_mtl.yaml +0 -0
  827. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_robustness_clean.yaml +0 -0
  828. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_robustness_corrupted.yaml +0 -0
  829. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_single_finetuned.yaml +0 -0
  830. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_single_task_projection.yaml +0 -0
  831. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_and_cars.yaml +0 -0
  832. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_and_dtd.yaml +0 -0
  833. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_cars_and_dtd.yaml +0 -0
  834. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_svhn_and_mnist.yaml +0 -0
  835. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_two_tasks_control_task.yaml +0 -0
  836. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TA8.yaml +0 -0
  837. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TA8_model_only.yaml +0 -0
  838. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TALL14.yaml +0 -0
  839. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TALL14_model_only.yaml +0 -0
  840. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TALL20.yaml +0 -0
  841. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TALL20_model_only.yaml +0 -0
  842. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_individual.yaml +0 -0
  843. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/Qwen2.5-7B-math_and_coder.yaml +0 -0
  844. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/deepseek-v2-lite.yaml +0 -0
  845. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/llama_alpaca_cleaned.yaml +0 -0
  846. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/llama_codealpaca.yaml +0 -0
  847. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/llama_for_causallm.yaml +0 -0
  848. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/llama_metamathqa.yaml +0 -0
  849. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/llama_ultrachat.yaml +0 -0
  850. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/Llama-3.1-8B-Instruct.yaml +0 -0
  851. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/Llama-3.1-8B.yaml +0 -0
  852. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/Llama-3.2-3B-Instruct.yaml +0 -0
  853. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/Llama-3.2-3B.yaml +0 -0
  854. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/gemma-2-2b-it.yaml +0 -0
  855. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/gemma-2-2b.yaml +0 -0
  856. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/gemma-2-9b-it.yaml +0 -0
  857. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mergebench/gemma-2-9b.yaml +0 -0
  858. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mistral-7b.yaml +0 -0
  859. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mixtral-8x7b.yaml +0 -0
  860. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/mixtral_moe_merging.yaml +0 -0
  861. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/qwen2_math_1.5B_and_R1.yaml +0 -0
  862. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/simle_mixtral_exp_v4.yaml +0 -0
  863. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/single_llama_model.yaml +0 -0
  864. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/CausalLMPool/vicuna-7b-v1.5.yaml +0 -0
  865. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/README.md +0 -0
  866. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-B-16_TA8.yaml +0 -0
  867. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-B-32_TA8.yaml +0 -0
  868. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-B-32_TA_cars_dtd.yaml +0 -0
  869. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-B-32_TA_sun397_cars.yaml +0 -0
  870. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-B-32_TA_sun397_dtd.yaml +0 -0
  871. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-B-32_individual.yaml +0 -0
  872. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/OpenCLIPVisionModelPool/ViT-L-14_TA8.yaml +0 -0
  873. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/_template.yaml +0 -0
  874. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/flan-t5-base_glue.yaml +0 -0
  875. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/flan-t5-base_glue_lora16.yaml +0 -0
  876. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/flan-t5-base_glue_lora16_tta.yaml +0 -0
  877. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/flan-t5-base_glue_tta.yaml +0 -0
  878. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/flan-t5-base_individual.yaml +0 -0
  879. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/Seq2SeqLMPool/flan-t5-large_glue_lora16.yaml +0 -0
  880. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/SequenceClassificationModelPool/llama_preference700k.yaml +0 -0
  881. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/SequenceClassificationModelPool/roberta-base_glue.yaml +0 -0
  882. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/SequenceClassificationModelPool/single_reward_model.yaml +0 -0
  883. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/automodelpool.yaml +0 -0
  884. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/gpt-2_glue.yaml +0 -0
  885. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/nyuv2_modelpool.yaml +0 -0
  886. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/smile_mistral_exp_v1.yaml +0 -0
  887. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/smile_mistral_exp_v2.yaml +0 -0
  888. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/smile_mistral_exp_v3.yaml +0 -0
  889. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/modelpool/smile_mistral_exp_v4.yaml +0 -0
  890. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/nyuv2_config.yaml +0 -0
  891. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/nyuv2_mtl_train.yaml +0 -0
  892. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/path/default.yaml +0 -0
  893. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/_template.yaml +0 -0
  894. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-base-patch32_robustness_corrupted.yaml +0 -0
  895. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-base-patch32_svhn_and_mnist.yaml +0 -0
  896. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TA8.yaml +0 -0
  897. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TA8_B16.yaml +0 -0
  898. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TA8_L14.yaml +0 -0
  899. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TA8_val.yaml +0 -0
  900. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TA8_with_control_task.yaml +0 -0
  901. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TALL14.yaml +0 -0
  902. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-classification_TALL20.yaml +0 -0
  903. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_cifar10.yaml +0 -0
  904. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_cifar100.yaml +0 -0
  905. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_dtd.yaml +0 -0
  906. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_emnist_letters.yaml +0 -0
  907. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_eurosat.yaml +0 -0
  908. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_fashion_mnist.yaml +0 -0
  909. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_fer2013.yaml +0 -0
  910. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_food101.yaml +0 -0
  911. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_gtsrb.yaml +0 -0
  912. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_kmnist.yaml +0 -0
  913. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_mnist.yaml +0 -0
  914. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_oxford-iiit-pet.yaml +0 -0
  915. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_oxford_flowers102.yaml +0 -0
  916. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_oxford_flowers102_val.yaml +0 -0
  917. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_pcam.yaml +0 -0
  918. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_rendered-sst2.yaml +0 -0
  919. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_resisc45.yaml +0 -0
  920. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_stanford-cars.yaml +0 -0
  921. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_stl10.yaml +0 -0
  922. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_sun397.yaml +0 -0
  923. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-single-task_svhn.yaml +0 -0
  924. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip_rankone_wemoe_clip-vit-classification_TA8.yaml +0 -0
  925. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip_sparse_wemoe_clip-vit-classification_TA8.yaml +0 -0
  926. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/LMEvalHarnessTaskPool/lm_eval.yaml +0 -0
  927. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/OpenCLIPVisionModelTaskPool/ViT-B-16_TA8.yaml +0 -0
  928. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/OpenCLIPVisionModelTaskPool/ViT-B-32_TA8.yaml +0 -0
  929. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/OpenCLIPVisionModelTaskPool/ViT-L-14_TA8.yaml +0 -0
  930. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/clip-vit-base-patch32_robustness_clean.yaml +0 -0
  931. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/clip-vit-base-patch32_robustness_corrupted.yaml +0 -0
  932. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/dummy.yaml +0 -0
  933. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/flan-t5_glue_text_generation.yaml +0 -0
  934. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/gpt-2_glue.yaml +0 -0
  935. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/nyuv2_taskpool.yaml +0 -0
  936. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/fusion_bench_config/taskpool/reward_model_evaluation.yaml +0 -0
  937. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/setup.cfg +0 -0
  938. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/tests/test_depth_upscaling.py +0 -0
  939. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/tests/test_simple_average.py +0 -0
  940. {fusion_bench-0.2.21 → fusion_bench-0.2.22}/tests/test_weighed_ensemble.py +0 -0
@@ -1,30 +1,8 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: fusion_bench
3
- Version: 0.2.21
3
+ Version: 0.2.22
4
4
  Summary: A Comprehensive Benchmark of Deep Model Fusion
5
5
  Author-email: Anke Tang <tang.anke@foxmail.com>
6
- License: MIT License
7
-
8
- Copyright (c) 2024 Anke Tang
9
-
10
- Permission is hereby granted, free of charge, to any person obtaining a copy
11
- of this software and associated documentation files (the "Software"), to deal
12
- in the Software without restriction, including without limitation the rights
13
- to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
14
- copies of the Software, and to permit persons to whom the Software is
15
- furnished to do so, subject to the following conditions:
16
-
17
- The above copyright notice and this permission notice shall be included in all
18
- copies or substantial portions of the Software.
19
-
20
- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
21
- IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
22
- FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
23
- AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
24
- LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
25
- OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
26
- SOFTWARE.
27
-
28
6
  Project-URL: Repository, https://github.com/tanganke/fusion_bench
29
7
  Project-URL: Homepage, https://github.com/tanganke/fusion_bench
30
8
  Project-URL: Issues, https://github.com/tanganke/fusion_bench/issues
@@ -19,9 +19,28 @@ from . import (
19
19
  tasks,
20
20
  utils,
21
21
  )
22
+ from .constants import RuntimeConstants
22
23
  from .method import BaseAlgorithm, BaseModelFusionAlgorithm
23
24
  from .mixins import auto_register_config
24
25
  from .modelpool import BaseModelPool
25
- from .models import separate_io
26
+ from .models import (
27
+ create_default_model_card,
28
+ load_model_card_template,
29
+ save_pretrained_with_remote_code,
30
+ separate_io,
31
+ )
32
+ from .programs import BaseHydraProgram
26
33
  from .taskpool import BaseTaskPool
27
- from .utils import parse_dtype, print_parameters, timeit_context
34
+ from .utils import (
35
+ cache_with_joblib,
36
+ get_rankzero_logger,
37
+ import_object,
38
+ instantiate,
39
+ parse_dtype,
40
+ print_parameters,
41
+ seed_everything_by_time,
42
+ set_default_cache_dir,
43
+ set_print_function_call,
44
+ set_print_function_call_permeanent,
45
+ timeit_context,
46
+ )
@@ -2,6 +2,7 @@
2
2
  import importlib.metadata
3
3
 
4
4
  from .paths import *
5
+ from .runtime import RuntimeConstants
5
6
 
6
7
  # fusionbench version
7
8
  FUSION_BENCH_VERSION = importlib.metadata.version("fusion-bench")
@@ -0,0 +1,57 @@
1
+ import threading
2
+ from pathlib import Path
3
+ from typing import Optional, Union
4
+
5
+
6
+ class RuntimeConstants:
7
+ """
8
+ This class holds constants related to the runtime environment of the Fusion Bench framework.
9
+ It includes default values for cache directories and other runtime configurations.
10
+
11
+ Implemented as a thread-safe singleton to ensure consistent runtime configuration
12
+ across the entire application.
13
+ """
14
+
15
+ _instance: Optional["RuntimeConstants"] = None
16
+ _lock = threading.Lock()
17
+
18
+ def __new__(cls) -> "RuntimeConstants":
19
+ """Create a new instance using singleton pattern with thread safety."""
20
+ with cls._lock:
21
+ # Double-check locking pattern
22
+ if cls._instance is None:
23
+ cls._instance = super(RuntimeConstants, cls).__new__(cls)
24
+ cls._instance._initialized = False
25
+ return cls._instance
26
+
27
+ def __init__(self):
28
+ """Initialize the singleton instance only once."""
29
+ if not self._initialized:
30
+ # Add your runtime constants here
31
+ self._initialized = True
32
+
33
+ debug = False
34
+
35
+ @property
36
+ def cache_dir(self) -> Path:
37
+ from fusion_bench.utils.cache_utils import DEFAULT_CACHE_DIR
38
+
39
+ return DEFAULT_CACHE_DIR
40
+
41
+ @cache_dir.setter
42
+ def cache_dir(self, path: Union[str, Path]) -> None:
43
+ from fusion_bench.utils.cache_utils import set_default_cache_dir
44
+
45
+ set_default_cache_dir(path)
46
+
47
+ @property
48
+ def print_function_call(self) -> bool:
49
+ from fusion_bench.utils.instantiate_utils import PRINT_FUNCTION_CALL
50
+
51
+ return PRINT_FUNCTION_CALL
52
+
53
+ @print_function_call.setter
54
+ def print_function_call(self, enable: bool) -> None:
55
+ from fusion_bench.utils.instantiate_utils import set_print_function_call
56
+
57
+ set_print_function_call(enable)
@@ -90,7 +90,10 @@ _import_structure = {
90
90
  "MixtralForCausalLMMergingAlgorithm",
91
91
  ],
92
92
  "dawe": ["DataAdaptiveWeightEnsemblingForCLIP"],
93
- "we_moe": ["CLIPWeightEnsemblingMoEAlgorithm"],
93
+ "we_moe": [
94
+ "CLIPWeightEnsemblingMoEAlgorithm",
95
+ "FlanT5WeightEnsemblingMoEAlgorithm",
96
+ ],
94
97
  "rankone_moe": ["CLIPRankOneMoEAlgorithm", "RankOneMoEAlgorithm"],
95
98
  "sparse_we_moe": [
96
99
  "SparseWeightEnsemblingMoEAlgorithm",
@@ -228,7 +231,10 @@ if TYPE_CHECKING:
228
231
  from .task_arithmetic import TaskArithmeticAlgorithm
229
232
  from .task_singular_vector import TaskSingularVectorMerging
230
233
  from .ties_merging import TiesMergingAlgorithm
231
- from .we_moe import CLIPWeightEnsemblingMoEAlgorithm
234
+ from .we_moe import (
235
+ CLIPWeightEnsemblingMoEAlgorithm,
236
+ FlanT5WeightEnsemblingMoEAlgorithm,
237
+ )
232
238
  from .weighted_average import WeightedAverageAlgorithm, WeightedAverageForLLama
233
239
 
234
240
  else:
@@ -1,4 +1,5 @@
1
1
  """
2
2
  Adapted from https://github.com/FasterDecoding/BitDelta
3
3
  """
4
+
4
5
  from .bitdelta import BitDeltaAlgorithm
@@ -393,7 +393,7 @@ def convert_l_lora_state_dict_to_hf(
393
393
  base_model_name: Optional[str] = None,
394
394
  ):
395
395
  """
396
- Convert a linearized Lora model's checkpoint to Hugggingface's format.
396
+ Convert a linearized Lora model's checkpoint to huggingface's format.
397
397
 
398
398
  Args:
399
399
  pretrained_path (str): The path to the pretrained model.
@@ -32,7 +32,6 @@ class FisherMergingForCLIPVisionModel(
32
32
  zeroshot_weights = {}
33
33
 
34
34
  _config_mapping = FisherMergingAlgorithm._config_mapping | {
35
- "zeroshot_weights_cache_dir": "zeroshot_weights_cache_dir",
36
35
  "_dataloader_kwargs": "dataloader_kwargs",
37
36
  }
38
37
 
@@ -44,7 +43,6 @@ class FisherMergingForCLIPVisionModel(
44
43
  minimal_fisher_weight,
45
44
  num_fisher_examples,
46
45
  dataloader_kwargs: DictConfig,
47
- zeroshot_weights_cache_dir=None,
48
46
  **kwargs,
49
47
  ):
50
48
  """
@@ -56,7 +54,6 @@ class FisherMergingForCLIPVisionModel(
56
54
  minimal_fisher_weight (float): Minimal value for Fisher weights to avoid numerical issues.
57
55
  num_fisher_examples (int): Number of examples to compute Fisher weights.
58
56
  dataloader_kwargs (DictConfig): Configuration for the dataloader.
59
- zeroshot_weights_cache_dir (str, optional): Directory to cache zero-shot weights. Defaults to None.
60
57
  **kwargs: Additional keyword arguments.
61
58
  """
62
59
  super().__init__(
@@ -66,7 +63,6 @@ class FisherMergingForCLIPVisionModel(
66
63
  num_fisher_examples=num_fisher_examples,
67
64
  )
68
65
  self.dataloader_kwargs = dataloader_kwargs
69
- self.zeroshot_weights_cache_dir = zeroshot_weights_cache_dir
70
66
  for key, value in kwargs.items():
71
67
  log.warning(f"Unused argument: {key}={value}")
72
68
  setattr(self, key, value)
@@ -15,10 +15,10 @@ from transformers import GPT2ForSequenceClassification, GPT2Model
15
15
  from transformers.data import default_data_collator
16
16
  from transformers.models.gpt2.modeling_gpt2 import Conv1D
17
17
 
18
- from fusion_bench.mixins import LightningFabricMixin
18
+ from fusion_bench.mixins import LightningFabricMixin, auto_register_config
19
19
  from fusion_bench.modelpool import GPT2ForSequenceClassificationPool
20
20
  from fusion_bench.utils import timeit_context
21
- from fusion_bench.mixins import auto_register_config
21
+
22
22
  from .fisher_merging import FisherMergingAlgorithm, get_param_squared_gradients
23
23
 
24
24
 
@@ -1,3 +1,4 @@
1
+ import os
1
2
  from copy import deepcopy
2
3
  from typing import TYPE_CHECKING, Optional
3
4
 
@@ -7,13 +8,16 @@ from typing_extensions import override
7
8
  from fusion_bench import timeit_context
8
9
  from fusion_bench.method.base_algorithm import BaseAlgorithm
9
10
  from fusion_bench.method.simple_average import SimpleAverageAlgorithm
11
+ from fusion_bench.mixins import auto_register_config
10
12
  from fusion_bench.modelpool import CausalLMBackbonePool, CausalLMPool
13
+ from fusion_bench.models.hf_utils import create_default_model_card
11
14
  from fusion_bench.utils import instantiate
12
- from fusion_bench.utils.pylogger import getRankZeroLogger
15
+ from fusion_bench.utils.pylogger import get_rankzero_logger
13
16
 
14
- log = getRankZeroLogger(__name__)
17
+ log = get_rankzero_logger(__name__)
15
18
 
16
19
 
20
+ @auto_register_config
17
21
  class SimpleAverageForLlama(BaseAlgorithm):
18
22
  R"""
19
23
  A simple averaging algorithm for LLama models. If `merge_backbone` is set to `True`, the backbone of the model will be averaged and the rest of the model will be loaded from the pre-trained model.
@@ -29,21 +33,14 @@ class SimpleAverageForLlama(BaseAlgorithm):
29
33
  ```
30
34
  """
31
35
 
32
- _config_mapping = BaseAlgorithm._config_mapping | {
33
- "merge_backbone": "merge_backbone",
34
- "show_pbar": "show_pbar",
35
- }
36
-
37
36
  def __init__(
38
37
  self,
39
38
  merge_backbone: bool,
40
39
  model_save_path: Optional[str] = None,
41
40
  show_pbar: bool = False,
41
+ **kwargs,
42
42
  ):
43
- super().__init__()
44
- self.merge_backbone = merge_backbone
45
- self.model_save_path = model_save_path
46
- self.show_pbar = show_pbar
43
+ super().__init__(**kwargs)
47
44
 
48
45
  @override
49
46
  def run(self, modelpool: CausalLMPool):
@@ -75,4 +72,12 @@ class SimpleAverageForLlama(BaseAlgorithm):
75
72
  with timeit_context(f"Saving the model to {self.model_save_path}"):
76
73
  tokenizer.save_pretrained(self.model_save_path)
77
74
  model.save_pretrained(self.model_save_path)
75
+ model_card_str = create_default_model_card(
76
+ models=[modelpool.get_model_path(m) for m in modelpool.model_names],
77
+ description="Merged model using simple averaging.",
78
+ algorithm_config=self.config,
79
+ modelpool_config=modelpool.config,
80
+ )
81
+ with open(os.path.join(self.model_save_path, "README.md"), "w") as f:
82
+ f.write(model_card_str)
78
83
  return model
@@ -61,8 +61,8 @@ def simple_average(
61
61
 
62
62
  @auto_register_config
63
63
  class SimpleAverageAlgorithm(
64
- BaseAlgorithm,
65
64
  SimpleProfilerMixin,
65
+ BaseAlgorithm,
66
66
  ):
67
67
  def __init__(self, show_pbar: bool = False, **kwargs):
68
68
  """
@@ -120,13 +120,13 @@ class SimpleAverageAlgorithm(
120
120
  if isinstance(forward_model, LazyStateDict):
121
121
  # if the model is a LazyStateDict, convert it to an empty module
122
122
  forward_model = forward_model.meta_module.to_empty(
123
- device=(
124
- "cpu"
125
- if forward_model._torch_dtype is None
126
- else forward_model._torch_dtype
127
- )
123
+ device=forward_model._device
128
124
  )
129
- forward_model.load_state_dict(sd)
125
+ result = forward_model.load_state_dict(sd, strict=False)
126
+ if result.unexpected_keys:
127
+ raise ValueError(f"Unexpected keys in state dict: {result.unexpected_keys}")
128
+ if result.missing_keys:
129
+ log.warning(f"Missing keys in state dict: {result.missing_keys}")
130
130
  # print profile report and log the merged models
131
131
  self.print_profile_summary()
132
132
  log.info(f"merged {len(merged_model_names)} models:")
@@ -0,0 +1,371 @@
1
+ import logging
2
+ import os
3
+ from copy import deepcopy
4
+ from typing import TYPE_CHECKING, Any, Dict, List, Tuple, Type, Union
5
+
6
+ import torch
7
+ from accelerate import init_empty_weights
8
+ from tqdm.auto import tqdm
9
+ from transformers import (
10
+ AutoConfig,
11
+ AutoModelForCausalLM,
12
+ AutoTokenizer,
13
+ LlamaForCausalLM,
14
+ MistralForCausalLM,
15
+ PretrainedConfig,
16
+ PreTrainedModel,
17
+ Qwen2ForCausalLM,
18
+ )
19
+ from transformers.models.llama.modeling_llama import LlamaDecoderLayer
20
+ from transformers.models.mistral.modeling_mistral import MistralDecoderLayer
21
+ from transformers.models.qwen2.modeling_qwen2 import Qwen2DecoderLayer
22
+
23
+ from fusion_bench import BaseAlgorithm, BaseModelPool
24
+ from fusion_bench.compat.modelpool import to_modelpool
25
+ from fusion_bench.constants import RuntimeConstants
26
+ from fusion_bench.mixins import SimpleProfilerMixin, auto_register_config
27
+ from fusion_bench.modelpool import CausalLMPool
28
+ from fusion_bench.models.hf_utils import (
29
+ create_default_model_card,
30
+ save_pretrained_with_remote_code,
31
+ )
32
+ from fusion_bench.models.modeling_smile_llama import (
33
+ SmileLlamaConfig,
34
+ SmileLlamaForCausalLM,
35
+ SmileLlamaModel,
36
+ )
37
+ from fusion_bench.models.modeling_smile_llama.modeling_smile_llama import (
38
+ SmileLlamaDecoderLayer,
39
+ )
40
+ from fusion_bench.models.modeling_smile_mistral import (
41
+ SmileMistralConfig,
42
+ SmileMistralForCausalLM,
43
+ SmileMistralModel,
44
+ )
45
+ from fusion_bench.models.modeling_smile_mistral.modeling_smile_mistral import (
46
+ SmileMistralDecoderLayer,
47
+ )
48
+
49
+ # Import all SMILE configurations and models
50
+ from fusion_bench.models.modeling_smile_qwen2 import (
51
+ SmileQwen2Config,
52
+ SmileQwen2ForCausalLM,
53
+ SmileQwen2Model,
54
+ )
55
+ from fusion_bench.models.modeling_smile_qwen2.modeling_smile_qwen2 import (
56
+ SmileQwen2DecoderLayer,
57
+ )
58
+ from fusion_bench.models.smile_moe.linear_from_hf_config import (
59
+ ExpertNotTrainedError,
60
+ upscale_to_smile_linear,
61
+ )
62
+ from fusion_bench.utils.dtype import parse_dtype
63
+ from fusion_bench.utils.parameters import print_parameters
64
+
65
+ log = logging.getLogger(__name__)
66
+
67
+ # Model type mappings
68
+ MODEL_TYPE_MAPPINGS = {
69
+ "qwen2": {
70
+ "base_model_cls": Qwen2ForCausalLM,
71
+ "base_decoder_layer_cls": Qwen2DecoderLayer,
72
+ "smile_config_cls": SmileQwen2Config,
73
+ "smile_model_cls": SmileQwen2ForCausalLM,
74
+ "smile_base_model_cls": SmileQwen2Model,
75
+ "smile_decoder_layer_cls": SmileQwen2DecoderLayer,
76
+ "description": "Qwen2",
77
+ },
78
+ "llama": {
79
+ "base_model_cls": LlamaForCausalLM,
80
+ "base_decoder_layer_cls": LlamaDecoderLayer,
81
+ "smile_config_cls": SmileLlamaConfig,
82
+ "smile_model_cls": SmileLlamaForCausalLM,
83
+ "smile_base_model_cls": SmileLlamaModel,
84
+ "smile_decoder_layer_cls": SmileLlamaDecoderLayer,
85
+ "description": "Llama",
86
+ },
87
+ "mistral": {
88
+ "base_model_cls": MistralForCausalLM,
89
+ "base_decoder_layer_cls": MistralDecoderLayer,
90
+ "smile_config_cls": SmileMistralConfig,
91
+ "smile_model_cls": SmileMistralForCausalLM,
92
+ "smile_base_model_cls": SmileMistralModel,
93
+ "smile_decoder_layer_cls": SmileMistralDecoderLayer,
94
+ "description": "Mistral",
95
+ },
96
+ }
97
+
98
+
99
+ def detect_model_type(
100
+ model_or_config: Union[PreTrainedModel, PretrainedConfig, str],
101
+ ) -> str:
102
+ """
103
+ Detect the model type from a model, config, or model name/path.
104
+
105
+ Args:
106
+ model_or_config: Model, config, or model name/path to detect type from
107
+
108
+ Returns:
109
+ str: The detected model type ("qwen2", "llama", "mistral")
110
+
111
+ Raises:
112
+ ValueError: If model type cannot be detected or is not supported
113
+ """
114
+ if isinstance(model_or_config, str):
115
+ # Load config from path/name
116
+ config = AutoConfig.from_pretrained(model_or_config)
117
+ elif isinstance(model_or_config, PreTrainedModel):
118
+ config = model_or_config.config
119
+ elif isinstance(model_or_config, PretrainedConfig):
120
+ config = model_or_config
121
+ else:
122
+ raise ValueError(
123
+ f"Unsupported type for model type detection: {type(model_or_config)}"
124
+ )
125
+
126
+ model_type = getattr(config, "model_type", "").lower()
127
+
128
+ # Handle various model type variations
129
+ if model_type in MODEL_TYPE_MAPPINGS:
130
+ return model_type
131
+ else:
132
+ raise ValueError(
133
+ f"Unsupported model type: {model_type}. Supported types: {list(MODEL_TYPE_MAPPINGS.keys())}"
134
+ )
135
+
136
+
137
+ @auto_register_config
138
+ class SmileCausalLMUpscalingAlgorithm(
139
+ SimpleProfilerMixin,
140
+ BaseAlgorithm,
141
+ ):
142
+ R"""
143
+ SmileCausalLMUpscalingAlgorithm is a generic model fusion algorithm designed to upscale
144
+ a pretrained CausalLM model using a set of fine-tuned expert models. The algorithm
145
+ supports Qwen2, Llama, and Mistral model architectures and leverages Singular Value
146
+ Decomposition (SVD) to merge the weights of the pretrained model and the expert models
147
+ into a new upscaled model.
148
+
149
+ The algorithm automatically detects the model type and uses the appropriate SMILE
150
+ configuration and model classes.
151
+
152
+ Methods:
153
+ run(modelpool: BaseModelPool) -> Union[SmileQwen2ForCausalLM, SmileLlamaForCausalLM, SmileMistralForCausalLM]:
154
+ Executes the upscaling process and returns the upscaled model.
155
+
156
+ merge(pretrained_model: PreTrainedModel, finetuned_models: List[PreTrainedModel]) -> PreTrainedModel:
157
+ Merges the pretrained model with the fine-tuned models to create an upscaled model.
158
+ """
159
+
160
+ modelpool: CausalLMPool
161
+
162
+ def __init__(
163
+ self,
164
+ device,
165
+ accelerator,
166
+ model_save_path,
167
+ model_dtype,
168
+ num_experts_per_tok,
169
+ rank_of_router,
170
+ rank_of_expert,
171
+ save_with_remote_code: bool = True,
172
+ model_type: str = None, # Optional: explicitly specify model type
173
+ **kwargs,
174
+ ):
175
+ super().__init__(**kwargs)
176
+ self.model_mappings = None # Will be set during run()
177
+
178
+ if not torch.cuda.is_available():
179
+ if "cuda" in self.device:
180
+ self.device = "cpu"
181
+ if "cuda" in self.accelerator:
182
+ self.accelerator = "cpu"
183
+
184
+ @torch.no_grad()
185
+ def run(self, modelpool) -> PreTrainedModel:
186
+ """
187
+ Executes the upscaling process.
188
+
189
+ Args:
190
+ modelpool (ModelPool): The pool of models to be used for upscaling.
191
+
192
+ Returns:
193
+ PreTrainedModel: The upscaled model (specific type depends on detected model architecture).
194
+ """
195
+ self.modelpool = modelpool = to_modelpool(modelpool)
196
+ config = self.config
197
+
198
+ # Auto-detect model type if not specified
199
+ if self.model_type is None:
200
+ self.model_type = detect_model_type(
201
+ modelpool.get_model_path("_pretrained_")
202
+ )
203
+ log.info(f"Auto-detected model type: {self.model_type}")
204
+
205
+ # Get the appropriate model mappings
206
+ if self.model_type not in MODEL_TYPE_MAPPINGS:
207
+ raise ValueError(
208
+ f"Unsupported model type: {self.model_type}. Supported: {list(MODEL_TYPE_MAPPINGS.keys())}"
209
+ )
210
+
211
+ self.model_mappings = MODEL_TYPE_MAPPINGS[self.model_type]
212
+ log.info(f"Using {self.model_mappings['description']} model architecture")
213
+
214
+ with self.profile("load pretrained model"):
215
+ pretrained_model = modelpool.load_pretrained_model()
216
+
217
+ with self.profile("load fine-tuned model"):
218
+ finetuned_models = [
219
+ m for m in tqdm(modelpool.models(), total=len(modelpool.model_names))
220
+ ]
221
+
222
+ if self.device == "cuda" and torch.cuda.is_available():
223
+ pretrained_model = pretrained_model.cuda()
224
+ print("parameter count of pretrained model:")
225
+ print_parameters(pretrained_model)
226
+ finetuned_models = [m.cuda() for m in finetuned_models]
227
+
228
+ with self.profile("merge model"):
229
+ model = self.merge(pretrained_model, finetuned_models)
230
+
231
+ self.print_profile_summary()
232
+ print("parameter count of upscaled MoE model:")
233
+ print_parameters(model)
234
+ print(model)
235
+
236
+ if self.model_dtype is not None:
237
+ model.to(dtype=parse_dtype(self.model_dtype))
238
+
239
+ if self.model_save_path is not None:
240
+ if os.path.dirname(self.model_save_path):
241
+ os.makedirs(os.path.dirname(self.model_save_path), exist_ok=True)
242
+ log.info(f"Saving model to {self.model_save_path}")
243
+ tokenizer = self.modelpool.load_tokenizer()
244
+ tokenizer.save_pretrained(self.model_save_path)
245
+ if not self.save_with_remote_code:
246
+ model.save_pretrained(self.model_save_path)
247
+ else:
248
+ # Use the appropriate auto_map for the detected model type
249
+ auto_map = {
250
+ "AutoConfig": self.model_mappings["smile_config_cls"],
251
+ "AutoModel": self.model_mappings["smile_base_model_cls"],
252
+ "AutoModelForCausalLM": self.model_mappings["smile_model_cls"],
253
+ }
254
+ save_pretrained_with_remote_code(
255
+ model,
256
+ auto_map=auto_map,
257
+ save_directory=self.model_save_path,
258
+ )
259
+
260
+ # save readme
261
+ model_card_str = create_default_model_card(
262
+ models=[modelpool.get_model_path(m) for m in modelpool.all_model_names],
263
+ description=f"Merged {self.model_mappings['description']} model using SMILE Upscaling",
264
+ algorithm_config=self.config,
265
+ modelpool_config=modelpool.config,
266
+ )
267
+ with open(os.path.join(self.model_save_path, "README.md"), "w") as f:
268
+ f.write(model_card_str)
269
+
270
+ return model
271
+
272
+ def merge(
273
+ self,
274
+ pretrained_model: PreTrainedModel,
275
+ finetuned_models: List[PreTrainedModel],
276
+ ) -> PreTrainedModel:
277
+ """
278
+ Merges the pretrained model with the fine-tuned models to create an upscaled model.
279
+
280
+ Args:
281
+ pretrained_model (PreTrainedModel): The pretrained model.
282
+ finetuned_models (List[PreTrainedModel]): A list of fine-tuned models.
283
+
284
+ Returns:
285
+ PreTrainedModel: The upscaled model (specific type depends on model architecture).
286
+ """
287
+ with init_empty_weights():
288
+ pretrained_model_config = self.modelpool.get_model_config("_pretrained_")
289
+ if isinstance(pretrained_model_config, str):
290
+ pretrained_path = pretrained_model_config
291
+ else:
292
+ pretrained_path = pretrained_model_config.get(
293
+ "path", pretrained_model_config["pretrained_model_name_or_path"]
294
+ )
295
+ base_config = AutoConfig.from_pretrained(pretrained_path)
296
+
297
+ # Create the appropriate SMILE config for the detected model type
298
+ SmileConfigClass = self.model_mappings["smile_config_cls"]
299
+ model_config = SmileConfigClass(
300
+ num_experts_per_tok=self.num_experts_per_tok,
301
+ rank_of_router=self.rank_of_router,
302
+ rank_of_expert=self.rank_of_expert,
303
+ num_local_experts=len(finetuned_models),
304
+ **base_config.to_dict(),
305
+ )
306
+
307
+ # Create the appropriate SMILE model for the detected model type
308
+ SmileModelClass = self.model_mappings["smile_model_cls"]
309
+ model = SmileModelClass(model_config)
310
+
311
+ model.to(dtype=pretrained_model.dtype).to_empty(device="cpu")
312
+
313
+ # copy pretrained model weights
314
+ state_dict = model.state_dict()
315
+ pretrained_state_dict = pretrained_model.state_dict()
316
+ for key in list(pretrained_state_dict.keys()):
317
+ if key not in state_dict:
318
+ pretrained_state_dict.pop(key)
319
+ model.load_state_dict(pretrained_state_dict, strict=False)
320
+
321
+ # upscale model
322
+ BaseDecoderLayerClass = self.model_mappings["base_decoder_layer_cls"]
323
+ SmileDecoderLayerClass = self.model_mappings["smile_decoder_layer_cls"]
324
+
325
+ for layer_idx in tqdm(
326
+ range(len(pretrained_model.model.layers)),
327
+ "Upscaling Modules (layer)",
328
+ dynamic_ncols=True,
329
+ ):
330
+ if RuntimeConstants.debug and layer_idx > 0:
331
+ log.info(
332
+ "Debug mode enabled: processing only the first layer, skipping remaining layers"
333
+ )
334
+ break
335
+
336
+ pretrained_layer = pretrained_model.model.layers[layer_idx]
337
+ finetuned_layers = [m.model.layers[layer_idx] for m in finetuned_models]
338
+
339
+ target_layer = model.model.layers[layer_idx]
340
+
341
+ for n in ["q_proj", "k_proj", "v_proj", "o_proj"]:
342
+ try:
343
+ upscale_to_smile_linear(
344
+ base=getattr(pretrained_layer.self_attn, n),
345
+ experts=[getattr(m.self_attn, n) for m in finetuned_layers],
346
+ target=getattr(target_layer.self_attn, n),
347
+ accelerator=self.accelerator,
348
+ )
349
+ except ExpertNotTrainedError:
350
+ setattr(
351
+ target_layer.self_attn,
352
+ n,
353
+ getattr(pretrained_layer.self_attn, n),
354
+ )
355
+
356
+ for n in ["gate_proj", "up_proj", "down_proj"]:
357
+ try:
358
+ upscale_to_smile_linear(
359
+ base=getattr(pretrained_layer.mlp, n),
360
+ experts=[getattr(m.mlp, n) for m in finetuned_layers],
361
+ target=getattr(target_layer.mlp, n),
362
+ accelerator=self.accelerator,
363
+ )
364
+ except ExpertNotTrainedError:
365
+ setattr(
366
+ target_layer.mlp,
367
+ n,
368
+ getattr(pretrained_layer.mlp, n),
369
+ )
370
+
371
+ return model