fusion-bench 0.2.19__py3-none-any.whl → 0.2.21__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- fusion_bench/__init__.py +1 -0
- fusion_bench/_get_started/__init__.py +3 -0
- fusion_bench/_get_started/greeting_program.py +49 -0
- fusion_bench/compat/method/base_algorithm.py +14 -0
- fusion_bench/constants/__init__.py +5 -0
- fusion_bench/constants/clip_vision.py +26 -2
- fusion_bench/constants/paths.py +4 -0
- fusion_bench/dataset/clip_dataset.py +2 -1
- fusion_bench/dataset/gpt2_glue.py +9 -9
- fusion_bench/dataset/image_corruption/__init__.py +0 -0
- fusion_bench/dataset/image_corruption/make_corruption.py +179 -0
- fusion_bench/dataset/image_dataset.py +1 -1
- fusion_bench/dataset/nyuv2.py +2 -2
- fusion_bench/method/__init__.py +16 -1
- fusion_bench/method/adamerging/clip_layer_wise_adamerging.py +1 -1
- fusion_bench/method/adamerging/clip_task_wise_adamerging.py +11 -7
- fusion_bench/method/adamerging/layer_wise_adamerging.py +11 -5
- fusion_bench/method/base_algorithm.py +195 -12
- fusion_bench/method/bitdelta/__init__.py +4 -0
- fusion_bench/method/bitdelta/bitdelta.py +156 -0
- fusion_bench/method/bitdelta/bitdelta_utils/__init__.py +0 -0
- fusion_bench/method/bitdelta/bitdelta_utils/binary_gemm_kernel.py +462 -0
- fusion_bench/method/bitdelta/bitdelta_utils/data.py +35 -0
- fusion_bench/method/bitdelta/bitdelta_utils/diff.py +129 -0
- fusion_bench/method/concrete_subspace/clip_concrete_adamerging.py +0 -1
- fusion_bench/method/depth_upscaling/depth_upscaling.py +4 -9
- fusion_bench/method/doge_ta/clip_layer_wise_adamerging.py +4 -5
- fusion_bench/method/doge_ta/doge_ta.py +1 -1
- fusion_bench/method/ensemble.py +12 -12
- fusion_bench/method/expert_sparsity/utils/calibration_data.py +1 -1
- fusion_bench/method/fisher_merging/clip_fisher_merging.py +2 -2
- fusion_bench/method/fisher_merging/fisher_merging.py +6 -15
- fusion_bench/method/fisher_merging/gpt2_fisher_merging.py +3 -10
- fusion_bench/method/fw_merging/fw_hard.py +1 -1
- fusion_bench/method/fw_merging/fw_soft.py +1 -1
- fusion_bench/method/gossip/clip_layer_wise_gossip.py +4 -5
- fusion_bench/method/linear/expo.py +2 -1
- fusion_bench/method/linear/linear_interpolation.py +6 -4
- fusion_bench/method/linear/simple_average_for_llama.py +16 -6
- fusion_bench/method/lm_finetune/bradley_terry_rm.py +2 -2
- fusion_bench/method/mixture_of_experts/mixtral_upcycling.py +9 -26
- fusion_bench/method/model_recombination.py +2 -5
- fusion_bench/method/moe_pruner/hooks/__init__.py +1 -2
- fusion_bench/method/moe_pruner/utils/data.py +2 -1
- fusion_bench/method/moe_pruner/utils/prune.py +6 -1
- fusion_bench/method/pruning/llama_magnitude_prune.py +1 -1
- fusion_bench/method/pruning/wanda_utils/data.py +1 -2
- fusion_bench/method/pwe_moe/clip_pwe_moe.py +12 -34
- fusion_bench/method/randes/modelsoup.py +1 -3
- fusion_bench/method/regmean/clip_regmean.py +2 -2
- fusion_bench/method/regmean/gpt2_regmean.py +3 -10
- fusion_bench/method/regmean/regmean.py +2 -11
- fusion_bench/method/regmean_plusplus/__init__.py +3 -0
- fusion_bench/method/regmean_plusplus/clip_regmean_plusplus.py +199 -0
- fusion_bench/method/regmean_plusplus/regmean_plusplus.py +383 -0
- fusion_bench/method/simple_average.py +16 -4
- fusion_bench/method/slerp/slerp.py +5 -2
- fusion_bench/method/smile_upscaling/error_accumulation.py +177 -0
- fusion_bench/method/smile_upscaling/projected_energy.py +145 -0
- fusion_bench/method/smile_upscaling/smile_qwen2_upscaling.py +39 -28
- fusion_bench/method/smile_upscaling/smile_upscaling.py +12 -5
- fusion_bench/method/tall_mask/task_arithmetic.py +3 -11
- fusion_bench/method/task_arithmetic/task_arithmetic.py +6 -10
- fusion_bench/method/ties_merging/ties_merging.py +13 -26
- fusion_bench/method/we_moe/clip_we_moe.py +5 -4
- fusion_bench/method/we_moe/we_moe.py +6 -6
- fusion_bench/method/weighted_average/llama.py +4 -16
- fusion_bench/metrics/continual_learning/__init__.py +1 -0
- fusion_bench/metrics/continual_learning/backward_transfer.py +1 -1
- fusion_bench/metrics/nyuv2/__init__.py +2 -2
- fusion_bench/metrics/nyuv2/segmentation.py +1 -1
- fusion_bench/mixins/__init__.py +10 -2
- fusion_bench/mixins/clip_classification.py +4 -3
- fusion_bench/mixins/hydra_config.py +105 -7
- fusion_bench/mixins/lightning_fabric.py +2 -0
- fusion_bench/mixins/serialization.py +265 -48
- fusion_bench/modelpool/__init__.py +2 -2
- fusion_bench/modelpool/base_pool.py +29 -9
- fusion_bench/modelpool/causal_lm/causal_lm.py +9 -0
- fusion_bench/modelpool/clip_vision/modelpool.py +43 -12
- fusion_bench/modelpool/seq_classification_lm/__init__.py +1 -1
- fusion_bench/modelpool/seq_classification_lm/seq_classification_lm.py +1 -1
- fusion_bench/models/__init__.py +2 -1
- fusion_bench/models/expert_sparsity/mixtral/__init__.py +1 -1
- fusion_bench/models/hf_utils.py +182 -0
- fusion_bench/models/linearized/linearized_model_utils.py +4 -4
- fusion_bench/models/linearized/vision_model.py +1 -1
- fusion_bench/models/modeling_deepseek_v2/__init__.py +1 -1
- fusion_bench/models/modeling_deepseek_v2/modeling_deepseek.py +4 -4
- fusion_bench/models/modeling_deepseek_v2/tokenization_deepseek_fast.py +0 -1
- fusion_bench/models/modeling_smile_gemma2/__init__.py +9 -0
- fusion_bench/models/modeling_smile_gemma2/configuration_smile_gemma2.py +20 -0
- fusion_bench/models/modeling_smile_gemma2/modeling_smile_gemma2.py +986 -0
- fusion_bench/models/modeling_smile_gemma2/register.py +26 -0
- fusion_bench/models/modeling_smile_llama/__init__.py +0 -0
- fusion_bench/models/modeling_smile_llama/configuration_smile_llama.py +20 -0
- fusion_bench/models/modeling_smile_llama/modeling_smile_llama.py +705 -0
- fusion_bench/models/modeling_smile_llama/register.py +8 -0
- fusion_bench/models/modeling_smile_mistral/__init__.py +5 -47
- fusion_bench/models/modeling_smile_qwen2/__init__.py +1 -1
- fusion_bench/models/modeling_smile_qwen2/modeling_smile_qwen2.py +6 -7
- fusion_bench/models/modeling_smile_qwen2/register.py +1 -4
- fusion_bench/models/parameter_dict.py +1 -1
- fusion_bench/models/sparse_we_moe.py +1 -53
- fusion_bench/models/utils.py +26 -0
- fusion_bench/models/we_moe.py +1 -53
- fusion_bench/models/wrappers/ensemble.py +6 -4
- fusion_bench/models/wrappers/layer_wise_fusion.py +1 -1
- fusion_bench/models/wrappers/task_wise_fusion.py +250 -72
- fusion_bench/programs/base_program.py +81 -2
- fusion_bench/programs/fabric_fusion_program.py +24 -8
- fusion_bench/scripts/cli.py +6 -6
- fusion_bench/taskpool/base_pool.py +4 -3
- fusion_bench/taskpool/clip_vision/taskpool.py +34 -18
- fusion_bench/taskpool/dummy.py +1 -1
- fusion_bench/taskpool/lm_eval_harness/taskpool.py +1 -2
- fusion_bench/tasks/clip_classification/__init__.py +6 -4
- fusion_bench/utils/__init__.py +6 -1
- fusion_bench/utils/devices.py +14 -4
- fusion_bench/utils/instantiate_utils.py +3 -1
- fusion_bench/utils/misc.py +48 -2
- fusion_bench/utils/modelscope.py +265 -0
- fusion_bench/utils/parameters.py +2 -2
- fusion_bench/utils/rich_utils.py +3 -0
- fusion_bench/utils/state_dict_arithmetic.py +34 -27
- {fusion_bench-0.2.19.dist-info → fusion_bench-0.2.21.dist-info}/METADATA +31 -24
- {fusion_bench-0.2.19.dist-info → fusion_bench-0.2.21.dist-info}/RECORD +189 -153
- fusion_bench_config/_get_started/clip_evaluate_single_model.yaml +21 -0
- fusion_bench_config/_get_started/clip_simple_average.yaml +23 -0
- fusion_bench_config/_get_started/clip_task_arithmetic.yaml +24 -0
- fusion_bench_config/_get_started/greeting_program.yaml +4 -0
- fusion_bench_config/fabric/loggers/csv_logger.yaml +3 -3
- fusion_bench_config/fabric/loggers/tensorboard_logger.yaml +3 -3
- fusion_bench_config/fabric_model_fusion.yaml +45 -17
- fusion_bench_config/hydra/default.yaml +6 -2
- fusion_bench_config/llama_full_finetune.yaml +1 -0
- fusion_bench_config/method/adamerging/clip.yaml +1 -1
- fusion_bench_config/method/bitdelta/bitdelta.yaml +12 -0
- fusion_bench_config/method/depth_upscaling.yaml +4 -1
- fusion_bench_config/method/regmean/clip_regmean.yaml +1 -1
- fusion_bench_config/method/regmean_plusplus/clip_regmean_plusplus.yaml +11 -0
- fusion_bench_config/method/smile_upscaling/error_accumulation.yaml +5 -0
- fusion_bench_config/method/smile_upscaling/projected_energy.yaml +2 -0
- fusion_bench_config/method/smile_upscaling/smile_qwen2_upscaling.yaml +1 -0
- fusion_bench_config/modelpool/CLIPVisionModelPool/_template.yaml +1 -4
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TALL20.yaml +73 -8
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch16_TALL20_model_only.yaml +27 -7
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TA8.yaml +34 -4
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TA8_control_task.yaml +14 -17
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TA8_model_only.yaml +14 -3
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL10.yaml +39 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL12.yaml +49 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL14.yaml +55 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL14_model_only.yaml +21 -4
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL16.yaml +61 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL18.yaml +67 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL20.yaml +73 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL20_model_only.yaml +26 -3
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_individual.yaml +4 -9
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_single_finetuned.yaml +7 -5
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_single_task_projection.yaml +6 -10
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_and_cars.yaml +6 -7
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_and_dtd.yaml +6 -7
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_cars_and_dtd.yaml +7 -8
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_svhn_and_mnist.yaml +8 -6
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_two_tasks_control_task.yaml +4 -6
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TA8.yaml +32 -7
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TA8_model_only.yaml +14 -6
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TALL20.yaml +73 -8
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TALL20_model_only.yaml +27 -7
- fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_individual.yaml +6 -10
- fusion_bench_config/modelpool/CausalLMPool/Qwen2.5-1.5B_math_and_coder.yaml +2 -2
- fusion_bench_config/modelpool/CausalLMPool/Qwen2.5-7B-math_and_coder.yaml +9 -0
- fusion_bench_config/modelpool/CausalLMPool/mistral-7b.yaml +6 -0
- fusion_bench_config/modelpool/CausalLMPool/mixtral_moe_merging.yaml +10 -0
- fusion_bench_config/modelpool/CausalLMPool/qwen2_math_1.5B_and_R1.yaml +4 -12
- fusion_bench_config/modelpool/CausalLMPool/simle_mixtral_exp_v4.yaml +6 -16
- fusion_bench_config/modelpool/CausalLMPool/vicuna-7b-v1.5.yaml +8 -0
- fusion_bench_config/modelpool/{SeqenceClassificationModelPool → SequenceClassificationModelPool}/llama_preference700k.yaml +1 -1
- fusion_bench_config/modelpool/{SeqenceClassificationModelPool → SequenceClassificationModelPool}/single_reward_model.yaml +1 -1
- fusion_bench_config/nyuv2_config.yaml +3 -1
- fusion_bench_config/nyuv2_mtl_train.yaml +1 -0
- fusion_bench_config/path/default.yaml +28 -0
- fusion_bench_config/taskpool/CLIPVisionModelTaskPool/clip-vit-base-patch32_svhn_and_mnist.yaml +24 -0
- fusion_bench_config/method/adamerging.yaml +0 -23
- fusion_bench_config/modelpool/mixtral_moe_merging.yaml +0 -14
- fusion_bench_config/modelpool/mixtral_moe_upscaling.yaml +0 -6
- fusion_bench_config/taskpool/clip-vit-base-patch32_svhn_and_mnist.yaml +0 -22
- {fusion_bench-0.2.19.dist-info → fusion_bench-0.2.21.dist-info}/WHEEL +0 -0
- {fusion_bench-0.2.19.dist-info → fusion_bench-0.2.21.dist-info}/entry_points.txt +0 -0
- {fusion_bench-0.2.19.dist-info → fusion_bench-0.2.21.dist-info}/licenses/LICENSE +0 -0
- {fusion_bench-0.2.19.dist-info → fusion_bench-0.2.21.dist-info}/top_level.txt +0 -0
- /fusion_bench_config/modelpool/{SeqenceClassificationModelPool → SequenceClassificationModelPool}/roberta-base_glue.yaml +0 -0
|
@@ -1,8 +1,58 @@
|
|
|
1
|
-
# The 14 task used in the paper:
|
|
1
|
+
# The 14 task used in the paper (TALL mask):
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
4
|
defaults:
|
|
5
|
-
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
5
|
+
- /dataset/image_classification/train@train_datasets:
|
|
6
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
7
|
+
- sun397
|
|
8
|
+
- stanford-cars
|
|
9
|
+
- resisc45
|
|
10
|
+
- eurosat
|
|
11
|
+
- svhn
|
|
12
|
+
- gtsrb
|
|
13
|
+
- mnist
|
|
14
|
+
- dtd
|
|
15
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
16
|
+
- oxford_flowers102
|
|
17
|
+
- pcam
|
|
18
|
+
- fer2013
|
|
19
|
+
- oxford-iiit-pet
|
|
20
|
+
- stl10
|
|
21
|
+
- cifar100
|
|
22
|
+
- /dataset/image_classification/test@test_datasets:
|
|
23
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
24
|
+
- sun397
|
|
25
|
+
- stanford-cars
|
|
26
|
+
- resisc45
|
|
27
|
+
- eurosat
|
|
28
|
+
- svhn
|
|
29
|
+
- gtsrb
|
|
30
|
+
- mnist
|
|
31
|
+
- dtd
|
|
32
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
33
|
+
- oxford_flowers102
|
|
34
|
+
- pcam
|
|
35
|
+
- fer2013
|
|
36
|
+
- oxford-iiit-pet
|
|
37
|
+
- stl10
|
|
38
|
+
- cifar100
|
|
39
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
40
|
+
_recursive_: False
|
|
41
|
+
processor: openai/clip-vit-base-patch32
|
|
42
|
+
models:
|
|
43
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
44
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
45
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
46
|
+
resisc45: tanganke/clip-vit-base-patch32_resisc45
|
|
47
|
+
eurosat: tanganke/clip-vit-base-patch32_eurosat
|
|
48
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
49
|
+
gtsrb: tanganke/clip-vit-base-patch32_gtsrb
|
|
50
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
51
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
52
|
+
oxford_flowers102: tanganke/clip-vit-base-patch32_oxford_flowers102
|
|
53
|
+
pcam: tanganke/clip-vit-base-patch32_pcam
|
|
54
|
+
fer2013: tanganke/clip-vit-base-patch32_fer2013
|
|
55
|
+
oxford-iiit-pet: tanganke/clip-vit-base-patch32_oxford-iiit-pet
|
|
56
|
+
stl10: tanganke/clip-vit-base-patch32_stl10
|
|
57
|
+
cifar100: tanganke/clip-vit-base-patch32_cifar100
|
|
58
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL14_model_only.yaml
CHANGED
|
@@ -1,6 +1,23 @@
|
|
|
1
|
-
# The 14 task used in the paper:
|
|
1
|
+
# The 14 task used in the paper:
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
4
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
5
|
+
_recursive_: False
|
|
6
|
+
processor: openai/clip-vit-base-patch32
|
|
7
|
+
models:
|
|
8
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
9
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
10
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
11
|
+
resisc45: tanganke/clip-vit-base-patch32_resisc45
|
|
12
|
+
eurosat: tanganke/clip-vit-base-patch32_eurosat
|
|
13
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
14
|
+
gtsrb: tanganke/clip-vit-base-patch32_gtsrb
|
|
15
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
16
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
17
|
+
oxford_flowers102: tanganke/clip-vit-base-patch32_oxford_flowers102
|
|
18
|
+
pcam: tanganke/clip-vit-base-patch32_pcam
|
|
19
|
+
fer2013: tanganke/clip-vit-base-patch32_fer2013
|
|
20
|
+
oxford-iiit-pet: tanganke/clip-vit-base-patch32_oxford-iiit-pet
|
|
21
|
+
stl10: tanganke/clip-vit-base-patch32_stl10
|
|
22
|
+
cifar100: tanganke/clip-vit-base-patch32_cifar100
|
|
23
|
+
platform: hf
|
|
@@ -1,8 +1,64 @@
|
|
|
1
|
-
# The
|
|
1
|
+
# The 16 task used in the paper (TALL mask):
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
4
|
defaults:
|
|
5
|
-
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
5
|
+
- /dataset/image_classification/train@train_datasets:
|
|
6
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
7
|
+
- sun397
|
|
8
|
+
- stanford-cars
|
|
9
|
+
- resisc45
|
|
10
|
+
- eurosat
|
|
11
|
+
- svhn
|
|
12
|
+
- gtsrb
|
|
13
|
+
- mnist
|
|
14
|
+
- dtd
|
|
15
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
16
|
+
- oxford_flowers102
|
|
17
|
+
- pcam
|
|
18
|
+
- fer2013
|
|
19
|
+
- oxford-iiit-pet
|
|
20
|
+
- stl10
|
|
21
|
+
- cifar100
|
|
22
|
+
- cifar10
|
|
23
|
+
- food101
|
|
24
|
+
- /dataset/image_classification/test@test_datasets:
|
|
25
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
26
|
+
- sun397
|
|
27
|
+
- stanford-cars
|
|
28
|
+
- resisc45
|
|
29
|
+
- eurosat
|
|
30
|
+
- svhn
|
|
31
|
+
- gtsrb
|
|
32
|
+
- mnist
|
|
33
|
+
- dtd
|
|
34
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
35
|
+
- oxford_flowers102
|
|
36
|
+
- pcam
|
|
37
|
+
- fer2013
|
|
38
|
+
- oxford-iiit-pet
|
|
39
|
+
- stl10
|
|
40
|
+
- cifar100
|
|
41
|
+
- cifar10
|
|
42
|
+
- food101
|
|
43
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
44
|
+
_recursive_: False
|
|
45
|
+
processor: openai/clip-vit-base-patch32
|
|
46
|
+
models:
|
|
47
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
48
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
49
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
50
|
+
resisc45: tanganke/clip-vit-base-patch32_resisc45
|
|
51
|
+
eurosat: tanganke/clip-vit-base-patch32_eurosat
|
|
52
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
53
|
+
gtsrb: tanganke/clip-vit-base-patch32_gtsrb
|
|
54
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
55
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
56
|
+
oxford_flowers102: tanganke/clip-vit-base-patch32_oxford_flowers102
|
|
57
|
+
pcam: tanganke/clip-vit-base-patch32_pcam
|
|
58
|
+
fer2013: tanganke/clip-vit-base-patch32_fer2013
|
|
59
|
+
oxford-iiit-pet: tanganke/clip-vit-base-patch32_oxford-iiit-pet
|
|
60
|
+
stl10: tanganke/clip-vit-base-patch32_stl10
|
|
61
|
+
cifar100: tanganke/clip-vit-base-patch32_cifar100
|
|
62
|
+
cifar10: tanganke/clip-vit-base-patch32_cifar10
|
|
63
|
+
food101: tanganke/clip-vit-base-patch32_food101
|
|
64
|
+
platform: hf
|
|
@@ -1,8 +1,70 @@
|
|
|
1
|
-
# The
|
|
1
|
+
# The 18 task used in the paper:
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
4
|
defaults:
|
|
5
|
-
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
5
|
+
- /dataset/image_classification/train@train_datasets:
|
|
6
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
7
|
+
- sun397
|
|
8
|
+
- stanford-cars
|
|
9
|
+
- resisc45
|
|
10
|
+
- eurosat
|
|
11
|
+
- svhn
|
|
12
|
+
- gtsrb
|
|
13
|
+
- mnist
|
|
14
|
+
- dtd
|
|
15
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
16
|
+
- oxford_flowers102
|
|
17
|
+
- pcam
|
|
18
|
+
- fer2013
|
|
19
|
+
- oxford-iiit-pet
|
|
20
|
+
- stl10
|
|
21
|
+
- cifar100
|
|
22
|
+
- cifar10
|
|
23
|
+
- food101
|
|
24
|
+
- fashion_mnist
|
|
25
|
+
- emnist_letters
|
|
26
|
+
- /dataset/image_classification/test@test_datasets:
|
|
27
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
28
|
+
- sun397
|
|
29
|
+
- stanford-cars
|
|
30
|
+
- resisc45
|
|
31
|
+
- eurosat
|
|
32
|
+
- svhn
|
|
33
|
+
- gtsrb
|
|
34
|
+
- mnist
|
|
35
|
+
- dtd
|
|
36
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
37
|
+
- oxford_flowers102
|
|
38
|
+
- pcam
|
|
39
|
+
- fer2013
|
|
40
|
+
- oxford-iiit-pet
|
|
41
|
+
- stl10
|
|
42
|
+
- cifar100
|
|
43
|
+
- cifar10
|
|
44
|
+
- food101
|
|
45
|
+
- fashion_mnist
|
|
46
|
+
- emnist_letters
|
|
47
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
48
|
+
_recursive_: False
|
|
49
|
+
processor: openai/clip-vit-base-patch32
|
|
50
|
+
models:
|
|
51
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
52
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
53
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
54
|
+
resisc45: tanganke/clip-vit-base-patch32_resisc45
|
|
55
|
+
eurosat: tanganke/clip-vit-base-patch32_eurosat
|
|
56
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
57
|
+
gtsrb: tanganke/clip-vit-base-patch32_gtsrb
|
|
58
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
59
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
60
|
+
oxford_flowers102: tanganke/clip-vit-base-patch32_oxford_flowers102
|
|
61
|
+
pcam: tanganke/clip-vit-base-patch32_pcam
|
|
62
|
+
fer2013: tanganke/clip-vit-base-patch32_fer2013
|
|
63
|
+
oxford-iiit-pet: tanganke/clip-vit-base-patch32_oxford-iiit-pet
|
|
64
|
+
stl10: tanganke/clip-vit-base-patch32_stl10
|
|
65
|
+
cifar100: tanganke/clip-vit-base-patch32_cifar100
|
|
66
|
+
cifar10: tanganke/clip-vit-base-patch32_cifar10
|
|
67
|
+
food101: tanganke/clip-vit-base-patch32_food101
|
|
68
|
+
fashion_mnist: tanganke/clip-vit-base-patch32_fashion_mnist
|
|
69
|
+
emnist_letters: tanganke/clip-vit-base-patch32_emnist_letters
|
|
70
|
+
platform: hf
|
|
@@ -1,8 +1,76 @@
|
|
|
1
|
-
# The 20 task used in the paper:
|
|
1
|
+
# The 20 task used in the paper:
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
4
|
defaults:
|
|
5
|
-
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
5
|
+
- /dataset/image_classification/train@train_datasets:
|
|
6
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
7
|
+
- sun397
|
|
8
|
+
- stanford-cars
|
|
9
|
+
- resisc45
|
|
10
|
+
- eurosat
|
|
11
|
+
- svhn
|
|
12
|
+
- gtsrb
|
|
13
|
+
- mnist
|
|
14
|
+
- dtd
|
|
15
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
16
|
+
- oxford_flowers102
|
|
17
|
+
- pcam
|
|
18
|
+
- fer2013
|
|
19
|
+
- oxford-iiit-pet
|
|
20
|
+
- stl10
|
|
21
|
+
- cifar100
|
|
22
|
+
- cifar10
|
|
23
|
+
- food101
|
|
24
|
+
- fashion_mnist
|
|
25
|
+
- emnist_letters
|
|
26
|
+
- kmnist
|
|
27
|
+
- rendered-sst2
|
|
28
|
+
- /dataset/image_classification/test@test_datasets:
|
|
29
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
30
|
+
- sun397
|
|
31
|
+
- stanford-cars
|
|
32
|
+
- resisc45
|
|
33
|
+
- eurosat
|
|
34
|
+
- svhn
|
|
35
|
+
- gtsrb
|
|
36
|
+
- mnist
|
|
37
|
+
- dtd
|
|
38
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
39
|
+
- oxford_flowers102
|
|
40
|
+
- pcam
|
|
41
|
+
- fer2013
|
|
42
|
+
- oxford-iiit-pet
|
|
43
|
+
- stl10
|
|
44
|
+
- cifar100
|
|
45
|
+
- cifar10
|
|
46
|
+
- food101
|
|
47
|
+
- fashion_mnist
|
|
48
|
+
- emnist_letters
|
|
49
|
+
- kmnist
|
|
50
|
+
- rendered-sst2
|
|
51
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
52
|
+
_recursive_: False
|
|
53
|
+
processor: openai/clip-vit-base-patch32
|
|
54
|
+
models:
|
|
55
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
56
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
57
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
58
|
+
resisc45: tanganke/clip-vit-base-patch32_resisc45
|
|
59
|
+
eurosat: tanganke/clip-vit-base-patch32_eurosat
|
|
60
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
61
|
+
gtsrb: tanganke/clip-vit-base-patch32_gtsrb
|
|
62
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
63
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
64
|
+
oxford_flowers102: tanganke/clip-vit-base-patch32_oxford_flowers102
|
|
65
|
+
pcam: tanganke/clip-vit-base-patch32_pcam
|
|
66
|
+
fer2013: tanganke/clip-vit-base-patch32_fer2013
|
|
67
|
+
oxford-iiit-pet: tanganke/clip-vit-base-patch32_oxford-iiit-pet
|
|
68
|
+
stl10: tanganke/clip-vit-base-patch32_stl10
|
|
69
|
+
cifar100: tanganke/clip-vit-base-patch32_cifar100
|
|
70
|
+
cifar10: tanganke/clip-vit-base-patch32_cifar10
|
|
71
|
+
food101: tanganke/clip-vit-base-patch32_food101
|
|
72
|
+
fashion_mnist: tanganke/clip-vit-base-patch32_fashion_mnist
|
|
73
|
+
emnist_letters: tanganke/clip-vit-base-patch32_emnist_letters
|
|
74
|
+
kmnist: tanganke/clip-vit-base-patch32_kmnist
|
|
75
|
+
rendered-sst2: tanganke/clip-vit-base-patch32_rendered-sst2
|
|
76
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_TALL20_model_only.yaml
CHANGED
|
@@ -1,6 +1,29 @@
|
|
|
1
1
|
# The 20 task used in the paper:
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
4
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
5
|
+
_recursive_: False
|
|
6
|
+
processor: openai/clip-vit-base-patch32
|
|
7
|
+
models:
|
|
8
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
9
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
10
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
11
|
+
resisc45: tanganke/clip-vit-base-patch32_resisc45
|
|
12
|
+
eurosat: tanganke/clip-vit-base-patch32_eurosat
|
|
13
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
14
|
+
gtsrb: tanganke/clip-vit-base-patch32_gtsrb
|
|
15
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
16
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
17
|
+
oxford_flowers102: tanganke/clip-vit-base-patch32_oxford_flowers102
|
|
18
|
+
pcam: tanganke/clip-vit-base-patch32_pcam
|
|
19
|
+
fer2013: tanganke/clip-vit-base-patch32_fer2013
|
|
20
|
+
oxford-iiit-pet: tanganke/clip-vit-base-patch32_oxford-iiit-pet
|
|
21
|
+
stl10: tanganke/clip-vit-base-patch32_stl10
|
|
22
|
+
cifar100: tanganke/clip-vit-base-patch32_cifar100
|
|
23
|
+
cifar10: tanganke/clip-vit-base-patch32_cifar10
|
|
24
|
+
food101: tanganke/clip-vit-base-patch32_food101
|
|
25
|
+
fashion_mnist: tanganke/clip-vit-base-patch32_fashion_mnist
|
|
26
|
+
emnist_letters: tanganke/clip-vit-base-patch32_emnist_letters
|
|
27
|
+
kmnist: tanganke/clip-vit-base-patch32_kmnist
|
|
28
|
+
rendered-sst2: tanganke/clip-vit-base-patch32_rendered-sst2
|
|
29
|
+
platform: hf
|
|
@@ -1,10 +1,5 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
1
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
2
|
+
_recursive_: False
|
|
3
3
|
models:
|
|
4
|
-
_pretrained_:
|
|
5
|
-
|
|
6
|
-
pretrained_model_name_or_path: ${...base_model}
|
|
7
|
-
processor:
|
|
8
|
-
_target_: transformers.CLIPProcessor.from_pretrained
|
|
9
|
-
pretrained_model_name_or_path: ${..base_model}
|
|
10
|
-
base_model: openai/clip-vit-base-patch32
|
|
4
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
5
|
+
processor: ${.models._pretrained_}
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_single_finetuned.yaml
CHANGED
|
@@ -1,5 +1,7 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
1
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
2
|
+
_recursive_: False
|
|
3
|
+
processor: openai/clip-vit-base-patch32
|
|
4
|
+
models:
|
|
5
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
6
|
+
finetuned: tanganke/clip-vit-base-patch32_stanford-cars
|
|
7
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_single_task_projection.yaml
CHANGED
|
@@ -1,12 +1,8 @@
|
|
|
1
|
-
defaults:
|
|
2
|
-
- /model/clip-vit@models:
|
|
3
|
-
- clip-vit-base-patch32
|
|
4
|
-
- clip-vit-base-patch32_sun397
|
|
5
|
-
- clip-vit-base-patch32_stanford-cars
|
|
6
1
|
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
7
2
|
_recursive_: false
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
3
|
+
processor: openai/clip-vit-base-patch32
|
|
4
|
+
models:
|
|
5
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
6
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
7
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
8
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_and_cars.yaml
CHANGED
|
@@ -1,8 +1,4 @@
|
|
|
1
1
|
defaults:
|
|
2
|
-
- /model/clip-vit@models:
|
|
3
|
-
- clip-vit-base-patch32
|
|
4
|
-
- clip-vit-base-patch32_sun397
|
|
5
|
-
- clip-vit-base-patch32_stanford-cars
|
|
6
2
|
- /dataset/image_classification/train@train_datasets:
|
|
7
3
|
- sun397
|
|
8
4
|
- stanford-cars
|
|
@@ -11,6 +7,9 @@ defaults:
|
|
|
11
7
|
- stanford-cars
|
|
12
8
|
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
13
9
|
_recursive_: False
|
|
14
|
-
processor:
|
|
15
|
-
|
|
16
|
-
|
|
10
|
+
processor: openai/clip-vit-base-patch32
|
|
11
|
+
models:
|
|
12
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
13
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
14
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
15
|
+
platform: hf
|
|
@@ -1,8 +1,4 @@
|
|
|
1
1
|
defaults:
|
|
2
|
-
- /model/clip-vit@models:
|
|
3
|
-
- clip-vit-base-patch32
|
|
4
|
-
- clip-vit-base-patch32_sun397
|
|
5
|
-
- clip-vit-base-patch32_dtd
|
|
6
2
|
- /dataset/image_classification/train@train_datasets:
|
|
7
3
|
- sun397
|
|
8
4
|
- dtd
|
|
@@ -11,6 +7,9 @@ defaults:
|
|
|
11
7
|
- dtd
|
|
12
8
|
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
13
9
|
_recursive_: False
|
|
14
|
-
processor:
|
|
15
|
-
|
|
16
|
-
|
|
10
|
+
processor: openai/clip-vit-base-patch32
|
|
11
|
+
models:
|
|
12
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
13
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
14
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
15
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_sun397_cars_and_dtd.yaml
CHANGED
|
@@ -1,9 +1,4 @@
|
|
|
1
1
|
defaults:
|
|
2
|
-
- /model/clip-vit@models:
|
|
3
|
-
- clip-vit-base-patch32
|
|
4
|
-
- clip-vit-base-patch32_sun397
|
|
5
|
-
- clip-vit-base-patch32_stanford-cars
|
|
6
|
-
- clip-vit-base-patch32_dtd
|
|
7
2
|
- /dataset/image_classification/train@train_datasets:
|
|
8
3
|
- sun397
|
|
9
4
|
- stanford-cars
|
|
@@ -14,6 +9,10 @@ defaults:
|
|
|
14
9
|
- dtd
|
|
15
10
|
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
16
11
|
_recursive_: False
|
|
17
|
-
processor:
|
|
18
|
-
|
|
19
|
-
|
|
12
|
+
processor: openai/clip-vit-base-patch32
|
|
13
|
+
models:
|
|
14
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
15
|
+
sun397: tanganke/clip-vit-base-patch32_sun397
|
|
16
|
+
stanford-cars: tanganke/clip-vit-base-patch32_stanford-cars
|
|
17
|
+
dtd: tanganke/clip-vit-base-patch32_dtd
|
|
18
|
+
platform: hf
|
|
@@ -1,6 +1,8 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
1
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
2
|
+
_recursive_: False
|
|
3
|
+
processor: openai/clip-vit-base-patch32
|
|
4
|
+
models:
|
|
5
|
+
_pretrained_: openai/clip-vit-base-patch32
|
|
6
|
+
svhn: tanganke/clip-vit-base-patch32_svhn
|
|
7
|
+
mnist: tanganke/clip-vit-base-patch32_mnist
|
|
8
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-base-patch32_two_tasks_control_task.yaml
CHANGED
|
@@ -1,14 +1,12 @@
|
|
|
1
1
|
defaults:
|
|
2
|
-
- _self_
|
|
3
2
|
- /dataset/image_classification/train@train_datasets:
|
|
4
3
|
- tiny-imagenet
|
|
4
|
+
- _self_
|
|
5
5
|
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
6
|
-
_recursive_:
|
|
6
|
+
_recursive_: False
|
|
7
7
|
models:
|
|
8
8
|
_pretrained_: openai/clip-vit-base-patch32
|
|
9
9
|
model_1: tanganke/clip-vit-base-patch32_sun397
|
|
10
10
|
model_2: tanganke/clip-vit-base-patch32_stanford-cars
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
_target_: transformers.CLIPProcessor.from_pretrained
|
|
14
|
-
pretrained_model_name_or_path: openai/clip-vit-base-patch32
|
|
11
|
+
processor: openai/clip-vit-base-patch32
|
|
12
|
+
platform: hf
|
|
@@ -1,8 +1,33 @@
|
|
|
1
1
|
defaults:
|
|
2
|
-
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
2
|
+
- /dataset/image_classification/train@train_datasets:
|
|
3
|
+
- sun397
|
|
4
|
+
- stanford-cars
|
|
5
|
+
- resisc45
|
|
6
|
+
- eurosat
|
|
7
|
+
- svhn
|
|
8
|
+
- gtsrb
|
|
9
|
+
- mnist
|
|
10
|
+
- dtd
|
|
11
|
+
- /dataset/image_classification/test@test_datasets:
|
|
12
|
+
- sun397
|
|
13
|
+
- stanford-cars
|
|
14
|
+
- resisc45
|
|
15
|
+
- eurosat
|
|
16
|
+
- svhn
|
|
17
|
+
- gtsrb
|
|
18
|
+
- mnist
|
|
19
|
+
- dtd
|
|
20
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
21
|
+
_recursive_: False
|
|
22
|
+
processor: openai/clip-vit-large-patch14
|
|
23
|
+
models:
|
|
24
|
+
_pretrained_: openai/clip-vit-large-patch14
|
|
25
|
+
sun397: tanganke/clip-vit-large-patch14_sun397
|
|
26
|
+
stanford-cars: tanganke/clip-vit-large-patch14_stanford-cars
|
|
27
|
+
resisc45: tanganke/clip-vit-large-patch14_resisc45
|
|
28
|
+
eurosat: tanganke/clip-vit-large-patch14_eurosat
|
|
29
|
+
svhn: tanganke/clip-vit-large-patch14_svhn
|
|
30
|
+
gtsrb: tanganke/clip-vit-large-patch14_gtsrb
|
|
31
|
+
mnist: tanganke/clip-vit-large-patch14_mnist
|
|
32
|
+
dtd: tanganke/clip-vit-large-patch14_dtd
|
|
33
|
+
platform: hf
|
fusion_bench_config/modelpool/CLIPVisionModelPool/clip-vit-large-patch14_TA8_model_only.yaml
CHANGED
|
@@ -1,6 +1,14 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
1
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
2
|
+
_recursive_: False
|
|
3
|
+
processor: openai/clip-vit-large-patch14
|
|
4
|
+
models:
|
|
5
|
+
_pretrained_: openai/clip-vit-large-patch14
|
|
6
|
+
sun397: tanganke/clip-vit-large-patch14_sun397
|
|
7
|
+
stanford-cars: tanganke/clip-vit-large-patch14_stanford-cars
|
|
8
|
+
resisc45: tanganke/clip-vit-large-patch14_resisc45
|
|
9
|
+
eurosat: tanganke/clip-vit-large-patch14_eurosat
|
|
10
|
+
svhn: tanganke/clip-vit-large-patch14_svhn
|
|
11
|
+
gtsrb: tanganke/clip-vit-large-patch14_gtsrb
|
|
12
|
+
mnist: tanganke/clip-vit-large-patch14_mnist
|
|
13
|
+
dtd: tanganke/clip-vit-large-patch14_dtd
|
|
14
|
+
platform: hf
|
|
@@ -1,11 +1,76 @@
|
|
|
1
|
-
# The 20 task used in the paper:
|
|
1
|
+
# The 20 task used in the paper:
|
|
2
2
|
# Wang et al. Localizing Task Information for Improved Model Merging and Compression
|
|
3
3
|
# http://arxiv.org/abs/2405.07813
|
|
4
4
|
defaults:
|
|
5
|
-
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
5
|
+
- /dataset/image_classification/train@train_datasets:
|
|
6
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
7
|
+
- sun397
|
|
8
|
+
- stanford-cars
|
|
9
|
+
- resisc45
|
|
10
|
+
- eurosat
|
|
11
|
+
- svhn
|
|
12
|
+
- gtsrb
|
|
13
|
+
- mnist
|
|
14
|
+
- dtd
|
|
15
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
16
|
+
- oxford_flowers102
|
|
17
|
+
- pcam
|
|
18
|
+
- fer2013
|
|
19
|
+
- oxford-iiit-pet
|
|
20
|
+
- stl10
|
|
21
|
+
- cifar100
|
|
22
|
+
- cifar10
|
|
23
|
+
- food101
|
|
24
|
+
- fashion_mnist
|
|
25
|
+
- emnist_letters
|
|
26
|
+
- kmnist
|
|
27
|
+
- rendered-sst2
|
|
28
|
+
- /dataset/image_classification/test@test_datasets:
|
|
29
|
+
# -- begin of eight tasks in the task arithmetic paper ---
|
|
30
|
+
- sun397
|
|
31
|
+
- stanford-cars
|
|
32
|
+
- resisc45
|
|
33
|
+
- eurosat
|
|
34
|
+
- svhn
|
|
35
|
+
- gtsrb
|
|
36
|
+
- mnist
|
|
37
|
+
- dtd
|
|
38
|
+
# -- end of eight tasks in the task arithmetic paper ---
|
|
39
|
+
- oxford_flowers102
|
|
40
|
+
- pcam
|
|
41
|
+
- fer2013
|
|
42
|
+
- oxford-iiit-pet
|
|
43
|
+
- stl10
|
|
44
|
+
- cifar100
|
|
45
|
+
- cifar10
|
|
46
|
+
- food101
|
|
47
|
+
- fashion_mnist
|
|
48
|
+
- emnist_letters
|
|
49
|
+
- kmnist
|
|
50
|
+
- rendered-sst2
|
|
51
|
+
_target_: fusion_bench.modelpool.CLIPVisionModelPool
|
|
52
|
+
_recursive_: False
|
|
53
|
+
processor: openai/clip-vit-large-patch14
|
|
54
|
+
models:
|
|
55
|
+
_pretrained_: openai/clip-vit-large-patch14
|
|
56
|
+
sun397: tanganke/clip-vit-large-patch14_sun397
|
|
57
|
+
stanford-cars: tanganke/clip-vit-large-patch14_stanford-cars
|
|
58
|
+
resisc45: tanganke/clip-vit-large-patch14_resisc45
|
|
59
|
+
eurosat: tanganke/clip-vit-large-patch14_eurosat
|
|
60
|
+
svhn: tanganke/clip-vit-large-patch14_svhn
|
|
61
|
+
gtsrb: tanganke/clip-vit-large-patch14_gtsrb
|
|
62
|
+
mnist: tanganke/clip-vit-large-patch14_mnist
|
|
63
|
+
dtd: tanganke/clip-vit-large-patch14_dtd
|
|
64
|
+
oxford_flowers102: tanganke/clip-vit-large-patch14_oxford_flowers102
|
|
65
|
+
pcam: tanganke/clip-vit-large-patch14_pcam
|
|
66
|
+
fer2013: tanganke/clip-vit-large-patch14_fer2013
|
|
67
|
+
oxford-iiit-pet: tanganke/clip-vit-large-patch14_oxford-iiit-pet
|
|
68
|
+
stl10: tanganke/clip-vit-large-patch14_stl10
|
|
69
|
+
cifar100: tanganke/clip-vit-large-patch14_cifar100
|
|
70
|
+
cifar10: tanganke/clip-vit-large-patch14_cifar10
|
|
71
|
+
food101: tanganke/clip-vit-large-patch14_food101
|
|
72
|
+
fashion_mnist: tanganke/clip-vit-large-patch14_fashion_mnist
|
|
73
|
+
emnist_letters: tanganke/clip-vit-large-patch14_emnist_letters
|
|
74
|
+
kmnist: tanganke/clip-vit-large-patch14_kmnist
|
|
75
|
+
rendered-sst2: tanganke/clip-vit-large-patch14_rendered-sst2
|
|
76
|
+
platform: hf
|