PyPI - fusion-bench - Versions diffs - 0.2.30__py3-none-any.whl → 0.2.32__py3-none-any.whl - Mend

fusion-bench 0.2.30py3-none-any.whl → 0.2.32py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

fusion_bench/__init__.py +6 -0
fusion_bench/__main__.py +2 -2
fusion_bench/constants/runtime.py +4 -1
fusion_bench/dataset/__init__.py +2 -0
fusion_bench/dataset/clip_dataset.py +4 -72
fusion_bench/dataset/image_dataset.py +44 -18
fusion_bench/method/base_algorithm.py +4 -0
fusion_bench/method/classification/image_classification_finetune.py +1 -0
fusion_bench/method/concrete_subspace/clip_concrete_tsvm.py +285 -0
fusion_bench/method/dop/dop.py +0 -22
fusion_bench/method/dop/dop_general.py +489 -0
fusion_bench/method/dop/utils.py +24 -4
fusion_bench/method/emr_merging/__init__.py +1 -0
fusion_bench/method/emr_merging/emr_merging.py +53 -0
fusion_bench/method/emr_merging/utils.py +162 -0
fusion_bench/method/opcm/opcm.py +6 -2
fusion_bench/method/opcm/opcm_general.py +356 -0
fusion_bench/method/opcm/utils.py +1 -4
fusion_bench/method/simple_average.py +52 -18
fusion_bench/method/task_arithmetic/task_arithmetic.py +1 -1
fusion_bench/method/task_singular_vector/TSVM.py +7 -6
fusion_bench/method/task_singular_vector/utils/TSVM_utils.py +0 -1
fusion_bench/mixins/lightning_fabric.py +110 -11
fusion_bench/mixins/openclip_classification.py +155 -1
fusion_bench/mixins/serialization.py +1 -1
fusion_bench/modelpool/base_pool.py +37 -0
fusion_bench/modelpool/convnext_for_image_classification.py +5 -2
fusion_bench/modelpool/openclip_vision/modelpool.py +12 -3
fusion_bench/models/hf_clip.py +20 -0
fusion_bench/models/modulator/__init__.py +1 -0
fusion_bench/models/modulator/base.py +123 -0
fusion_bench/models/open_clip/modeling.py +61 -5
fusion_bench/models/open_clip/utils.py +13 -2
fusion_bench/models/parameter_dict.py +119 -29
fusion_bench/models/utils.py +190 -2
fusion_bench/models/wrappers/switch.py +90 -0
fusion_bench/programs/base_program.py +6 -0
fusion_bench/programs/fabric_fusion_program.py +4 -0
fusion_bench/py.typed +1 -0
fusion_bench/scripts/cli.py +25 -23
fusion_bench/scripts/imgui.py +2 -2
fusion_bench/scripts/webui.py +2 -2
fusion_bench/taskpool/image_classification.py +270 -0
fusion_bench/utils/__init__.py +20 -1
fusion_bench/utils/data.py +1 -1
fusion_bench/utils/dict.py +19 -0
fusion_bench/utils/dtype.py +19 -0
fusion_bench/utils/hydra_utils.py +75 -0
fusion_bench/utils/misc.py +1 -0
fusion_bench/utils/packages.py +4 -0
fusion_bench/utils/parameters.py +33 -0
fusion_bench/utils/rich_utils.py +42 -19
fusion_bench/utils/state_dict_arithmetic.py +183 -1
fusion_bench/utils/tensorboard.py +21 -3
{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/METADATA +3 -1
{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/RECORD +70 -53
{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/WHEEL +1 -1
{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/entry_points.txt +1 -1
fusion_bench_config/README.md +9 -0
fusion_bench_config/fabric/auto.yaml +1 -0
fusion_bench_config/fabric/loggers/mlflow_logger.yaml +4 -0
fusion_bench_config/hydra/default.yaml +3 -1
fusion_bench_config/method/concrete_subspace/clip_concrete_tsvm.yaml +38 -0
fusion_bench_config/method/dop/dop_general.yaml +33 -0
fusion_bench_config/method/emr_merging/emr_merging.yaml +1 -0
fusion_bench_config/method/opcm/opcm_general.yaml +18 -0
fusion_bench_config/modelpool/ConvNextForImageClassification/convnext-base-224_8-tasks.yaml +15 -0
fusion_bench_config/taskpool/ImageClassificationTaskPool/convnext-base-224_8-tasks.yaml +17 -0
{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/licenses/LICENSE +0 -0
{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/top_level.txt +0 -0

fusion_bench_config/fabric/auto.yaml CHANGED Viewed

@@ -13,3 +13,4 @@ strategy: auto
 # ``"cpu"``, ``"cuda"``, ``"mps"``, ``"gpu"``, ``"tpu"``, ``"auto"``.
 # for example: fabric.accelerator=cpu
 accelerator: auto
+precision: null

fusion_bench_config/fabric/loggers/mlflow_logger.yaml CHANGED Viewed

@@ -1,2 +1,6 @@
 # https://mlflow.org/
 _target_: lightning.pytorch.loggers.MLFlowLogger
+tracking_uri: "sqlite:///${path.output_dir}/mlflow.db"
+experiment_name: ${hydra:job.config_name}
+run_name: ${now:%Y-%m-%d_%H-%M-%S}
+save_dir: ${path.log_dir}

fusion_bench_config/hydra/default.yaml CHANGED Viewed

@@ -4,7 +4,9 @@ defaults:
 run:
   dir: ${path.log_dir}
 sweep:
-  dir: ${path.log_dir}
+  # the directory where all multirun outputs are stored
+  # can not refer to ${path.log_dir} because this is evaluated before constructing the separate run configs
+  dir: ${oc.env:FUSION_BENCH_PROJECT_ROOT,"."}/outputs/multirun/${hydra.job.config_name}/${now:%Y-%m-%d_%H-%M-%S}
   subdir: ${hydra.job.num}
 job:
   env_set:

fusion_bench_config/method/concrete_subspace/clip_concrete_tsvm.yaml ADDED Viewed

@@ -0,0 +1,38 @@
+_target_: fusion_bench.method.concrete_subspace.clip_concrete_tsvm.ConcreteTSVMForOpenCLIP
+# === Concrete Subspace parameters ===
+# batch size per gpu
+# if you have multiple gpus, the total batch size will be `batch_size * num_gpus`
+dataloader_kwargs:
+  batch_size: 16
+  num_workers: 8
+optimizer:
+  _target_: torch.optim.AdamW
+  lr: 1e-3
+  weight_decay: 0.01
+  fused: null
+lr_scheduler: null
+merge_dtype: null
+max_steps: 2000
+save_interval: 500
+initial_logits: 0
+temperature: 0.5
+# "discrete" or "continuous", this is the mask applied for evaluation, not during training
+# the performance of final model are expected to be similar
+eval_mask_type: continuous
+mask_checkpoint: null
+# if `clamp_weights` is true, the weights will be clamped to [0, 1]
+clamp_weights: false
+# arguments of `functional_call`
+tie_weights: true
+strict: false
+# directory to cache zero-shot classification heads
+cache_dir: outputs
+skip_training: false
+# === TSVM parameters ===
+exclude_keys: null
+# alpha (also known as scaling factor) is a float or a list of floats
+# example:
+# alpha: 1
+# alpha: [1, 0.5, 0.25]
+alpha: 1
+return_single_task_models: false

fusion_bench_config/method/dop/dop_general.yaml ADDED Viewed

@@ -0,0 +1,33 @@
+_target_: fusion_bench.method.dop.dop_general.DOPMerging
+# the random seed to use
+seed: null
+# shuffle the order of the models
+shuffle_order: true
+# save the merged model on every step
+save_on_every_step: false
+# evaluate the merged model on every step
+evaluate_on_every_step: true
+# optimizer (learning rate)
+lr: 1e-4
+# optimizer (num_steps)
+num_steps: 200
+# weighted loss
+# if mgda is true, use mgda to optimize the loss weights
+mgda: true
+# if mgda is false, this is the weight for the loss of the first task
+alpha: 0.8
+# if mgda is true and ema is ture, using exponential moving average (ema), alpha is the initial value
+ema: true
+# if mgda is true and ema is ture, using exponential moving average (ema), beta is the decay rate
+ema_beta: 0.999
+# epsilon for svd (the proportion of energy retained)
+svd_epsilon: 0.99999
+# the space to project the delta w (left singular vectors, right singular vectors, or both)
+svd_proj_space: uv # u or v or uv
+# the number of ray actors to use for parallel merging (0 means no ray)
+num_ray_actors: 0

fusion_bench_config/method/emr_merging/emr_merging.yaml ADDED Viewed

	@@ -0,0 +1 @@
1	+ _target_: fusion_bench.method.emr_merging.EMRMerging

fusion_bench_config/method/opcm/opcm_general.yaml ADDED Viewed

@@ -0,0 +1,18 @@
+# =============================================================================
+# FusionBench Method Configuration: OPCM
+# =============================================================================
+# Incrementally merges models via SVD projection and evaluation per step.
+# =============================================================================
+_target_: fusion_bench.method.opcm.opcm_general.OPCM
+# shuffle the order of the models
+shuffle_order: true
+# the scaling factor for the SVD projection
+alpha: 0.5
+# the random seed to use
+seed: null
+# save the merged model on every step
+save_on_every_step: true
+# evaluate the merged model on every step
+evaluate_on_every_step: true
+# the number of ray actors to use for distributed merging
+num_ray_actors: 0

fusion_bench_config/modelpool/ConvNextForImageClassification/convnext-base-224_8-tasks.yaml ADDED Viewed

@@ -0,0 +1,15 @@
+_target_: fusion_bench.modelpool.ConvNextForImageClassificationPool
+_recursive_: False
+models:
+  _pretrained_: facebook/convnext-base-224
+  sun397: tanganke/convnext-base-224_sun397_sgd_batch-size-64_lr-0.01_steps-4000
+  stanford-cars: tanganke/convnext-base-224_stanford-cars_sgd_batch-size-64_lr-0.01_steps-4000
+  resisc45: tanganke/convnext-base-224_resisc45_sgd_batch-size-64_lr-0.01_steps-4000
+  eurosat: tanganke/convnext-base-224_eurosat_sgd_batch-size-64_lr-0.01_steps-4000
+  svhn: tanganke/convnext-base-224_svhn_sgd_batch-size-64_lr-0.01_steps-4000
+  gtsrb: tanganke/convnext-base-224_gtsrb_sgd_batch-size-64_lr-0.01_steps-4000
+  mnist: tanganke/convnext-base-224_mnist_sgd_batch-size-64_lr-0.01_steps-4000
+  dtd: tanganke/convnext-base-224_dtd_sgd_batch-size-64_lr-0.01_steps-4000
+train_datasets: null
+val_datasets: null
+test_datasets: null

fusion_bench_config/taskpool/ImageClassificationTaskPool/convnext-base-224_8-tasks.yaml ADDED Viewed

@@ -0,0 +1,17 @@
+defaults:
+  - /dataset/image_classification/test@test_datasets:
+      - sun397
+      - stanford-cars
+      - resisc45
+      - eurosat
+      - svhn
+      - gtsrb
+      - mnist
+      - dtd
+  - _self_
+_target_: fusion_bench.taskpool.image_classification.ImageClassificationTaskPool
+_recursive_: False
+processor: facebook/convnext-base-224
+dataloader_kwargs:
+  batch_size: 32
+  num_workers: 0

{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{fusion_bench-0.2.30.dist-info → fusion_bench-0.2.32.dist-info}/top_level.txt RENAMED Viewed

File without changes

fusion-bench 0.2.30__py3-none-any.whl → 0.2.32__py3-none-any.whl

fusion-bench 0.2.30py3-none-any.whl → 0.2.32py3-none-any.whl