updated composer and streaming versions (#1857)

ethantang-db · web-flow · commit 8c8dd48f7216 · 2025-07-21T15:17:29.000-07:00
diff --git a/llmfoundry/callbacks/hf_checkpointer.py b/llmfoundry/callbacks/hf_checkpointer.py
@@ -673,17 +673,33 @@ def tensor_hook(
             # initialization cost.
             with init_empty_weights():
                 if self.using_peft:
+                    import peft
                     from peft import PeftModel
                     assert isinstance(original_model, PeftModel)
                     active_adapter = original_model.active_adapter  # type: ignore
                     base_model: PreTrainedModel = original_model.get_base_model(  # type: ignore
                     )
                     new_base_model_instance = type(base_model)(new_config)
 
+                    # TODO: Deprecate this when we no longer support peft 0.16.0 from upstream
+                    if peft.__version__ == '0.16.0':
+                        # due to https://github.com/huggingface/peft/issues/2634, we need to change
+                        # the peft type to an enum. Should be fixed in 0.17.0 by
+                        # https://github.com/huggingface/peft/pull/2635
+                        peft_config = copy.copy(
+                            original_model.
+                            peft_config[active_adapter],  # type: ignore
+                        )
+                        peft_config.peft_type = peft.PeftType(  # type: ignore
+                            peft_config.peft_type,  # type: ignore
+                        )
+                    else:
+                        peft_config = original_model.peft_config[  # type: ignore
+                            active_adapter]  # type: ignore
+
                     new_model_instance = type(original_model)(
                         new_base_model_instance,  # type: ignore
-                        original_model.
-                        peft_config[active_adapter],  # type: ignore
+                        peft_config,  # type: ignore
                     )
                     del new_base_model_instance
                 else:
diff --git a/setup.py b/setup.py
@@ -51,7 +51,7 @@
 ]
 
 install_requires = [
-    'mosaicml[libcloud,wandb,oci,gcs,mlflow]>=0.31.0,<0.33',
+    'mosaicml[libcloud,wandb,oci,gcs,mlflow]>=0.32.0,<0.33',
     'mlflow>=2.14.1,<3.2',
     'accelerate>=0.25,<1.9',  # for HF inference `device_map`
     'transformers>=v4.51.0,<4.52',
@@ -91,15 +91,15 @@
 ]
 
 extra_deps['databricks'] = [
-    'mosaicml[databricks]>=0.31.0,<0.32',
+    'mosaicml[databricks]>=0.32.0,<0.33',
     'numpy<2',
     'databricks-sql-connector>=3,<4',
     'databricks-connect==14.1.0',
     'lz4>=4,<5',
 ]
 
 extra_deps['tensorboard'] = [
-    'mosaicml[tensorboard]>=0.31.0,<0.32',
+    'mosaicml[tensorboard]>=0.32.0,<0.33',
 ]
 
 # Flash 2 group kept for backwards compatibility
@@ -110,7 +110,7 @@
 extra_deps['gpu'] = copy.deepcopy(extra_deps['gpu-flash2'])
 
 extra_deps['peft'] = [
-    'mosaicml[peft]>=0.31.0,<0.32',
+    'mosaicml[peft]>=0.32.0,<0.33',
 ]
 
 extra_deps['openai'] = [

Original file line number	Diff line number	Diff line change
`@@ -51,7 +51,7 @@`
`51`	`51`	`]`
`52`	`52`
`53`	`53`	`install_requires = [`
`54`		`- 'mosaicml[libcloud,wandb,oci,gcs,mlflow]>=0.31.0,<0.33',`
	`54`	`+ 'mosaicml[libcloud,wandb,oci,gcs,mlflow]>=0.32.0,<0.33',`
`55`	`55`	`'mlflow>=2.14.1,<3.2',`
`56`	`56`	'accelerate>=0.25,<1.9', # for HF inference `device_map`
`57`	`57`	`'transformers>=v4.51.0,<4.52',`
`@@ -91,15 +91,15 @@`
`91`	`91`	`]`
`92`	`92`
`93`	`93`	`extra_deps['databricks'] = [`
`94`		`- 'mosaicml[databricks]>=0.31.0,<0.32',`
	`94`	`+ 'mosaicml[databricks]>=0.32.0,<0.33',`
`95`	`95`	`'numpy<2',`
`96`	`96`	`'databricks-sql-connector>=3,<4',`
`97`	`97`	`'databricks-connect==14.1.0',`
`98`	`98`	`'lz4>=4,<5',`
`99`	`99`	`]`
`100`	`100`
`101`	`101`	`extra_deps['tensorboard'] = [`
`102`		`- 'mosaicml[tensorboard]>=0.31.0,<0.32',`
	`102`	`+ 'mosaicml[tensorboard]>=0.32.0,<0.33',`
`103`	`103`	`]`
`104`	`104`
`105`	`105`	`# Flash 2 group kept for backwards compatibility`
`@@ -110,7 +110,7 @@`
`110`	`110`	`extra_deps['gpu'] = copy.deepcopy(extra_deps['gpu-flash2'])`
`111`	`111`
`112`	`112`	`extra_deps['peft'] = [`
`113`		`- 'mosaicml[peft]>=0.31.0,<0.32',`
	`113`	`+ 'mosaicml[peft]>=0.32.0,<0.33',`
`114`	`114`	`]`
`115`	`115`
`116`	`116`	`extra_deps['openai'] = [`