From 9496f2f5ebb7cd8c88fbcfd2efd31bbb48d9bef3 Mon Sep 17 00:00:00 2001
From: Yu Chin Fabian Lim <flim@sg.ibm.com>
Date: Sun, 30 Jun 2024 15:46:07 +0000
Subject: [PATCH 1/3] revert some changes in #219

Signed-off-by: Yu Chin Fabian Lim <flim@sg.ibm.com>
---
 README.md                                                 | 4 ++--
 pyproject.toml                                            | 2 ++
 .../acceleration_configs/acceleration_framework_config.py | 8 ++++----
 3 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/README.md b/README.md
index 7a6bbd7d..43fa9c21 100644
--- a/README.md
+++ b/README.md
@@ -25,7 +25,7 @@ pip install fms-hf-tuning[aim]
 
 If you wish to use [fms-acceleration](https://github.com/foundation-model-stack/fms-acceleration), you need to install it. 
 ```
-pip install git+https://github.com/foundation-model-stack/fms-acceleration.git#subdirectory=plugins/framework
+pip install fms-hf-tuning[fms-accel]
 ```
 `fms-acceleration` is a collection of plugins that packages that accelerate fine-tuning / training of large models, as part of the `fms-hf-tuning` suite. For more details on see [this section below](#fms-acceleration).
 
@@ -389,7 +389,7 @@ Equally you can pass in a JSON configuration for running tuning. See [build doc]
 
 To access `fms-acceleration` features the `[fms-accel]` dependency must first be installed:
   ```
-  $ pip install https://github.com/foundation-model-stack/fms-acceleration.git#subdirectory=plugins/framework
+  $ pip install fms-hf-tuning[fms-accel]
   ```
 
 Furthermore, the required `fms-acceleration` plugin must be installed. This is done via the command line utility `fms_acceleration.cli`. To show available plugins:
diff --git a/pyproject.toml b/pyproject.toml
index 1a8c7ba7..a869fc9f 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -44,6 +44,8 @@ dependencies = [
 dev = ["wheel>=0.42.0,<1.0", "packaging>=23.2,<24", "ninja>=1.11.1.1,<2.0", "scikit-learn>=1.0, <2.0", "boto3>=1.34, <2.0"]
 flash-attn = ["flash-attn>=2.5.3,<3.0"]
 aim = ["aim>=3.19.0,<4.0"]
+fms-accel = ["fms-acceleration>=0.1"]
+
 
 [tool.setuptools.packages.find]
 exclude = ["tests", "tests.*"]
diff --git a/tuning/config/acceleration_configs/acceleration_framework_config.py b/tuning/config/acceleration_configs/acceleration_framework_config.py
index 2d666a0b..c93ea9e5 100644
--- a/tuning/config/acceleration_configs/acceleration_framework_config.py
+++ b/tuning/config/acceleration_configs/acceleration_framework_config.py
@@ -178,10 +178,10 @@ def get_framework(self):
         else:
             if not self.is_empty():
                 raise ValueError(
-                    "No acceleration framework package found. To use, first ensure that "
-                    "'pip install git+https://github.com/foundation-model-stack/fms-acceleration.git#subdirectory=plugins/framework' "  # pylint: disable=line-too-long
-                    "is done first to obtain the acceleration framework dependency. Additional "
-                    "acceleration plugins make be required depending on the requested "
+                    "No acceleration framework package found. To use, first "
+                    "ensure that 'pip install fms-hf-tuning[fms-accel]' is done first to "
+                    "obtain the acceleration framework dependency. Additional "
+                    "acceleration plugins make be required depending on the requsted "
                     "acceleration. See README.md for instructions."
                 )
 

From c859361995442b7f1e3cd6a7bb4aedd70412dae9 Mon Sep 17 00:00:00 2001
From: Yu Chin Fabian Lim <flim@sg.ibm.com>
Date: Sun, 30 Jun 2024 15:51:24 +0000
Subject: [PATCH 2/3] minor fixes

Signed-off-by: Yu Chin Fabian Lim <flim@sg.ibm.com>
---
 .../acceleration_framework_config.py          | 19 ++++++++++---------
 .../fused_ops_and_kernels.py                  | 18 +-----------------
 .../quantized_lora_config.py                  | 12 +-----------
 3 files changed, 12 insertions(+), 37 deletions(-)

diff --git a/tuning/config/acceleration_configs/acceleration_framework_config.py b/tuning/config/acceleration_configs/acceleration_framework_config.py
index c93ea9e5..7dc5737b 100644
--- a/tuning/config/acceleration_configs/acceleration_framework_config.py
+++ b/tuning/config/acceleration_configs/acceleration_framework_config.py
@@ -162,6 +162,8 @@ def from_dataclasses(*dataclasses: Type):
         return config
 
     def get_framework(self):
+        if self.is_empty():
+            return
 
         if is_fms_accelerate_available():
 
@@ -176,14 +178,13 @@ def get_framework(self):
                 self.to_yaml(f.name)
                 return AccelerationFramework(f.name)
         else:
-            if not self.is_empty():
-                raise ValueError(
-                    "No acceleration framework package found. To use, first "
-                    "ensure that 'pip install fms-hf-tuning[fms-accel]' is done first to "
-                    "obtain the acceleration framework dependency. Additional "
-                    "acceleration plugins make be required depending on the requsted "
-                    "acceleration. See README.md for instructions."
-                )
+            raise ValueError(
+                "No acceleration framework package found. To use, first "
+                "ensure that 'pip install fms-hf-tuning[fms-accel]' is done first to "
+                "obtain the acceleration framework dependency. Additional "
+                "acceleration plugins make be required depending on the requsted "
+                "acceleration. See README.md for instructions."
+            )
 
     def is_empty(self):
         "check if the configuration is empty"
@@ -244,7 +245,7 @@ def _descend_and_set(path: List[str], d: Dict):
                         "to be installed. Please do:\n"
                         + "\n".join(
                             [
-                                "- python -m fms_acceleration install "
+                                "- python -m fms_acceleration.cli install "
                                 f"{AccelerationFrameworkConfig.PACKAGE_PREFIX + x}"
                                 for x in annotate.required_packages
                             ]
diff --git a/tuning/config/acceleration_configs/fused_ops_and_kernels.py b/tuning/config/acceleration_configs/fused_ops_and_kernels.py
index 91df8c9d..ded51415 100644
--- a/tuning/config/acceleration_configs/fused_ops_and_kernels.py
+++ b/tuning/config/acceleration_configs/fused_ops_and_kernels.py
@@ -18,20 +18,13 @@
 from typing import List
 
 # Local
-from .utils import (
-    EnsureTypes,
-    ensure_nested_dataclasses_initialized,
-    parsable_dataclass,
-)
+from .utils import ensure_nested_dataclasses_initialized, parsable_dataclass
 
 
 @parsable_dataclass
 @dataclass
 class FusedLoraConfig(List):
 
-    # to help the HfArgumentParser arrive at correct types
-    __args__ = [EnsureTypes(str, bool)]
-
     # load unsloth optimizations for these 4bit base layer weights.
     # currently only support "auto_gptq" and "bitsandbytes"
     base_layer: str = None
@@ -41,9 +34,6 @@ class FusedLoraConfig(List):
 
     def __post_init__(self):
 
-        # reset for another parse
-        self.__args__[0].reset()
-
         if self.base_layer is not None and self.base_layer not in {
             "auto_gptq",
             "bitsandbytes",
@@ -60,9 +50,6 @@ def __post_init__(self):
 @dataclass
 class FastKernelsConfig(List):
 
-    # to help the HfArgumentParser arrive at correct types
-    __args__ = [EnsureTypes(bool, bool, bool)]
-
     # fast loss triton kernels
     fast_loss: bool = False
 
@@ -74,9 +61,6 @@ class FastKernelsConfig(List):
 
     def __post_init__(self):
 
-        # reset for another parse
-        self.__args__[0].reset()
-
         if not self.fast_loss == self.fast_rsm_layernorm == self.fast_rope_embeddings:
             raise ValueError(
                 "fast_loss, fast_rms_layernorm and fast_rope_embedding must be enabled "
diff --git a/tuning/config/acceleration_configs/quantized_lora_config.py b/tuning/config/acceleration_configs/quantized_lora_config.py
index d8174438..a55ac55d 100644
--- a/tuning/config/acceleration_configs/quantized_lora_config.py
+++ b/tuning/config/acceleration_configs/quantized_lora_config.py
@@ -18,11 +18,7 @@
 from typing import List
 
 # Local
-from .utils import (
-    EnsureTypes,
-    ensure_nested_dataclasses_initialized,
-    parsable_dataclass,
-)
+from .utils import ensure_nested_dataclasses_initialized, parsable_dataclass
 
 
 @parsable_dataclass
@@ -49,9 +45,6 @@ def __post_init__(self):
 @dataclass
 class BNBQLoraConfig(List):
 
-    # to help the HfArgumentParser arrive at correct types
-    __args__ = [EnsureTypes(str, bool)]
-
     # type of quantization applied
     quant_type: str = "nf4"
 
@@ -61,9 +54,6 @@ class BNBQLoraConfig(List):
 
     def __post_init__(self):
 
-        # reset for another parse
-        self.__args__[0].reset()
-
         if self.quant_type not in ["nf4", "fp4"]:
             raise ValueError("quant_type can only be either 'nf4' or 'fp4.")
 

From 3ef14a20bec4944ce11c381647cae0d493b8af20 Mon Sep 17 00:00:00 2001
From: Yu Chin Fabian Lim <flim@sg.ibm.com>
Date: Tue, 9 Jul 2024 02:57:55 +0000
Subject: [PATCH 3/3] fix the is_empty logic

Signed-off-by: Yu Chin Fabian Lim <flim@sg.ibm.com>
---
 .../acceleration_framework_config.py          | 36 ++++++++++++-------
 1 file changed, 24 insertions(+), 12 deletions(-)

diff --git a/tuning/config/acceleration_configs/acceleration_framework_config.py b/tuning/config/acceleration_configs/acceleration_framework_config.py
index 7dc5737b..ed0f54d1 100644
--- a/tuning/config/acceleration_configs/acceleration_framework_config.py
+++ b/tuning/config/acceleration_configs/acceleration_framework_config.py
@@ -162,8 +162,6 @@ def from_dataclasses(*dataclasses: Type):
         return config
 
     def get_framework(self):
-        if self.is_empty():
-            return
 
         if is_fms_accelerate_available():
 
@@ -174,17 +172,31 @@ def get_framework(self):
                 NamedTemporaryFile,
             )
 
-            with NamedTemporaryFile("w") as f:
-                self.to_yaml(f.name)
-                return AccelerationFramework(f.name)
+            try:
+                with NamedTemporaryFile("w") as f:
+                    self.to_yaml(f.name)
+                    return AccelerationFramework(f.name)
+            except ValueError as e:
+                (msg,) = e.args
+
+                # AcceleratorFramework raises ValueError if it
+                # fails to configure any plugin
+                if self.is_empty() and msg.startswith("No plugins could be configured"):
+                    # in the case when the error was thrown when
+                    # the acceleration framework config was empty
+                    # then this is expected.
+                    return None
+
+                raise e
         else:
-            raise ValueError(
-                "No acceleration framework package found. To use, first "
-                "ensure that 'pip install fms-hf-tuning[fms-accel]' is done first to "
-                "obtain the acceleration framework dependency. Additional "
-                "acceleration plugins make be required depending on the requsted "
-                "acceleration. See README.md for instructions."
-            )
+            if not self.is_empty():
+                raise ValueError(
+                    "No acceleration framework package found. To use, first "
+                    "ensure that 'pip install fms-hf-tuning[fms-accel]' is done first to "
+                    "obtain the acceleration framework dependency. Additional "
+                    "acceleration plugins make be required depending on the requsted "
+                    "acceleration. See README.md for instructions."
+                )
 
     def is_empty(self):
         "check if the configuration is empty"