neuralmagic · bfineran · Jan 10, 2024 · Nov 28, 2023 · Dec 4, 2023 · Dec 11, 2023
diff --git a/.github/workflows/test-check.yaml b/.github/workflows/test-check.yaml
@@ -18,6 +18,7 @@ jobs:
       deepsparse: ${{ steps.deepsparse-check.outputs.output }}
       onnx: ${{ steps.onnx-check.outputs.output }}
       pytorch: ${{ steps.pytorch-check.outputs.output }}
+      export: ${{ steps.export-check.outputs.output }}
     steps:
       - uses: actions/checkout@v2
         with:
@@ -53,6 +54,12 @@ jobs:
           ((git diff --name-only origin/main HEAD | grep -E "[src|tests]/sparseml/pytorch|setup.py|.github")
           || (echo $GITHUB_REF | grep -E "refs/heads/[release/|main]"))
           && echo "::set-output name=output::1" || echo "::set-output name=output::0"
+      - name: "Checking if sparseml.export was changed"
+        id: export-check
+        run: >
+          ((git diff --name-only origin/main HEAD | grep -E "[src|tests]/sparseml/export|setup.py|.github")
+          || (echo $GITHUB_REF | grep -E "refs/heads/[release/|main]"))
+          && echo "::set-output name=output::1" || echo "::set-output name=output::0"
   base-tests:
     runs-on: ubuntu-22.04
     env:
@@ -221,3 +228,28 @@ jobs:
         run: pip3 install .[dev,torch,transformers]
       - name: "🔬 Running transformers tests"
         run: make test TARGETS=transformers
+  export-tests:
+    runs-on: ubuntu-22.04
+    env:
+      SPARSEZOO_TEST_MODE: "true"
+    needs: test-setup
+    if: ${{needs.test-setup.outputs.export == 1}}
+    steps:
+      - uses: actions/setup-python@v4
+        with:
+          python-version: '3.11'
+      - uses: actions/checkout@v2
+      - uses: actions/checkout@v2
+        with:
+          repository: "neuralmagic/sparsezoo"
+          path: "sparsezoo"
+          ref: ${{needs.test-setup.outputs.branch}}
+      - name: "⚙️ Install sparsezoo dependencies"
+        run: pip3 install -U pip && pip3 install setuptools sparsezoo/
+      - name: "Clean sparsezoo directory"
+        run: rm -r sparsezoo/
+      - name: "⚙️ Install dependencies"
+        run: pip3 install .[dev,torch,transformers,torchvision]
+      - name: "🔬 Running export tests"
+        run: make test TARGETS=export
+
diff --git a/Makefile b/Makefile
@@ -9,7 +9,7 @@ MDCHECKFILES := CODE_OF_CONDUCT.md CONTRIBUTING.md DEVELOPING.md README.md
 SPARSEZOO_TEST_MODE := "true"
 
 BUILD_ARGS :=  # set nightly to build nightly release
-TARGETS := ""  # targets for running pytests: deepsparse,keras,onnx,pytorch,pytorch_models,pytorch_datasets,tensorflow_v1,tensorflow_v1_models,tensorflow_v1_datasets
+TARGETS := ""  # targets for running pytests: deepsparse,keras,onnx,pytorch,pytorch_models,export,pytorch_datasets,tensorflow_v1,tensorflow_v1_models,tensorflow_v1_datasets
 PYTEST_ARGS ?= ""
 PYTEST_INTEG_ARGS ?= ""
 ifneq ($(findstring deepsparse,$(TARGETS)),deepsparse)
@@ -18,6 +18,9 @@ endif
 ifneq ($(findstring transformers,$(TARGETS)),transformers)
     PYTEST_ARGS := $(PYTEST_ARGS) --ignore tests/sparseml/transformers
 endif
+ifneq ($(findstring export,$(TARGETS)),export)
+    PYTEST_ARGS := $(PYTEST_ARGS) --ignore tests/sparseml/export
+endif
 ifneq ($(findstring keras,$(TARGETS)),keras)
     PYTEST_ARGS := $(PYTEST_ARGS) --ignore tests/sparseml/keras
 endif

diff --git a/src/sparseml/pytorch/image_classification/utils/helpers.py b/src/sparseml/pytorch/image_classification/utils/helpers.py
@@ -673,11 +673,18 @@ def is_image_classification_model(source_path: Union[Path, str]) -> bool:
     else:
         checkpoint_path = source_path
     try:
-        checkpoint = torch.load(checkpoint_path)
+        if torch.cuda.is_available():
+            checkpoint = torch.load(checkpoint_path)
+        else:
+            checkpoint = torch.load(checkpoint_path, map_location=torch.device("cpu"))
+
         arch_key = checkpoint.get("arch_key")
         if arch_key:
             return True
-    except Exception:
+    except Exception as e:
+        _LOGGER.warning(
+            f"Model: {checkpoint_path} not an image classification model: {e}"
+        )
         return False
 
 

diff --git a/src/sparseml/transformers/sparsification/obcq/obcq.py b/src/sparseml/transformers/sparsification/obcq/obcq.py
@@ -25,8 +25,6 @@
 from sparseml.core.framework import Framework
 from sparseml.modifiers.obcq.utils.helpers import ppl_eval_general
 from sparseml.pytorch.model_load.helpers import (
-    RECIPE_FILE_NAME,
-    apply_recipe_structure_to_model,
     fallback_to_cpu,
     parse_dtype,
     save_model_and_recipe,
@@ -36,7 +34,7 @@
     llama_forward,
     opt_forward,
 )
-from sparseml.transformers.utils.sparse_model import SparseAutoModel
+from sparseml.transformers.utils.initializers import initialize_sparse_model
 
 
 __all__ = ["one_shot"]
@@ -90,25 +88,28 @@ def one_shot(
     config = AutoConfig.from_pretrained(model_path)
     model_type = config.model_type.lower()
 
-    model_loader_fn = None
-    forward_fn = None
     if "opt" in model_type:
-        model_loader_fn = SparseAutoModel.text_classification_from_pretrained
         forward_fn = opt_forward
     elif "llama" in model_type or "mistral" in model_type:
-        model_loader_fn = SparseAutoModel.text_classification_from_pretrained
         forward_fn = llama_forward
     else:
         _LOGGER.warning(
             f"A supported model type({SUPPORTED_MODELS}) could not be "
             f"parsed from model_path={model_path}. Defaulting to "
             "SparseAutoModel loading. "
         )
-        model_loader_fn = SparseAutoModel.text_classification_from_pretrained
         forward_fn = llama_forward
+
     torch_dtype = parse_dtype(precision)
-    model = model_loader_fn(
-        model_path, sequence_length=sequence_length, torch_dtype=torch_dtype
+    # create session and initialize a sparse model
+    session_manager.create_session()
+    model = initialize_sparse_model(
+        model_path=model_path,
+        task="text-generation",
+        sequence_length=sequence_length,
+        torch_dtype=torch_dtype,
+        config=config,
+        device=device,
     )
 
     if dataset_name not in SUPPORTED_DATASETS:
@@ -126,16 +127,8 @@ def one_shot(
     calibration_data = dataset.loader
     tokenizer = dataset.tokenizer
 
-    # create session and initialize any structure from input model recipe
-    session_manager.create_session()
-    session = session_manager.active_session()
-    input_recipe_path = os.path.join(model_path, RECIPE_FILE_NAME)
-    if os.path.exists(input_recipe_path):
-        apply_recipe_structure_to_model(
-            model=model, recipe_path=input_recipe_path, model_path=model_path
-        )
-
     # launch one shot
+    session = session_manager.active_session()
     session.apply(
         framework=Framework.pytorch,
         recipe=recipe_file,

diff --git a/src/sparseml/transformers/utils/helpers.py b/src/sparseml/transformers/utils/helpers.py
@@ -26,7 +26,6 @@
 from transformers import AutoConfig, AutoModel
 from transformers.trainer_utils import get_last_checkpoint
 
-import sparseml.core.session as session_manager
 from sparseml.export.helpers import ONNX_MODEL_NAME
 from sparseml.pytorch.model_load.helpers import apply_recipe_structure_to_model
 from sparsezoo import setup_model
@@ -70,18 +69,17 @@ class TaskNames(Enum):
 
 
 def apply_structure_to_transformers(
-    model: AutoModel, model_directory: Union[str, Path], recipe_path: Union[Path, str]
+    model: AutoModel, model_directory: Union[str, Path], recipe: Union[Path, str]
 ) -> None:
     """
     Apply the structure (dictated by the recipe) to the model.
     If no recipe is found, the model is returned as is (a warning is logged).
     :param model: the model to apply the structure to
     :param model_directory: the directory where the model is stored
-    :param recipe_path: a valid path to the recipe to apply
+    :param recipe: a valid path to the recipe to apply or a recipe string
     """
-    session_manager.create_session()
     apply_recipe_structure_to_model(
-        model=model, recipe_path=recipe_path, model_path=model_directory
+        model=model, recipe_path=recipe, model_path=model_directory
     )
 
 

diff --git a/src/sparseml/transformers/utils/initializers.py b/src/sparseml/transformers/utils/initializers.py
@@ -206,20 +206,53 @@ def resolve_recipe_application(
 ) -> Union[str, Path, None]:
     """
     Resolve the recipe to apply to the model.
-    If the recipe is None, will look for a recipe in the model_path
-
     :param recipe: the recipe to apply to the model.
-        If None, will look for a recipe in the model_path
+        It can be one of the following:
+        - None (no recipe will be applied or the
+            default recipe will be applied if exists. Default recipe
+            is assumed to be stored in the model_path and named RECIPE_NAME)
+        - a path to the recipe file
+        - name of the recipe file (e.g. "recipe.yaml")
+            (assumed to be stored in the model_path instead
+            of RECIPE_NAME)
+        - a string containing the recipe
     :param model_path: the path to the model to load
     :return: the resolved recipe
     """
-    default_recipe = os.path.join(model_path, RECIPE_NAME)
-    requested_recipe = None
-    if recipe:
-        requested_recipe = (
-            recipe if os.path.isfile(recipe) else os.path.join(model_path, recipe)
+
+    if recipe is None:
+        # if recipe is None -> still look for recipe.yaml in the model_path
+        recipe = os.path.join(model_path, RECIPE_NAME)
+        if os.path.isfile(recipe):
+            return recipe
+
+    elif os.path.isfile(recipe):
+        # recipe is a path to a recipe file
+        return _resolve_recipe_file(recipe, model_path)
+
+    elif os.path.isfile(os.path.join(model_path, recipe)):
+        # recipe is a name of a recipe file
+        recipe = os.path.join(model_path, recipe)
+        return _resolve_recipe_file(recipe, model_path)
+    elif isinstance(recipe, str):
+        # recipe is a string containing the recipe
+        _LOGGER.debug(
+            "Applying the recipe string directly to the model, without "
+            "checking for a potential existing recipe in the model_path."
         )
+        return recipe
+
+    _LOGGER.info(
+        "No recipe requested and no default recipe "
+        f"found in {model_path}. Skipping recipe application."
+    )
+    return None
 
+
+def _resolve_recipe_file(
+    requested_recipe: Union[str, Path], model_path: Union[str, Path]
+) -> Union[str, Path, None]:
+    default_recipe = os.path.join(model_path, RECIPE_NAME)
     default_recipe_exists = os.path.isfile(default_recipe)
     default_and_request_recipes_identical = default_recipe == requested_recipe
 
@@ -253,15 +286,9 @@ def resolve_recipe_application(
         return requested_recipe
 
     elif default_recipe_exists:
-        _LOGGER.info(f"Applying the default recip: {default_recipe}")
+        _LOGGER.info(f"Applying the default recipe: {default_recipe}")
         return default_recipe
 
-    _LOGGER.info(
-        "No recipe requested and no default recipe "
-        f"found in {model_path}. Skipping recipe application."
-    )
-    return None
-
 
 def _parse_data_args(data_args):
     try:

diff --git a/src/sparseml/transformers/utils/load_task_model.py b/src/sparseml/transformers/utils/load_task_model.py
@@ -65,16 +65,19 @@ def load_task_model(
         )
 
     if task in TaskNames.text_generation.value:
+        torch_dtype = kwargs.get("torch_dtype")
         sequence_length = kwargs.get("sequence_length")
         if sequence_length is None:
             sequence_length = resolve_sequence_length(config)
+
         return SparseAutoModel.text_generation_from_pretrained(
             model_name_or_path=model_path,
             sequence_length=sequence_length,
             config=config,
             model_type="model",
             recipe=recipe,
             trust_remote_code=trust_remote_code,
+            torch_dtype=torch_dtype,
         )
 
     raise ValueError(f"unrecognized task given of {task}")
diff --git a/src/sparseml/transformers/utils/sparse_model.py b/src/sparseml/transformers/utils/sparse_model.py
@@ -181,7 +181,7 @@ def question_answering_from_pretrained_distil(
     @staticmethod
     def text_classification_from_pretrained(
         model_name_or_path: str,
-        model_type: str,
+        model_type: str = "model",
         **kwargs,
     ) -> Module:
         """
@@ -243,9 +243,9 @@ def text_classification_from_pretrained_distil(
     @staticmethod
     def text_generation_from_pretrained(
         model_name_or_path: str,
-        model_type: str,
         sequence_length: int,
         config: AutoConfig,
+        model_type: str = "model",
         recipe: Optional[Union[str, Path]] = None,
         trust_remote_code: bool = False,
         torch_dtype: Union[str, torch.dtype] = "auto",

diff --git a/...tion/test_integration_helper_functions.py → tests/sparseml/pytorch/conftest.py b/...tion/test_integration_helper_functions.py → tests/sparseml/pytorch/conftest.py
@@ -11,15 +11,16 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from src.sparseml.integration_helper_functions import (
-    IntegrationHelperFunctions,
-    Integrations,
-)
+import pytest
 
 
-def test_integration_helper_functions():
+def _test_image_classification_integration_helper_functions():
     # import needed to register the object on the fly
     import sparseml.pytorch.image_classification.integration_helper_functions  # noqa F401
+    from src.sparseml.integration_helper_functions import (
+        IntegrationHelperFunctions,
+        Integrations,
+    )
 
     image_classification = IntegrationHelperFunctions.load_from_registry(
         Integrations.image_classification.value
@@ -31,3 +32,11 @@ def test_integration_helper_functions():
     assert image_classification.create_data_samples
     assert image_classification.deployment_directory_files_mandatory == ["model.onnx"]
     assert image_classification.deployment_directory_files_optional is None
+
+
+@pytest.fixture(scope="session", autouse=True)
+def setup_and_teardown():
+    # setup
+    yield
+    # teardown
+    _test_image_classification_integration_helper_functions()
diff --git a/tests/sparseml/pytorch/image_classification/utils/test_helpers.py b/tests/sparseml/pytorch/image_classification/utils/test_helpers.py
@@ -51,7 +51,8 @@ def test_save_zoo_directory(stub, tmp_path_factory):
     "stub, is_image_classification",
     [("zoo:efficientnet_v2-s-imagenet-base_quantized", True)],
 )
-def test_is_image_classification_model(stub, is_image_classification):
-    path_to_model = Model(stub).training.path
+def test_is_image_classification_model(tmp_path, stub, is_image_classification):
+    path_to_model = Model(stub, tmp_path).training.path
     assert is_image_classification_model(path_to_model)
     assert is_image_classification_model(Path(path_to_model))
+    shutil.rmtree(tmp_path)
diff --git a/tests/sparseml/transformers/obcq/test_obcq.py b/tests/sparseml/transformers/obcq/test_obcq.py
@@ -25,7 +25,10 @@
 from sparseml.transformers.data import TransformersDataset
 from sparseml.transformers.sparsification.obcq.obcq import one_shot
 from sparseml.transformers.sparsification.obcq.utils.helpers import llama_forward
-from sparseml.transformers.utils.sparse_model import SparseAutoModel
+from sparseml.transformers.utils.initializers import (
+    initialize_config,
+    initialize_sparse_model,
+)
 
 
 @pytest.mark.parametrize(
@@ -75,7 +78,13 @@ def test_lm_head_target():
     if not torch.cuda.is_available():
         device = "cpu"
 
-    model = SparseAutoModel.text_classification_from_pretrained(tiny_model_path)
+    config = initialize_config(model_path=tiny_model_path)
+    model = initialize_sparse_model(
+        model_path=tiny_model_path,
+        device=device,
+        task="text-generation",
+        config=config,
+    )
 
     kwargs = {
         "sparsity": 0.5,