diff --git a/integrations/torchvision/modifiers_refactor_example/e2e_test.py b/integrations/torchvision/modifiers_refactor_example/e2e_test.py
index 27fd697b50c..0cf7fd1b95a 100644
--- a/integrations/torchvision/modifiers_refactor_example/e2e_test.py
+++ b/integrations/torchvision/modifiers_refactor_example/e2e_test.py
@@ -24,7 +24,7 @@ def main():
     from torch.utils.data import DataLoader
     from torchvision import transforms
 
-    import sparseml.core.session as sml
+    import sparseml.core.session as session_manager
     from sparseml.core.event import EventType
     from sparseml.core.framework import Framework
     from sparseml.pytorch.utils import (
@@ -40,8 +40,8 @@ def main():
     device = "cuda:0"
 
     # set up SparseML session
-    sml.create_session()
-    session = sml.active_session()
+    session_manager.create_session()
+    session = session_manager.active_session()
 
     # download model
     model = torchvision.models.mobilenet_v2(
diff --git a/setup.py b/setup.py
index cae8c87358c..047ae7f0faa 100644
--- a/setup.py
+++ b/setup.py
@@ -187,8 +187,11 @@ def _setup_entry_points() -> Dict:
             ]
         )
 
-    entry_points["console_scripts"].append(
-        "sparseml.transformers.export_onnx=sparseml.transformers.export:main"
+    entry_points["console_scripts"].extend(
+        [
+            "sparseml.transformers.export_onnx=sparseml.transformers.export:main",
+            "sparseml.transformers.export_onnx_refactor=sparseml.transformers.sparsification.obcq.export:main",  # noqa 501
+        ]
     )
 
     # image classification integration
diff --git a/src/sparseml/modifiers/quantization/base.py b/src/sparseml/modifiers/quantization/base.py
index 88f973beccc..e66f5b9ea72 100644
--- a/src/sparseml/modifiers/quantization/base.py
+++ b/src/sparseml/modifiers/quantization/base.py
@@ -14,7 +14,7 @@
 
 from typing import Any, Dict, List, Optional
 
-from sparseml.core import Event, Modifier, State
+from sparseml.core import Event, Modifier
 
 
 __all__ = ["QuantizationModifier"]
@@ -136,6 +136,3 @@ def check_should_disable_observer(self, event: Event) -> bool:
         if event.current_index >= disable_epoch:
             return True
         return False
-
-    def on_initialize_structure(self, state: State, **kwargs):
-        pass  # nothing needed for this modifier
diff --git a/src/sparseml/modifiers/quantization/pytorch.py b/src/sparseml/modifiers/quantization/pytorch.py
index 8a77bcb2eea..dfa352e1378 100644
--- a/src/sparseml/modifiers/quantization/pytorch.py
+++ b/src/sparseml/modifiers/quantization/pytorch.py
@@ -71,6 +71,11 @@ def __init__(self, **kwargs):
             self.scheme_overrides, self.scheme
         )
 
+    def on_initialize_structure(self, state: State, **kwargs):
+        module = state.model.model
+        self._enable_module_qat(module)
+        state.model.model.apply(torch.quantization.disable_observer)
+
     def on_initialize(self, state: State, **kwargs) -> bool:
         raise_if_torch_quantization_not_available()
         if self.end and self.end != -1:
@@ -84,6 +89,7 @@ def on_initialize(self, state: State, **kwargs) -> bool:
 
         if self.calculate_start() == -1:  # one-shot
             self._enable_module_qat(module)
+            self._calibrate_if_possible(module)
             self._disable_quantization_observer(module)
 
         return True
@@ -122,30 +128,31 @@ def _disable_quantization_observer(self, model: Module):
         self.quantization_observer_disabled_ = True
 
     def _enable_module_qat(self, module: Module):
-        # fuse conv-bn-relu blocks prior to quantization emulation
-        self._fuse(module)
-
-        # add quantization_schemes to target submodules
-        set_quantization_schemes(
-            module,
-            scheme=self.scheme,
-            scheme_overrides=self.scheme_overrides,
-            ignore=self.ignore,
-            strict=self.strict,
-        )
+        module.apply(torch.quantization.enable_observer)
 
-        # fix for freezing batchnorm statistics when not fusing BN with convs.
-        # pytorch only supports freezing batchnorm statistics for fused modules.
-        # this fix wraps BN modules adding with a new module class that supports
-        # methods related to freezing/unfreezing BN statistics.
-        configure_module_bn_wrappers(module)
+        if not self.qat_enabled_:
+            # fuse conv-bn-relu blocks prior to quantization emulation
+            self._fuse(module)
+
+            # add quantization_schemes to target submodules
+            set_quantization_schemes(
+                module,
+                scheme=self.scheme,
+                scheme_overrides=self.scheme_overrides,
+                ignore=self.ignore,
+                strict=self.strict,
+            )
 
-        # convert target qconfig layers to QAT modules with FakeQuantize
-        convert_module_qat_from_schemes(module)
+            # fix for freezing batchnorm statistics when not fusing BN with convs.
+            # pytorch only supports freezing batchnorm statistics for fused modules.
+            # this fix wraps BN modules adding with a new module class that supports
+            # methods related to freezing/unfreezing BN statistics.
+            configure_module_bn_wrappers(module)
 
-        self.qat_enabled_ = True
+            # convert target qconfig layers to QAT modules with FakeQuantize
+            convert_module_qat_from_schemes(module)
 
-        self._calibrate_if_possible(module)
+        self.qat_enabled_ = True
 
     def _fuse(self, module: Module):
         if self.model_fuse_fn_name in [None, "conv_bn_relus"]:
diff --git a/src/sparseml/transformers/sparsification/obcq/export.py b/src/sparseml/transformers/sparsification/obcq/export.py
new file mode 100644
index 00000000000..ad29b3c5056
--- /dev/null
+++ b/src/sparseml/transformers/sparsification/obcq/export.py
@@ -0,0 +1,634 @@
+# Copyright (c) 2021 - present / Neuralmagic, Inc. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""
+Helper functions and script for exporting inference artifacts
+to be used by inference engines such as DeepSparse.
+The export incorporates:
+- creating the deployment directory (the direct input to the DeepSparse
+    inference pipeline)
+- creating an ONNX file representing a trained transformers model
+
+script accessible from sparseml.transformers.export_onnx_refactor
+
+command help:
+usage: sparseml.transformers.export_onnx [-h] --task TASK --model_path
+                                         MODEL_PATH
+                                         [--sequence_length SEQUENCE_LENGTH]
+                                         [--no_convert_qat]
+                                         [--onnx_file_name ONNX_FILE_NAME]
+                                         [--num_exported_samples NUM_EXPORTED_SAMPLES]
+                                         [--data_args DATA_ARGS]
+
+Export a trained transformers model to an ONNX file
+
+optional arguments:
+  -h, --help            show this help message and exit
+  --task TASK           Task to create the model for. i.e. mlm, qa, glue, ner
+  --model_path MODEL_PATH
+                        Path to directory where model files for weights,
+                        config, and tokenizer are stored
+  --sequence_length SEQUENCE_LENGTH
+                        Sequence length to use. Default is 384. Can be
+                        overwritten later
+  --no_convert_qat      Set flag to not perform QAT to fully quantized
+                        conversion after export
+  --onnx_file_name ONNX_FILE_NAME
+                        Name for exported ONNX file in the model directory.
+                        Default and recommended value for pipeline
+                        compatibility is model.onnx
+  --num_export_samples NUM_EXPORT_SAMPLES
+                        Number of samples (inputs/outputs) to export
+  --data_args DATA_ARGS
+                        Valid json loadable args used to instantiate a
+                        `DataTrainingArguments` instance while exporting
+                        samples
+
+example usage:
+sparseml.transformers.export_onnx_refactor \
+  --task text_generation \
+  --model_path /PATH/TO/SPARSIFIED/MODEL/DIRECTORY \
+  --sequence_length 128
+"""
+
+import argparse
+import collections
+import copy
+import inspect
+import logging
+import os
+import shutil
+from typing import Any, Dict, List, Optional, Union
+
+import torch
+from torch.nn import Module
+from transformers import AutoConfig, AutoTokenizer
+from transformers.tokenization_utils_base import PaddingStrategy
+
+import sparseml.core.session as session_manager
+from sparseml.core.framework import Framework
+from sparseml.optim import parse_recipe_variables
+from sparseml.pytorch.sparsification.quantization.helpers import (
+    initialize_channel_wise_scale_zp,
+)
+from sparseml.pytorch.utils import export_onnx
+from sparseml.transformers.utils import SparseAutoModel
+from sparseml.transformers.utils.helpers import RECIPE_NAME
+from sparsezoo.utils.onnx import EXTERNAL_ONNX_DATA_NAME
+
+
+__all__ = ["export_transformer_to_onnx", "load_task_model"]
+
+MODEL_ONNX_NAME = "model.onnx"
+MANDATORY_DEPLOYMENT_FILES = [
+    MODEL_ONNX_NAME,
+    "tokenizer_config.json",
+    "config.json",
+]
+OPT_TOKENIZER_FILES = ["special_tokens_map.json", "vocab.json", "merges.txt"]
+
+OPTIONAL_DEPLOYMENT_FILES: List[str] = ["tokenizer.json"]
+OPTIONAL_DEPLOYMENT_FILES.append(EXTERNAL_ONNX_DATA_NAME)
+OPTIONAL_DEPLOYMENT_FILES.extend(OPT_TOKENIZER_FILES)
+
+
+_LOGGER = logging.getLogger(__name__)
+
+
+def _reload_model_state(model, load_path: str, orig_state_dict: Dict[str, Any]):
+    """
+    Reload the weights after model arch changes due to recipe application
+    Return True if weights are successfully reloaded; False otherwise
+    """
+    invalid_load_path = not load_path or not os.path.isdir(load_path)
+    files = os.listdir(load_path) if not invalid_load_path else []
+    weight_files = [
+        os.path.join(load_path, f)
+        for f in files
+        if f.startswith("pytorch_model") and f.endswith("bin")
+    ]
+    if not weight_files:
+        _LOGGER.warning(
+            "Model state was not reloaded for SparseML: "
+            f"could not find model weights for {load_path}"
+        )
+        return False
+
+    # PerChannel quantization observers initialize variables
+    # to dummy shapes that do not match the ones saved in
+    # state_dict.
+    # Need to reshape these variables in order to load state_dict
+    # properly.
+    initialize_channel_wise_scale_zp(model)
+
+    current_state_dict = model.state_dict()
+
+    if set(orig_state_dict.keys()) == set(current_state_dict):
+        # no change in keys, ignore reload
+        return False
+
+    # change in keys due to architecture changes, reload statedict
+    loaded_state_dict = {}
+    for f in weight_files:
+        dd = torch.load(os.path.join(load_path, f), map_location="cpu")
+        loaded_state_dict.update(dd)
+
+    _, missing, unexpected, mismatched, _, _ = model._load_pretrained_model(
+        model=model,
+        state_dict=loaded_state_dict,
+        loaded_keys=list(loaded_state_dict.keys()),
+        resolved_archive_file=None,
+        pretrained_model_name_or_path=load_path,
+        _fast_init=False,
+    )
+
+    if missing:
+        _LOGGER.warning(
+            "Missing keys found when reloading model state for SparseML recipe:"
+            f"{missing}"
+        )
+
+    if unexpected:
+        _LOGGER.warning(
+            f"Unexpected keys found when reloading model state for SparseML recipe:"
+            f"{unexpected}"
+        )
+
+    if mismatched:
+        _LOGGER.warning(
+            f"Mismatched keys found when reloading model state for SparseML recipe:"
+            f"{mismatched}"
+        )
+
+    total_loaded = len(current_state_dict) - (len(missing) if len(missing) else 0)
+    _LOGGER.info(
+        f"Reloaded {total_loaded} model params for SparseML Recipe from {load_path}"
+    )
+    SparseAutoModel.log_model_load(
+        model,
+        load_path,
+        model_type="student",
+        delayed_load=False,
+    )
+    return True
+
+
+def load_task_model(
+    task: str, model_path: str, config: Any, trust_remote_code: bool = False
+) -> Module:
+    if task == "masked-language-modeling" or task == "mlm":
+        return SparseAutoModel.masked_language_modeling_from_pretrained(
+            model_name_or_path=model_path,
+            config=config,
+            model_type="model",
+            trust_remote_code=trust_remote_code,
+        )
+
+    if task == "question-answering" or task == "qa":
+        return SparseAutoModel.question_answering_from_pretrained(
+            model_name_or_path=model_path,
+            config=config,
+            model_type="model",
+            trust_remote_code=trust_remote_code,
+        )
+
+    if (
+        task == "sequence-classification"
+        or task == "glue"
+        or task == "sentiment-analysis"
+        or task == "text-classification"
+    ):
+        return SparseAutoModel.text_classification_from_pretrained(
+            model_name_or_path=model_path,
+            config=config,
+            model_type="model",
+            trust_remote_code=trust_remote_code,
+        )
+
+    if task == "token-classification" or task == "ner":
+        return SparseAutoModel.token_classification_from_pretrained(
+            model_name_or_path=model_path,
+            config=config,
+            model_type="model",
+            trust_remote_code=trust_remote_code,
+        )
+
+    if task == "text-generation":
+        return SparseAutoModel.text_generation_from_pretrained(
+            model_name_or_path=model_path,
+            config=config,
+            model_type="model",
+            trust_remote_code=trust_remote_code,
+        )
+
+    raise ValueError(f"unrecognized task given of {task}")
+
+
+def load_task_dataset(
+    task: str, tokenizer, data_args: Dict[str, Any], model: Module, config=None
+):
+    """
+    :param task: the task a dataset being loaded for
+    :param tokenizer: the tokenizer to use for the dataset
+    :param data_args: additional data args used to create a `DataTrainingArguments`
+        instance for fetching the dataset
+    """
+
+    if task == "masked-language-modeling" or task == "mlm":
+        from sparseml.transformers.masked_language_modeling import (
+            DataTrainingArguments,
+            get_tokenized_mlm_dataset,
+        )
+
+        data_training_args = DataTrainingArguments(**data_args)
+        return get_tokenized_mlm_dataset(
+            data_args=data_training_args, tokenizer=tokenizer
+        )
+
+    if task == "question-answering" or task == "qa":
+        from sparseml.transformers.question_answering import (
+            DataTrainingArguments,
+            get_tokenized_qa_dataset,
+        )
+
+        data_training_args = DataTrainingArguments(**data_args)
+        return get_tokenized_qa_dataset(
+            data_args=data_training_args, tokenizer=tokenizer
+        )
+
+    if task == "token-classification" or task == "ner":
+        from sparseml.transformers.token_classification import (
+            DataTrainingArguments,
+            get_tokenized_token_classification_dataset,
+        )
+
+        data_training_args = DataTrainingArguments(**data_args)
+        return get_tokenized_token_classification_dataset(
+            data_args=data_training_args, tokenizer=tokenizer, model=model or config
+        )
+
+    if (
+        task == "sequence-classification"
+        or task == "glue"
+        or task == "sentiment-analysis"
+        or task == "text-classification"
+    ):
+        from sparseml.transformers.text_classification import (
+            DataTrainingArguments,
+            get_tokenized_text_classification_dataset,
+        )
+
+        data_training_args = DataTrainingArguments(**data_args)
+
+        return get_tokenized_text_classification_dataset(
+            data_args=data_training_args,
+            tokenizer=tokenizer,
+            model=model,
+            config=config,
+        )
+
+    raise ValueError(f"unrecognized task given of {task}")
+
+
+def export_transformer_to_onnx(
+    task: str,
+    model_path: str,
+    sequence_length: int = 384,
+    convert_qat: bool = True,
+    onnx_file_name: str = MODEL_ONNX_NAME,
+    num_export_samples: int = 0,
+    trust_remote_code: bool = False,
+    data_args: Optional[Union[Dict[str, Any], str]] = None,
+) -> str:
+    """
+    Exports the saved transformers file to ONNX at batch size 1 using
+    the given model path weights, config, and tokenizer
+
+    :param task: task to create the model for. i.e. mlm, qa, glue, ner
+    :param model_path: path to directory where model files, tokenizers,
+        and configs are saved. ONNX export will also be written here
+    :param sequence_length: model sequence length to use for export
+    :param convert_qat: set True to convert a QAT model to fully quantized
+        ONNX model. Default is True
+    :param onnx_file_name: name to save the exported ONNX file as. Default
+        is model.onnx. Note that when loading a model directory to a deepsparse
+        pipeline, it will look only for 'model.onnx'
+    :param num_export_samples: number of samples (inputs/outputs) to export
+    :param trust_remote_code: set True to allow custom models in HF-transformers
+    :param data_args: additional args to instantiate a `DataTrainingArguments`
+        instance for exporting samples
+    :return: path to the exported ONNX file
+    """
+    task = task.replace("_", "-").replace(" ", "-")
+
+    if not os.path.exists(model_path) or not os.path.isdir(model_path):
+        raise ValueError(
+            "model_path must be a directory that contains the trained transformer "
+            f"files. {model_path} is not a directory or does not exist"
+        )
+
+    if num_export_samples > 0 and data_args is None:
+        _LOGGER.info(
+            f"--data_args is needed for exporting {num_export_samples} "
+            "real samples but got None, synthetic data samples will be "
+            "generated based on model input/output shapes"
+        )
+    data_args: Dict[str, Any] = _parse_data_args(data_args)
+
+    _LOGGER.info(f"Attempting onnx export for model at {model_path} for task {task}")
+    config_args = {}
+    config = AutoConfig.from_pretrained(
+        model_path,
+        trust_remote_code=trust_remote_code,
+        **config_args,
+    )
+    tokenizer = AutoTokenizer.from_pretrained(
+        model_path, model_max_length=sequence_length
+    )
+    if task == "text-generation":
+        tokenizer.pad_token = tokenizer.eos_token
+
+    model = load_task_model(task, model_path, config, trust_remote_code)
+    _LOGGER.info(f"loaded model, config, and tokenizer from {model_path}")
+
+    model = model.train()
+
+    recipe_path = os.path.join(model_path, RECIPE_NAME)
+    if not os.path.exists(recipe_path):
+        _LOGGER.warning(
+            f"No recipes were applied for {model_path}, "
+            "check to make sure recipe(s) are stored in the model_path"
+        )
+        recipe_path = None
+
+    orig_state_dict = model.state_dict()
+
+    session_manager.create_session()
+    session_manager.pre_initialize_structure(
+        model=model, recipe=recipe_path, framework=Framework.pytorch
+    )
+
+    if recipe_path:
+        session = session_manager.active_session()
+        num_stages = len(session.lifecycle.recipe_container.compiled_recipe.stages)
+        msg = (
+            "an unstaged recipe"
+            if num_stages == 1
+            else f"a staged recipe with {num_stages} stages"
+        )
+        _LOGGER.info(f"Applied {msg} to the model at {model_path}")
+
+    # reload the state dict for the model now that architecture matches expected
+    if _reload_model_state(model, model_path, orig_state_dict):
+        _LOGGER.info(
+            "Reloaded model state after SparseML recipe structure modifications "
+            f"from {model_path}"
+        )
+
+    # create fake model input
+    inputs = tokenizer(
+        "", return_tensors="pt", padding=PaddingStrategy.MAX_LENGTH.value
+    ).data  # Dict[Tensor]
+
+    # Rearrange inputs' keys to match those defined by model foward func, which
+    # seem to define how the order of inputs is determined in the exported model
+    forward_args_spec = inspect.getfullargspec(model.__class__.forward)
+    dropped = [
+        input_key
+        for input_key in inputs.keys()
+        if input_key not in forward_args_spec.args
+    ]
+    inputs = collections.OrderedDict(
+        [
+            (func_input_arg_name, inputs[func_input_arg_name][0].reshape(1, -1))
+            for func_input_arg_name in forward_args_spec.args
+            if func_input_arg_name in inputs
+        ]
+    )
+    if dropped:
+        _LOGGER.warning(
+            "The following inputs were not present in the model forward function "
+            f"and therefore dropped from ONNX export: {dropped}"
+        )
+
+    inputs_shapes = {
+        key: (
+            f"{val.dtype if hasattr(val, 'dtype') else 'unknown'}: "
+            f"{list(val.shape) if hasattr(val, 'shape') else 'unknown'}"
+        )
+        for key, val in inputs.items()
+    }
+
+    _LOGGER.info(f"Created sample inputs for the ONNX export process: {inputs_shapes}")
+
+    # run export
+    model = model.eval()
+    onnx_file_path = os.path.join(model_path, onnx_file_name)
+    kwargs = {"input_names": list(inputs.keys())} if task == "text-generation" else {}
+
+    export_onnx(
+        model,
+        inputs,
+        onnx_file_path,
+        convert_qat=convert_qat,
+        **kwargs,
+    )
+    _LOGGER.info(f"ONNX exported to {onnx_file_path}")
+    return onnx_file_path
+
+
+def _parse_data_args(data_args):
+    try:
+        return parse_recipe_variables(data_args)
+    except ValueError as parse_error:
+        message = str(parse_error).replace("recipe_args", "data_args")
+        if "recipe variables" in message:
+            message = message.replace("recipe variables", "data_args")
+        raise ValueError(message)
+
+
+def create_deployment_folder(
+    training_directory: str,
+    onnx_file_name: str = MODEL_ONNX_NAME,
+    deployment_files: Optional[List[str]] = None,
+):
+    """
+    Sets up the deployment directory i.e. copies over the complete set of files
+    that are required to run the transformer model in the inference engine
+
+    :param training_directory: path to directory where model files, tokenizers,
+        and configs are saved. Exported ONNX model is also expected to be there
+    :param onnx_file_name: Name for exported ONNX file in the model directory.
+    :param deployment_files: optional list of deployment file names to override
+        default file names with.
+    :return: path to the valid deployment directory
+    """
+
+    if deployment_files is None:
+        # set deployment files to default values
+        deployment_files = copy.deepcopy(
+            MANDATORY_DEPLOYMENT_FILES + OPTIONAL_DEPLOYMENT_FILES
+        )
+        if onnx_file_name != MODEL_ONNX_NAME:
+            # replace the default onnx model name with the custom one
+            deployment_files[deployment_files.index(MODEL_ONNX_NAME)] = onnx_file_name
+
+    model_root_dir = os.path.dirname(training_directory)
+    deployment_folder_dir = os.path.join(model_root_dir, "deployment")
+    if os.path.isdir(deployment_folder_dir):
+        shutil.rmtree(deployment_folder_dir)
+    os.makedirs(deployment_folder_dir)
+
+    for file_name in deployment_files:
+        expected_file_path = os.path.join(training_directory, file_name)
+        deployment_file_path = os.path.join(deployment_folder_dir, file_name)
+        if not os.path.exists(expected_file_path):
+            if file_name in OPTIONAL_DEPLOYMENT_FILES:
+                _LOGGER.warning(
+                    f"Optional file {file_name} not found in {training_directory}. "
+                    f"Skipping copying to deployment folder."
+                )
+                continue
+            raise ValueError(
+                f"Attempting to copy {file_name} file from {expected_file_path},"
+                f"but the file does not exits. Make sure that {training_directory} "
+                f"contains following files: {deployment_files}"
+            )
+        if file_name == MODEL_ONNX_NAME:
+            # moving onnx file from training to deployment directory
+            shutil.move(expected_file_path, deployment_file_path)
+        elif file_name == EXTERNAL_ONNX_DATA_NAME:
+            # moving external onnx tensors from training to deployment directory
+            shutil.move(expected_file_path, deployment_file_path)
+        else:
+            # copying remaining `deployment_files` from training to deployment directory
+            shutil.copyfile(expected_file_path, deployment_file_path)
+        _LOGGER.info(
+            f"Saved {file_name} in the deployment folder at {deployment_file_path}"
+        )
+    return deployment_folder_dir
+
+
+def _parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description="Export a trained transformers model to an ONNX file"
+    )
+
+    parser.add_argument(
+        "--task",
+        type=str,
+        required=True,
+        help="Task to create the model for. i.e. mlm, qa, glue, ner",
+    )
+    parser.add_argument(
+        "--model_path",
+        required=True,
+        type=str,
+        help=(
+            "Path to directory where model files for weights, config, and "
+            "tokenizer are stored"
+        ),
+    )
+    parser.add_argument(
+        "--sequence_length",
+        type=int,
+        default=384,
+        help="Sequence length to use. Default is 384. Can be overwritten later",
+    )
+    parser.add_argument(
+        "--no_convert_qat",
+        action="store_true",
+        help=("Set flag to not perform QAT to fully quantized conversion after export"),
+    )
+    parser.add_argument(
+        "--onnx_file_name",
+        type=str,
+        default=MODEL_ONNX_NAME,
+        help=(
+            "Name for exported ONNX file in the model directory. "
+            "Default and recommended value for pipeline "
+            f"compatibility is {MODEL_ONNX_NAME}"
+        ),
+    )
+    parser.add_argument(
+        "--num_export_samples",
+        type=int,
+        default=0,
+        help="Number of samples (inputs/outputs) to export",
+    )
+    parser.add_argument(
+        "--data_args",
+        type=str,
+        default=None,
+        help="Valid json loadable args used to instantiate a `DataTrainingArguments`"
+        " instance while exporting samples",
+    )
+    parser.add_argument(
+        "--trust_remote_code",
+        action="store_true",
+        help=("Set flag to allow custom models in HF-transformers"),
+    )
+
+    return parser.parse_args()
+
+
+def export(
+    task: str,
+    model_path: str,
+    sequence_length: int,
+    no_convert_qat: bool,
+    onnx_file_name: str,
+    num_export_samples: int = 0,
+    trust_remote_code: bool = False,
+    data_args: Optional[str] = None,
+):
+    if os.path.exists(model_path):
+        # expand to absolute path to support downstream logic
+        model_path = os.path.abspath(model_path)
+    export_transformer_to_onnx(
+        task=task,
+        model_path=model_path,
+        sequence_length=sequence_length,
+        convert_qat=(not no_convert_qat),  # False if flagged
+        onnx_file_name=onnx_file_name,
+        num_export_samples=num_export_samples,
+        trust_remote_code=trust_remote_code,
+        data_args=data_args,
+    )
+
+    deployment_folder_dir = create_deployment_folder(
+        training_directory=model_path, onnx_file_name=onnx_file_name
+    )
+    _LOGGER.info(
+        f"Created deployment folder at {deployment_folder_dir} "
+        f"with files: {os.listdir(deployment_folder_dir)}"
+    )
+
+
+def main():
+    args = _parse_args()
+    export(
+        task=args.task,
+        model_path=args.model_path,
+        sequence_length=args.sequence_length,
+        no_convert_qat=args.no_convert_qat,  # False if flagged
+        onnx_file_name=args.onnx_file_name,
+        num_export_samples=args.num_export_samples,
+        trust_remote_code=args.trust_remote_code,
+        data_args=args.data_args,
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/src/sparseml/transformers/sparsification/obcq/obcq.py b/src/sparseml/transformers/sparsification/obcq/obcq.py
index f7ddf595602..7a60b14a5b8 100644
--- a/src/sparseml/transformers/sparsification/obcq/obcq.py
+++ b/src/sparseml/transformers/sparsification/obcq/obcq.py
@@ -20,7 +20,7 @@
 
 from torch.nn import Module
 
-import sparseml.core.session as sml
+import sparseml.core.session as session_manager
 from sparseml.core.framework import Framework
 from sparseml.modifiers.obcq.utils.helpers import ppl_eval_general
 from sparseml.optim.helpers import load_recipe_yaml_str
@@ -97,8 +97,8 @@ def one_shot(
     calibration_data = dataset.loader
     tokenizer = dataset.tokenizer
 
-    sml.create_session()
-    session = sml.active_session()
+    session_manager.create_session()
+    session = session_manager.active_session()
     session.apply(
         framework=Framework.pytorch,
         recipe=recipe_file,