update fp8 handler

InternLM · Nov 5, 2024 · c6ddc54 · c6ddc54
1 parent 92e40ab
commit c6ddc54
Showing 1 changed file with 7 additions and 0 deletions.
diff --git a/internlm/train/pipeline.py b/internlm/train/pipeline.py
@@ -45,6 +45,7 @@
     TensorParallelCommunicator,
 )
 from internlm.core.parallel.comm.zero import ParamAsyncBcastHandler
+from internlm.core.quantization.fp8handler import Float8Handler
 from internlm.core.trainer import TrainState
 from internlm.data.utils import unpack_type_ids
 from internlm.model.builder import create_model
@@ -278,6 +279,12 @@ def inject_model(model):
     if hasattr(model, IS_INJECTED) and getattr(model, IS_INJECTED):
         return model
 
+    # FP8 Linear and compile model
+    if hasattr(gpc.config, "use_fp8") and gpc.config.get("use_fp8", False):
+        float8_handler = Float8Handler()
+        float8_handler.convert_to_float8_training(model)
+        model = torch.compile(model)
+
     inject_model_helper(model, inject_info=gpc.config.model.get("inject_info", None))
 
     # should be set before NaiveAMPModel