[eval_llama] Add option to save checkpoint after eager transforms.

Differential Revision: D62150021 Pull Request resolved: #5045
pytorch · Sep 7, 2024 · 3268da2 · 3268da2
1 parent 32d83b0
commit 3268da2
Showing 1 changed file with 15 additions and 0 deletions.
diff --git a/examples/models/llama2/eval_llama_lib.py b/examples/models/llama2/eval_llama_lib.py
@@ -158,6 +158,15 @@ def gen_eval_wrapper(
             else manager.model.eval().to(device="cpu")
         )
 
+    # Save the checkpoint after the eager model preparation is done.
+    # The reason for this option is that the checkpoint can be used
+    # to do evaluations in other evaluation platforms, or with data
+    # that is not available in this eval_llama. We save the checkpoint
+    # here for consistency with eval_llama. The accuracy results we
+    # get from eval_llama can be used as a reference to other evaluations.
+    if args.output_eager_checkpoint_file is not None:
+        torch.save(model, args.output_eager_checkpoint_file)
+
     return EagerEvalWrapper(
         model=model,
         tokenizer=tokenizer,
@@ -196,6 +205,12 @@ def build_args_parser() -> argparse.ArgumentParser:
         default=None,
         help="[For ExecuTorch] Path to the Tokenizer binary for evaluating ExecuTorch models via runtime",
     )
+    parser.add_argument(
+        "--output_eager_checkpoint_file",
+        type=str,
+        default=None,
+        help="Save the checkpoint after source transformations, for other evaluation platform to run the same checkpoint.",
+    )
 
     return parser