nod-ai · saienduri · Apr 4, 2024 · Apr 3, 2024 · Apr 3, 2024 · Apr 3, 2024
diff --git a/.github/workflows/test_iree.yml b/.github/workflows/test_iree.yml
@@ -22,8 +22,11 @@ concurrency:
 
 jobs:
   linux_x86_64:
+    strategy:
+      matrix:
+        os: [nodai-amdgpu-w7900-x86-64]
     name: Linux (x86_64)
-    runs-on: ubuntu-latest
+    runs-on: ${{matrix.os}}
     env:
       VENV_DIR: ${{ github.workspace }}/.venv
     steps:
@@ -57,22 +60,30 @@ jobs:
           source ${VENV_DIR}/bin/activate
           python3 -m pip install -r iree_tests/requirements.txt
 
-      - name: "Running simple tests"
-        run: |
-          source ${VENV_DIR}/bin/activate
-          pytest iree_tests/simple --durations=0
+      # - name: "Running simple tests"
+      #   run: |
+      #     source ${VENV_DIR}/bin/activate
+      #     pytest iree_tests/simple --durations=0
 
-      - name: "Running the generated ONNX test suite"
-        run: |
-          source ${VENV_DIR}/bin/activate
-          pytest iree_tests/onnx/node/generated -n auto -rpfE --timeout=30 --retries 2 --retry-delay 5 --durations=10
+      # - name: "Running the generated ONNX test suite"
+      #   run: |
+      #     source ${VENV_DIR}/bin/activate
+      #     pytest iree_tests/onnx/node/generated -n auto -rpfE --timeout=30 --retries 2 --retry-delay 5 --durations=10
 
       # TODO(scotttodd): add a local cache for these large files to a persistent runner
       - name: "Downloading remote files for real weight model tests"
         run: |
           source ${VENV_DIR}/bin/activate
-          python3 iree_tests/download_remote_files.py
+          python3 iree_tests/download_remote_files.py --root-dir pytorch/models/sdxl-scheduled-unet-3-tank
       - name: "Running real weight model tests"
+        env:
+            IREE_TEST_CONFIG_FILES: iree_tests/configs/config_sdxl_cpu_llvm_task.json
+        run: |
+          source ${VENV_DIR}/bin/activate
+          pytest iree_tests/pytorch/models -s -n auto -k real_weights -rpfE --timeout=1200 --retries 2 --retry-delay 5 --durations=0
+      - name: "Running SDXL pipeline benchmark"
+        env:
+            IREE_TEST_CONFIG_FILES: iree_tests/configs/config_sdxl_cpu_llvm_task.json
         run: |
           source ${VENV_DIR}/bin/activate
-          pytest iree_tests -n auto -k real_weights -rpfE --timeout=600 --retries 2 --retry-delay 5 --durations=0
+          pytest iree_tests/benchmarks -s -rpfE --timeout=6000 --durations=0
diff --git a/iree_tests/benchmarks/sdxl-benchmark/model.mlirbc b/iree_tests/benchmarks/sdxl-benchmark/model.mlirbc
diff --git a/iree_tests/benchmarks/sdxl-benchmark/test_data_flags.txt b/iree_tests/benchmarks/sdxl-benchmark/test_data_flags.txt
@@ -0,0 +1 @@
+
diff --git a/iree_tests/configs/config_gpu_rocm.json b/iree_tests/configs/config_gpu_rocm.json
@@ -0,0 +1,16 @@
+{
+    "config_name": "gpu_rocm",
+    "iree_compile_flags" : [
+        "--iree-hal-target-backends=rocm",
+        "--iree-rocm-target-chip=gfx90a",
+        "--iree-rocm-link-bc=true",
+        "--verify=false"
+    ],
+    "iree_run_module_flags": [
+      "--device=rocm"
+    ],
+    "skip_compile_tests": ["llama-tank", "opt-125M", "resnet50", "sd-clip-tank", "sd-unet-tank", "sd-vae-decode-tank"],
+    "skip_run_tests": ["sdxl-scheduled-unet-tank", "llama-tank", "opt-125M", "resnet50", "sd-clip-tank", "sd-unet-tank", "sd-vae-decode-tank"],
+    "expected_compile_failures": [],
+    "expected_run_failures": []
+  }
diff --git a/iree_tests/configs/config_sdxl_cpu_llvm_task.json b/iree_tests/configs/config_sdxl_cpu_llvm_task.json
@@ -0,0 +1,17 @@
+{
+    "config_name": "sdxl_cpu_llvm_task",
+    "iree_compile_flags" : [
+      "--iree-hal-target-backends=llvm-cpu",
+      "--iree-llvmcpu-target-triple=x86_64-linux-gnu",
+      "--iree-llvmcpu-target-cpu-features=host",
+      "--iree-llvmcpu-fail-on-out-of-bounds-stack-allocation=false",
+      "--iree-llvmcpu-distribution-size=32"
+    ],
+    "iree_run_module_flags": [
+      "--device=local-task"
+    ],
+    "skip_compile_tests": ["opt-125M", "resnet50", "sdxl-vae-decode-tank", "sdxl-prompt-encoder-tank"],
+    "skip_run_tests": ["opt-125M", "resnet50", "sdxl-vae-decode-tank", "sdxl-prompt-encoder-tank"],
+    "expected_compile_failures": [],
+    "expected_run_failures": []
+  }
diff --git a/iree_tests/conftest.py b/iree_tests/conftest.py
@@ -282,6 +282,9 @@ def __init__(self, spec, **kwargs):
 
         # TODO(scotttodd): swap cwd for a temp path?
         self.test_cwd = self.spec.test_directory
+        vae_decode_path = os.path.dirname(os.path.dirname(self.test_cwd)) + "/pytorch/models/sdxl-vae-decode-tank"
+        scheduled_unet_path = os.path.dirname(os.path.dirname(self.test_cwd)) + "/pytorch/models/sdxl-scheduled-unet-3-tank"
+        prompt_encoder_path = os.path.dirname(os.path.dirname(self.test_cwd)) + "/pytorch/models/sdxl-prompt-encoder-tank"
         vmfb_name = f"{self.spec.input_mlir_stem}_{self.spec.test_name}.vmfb"
 
         self.compile_args = ["iree-compile", self.spec.input_mlir_name]
@@ -292,6 +295,8 @@ def __init__(self, spec, **kwargs):
         self.run_args.extend(self.spec.iree_run_module_flags)
         self.run_args.append(f"--flagfile={self.spec.data_flagfile_name}")
 
+        self.benchmark_args = ["iree-benchmark-module", "--device=local-task", f"--module={prompt_encoder_path}/model_sdxl_cpu_llvm_task_real_weights.vmfb", f"--parameters=model={prompt_encoder_path}/real_weights.irpa", f"--module={scheduled_unet_path}/model_sdxl_cpu_llvm_task_real_weights.vmfb", f"--parameters=model={scheduled_unet_path}/real_weights.irpa", f"--module={vae_decode_path}/model_sdxl_cpu_llvm_task_real_weights.vmfb", f"--parameters=model={vae_decode_path}/real_weights.irpa", f"--module={vmfb_name}", "--function=tokens_to_image", "--input=1x4x128x128xf16", "--input=1xf16", "--input=1x64xi64", "--input=1x64xi64", "--input=1x64xi64", "--input=1x64xi64"]
+
     def runtest(self):
         if self.spec.skip_test:
             pytest.skip()
@@ -317,7 +322,12 @@ def runtest(self):
                     reason="Expected run to fail",
                 )
             )
-        self.test_run()
+        # self.test_run()
+        print("TEST DIR NAME: " + str(self.spec.test_directory.name))
+        if self.spec.test_directory.name == "sdxl-benchmark":
+            self.test_benchmark()
+        else:
+            self.test_run()
 
     def test_compile(self):
         proc = subprocess.run(self.compile_args, capture_output=True, cwd=self.test_cwd)
@@ -328,6 +338,13 @@ def test_run(self):
         proc = subprocess.run(self.run_args, capture_output=True, cwd=self.test_cwd)
         if proc.returncode != 0:
             raise IreeRunException(proc, self.test_cwd, self.compile_args)
+
+    def test_benchmark(self):
+        proc = subprocess.run(self.benchmark_args, capture_output=True, cwd=self.test_cwd)
+        if proc.returncode != 0:
+            raise IreeRunException(proc, self.test_cwd, self.compile_args)
+        outs = proc.stdout.decode("utf-8")
+        print(f"Stdout benchmark:\n{outs}\n")
 
     def repr_failure(self, excinfo):
         """Called when self.runtest() raises an exception."""

diff --git a/...ls/llama-tank/real_weights_data_flags.txt → ...ls/llama-tank/real_weights_data_flags.txt b/...ls/llama-tank/real_weights_data_flags.txt → ...ls/llama-tank/real_weights_data_flags.txt
diff --git a/...ch/models/llama-tank/splat_data_flags.txt → ...ch-models/llama-tank/splat_data_flags.txt b/...ch/models/llama-tank/splat_data_flags.txt → ...ch-models/llama-tank/splat_data_flags.txt
diff --git a/...sts/pytorch/models/llama-tank/splats.irpa → ...ure-pytorch-models/llama-tank/splats.irpa b/...sts/pytorch/models/llama-tank/splats.irpa → ...ure-pytorch-models/llama-tank/splats.irpa
diff --git a/...pytorch/models/llama-tank/test_cases.json → ...pytorch-models/llama-tank/test_cases.json b/...pytorch/models/llama-tank/test_cases.json → ...pytorch-models/llama-tank/test_cases.json
diff --git a/.../sd-clip-tank/real_weights_data_flags.txt → .../sd-clip-tank/real_weights_data_flags.txt b/.../sd-clip-tank/real_weights_data_flags.txt → .../sd-clip-tank/real_weights_data_flags.txt
diff --git a/...h/models/sd-clip-tank/sd-clip-tank.mlirbc → ...h-models/sd-clip-tank/sd-clip-tank.mlirbc b/...h/models/sd-clip-tank/sd-clip-tank.mlirbc → ...h-models/sd-clip-tank/sd-clip-tank.mlirbc
diff --git a/.../models/sd-clip-tank/splat_data_flags.txt → ...-models/sd-clip-tank/splat_data_flags.txt b/.../models/sd-clip-tank/splat_data_flags.txt → ...-models/sd-clip-tank/splat_data_flags.txt
diff --git a/...s/pytorch/models/sd-clip-tank/splats.irpa → ...e-pytorch-models/sd-clip-tank/splats.irpa b/...s/pytorch/models/sd-clip-tank/splats.irpa → ...e-pytorch-models/sd-clip-tank/splats.irpa
diff --git a/...torch/models/sd-clip-tank/test_cases.json → ...torch-models/sd-clip-tank/test_cases.json b/...torch/models/sd-clip-tank/test_cases.json → ...torch-models/sd-clip-tank/test_cases.json
diff --git a/.../sd-unet-tank/real_weights_data_flags.txt → .../sd-unet-tank/real_weights_data_flags.txt b/.../sd-unet-tank/real_weights_data_flags.txt → .../sd-unet-tank/real_weights_data_flags.txt
diff --git a/...h/models/sd-unet-tank/sd-unet-tank.mlirbc → ...h-models/sd-unet-tank/sd-unet-tank.mlirbc b/...h/models/sd-unet-tank/sd-unet-tank.mlirbc → ...h-models/sd-unet-tank/sd-unet-tank.mlirbc
diff --git a/.../models/sd-unet-tank/splat_data_flags.txt → ...-models/sd-unet-tank/splat_data_flags.txt b/.../models/sd-unet-tank/splat_data_flags.txt → ...-models/sd-unet-tank/splat_data_flags.txt
diff --git a/...s/pytorch/models/sd-unet-tank/splats.irpa → ...e-pytorch-models/sd-unet-tank/splats.irpa b/...s/pytorch/models/sd-unet-tank/splats.irpa → ...e-pytorch-models/sd-unet-tank/splats.irpa
diff --git a/...torch/models/sd-unet-tank/test_cases.json → ...torch-models/sd-unet-tank/test_cases.json b/...torch/models/sd-unet-tank/test_cases.json → ...torch-models/sd-unet-tank/test_cases.json
diff --git a/...e-decode-tank/real_weights_data_flags.txt → ...e-decode-tank/real_weights_data_flags.txt b/...e-decode-tank/real_weights_data_flags.txt → ...e-decode-tank/real_weights_data_flags.txt
diff --git a/...s/sd-vae-decode-tank/splat_data_flags.txt → ...s/sd-vae-decode-tank/splat_data_flags.txt b/...s/sd-vae-decode-tank/splat_data_flags.txt → ...s/sd-vae-decode-tank/splat_data_flags.txt
diff --git a/...rch/models/sd-vae-decode-tank/splats.irpa → ...rch-models/sd-vae-decode-tank/splats.irpa b/...rch/models/sd-vae-decode-tank/splats.irpa → ...rch-models/sd-vae-decode-tank/splats.irpa
diff --git a/...models/sd-vae-decode-tank/test_cases.json → ...models/sd-vae-decode-tank/test_cases.json b/...models/sd-vae-decode-tank/test_cases.json → ...models/sd-vae-decode-tank/test_cases.json
diff --git a/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/model.mlirbc b/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/model.mlirbc
diff --git a/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/real_weights_data_flags.txt b/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/real_weights_data_flags.txt
@@ -0,0 +1,8 @@
+--parameters=model=real_weights.irpa
+--input=1x64xi64=@inference_input.0.bin
+--input=1x64xi64=@inference_input.1.bin
+--input=1x64xi64=@inference_input.2.bin
+--input=1x64xi64=@inference_input.3.bin
+--expected_output=2x64x2048xf16=@inference_output.0.bin
+--expected_output=2x1280xf16=@inference_output.1.bin
+--expected_f16_threshold=1.0f
diff --git a/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/splat_data_flags.txt b/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/splat_data_flags.txt
@@ -0,0 +1,5 @@
+--input="1x64xi64"
+--input="1x64xi64"
+--input="1x64xi64"
+--input="1x64xi64"
+--parameters=splats.irpa
diff --git a/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/splats.irpa b/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/splats.irpa
diff --git a/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/test_cases.json b/iree_tests/pytorch/models/sdxl-prompt-encoder-tank/test_cases.json
@@ -0,0 +1,29 @@
+{
+  "test_cases": [
+    {
+      "name": "splats",
+      "runtime_flagfile": "splat_data_flags.txt",
+      "remote_file_groups": []
+    },
+    {
+      "name": "real_weights",
+      "runtime_flagfile": "real_weights_data_flags.txt",
+      "remote_file_groups": [
+        {
+          "azure_account_url": "https://sharkpublic.blob.core.windows.net",
+          "azure_container_name": "sharkpublic",
+          "azure_base_blob_name": "sai/sdxl-prompt-encoder/",
+          "files": [
+            "inference_input.0.bin",
+            "inference_input.1.bin",
+            "inference_input.2.bin",
+            "inference_input.3.bin",
+            "inference_output.0.bin",
+            "inference_output.1.bin",
+            "real_weights.irpa"
+          ]
+        }
+      ]
+    }
+  ]
+}
diff --git a/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/model.mlirbc b/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/model.mlirbc
diff --git a/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/real_weights_data_flags.txt b/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/real_weights_data_flags.txt
@@ -0,0 +1,8 @@
+--parameters=model=real_weights.irpa
+--module=sdxl_scheduled_unet_pipeline_fp16_.vmfb
+--input=1x4x128x128xf16=@inference_input.0.bin
+--input=2x64x2048xf16=@inference_input.1.bin
+--input=2x1280xf16=@inference_input.2.bin
+--input=1xf16=@inference_input.3.bin
+--expected_output=1x4x128x128xf16=@inference_output.0.bin
+--expected_f16_threshold=1.5f
diff --git a/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/sdxl_scheduled_unet_pipeline_fp16_.vmfb b/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/sdxl_scheduled_unet_pipeline_fp16_.vmfb
diff --git a/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/splat_data_flags.txt b/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/splat_data_flags.txt
@@ -0,0 +1,5 @@
+--input="1x4x128x128xf16"
+--input="2x64x2048xf16"
+--input="2x1280xf16"
+--input="1xf16"
+--parameters=splats.irpa
diff --git a/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/splats.irpa b/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/splats.irpa
diff --git a/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/test_cases.json b/iree_tests/pytorch/models/sdxl-scheduled-unet-3-tank/test_cases.json
@@ -0,0 +1,28 @@
+{
+  "test_cases": [
+    {
+      "name": "splats",
+      "runtime_flagfile": "splat_data_flags.txt",
+      "remote_file_groups": []
+    },
+    {
+      "name": "real_weights",
+      "runtime_flagfile": "real_weights_data_flags.txt",
+      "remote_file_groups": [
+        {
+          "azure_account_url": "https://sharkpublic.blob.core.windows.net",
+          "azure_container_name": "sharkpublic",
+          "azure_base_blob_name": "sai/sdxl-scheduled-unet/",
+          "files": [
+            "inference_input.0.bin",
+            "inference_input.1.bin",
+            "inference_input.2.bin",
+            "inference_input.3.bin",
+            "inference_output.0.bin",
+            "real_weights.irpa"
+          ]
+        }
+      ]
+    }
+  ]
+}
diff --git a/iree_tests/pytorch/models/sdxl-vae-decode-tank/model.mlirbc b/iree_tests/pytorch/models/sdxl-vae-decode-tank/model.mlirbc
diff --git a/iree_tests/pytorch/models/sdxl-vae-decode-tank/real_weights_data_flags.txt b/iree_tests/pytorch/models/sdxl-vae-decode-tank/real_weights_data_flags.txt
@@ -0,0 +1,4 @@
+--parameters=model=real_weights.irpa
+--input=1x4x128x128xf16=@inference_input.0.bin
+--expected_output=1x3x1024x1024xf16=@inference_output.0.bin
+--expected_f16_threshold=0.02f
diff --git a/iree_tests/pytorch/models/sdxl-vae-decode-tank/splat_data_flags.txt b/iree_tests/pytorch/models/sdxl-vae-decode-tank/splat_data_flags.txt
@@ -0,0 +1,2 @@
+--input="1x4x128x128xf16"
+--parameters=splats.irpa
diff --git a/iree_tests/pytorch/models/sdxl-vae-decode-tank/splats.irpa b/iree_tests/pytorch/models/sdxl-vae-decode-tank/splats.irpa
diff --git a/iree_tests/pytorch/models/sdxl-vae-decode-tank/test_cases.json b/iree_tests/pytorch/models/sdxl-vae-decode-tank/test_cases.json
@@ -0,0 +1,25 @@
+{
+  "test_cases": [
+    {
+      "name": "splats",
+      "runtime_flagfile": "splat_data_flags.txt",
+      "remote_file_groups": []
+    },
+    {
+      "name": "real_weights",
+      "runtime_flagfile": "real_weights_data_flags.txt",
+      "remote_file_groups": [
+        {
+          "azure_account_url": "https://sharkpublic.blob.core.windows.net",
+          "azure_container_name": "sharkpublic",
+          "azure_base_blob_name": "sai/sdxl-vae-decode/",
+          "files": [
+            "inference_input.0.bin",
+            "inference_output.0.bin",
+            "real_weights.irpa"
+          ]
+        }
+      ]
+    }
+  ]
+}