diff --git a/iree_tests/download_remote_files.py b/iree_tests/download_remote_files.py index 87f06c6c6..ec0de6053 100644 --- a/iree_tests/download_remote_files.py +++ b/iree_tests/download_remote_files.py @@ -172,7 +172,9 @@ def download_huggingface_remote_file( # repo_id: SlyEcho/open_llama_3b_v2_gguf # revision: main # filename: open-llama-3b-v2-q4_0.gguf - result = re.search(r"https://huggingface.co/(.+)/resolve/(.+)/(.+)", remote_file) + result = re.search( + r"https://huggingface.co/(.+)/resolve/([^\/]+)/(.+)", remote_file + ) repo_id = result.groups()[0] revision = result.groups()[1] filename = result.groups()[2] diff --git a/iree_tests/sharktank/punet/.gitignore b/iree_tests/sharktank/punet/.gitignore new file mode 100644 index 000000000..3764e435e --- /dev/null +++ b/iree_tests/sharktank/punet/.gitignore @@ -0,0 +1,4 @@ +# Model source files are downloaded from +# https://huggingface.co/amd-shark/sdxl-quant-models, not stored in Git LFS. +*.mlirbc +*.mlir diff --git a/iree_tests/sharktank/punet/fp16/real_weights_data_flags.txt b/iree_tests/sharktank/punet/fp16/real_weights_data_flags.txt index 04dd7b238..bbd2374b6 100644 --- a/iree_tests/sharktank/punet/fp16/real_weights_data_flags.txt +++ b/iree_tests/sharktank/punet/fp16/real_weights_data_flags.txt @@ -1,4 +1,4 @@ ---parameters=model=sdxl_fp16_dataset.irpa +--parameters=model=sdxl_unet_fp16_dataset.irpa --input=1x4x128x128xf16 --input=1xi32 --input=2x64x2048xf16 diff --git a/iree_tests/sharktank/punet/fp16/sdxl_fp16_export_mlir.mlirbc b/iree_tests/sharktank/punet/fp16/sdxl_fp16_export_mlir.mlirbc deleted file mode 100644 index 7329a46d2..000000000 --- a/iree_tests/sharktank/punet/fp16/sdxl_fp16_export_mlir.mlirbc +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f0987d40ba5caf980871c72e243314341ef607f3063ccccb090d01fa430898e8 -size 873009 diff --git a/iree_tests/sharktank/punet/fp16/test_cases.json b/iree_tests/sharktank/punet/fp16/test_cases.json index 85674b51c..aad17842a 100644 --- a/iree_tests/sharktank/punet/fp16/test_cases.json +++ b/iree_tests/sharktank/punet/fp16/test_cases.json @@ -5,7 +5,8 @@ "name": "real_weights", "runtime_flagfile": "real_weights_data_flags.txt", "remote_files": [ - "https://sharkpublic.blob.core.windows.net/sharkpublic/scotttodd/iree_tests/2024_07_02/sdxl_fp16_dataset.irpa", + "https://huggingface.co/amd-shark/sdxl-quant-models/resolve/fe57fe12eeb6eac83f469793984f6ad4c06a478c/unet/fp16/export/sdxl_unet_fp16_dataset.irpa", + "https://huggingface.co/amd-shark/sdxl-quant-models/resolve/fe57fe12eeb6eac83f469793984f6ad4c06a478c/unet/fp16/export/sdxl_unet_fp16_export.mlir" // TODO: files for real inputs and real expected outputs ] } diff --git a/iree_tests/sharktank/punet/int8/real_weights_data_flags.txt b/iree_tests/sharktank/punet/int8/real_weights_data_flags.txt index 7f60304b9..a208248a7 100644 --- a/iree_tests/sharktank/punet/int8/real_weights_data_flags.txt +++ b/iree_tests/sharktank/punet/int8/real_weights_data_flags.txt @@ -1,4 +1,4 @@ ---parameters=model=sdxl_int8_dataset.irpa +--parameters=model=sdxl_unet_int8_dataset.irpa --input=1x4x128x128xf16 --input=1xi32 --input=2x64x2048xf16 diff --git a/iree_tests/sharktank/punet/int8/sdxl_int8_export_mlir.mlirbc b/iree_tests/sharktank/punet/int8/sdxl_int8_export_mlir.mlirbc deleted file mode 100644 index 750c9c1d3..000000000 --- a/iree_tests/sharktank/punet/int8/sdxl_int8_export_mlir.mlirbc +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:180d88507c1b75e3e80e65cdd192de8af6e9c70961717d45ceb33194de4d3ad7 -size 2362168 diff --git a/iree_tests/sharktank/punet/int8/test_cases.json b/iree_tests/sharktank/punet/int8/test_cases.json index a4ebd7440..48abb1b76 100644 --- a/iree_tests/sharktank/punet/int8/test_cases.json +++ b/iree_tests/sharktank/punet/int8/test_cases.json @@ -5,7 +5,8 @@ "name": "real_weights", "runtime_flagfile": "real_weights_data_flags.txt", "remote_files": [ - "https://sharkpublic.blob.core.windows.net/sharkpublic/scotttodd/iree_tests/2024_07_02/sdxl_int8_dataset.irpa", + "https://huggingface.co/amd-shark/sdxl-quant-models/resolve/fe57fe12eeb6eac83f469793984f6ad4c06a478c/unet/int8/export/sdxl_unet_int8_dataset.irpa", + "https://huggingface.co/amd-shark/sdxl-quant-models/resolve/fe57fe12eeb6eac83f469793984f6ad4c06a478c/unet/int8/export/sdxl_unet_int8_export.mlir" // TODO: files for real inputs and real expected outputs ] }