Bump test suite to include punet tests and fix xfail script. (#17897) Highlights from this update: * https://github.com/nod-ai/SHARK-TestSuite/commit/fc9fd6224f8ecf35159c0984c418b2e5c4781e35 Fixing the `update_config_xfails.py` script * https://github.com/nod-ai/SHARK-TestSuite/commit/2c0a31242ba977f3f16952090a1de757f5a54f98 (and follow-ups) Adding the [Partitioned UNet (punet)](https://github.com/nod-ai/sharktank/tree/main/sharktank/sharktank/models/punet) model to the test suite, using data from https://huggingface.co/amd-shark/sdxl-quant-models This also changes the 'models' pytest command to include all output, even for xfail'd tests. This will let us see the latest compile/run errors for these programs using the tested flags. ci-exactly: build_packages,regression_test

commit: 59434263c0dde40d8108d8e12502629164e9ee02 [log] [tgz]
author: Scott Todd <scott.todd0@gmail.com> Mon Jul 15 08:05:54 2024 -0700
committer: GitHub <noreply@github.com> Mon Jul 15 08:05:54 2024 -0700
tree: 1bded94b9fa448d11699c8c1c08da440c463cff9
parent: 9d6b425c81254d6fc8e18057188c26609320fab4 [diff]
diff --git a/.github/workflows/pkgci_regression_test.yml b/.github/workflows/pkgci_regression_test.yml
index 1a61c76..d2d7c0f 100644
--- a/.github/workflows/pkgci_regression_test.yml
+++ b/.github/workflows/pkgci_regression_test.yml

@@ -90,7 +90,7 @@
         uses: actions/checkout@v4.1.7
         with:
           repository: nod-ai/SHARK-TestSuite
-          ref: a06e730ce325c12db40bb89b43e8e6e897052e96
+          ref: 1da89a12a8b00dc77506d702f61300803b6240b7
           path: SHARK-TestSuite
           submodules: false
           lfs: false
@@ -198,7 +198,7 @@
         uses: actions/checkout@v4.1.7
         with:
           repository: nod-ai/SHARK-TestSuite
-          ref: a06e730ce325c12db40bb89b43e8e6e897052e96
+          ref: 1da89a12a8b00dc77506d702f61300803b6240b7
           path: SHARK-TestSuite
           submodules: false
           lfs: true
@@ -220,7 +220,7 @@
           pytest \
             SHARK-TestSuite/iree_tests/pytorch/models \
             SHARK-TestSuite/iree_tests/sharktank \
-            -rpfE \
+            -rA \
             -k real_weights \
             --no-skip-tests-missing-files \
             --capture=no \

diff --git a/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx90a.json b/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx90a.json
index 8b7f59c..1b15430 100644
--- a/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx90a.json
+++ b/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx90a.json

@@ -20,9 +20,11 @@
     "pytorch/models/resnet50",
     "pytorch/models/sdxl-vae-decode-tank",
 
-    // error: 'builtin.module' op failed to run transform dialect passes
-    // (transform spec file is specific to SDXL?)
-    "sharktank/llama/open-llama-3b-v2-f16"
+    // TODO(#17874): error: a handle passed as operand #0 and consumed by this operation points to a payload entity more than once
+    "sharktank/llama/open-llama-3b-v2-f16",
+
+    "sharktank/punet/fp16",
+    "sharktank/punet/int8"
   ],
   "expected_run_failures": []
 }

diff --git a/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx942.json b/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx942.json
index 5d451f0..0cf808b 100644
--- a/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx942.json
+++ b/build_tools/pkgci/external_test_suite/models_gpu_rocm_gfx942.json

@@ -20,9 +20,11 @@
     "pytorch/models/resnet50",
     "pytorch/models/sdxl-vae-decode-tank",
 
-    // error: 'builtin.module' op failed to run transform dialect passes
-    // (transform spec file is specific to SDXL?)
-    "sharktank/llama/open-llama-3b-v2-f16"
+      // TODO(#17874): error: a handle passed as operand #0 and consumed by this operation points to a payload entity more than once
+    "sharktank/llama/open-llama-3b-v2-f16",
+
+    "sharktank/punet/fp16",
+    "sharktank/punet/int8"
   ],
   "expected_run_failures": []
 }

diff --git a/build_tools/pkgci/external_test_suite/models_gpu_vulkan.json b/build_tools/pkgci/external_test_suite/models_gpu_vulkan.json
index d8af23a..7b40397 100644
--- a/build_tools/pkgci/external_test_suite/models_gpu_vulkan.json
+++ b/build_tools/pkgci/external_test_suite/models_gpu_vulkan.json

@@ -12,13 +12,16 @@
     // TODO(#17344): need to regenerate .mlirbc
     "pytorch/models/opt-125M",
     "pytorch/models/resnet50",
+
     "pytorch/models/sdxl-prompt-encoder-tank",
     "pytorch/models/sdxl-scheduled-unet-3-tank",
     "pytorch/models/sdxl-vae-decode-tank",
 
-    // error: 'builtin.module' op failed to run transform dialect passes
-    // (transform spec file is specific to SDXL?)
-    "sharktank/llama/open-llama-3b-v2-f16"
+    // TODO(#17874): error: a handle passed as operand #0 and consumed by this operation points to a payload entity more than once
+    "sharktank/llama/open-llama-3b-v2-f16",
+
+    "sharktank/punet/fp16",
+    "sharktank/punet/int8"
   ],
   "expected_run_failures": []
 }
commit	59434263c0dde40d8108d8e12502629164e9ee02	[log] [tgz]
author	Scott Todd <scott.todd0@gmail.com>	Mon Jul 15 08:05:54 2024 -0700
committer	GitHub <noreply@github.com>	Mon Jul 15 08:05:54 2024 -0700
tree	1bded94b9fa448d11699c8c1c08da440c463cff9
parent	9d6b425c81254d6fc8e18057188c26609320fab4 [diff]