nod-ai · saienduri · Jul 3, 2024 · Jul 3, 2024 · Jul 3, 2024 · Jul 3, 2024
diff --git a/iree_tests/configs/models_cpu_llvm_task.json b/iree_tests/configs/models_cpu_llvm_task.json
@@ -2,20 +2,19 @@
     "config_name": "cpu_llvm_task",
     "iree_compile_flags" : [
       "--iree-hal-target-backends=llvm-cpu",
-      "--iree-llvmcpu-target-cpu-features=host"
+      "--iree-llvmcpu-target-cpu-features=host",
+      "--iree-input-demote-i64-to-i32"
     ],
     "iree_run_module_flags": [
       "--device=local-task"
     ],
-    "skip_compile_tests": [
-      "pytorch/models/sdxl-scheduled-unet-3-tank",
-      "pytorch/models/sdxl-vae-decode-tank",
-      "pytorch/models/sdxl-prompt-encoder-tank"
-    ],
+    "skip_compile_tests": [],
     "skip_run_tests": [],
     "expected_compile_failures": [
-      "pytorch/models/opt-125M", // TODO(#17344): need to regenerate .mlirbc
-      "pytorch/models/resnet50", // TODO(#17344): need to regenerate .mlirbc
+      "pytorch/models/direct/opt-125M", // TODO(#17344): need to regenerate .mlirbc
+      "pytorch/models/direct/resnet50", // TODO(#17344): need to regenerate .mlirbc
     ],
-    "expected_run_failures": []
+    "expected_run_failures": [
+      "pytorch/models/onnx-export/mobilebert-uncased",
+    ]
   }
diff --git a/iree_tests/configs/models_gpu_rocm_gfx90a.json b/iree_tests/configs/models_gpu_rocm_gfx90a.json
@@ -2,25 +2,23 @@
     "config_name": "gpu_rocm",
     "iree_compile_flags" : [
       "--iree-hal-target-backends=rocm",
-      "--iree-rocm-target-chip=gfx90a",
-      "--iree-opt-const-eval=false",
-      "--iree-codegen-transform-dialect-library=${IREE_TEST_PATH_EXTENSION}/attention_and_matmul_spec.mlir"
+      "--iree-rocm-target-chip=gfx90a"
     ],
     "iree_run_module_flags": [
       "--device=hip"
     ],
-    "skip_compile_tests": [
-      "pytorch/models/sdxl-scheduled-unet-3-tank",
-      "pytorch/models/sdxl-vae-decode-tank",
-      "pytorch/models/sdxl-prompt-encoder-tank"
-    ],
+    "skip_compile_tests": [],
     "skip_run_tests": [],
     "expected_compile_failures": [
-      "pytorch/models/opt-125M", // TODO(#17344): need to regenerate .mlirbc
-      "pytorch/models/resnet50",
+      "pytorch/models/direct/opt-125M", // TODO(#17344): need to regenerate .mlirbc
+      "pytorch/models/direct/resnet50",
       // error: 'builtin.module' op failed to run transform dialect passes
       // (might need to drop the iree-codegen-transform-dialect-library flag)
-      "sharktank/llama/open-llama-3b-v2-f16"
+      "sharktank/llama/open-llama-3b-v2-f16",
+      "pytorch/models/onnx-export/mit-b0",
+      "pytorch/models/onnx-export/mobilebert-uncased",
+      "pytorch/models/onnx-export/t5-base",
+      "pytorch/models/onnx-export/t5-large"
     ],
     "expected_run_failures": []
 }
diff --git a/...s/pytorch/models/opt-125M/opt-125M.mlirbc → ...ch/models/direct/opt-125M/opt-125M.mlirbc b/...s/pytorch/models/opt-125M/opt-125M.mlirbc → ...ch/models/direct/opt-125M/opt-125M.mlirbc
diff --git a/...dels/opt-125M/real_weights_data_flags.txt → ...rect/opt-125M/real_weights_data_flags.txt b/...dels/opt-125M/real_weights_data_flags.txt → ...rect/opt-125M/real_weights_data_flags.txt
diff --git a/...orch/models/opt-125M/splat_data_flags.txt → ...dels/direct/opt-125M/splat_data_flags.txt b/...orch/models/opt-125M/splat_data_flags.txt → ...dels/direct/opt-125M/splat_data_flags.txt
diff --git a/...tests/pytorch/models/opt-125M/splats.irpa → ...ytorch/models/direct/opt-125M/splats.irpa b/...tests/pytorch/models/opt-125M/splats.irpa → ...ytorch/models/direct/opt-125M/splats.irpa
diff --git a/...s/pytorch/models/opt-125M/test_cases.json → ...ch/models/direct/opt-125M/test_cases.json b/...s/pytorch/models/opt-125M/test_cases.json → ...ch/models/direct/opt-125M/test_cases.json
diff --git a/...dels/resnet50/real_weights_data_flags.txt → ...rect/resnet50/real_weights_data_flags.txt b/...dels/resnet50/real_weights_data_flags.txt → ...rect/resnet50/real_weights_data_flags.txt
diff --git a/...s/pytorch/models/resnet50/resnet50.mlirbc → ...ch/models/direct/resnet50/resnet50.mlirbc b/...s/pytorch/models/resnet50/resnet50.mlirbc → ...ch/models/direct/resnet50/resnet50.mlirbc
diff --git a/...orch/models/resnet50/splat_data_flags.txt → ...dels/direct/resnet50/splat_data_flags.txt b/...orch/models/resnet50/splat_data_flags.txt → ...dels/direct/resnet50/splat_data_flags.txt
diff --git a/...tests/pytorch/models/resnet50/splats.irpa → ...ytorch/models/direct/resnet50/splats.irpa b/...tests/pytorch/models/resnet50/splats.irpa → ...ytorch/models/direct/resnet50/splats.irpa
diff --git a/...s/pytorch/models/resnet50/test_cases.json → ...ch/models/direct/resnet50/test_cases.json b/...s/pytorch/models/resnet50/test_cases.json → ...ch/models/direct/resnet50/test_cases.json
diff --git a/iree_tests/pytorch/models/onnx-export/mit-b0/model.mlirbc b/iree_tests/pytorch/models/onnx-export/mit-b0/model.mlirbc
diff --git a/iree_tests/pytorch/models/onnx-export/mit-b0/real_weights_data_flags.txt b/iree_tests/pytorch/models/onnx-export/mit-b0/real_weights_data_flags.txt
@@ -0,0 +1,3 @@
+--input=1x3x512x512xf32=@inference_input.0.bin
+--expected_output=1x1000xf32=@inference_output.0.bin
+--expected_f32_threshold=0.01f
diff --git a/iree_tests/pytorch/models/onnx-export/mit-b0/test_cases.json b/iree_tests/pytorch/models/onnx-export/mit-b0/test_cases.json
@@ -0,0 +1,13 @@
+{
+  "file_format": "test_cases_v0",
+  "test_cases": [
+    {
+      "name": "real_weights",
+      "runtime_flagfile": "real_weights_data_flags.txt",
+      "remote_files": [
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/mit-b0/inference_input.0.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/mit-b0/inference_output.0.bin"
+      ]
+    }
+  ]
+}
diff --git a/iree_tests/pytorch/models/onnx-export/mobilebert-uncased/real_weights_data_flags.txt b/iree_tests/pytorch/models/onnx-export/mobilebert-uncased/real_weights_data_flags.txt
@@ -0,0 +1,3 @@
+--input=1x128xi64=@inference_input.0.bin
+--expected_output=1x2xf32=@inference_output.0.bin
+--expected_f32_threshold=0.01f
diff --git a/iree_tests/pytorch/models/onnx-export/mobilebert-uncased/test_cases.json b/iree_tests/pytorch/models/onnx-export/mobilebert-uncased/test_cases.json
@@ -0,0 +1,14 @@
+{
+  "file_format": "test_cases_v0",
+  "test_cases": [
+    {
+      "name": "real_weights",
+      "runtime_flagfile": "real_weights_data_flags.txt",
+      "remote_files": [
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/mobilebert-uncased/inference_input.0.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/mobilebert-uncased/inference_output.0.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/mobilebert-uncased/model.mlirbc"
+      ]
+    }
+  ]
+}
diff --git a/iree_tests/pytorch/models/onnx-export/t5-base/real_weights_data_flags.txt b/iree_tests/pytorch/models/onnx-export/t5-base/real_weights_data_flags.txt
@@ -0,0 +1,54 @@
+--input=1x512xi64=@inference_input.0.bin
+--input=1x512xf32=@inference_input.1.bin
+--input=1x512xi64=@inference_input.2.bin
+--expected_output=1x512x768xf32=@inference_output.0.bin
+--expected_output=1x12x512x64xf32=@inference_output.1.bin
+--expected_output=1x12x512x64xf32=@inference_output.2.bin
+--expected_output=1x12x512x64xf32=@inference_output.3.bin
+--expected_output=1x12x512x64xf32=@inference_output.4.bin
+--expected_output=1x12x512x64xf32=@inference_output.5.bin
+--expected_output=1x12x512x64xf32=@inference_output.6.bin
+--expected_output=1x12x512x64xf32=@inference_output.7.bin
+--expected_output=1x12x512x64xf32=@inference_output.8.bin
+--expected_output=1x12x512x64xf32=@inference_output.9.bin
+--expected_output=1x12x512x64xf32=@inference_output.10.bin
+--expected_output=1x12x512x64xf32=@inference_output.11.bin
+--expected_output=1x12x512x64xf32=@inference_output.12.bin
+--expected_output=1x12x512x64xf32=@inference_output.13.bin
+--expected_output=1x12x512x64xf32=@inference_output.14.bin
+--expected_output=1x12x512x64xf32=@inference_output.15.bin
+--expected_output=1x12x512x64xf32=@inference_output.16.bin
+--expected_output=1x12x512x64xf32=@inference_output.17.bin
+--expected_output=1x12x512x64xf32=@inference_output.18.bin
+--expected_output=1x12x512x64xf32=@inference_output.19.bin
+--expected_output=1x12x512x64xf32=@inference_output.20.bin
+--expected_output=1x12x512x64xf32=@inference_output.21.bin
+--expected_output=1x12x512x64xf32=@inference_output.22.bin
+--expected_output=1x12x512x64xf32=@inference_output.23.bin
+--expected_output=1x12x512x64xf32=@inference_output.24.bin
+--expected_output=1x12x512x64xf32=@inference_output.25.bin
+--expected_output=1x12x512x64xf32=@inference_output.26.bin
+--expected_output=1x12x512x64xf32=@inference_output.27.bin
+--expected_output=1x12x512x64xf32=@inference_output.28.bin
+--expected_output=1x12x512x64xf32=@inference_output.29.bin
+--expected_output=1x12x512x64xf32=@inference_output.30.bin
+--expected_output=1x12x512x64xf32=@inference_output.31.bin
+--expected_output=1x12x512x64xf32=@inference_output.32.bin
+--expected_output=1x12x512x64xf32=@inference_output.33.bin
+--expected_output=1x12x512x64xf32=@inference_output.34.bin
+--expected_output=1x12x512x64xf32=@inference_output.35.bin
+--expected_output=1x12x512x64xf32=@inference_output.36.bin
+--expected_output=1x12x512x64xf32=@inference_output.37.bin
+--expected_output=1x12x512x64xf32=@inference_output.38.bin
+--expected_output=1x12x512x64xf32=@inference_output.39.bin
+--expected_output=1x12x512x64xf32=@inference_output.40.bin
+--expected_output=1x12x512x64xf32=@inference_output.41.bin
+--expected_output=1x12x512x64xf32=@inference_output.42.bin
+--expected_output=1x12x512x64xf32=@inference_output.43.bin
+--expected_output=1x12x512x64xf32=@inference_output.44.bin
+--expected_output=1x12x512x64xf32=@inference_output.45.bin
+--expected_output=1x12x512x64xf32=@inference_output.46.bin
+--expected_output=1x12x512x64xf32=@inference_output.47.bin
+--expected_output=1x12x512x64xf32=@inference_output.48.bin
+--expected_output=1x512x768xf32=@inference_output.49.bin
+--expected_f32_threshold=0.01f
diff --git a/iree_tests/pytorch/models/onnx-export/t5-base/test_cases.json b/iree_tests/pytorch/models/onnx-export/t5-base/test_cases.json
@@ -0,0 +1,65 @@
+{
+  "file_format": "test_cases_v0",
+  "test_cases": [
+    {
+      "name": "real_weights",
+      "runtime_flagfile": "real_weights_data_flags.txt",
+      "remote_files": [
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_input.0.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_input.1.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_input.2.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.0.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.1.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.2.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.3.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.4.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.5.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.6.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.7.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.8.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.9.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.10.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.11.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.12.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.13.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.14.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.15.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.16.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.17.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.18.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.19.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.20.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.21.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.22.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.23.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.24.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.25.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.26.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.27.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.28.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.29.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.30.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.31.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.32.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.33.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.34.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.35.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.36.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.37.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.38.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.39.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.40.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.41.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.42.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.43.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.44.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.45.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.46.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.47.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.48.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/inference_output.49.bin",
+        "https://sharkpublic.blob.core.windows.net/sharkpublic/shark-test-suite/iree-tests/pytorch/models/onnx-export/t5-base/model.mlirbc"
+      ]
+    }
+  ]
+}