@@ -197,7 +197,6 @@ def testBenchmark8B_f16_Decomposed(self):
197197 )
198198
199199 @skipif_run_quick_llama_test
200- @pytest .mark .xfail (reason = "Compile Error" , strict = True , raises = IreeCompileException )
201200 def testBenchmark8B_f16_Non_Decomposed_Prefill (self ):
202201 output_file_name = self .dir_path_8b / "f16_torch_prefill"
203202 output_mlir = self .llama8b_f16_torch_sdpa_artifacts .create_file (
@@ -780,7 +779,9 @@ def testBenchmark405B_f16_TP8_Decomposed(self):
780779 cwd = self .repo_root ,
781780 )
782781
783- @pytest .mark .xfail (reason = "Compile Error" , strict = True , raises = IreeCompileException )
782+ @pytest .mark .xfail (
783+ reason = "Benchmarking Error" , strict = True , raises = IreeBenchmarkException
784+ )
784785 def testBenchmark405B_f16_TP8_Non_Decomposed (self ):
785786 output_file_name = self .dir_path_405b / "f16_torch"
786787 output_mlir = self .llama405b_f16_torch_sdpa_artifacts .create_file (
@@ -828,7 +829,9 @@ def testBenchmark405B_f16_TP8_Non_Decomposed(self):
828829 cwd = self .repo_root ,
829830 )
830831
831- @pytest .mark .xfail (reason = "Compile Error" , strict = True , raises = IreeCompileException )
832+ @pytest .mark .xfail (
833+ reason = "KeyError in theta.py" , strict = True , raises = ExportMlirException
834+ )
832835 def testBenchmark405B_fp8_TP8_Decomposed (self ):
833836 output_file_name = self .dir_path_405b / "fp8_decomposed"
834837 output_mlir = self .llama405b_fp8_decomposed_artifacts .create_file (
@@ -874,7 +877,9 @@ def testBenchmark405B_fp8_TP8_Decomposed(self):
874877 cwd = self .repo_root ,
875878 )
876879
877- @pytest .mark .xfail (reason = "Compile Error" , strict = True , raises = IreeCompileException )
880+ @pytest .mark .xfail (
881+ reason = "KeyError in theta.py" , strict = True , raises = ExportMlirException
882+ )
878883 def testBenchmark405B_fp8_TP8_Non_Decomposed (self ):
879884 output_file_name = self .dir_path_405b / "fp8_torch"
880885 output_mlir = self .llama405b_fp8_torch_sdpa_artifacts .create_file (
0 commit comments