Merge remote-tracking branch 'origin/bench-gpu-profiling' into model_shapes_config

jainapurva · jainapurva · commit 6e8830665005 · 2025-04-10T12:42:34.000-07:00
diff --git a/benchmarks/microbenchmarks/benchmark_inference.py b/benchmarks/microbenchmarks/benchmark_inference.py
@@ -99,9 +99,10 @@ def run(config: BenchmarkConfig) -> BenchmarkResult:
                 result.profiler_json_path = generate_model_profile(
                     m_copy, input_data, config.profiler_file_name
                 )
-            except Exception:
-                print(f"Error running profiler for {config.name}")
+            except Exception as e:
+                print(f"Error running profiler for {config.name} with error: {e}")
+
         return result
-    except Exception:
-        print(f"Error in benchmark run: {config.name}")
-        return
+    except Exception as e:
+        print(f"Error in benchmark run: {config.name} with error: {e}")
+        return None
diff --git a/benchmarks/microbenchmarks/test/benchmark_config.yml b/benchmarks/microbenchmarks/test/benchmark_config.yml
@@ -5,7 +5,8 @@ quantization_config_recipe_names:
   - "int8wo"
   - "int8dq"
   - "float8dq"
-sparsity_config_recipe_names:
+  - "float8wo"
+# sparsity_config_recipe_names:
   # Will run a baseline inference for model by default, without sparsity for comparison
   - "semi-sparse"
   - "block"
diff --git a/benchmarks/microbenchmarks/utils.py b/benchmarks/microbenchmarks/utils.py
@@ -77,7 +77,7 @@ def generate_model_profile(model, input_data, profile_file_path):
         record_shapes=True,
         with_stack=True,
         profile_memory=True,
-        with_flops=True,  # Excperiemntal; might be unreliable for some layers
+        with_flops=True,  # Experimental; might be unreliable for some layers
     )
 
     # Warm up

Original file line number	Diff line number	Diff line change
`@@ -77,7 +77,7 @@ def generate_model_profile(model, input_data, profile_file_path):`
`77`	`77`	`record_shapes=True,`
`78`	`78`	`with_stack=True,`
`79`	`79`	`profile_memory=True,`
`80`		`- with_flops=True, # Excperiemntal; might be unreliable for some layers`
	`80`	`+ with_flops=True, # Experimental; might be unreliable for some layers`
`81`	`81`	`)`
`82`	`82`
`83`	`83`	`# Warm up`