Skip to content

Commit 6e88306

Browse files
committed
Merge remote-tracking branch 'origin/bench-gpu-profiling' into model_shapes_config
2 parents 345a00c + 5ee6b58 commit 6e88306

File tree

3 files changed

+9
-7
lines changed

3 files changed

+9
-7
lines changed

benchmarks/microbenchmarks/benchmark_inference.py

+6-5
Original file line numberDiff line numberDiff line change
@@ -99,9 +99,10 @@ def run(config: BenchmarkConfig) -> BenchmarkResult:
9999
result.profiler_json_path = generate_model_profile(
100100
m_copy, input_data, config.profiler_file_name
101101
)
102-
except Exception:
103-
print(f"Error running profiler for {config.name}")
102+
except Exception as e:
103+
print(f"Error running profiler for {config.name} with error: {e}")
104+
104105
return result
105-
except Exception:
106-
print(f"Error in benchmark run: {config.name}")
107-
return
106+
except Exception as e:
107+
print(f"Error in benchmark run: {config.name} with error: {e}")
108+
return None

benchmarks/microbenchmarks/test/benchmark_config.yml

+2-1
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,8 @@ quantization_config_recipe_names:
55
- "int8wo"
66
- "int8dq"
77
- "float8dq"
8-
sparsity_config_recipe_names:
8+
- "float8wo"
9+
# sparsity_config_recipe_names:
910
# Will run a baseline inference for model by default, without sparsity for comparison
1011
- "semi-sparse"
1112
- "block"

benchmarks/microbenchmarks/utils.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -77,7 +77,7 @@ def generate_model_profile(model, input_data, profile_file_path):
7777
record_shapes=True,
7878
with_stack=True,
7979
profile_memory=True,
80-
with_flops=True, # Excperiemntal; might be unreliable for some layers
80+
with_flops=True, # Experimental; might be unreliable for some layers
8181
)
8282

8383
# Warm up

0 commit comments

Comments
 (0)