Commit 2550f4f 1 parent 4a1357d commit 2550f4f Copy full SHA for 2550f4f
File tree 3 files changed +0
-58
lines changed
benchmark_tests/llm/sglang_benchmarks
3 files changed +0
-58
lines changed Original file line number Diff line number Diff line change @@ -75,28 +75,6 @@ def write_config(request, pre_process_model):
75
75
/ f"{ '_' .join (str (bs ) for bs in batch_sizes )} _{ prefix_sharing_algorithm } .json"
76
76
)
77
77
78
- config = {
79
- "module_name" : "module" ,
80
- "module_abi_version" : 1 ,
81
- "max_seq_len" : 131072 ,
82
- "attn_head_count" : 8 ,
83
- "attn_head_dim" : 128 ,
84
- "prefill_batch_sizes" : batch_sizes ,
85
- "decode_batch_sizes" : batch_sizes ,
86
- "transformer_block_count" : 32 ,
87
- "paged_kv_cache" : {
88
- "block_seq_stride" : 16 ,
89
- "device_block_count" : 256 ,
90
- "prefix_sharing_algorithm" : prefix_sharing_algorithm ,
91
- },
92
- }
93
-
94
- logger .info (f"Saving edited config to: { config_path } \n " )
95
- logger .info (f"Config: { json .dumps (config , indent = 2 )} " )
96
- with open (config_path , "w" ) as f :
97
- json .dump (config , f )
98
-
99
- logger .info ("Config file successfully written" + end_log_group ())
100
78
yield config_path
101
79
102
80
Original file line number Diff line number Diff line change @@ -64,21 +64,6 @@ def pre_process_model(request, tmp_path_factory):
64
64
device_settings ,
65
65
)
66
66
67
- config = {
68
- "module_name" : "module" ,
69
- "module_abi_version" : 1 ,
70
- "max_seq_len" : 131072 ,
71
- "attn_head_count" : 8 ,
72
- "attn_head_dim" : 128 ,
73
- "prefill_batch_sizes" : [1 , 4 ],
74
- "decode_batch_sizes" : [1 , 4 ],
75
- "transformer_block_count" : 32 ,
76
- "paged_kv_cache" : {"block_seq_stride" : 16 , "device_block_count" : 256 },
77
- }
78
- config_path = tmp_dir / "config.json"
79
- with open (config_path , "w" ) as f :
80
- json .dump (config , f )
81
-
82
67
return tmp_dir
83
68
84
69
Original file line number Diff line number Diff line change @@ -91,27 +91,6 @@ def write_config(request, model_test_dir):
91
91
model_test_dir
92
92
/ f"{ '_' .join (str (bs ) for bs in batch_sizes )} _{ prefix_sharing_algorithm } .json"
93
93
)
94
-
95
- config = {
96
- "module_name" : "module" ,
97
- "module_abi_version" : 1 ,
98
- "max_seq_len" : 2048 ,
99
- "attn_head_count" : 32 ,
100
- "attn_head_dim" : 100 ,
101
- "prefill_batch_sizes" : batch_sizes ,
102
- "decode_batch_sizes" : batch_sizes ,
103
- "transformer_block_count" : 26 ,
104
- "paged_kv_cache" : {
105
- "block_seq_stride" : 16 ,
106
- "device_block_count" : 256 ,
107
- "prefix_sharing_algorithm" : prefix_sharing_algorithm ,
108
- },
109
- }
110
- logger .info (f"Saving edited config to: { config_path } \n " )
111
- logger .info (f"Config: { json .dumps (config , indent = 2 )} " )
112
- with open (config_path , "w" ) as f :
113
- json .dump (config , f )
114
-
115
94
yield config_path
116
95
117
96
You can’t perform that action at this time.
0 commit comments