File tree Expand file tree Collapse file tree 1 file changed +5
-0
lines changed
llmc/compression/quantization Expand file tree Collapse file tree 1 file changed +5
-0
lines changed Original file line number Diff line number Diff line change @@ -185,6 +185,7 @@ def search_scale_subset(
185
185
torch .cuda .empty_cache ()
186
186
187
187
x_tmp = self .scaling_input (x , scales , is_gqa )
188
+ logger .info (f"x_tmp:{ x_tmp .shape } " )
188
189
189
190
if not check_w_only (
190
191
self .block_idx ,
@@ -205,13 +206,17 @@ def search_scale_subset(
205
206
).fake_quant_act_dynamic (_x )
206
207
outs .append (_x )
207
208
x_tmp = torch .stack (outs )
209
+ logger .info (f"x_tmp:{ x_tmp .shape } " )
208
210
209
211
out = self .inspect_module_forward (x_tmp , inspect_module , kwargs )
210
212
211
213
if self .padding_mask and org_out .shape [1 ] == self .padding_mask [i ].shape [- 1 ]:
212
214
org_out = org_out * self .padding_mask [i ].unsqueeze (dim = - 1 ).to (org_out .device ) # noqa
213
215
out = out * self .padding_mask [i ].unsqueeze (dim = - 1 ).to (out .device )
214
216
217
+ logger .info (f"org_out:{ org_out .shape } " )
218
+ logger .info (f"out:{ out .shape } " )
219
+
215
220
loss = self .calculate_loss (org_out , out )
216
221
217
222
if len (input ) == 1 :
You can’t perform that action at this time.
0 commit comments