Skip to content

Commit 99aade7

Browse files
authored
quant: avoid assign empty rowwise layers (#922)
1 parent 75aa594 commit 99aade7

1 file changed

Lines changed: 7 additions & 6 deletions

File tree

src/cache_dit/quantize/torchao/quantize_ao.py

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -295,12 +295,13 @@ def _maybe_fill_fallback_layers(self):
295295
if self.module_ref is not None and self.is_float8_dynamic_per_row():
296296
if not ENV.CACHE_DIT_DISABLE_EXCLUDE_FOR_QUANTIZE_AFTER_TP:
297297
rowwise_layers = getattr(self.module_ref, "_rowwise_layers", [])
298-
if self.float8_per_tensor_fallback and rowwise_layers:
299-
fallback_layers = fallback_layers + rowwise_layers
300-
logger.info(f"Set float8 per tensor fallback layers: {rowwise_layers}.")
301-
else:
302-
exclude_layers = exclude_layers + rowwise_layers
303-
logger.info(f"Add rowwise layers to exclude layers: {rowwise_layers}.")
298+
if rowwise_layers:
299+
if self.float8_per_tensor_fallback:
300+
fallback_layers = fallback_layers + rowwise_layers
301+
logger.info(f"Add fallback layers: {rowwise_layers}.")
302+
else:
303+
exclude_layers = exclude_layers + rowwise_layers
304+
logger.info(f"Add exclude layers: {rowwise_layers}.")
304305
self.rowwise_layers = copy.deepcopy(rowwise_layers)
305306
# Case 1/2/3/...: Future cases ...
306307
# We may add more cases in the future where we need to automatically fill the

0 commit comments

Comments
 (0)