fix: correcting whitespaces

bayo-ibm · bayo-ibm · commit 3aba05156bd4 · 2025-08-20T15:11:13.000-04:00
Signed-off-by: Omobayode Fagbohungbe &lt;omobayode.fagbohungbe@ibm.com&gt;
diff --git a/fms_mo/dq.py b/fms_mo/dq.py
@@ -198,7 +198,8 @@ def run_dq(model_args, data_args, opt_args, fms_mo_args):
 
     qcfg["model"] = model_args.model_name_or_path
     # config layers to skip, smooth scale
-    config_quantize_smooth_layers(qcfg)
+    if not inference:
+        config_quantize_smooth_layers(qcfg)
 
     use_dynamo = True
     # use dynamo as default unless really needed, False -> fallback to TorchScript tracing
diff --git a/fms_mo/modules/linear.py b/fms_mo/modules/linear.py
@@ -281,7 +281,6 @@ def forward(self, x):
                 )
 
             # pylint: disable=not-callable
-
             return F.linear(x, self.W_fp, self.bias)
         else:
             qinput = self.quantize_feature(x / scale).to(x.dtype)
@@ -294,10 +293,8 @@ def forward(self, x):
             else:
                 qweight = self.quantize_weight(self.weight * scale).to(
                     self.weight.dtype
-                )
-
+                )      
         qbias = self.bias
-        
         # pylint: disable=not-callable
         output = F.linear(qinput, qweight, qbias)
 
diff --git a/fms_mo/prep.py b/fms_mo/prep.py
@@ -392,9 +392,7 @@ def make_quant_module(module, curr_full_name, qcfg, verbose=False):
     # For nn.Linear
     elif isinstance(module, nn.Linear):
         if module.__class__ != nn.Linear:
-            if isinstance(
-                module, compressed_tensors.linear.compressed_linear.CompressedLinear
-            ):
+            if isinstance(module, compressed_tensors.linear.compressed_linear.CompressedLinear):
                 pass
             else:
                 logger.warning(
diff --git a/fms_mo/utils/dq_inf.py b/fms_mo/utils/dq_inf.py
@@ -102,7 +102,7 @@ def save_vllm_fp8(model: nn.Module, qcfg: dict, tokenizer=None, folder: str = No
     )
     tokenizer.save_pretrained(folder)
 
-    with open(folder + "/config.json", "w+", encoding='utf-8') as f:
+    with open(folder + "/config.json", "w+", encoding="utf-8") as f:
         json.dump(config, f, indent=4)
 
 
@@ -133,7 +133,7 @@ def convert_fms_mo_to_vllm_fp8_format(checkpoint: str = None, folder: str = None
     save_torch_state_dict(
         fms_dict, folder, filename_pattern="fms_mo{suffix}.safetensors"
     )
-    with open(folder + "/config.json", "w+", encoding='utf-8') as f:
+    with open(folder + "/config.json", "w+", encoding="utf-8") as f:
         json.dump(config, f, indent=4)
 
 

Original file line number	Diff line number	Diff line change
`@@ -102,7 +102,7 @@ def save_vllm_fp8(model: nn.Module, qcfg: dict, tokenizer=None, folder: str = No`
`102`	`102`	`)`
`103`	`103`	`tokenizer.save_pretrained(folder)`
`104`	`104`
`105`		`- with open(folder + "/config.json", "w+", encoding='utf-8') as f:`
	`105`	`+ with open(folder + "/config.json", "w+", encoding="utf-8") as f:`
`106`	`106`	`json.dump(config, f, indent=4)`
`107`	`107`
`108`	`108`
`@@ -133,7 +133,7 @@ def convert_fms_mo_to_vllm_fp8_format(checkpoint: str = None, folder: str = None`
`133`	`133`	`save_torch_state_dict(`
`134`	`134`	`fms_dict, folder, filename_pattern="fms_mo{suffix}.safetensors"`
`135`	`135`	`)`
`136`		`- with open(folder + "/config.json", "w+", encoding='utf-8') as f:`
	`136`	`+ with open(folder + "/config.json", "w+", encoding="utf-8") as f:`
`137`	`137`	`json.dump(config, f, indent=4)`
`138`	`138`
`139`	`139`