solve comments

Gasoonjia · Gasoonjia · commit 1599c2b6c18d · 2024-09-11T01:17:48.000-07:00
diff --git a/torchchat/cli/builder.py b/torchchat/cli/builder.py
@@ -37,7 +37,6 @@
 
 # bypass the import issue before torchao is ready on macos
 try:
-    from torchtune.training import set_default_dtype
     from torchtune.models.convert_weights import meta_to_tune
 except:
     pass
diff --git a/torchchat/model.py b/torchchat/model.py
@@ -281,7 +281,7 @@ def update(self, input_pos, k_val, v_val):
         return k_out, v_out
 
 
-class Model(nn.Module):
+class Model(ABC, nn.Module):
     """
     The entrance for model construction in torchchat.
     """
@@ -301,10 +301,10 @@ def build_model(self) -> nn.Module:
         recipe = ModelRecipe.get_recipe(self.config.model_type)
         modules = {}
         for name, module_class in recipe.modules.items():
-            if isinstance(self.config.transformer_args[name], dict):
-                modules[name] = module_class(**self.config.transformer_args[name])
+            if isinstance(config_args := self.config.transformer_args[name], dict):
+                modules[name] = module_class(**config_args)
             else:
-                modules[name] = module_class(self.config.transformer_args[name])
+                modules[name] = module_class(config_args)
 
         return recipe.fusion_class(**modules)
     
@@ -369,7 +369,12 @@ def reset_caches(self):
 
 
 class FlamingoModel(Model):
-    def forward(self, tokens: Tensor, encoder_input: Optional[Dict[str, Tensor]] = None, encoder_mask: Optional[Tensor] = None) -> Tensor:
+    def forward(
+        self,
+        tokens: Tensor,
+        encoder_input: Optional[Dict[str, Tensor]] = None,
+        encoder_mask: Optional[Tensor] = None,
+    ) -> Tensor:
         if encoder_input is None:
             return self.model(tokens, encoder_mask=encoder_mask)
         return self.model(tokens, encoder_input=encoder_input, encoder_mask=encoder_mask)