[Minor] Fix a dtype bug (#79)

c84e9242 · Woosuk Kwon · GitHub · c9d5b6d4 · c84e9242
Unverified Commit c84e9242 authored May 06, 2023 by Woosuk Kwon Committed by GitHub May 06, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 1 deletion

cacheflow/models/model_utils.py cacheflow/models/model_utils.py +5 -1

No files found.
--- a/cacheflow/models/model_utils.py
+++ b/cacheflow/models/model_utils.py
@@ -37,7 +37,11 @@ _MEMORY_ANALYZERS = {
 def _get_dtype(config: PretrainedConfig, dtype: str) -> torch.dtype:
-    config_dtype: torch.dtype = getattr(config, 'torch_dtype', torch.float32)
+    # NOTE: getattr(config, 'torch_dtype', torch.float32) is not correct
+    # because config.torch_dtype can be None.
+    config_dtype = getattr(config, 'torch_dtype', None)
+    if config_dtype is None:
+        config_dtype = torch.float32
    if dtype == 'default':
        if config_dtype == torch.float32:
            # Following the common practice, we use float16 for float32 models.