Benchmark - Update TE FP8 model conversion (#499)

__Description__ Update TE FP8 model conversion. __Major Revisions__ * Add 16-byte alignment comment. * Fix TE layer parameters type.

Benchmark - Update TE FP8 model conversion (#499)
__Description__ Update TE FP8 model conversion. __Major Revisions__ * Add 16-byte alignment comment. * Fix TE layer parameters type.
97c9a41f · Yifan Xiong · GitHub · c88c9709 · 97c9a41f
Unverified Commit 97c9a41f authored Mar 28, 2023 by Yifan Xiong Committed by GitHub Mar 28, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 2 deletions

superbench/benchmarks/model_benchmarks/pytorch_base.py superbench/benchmarks/model_benchmarks/pytorch_base.py +3 -2

No files found.
--- a/superbench/benchmarks/model_benchmarks/pytorch_base.py
+++ b/superbench/benchmarks/model_benchmarks/pytorch_base.py
@@ -63,15 +63,16 @@ def _to_te_model(self, model):
            return
        for name, m in model.named_children():
            if isinstance(m, torch.nn.Linear):
+                # check 16-byte alignment
                if any(p % 16 != 0 for p in m.weight.shape):
                    return
-                te_m = te.Linear(m.in_features, m.out_features, bias=(m.bias is not None))
+                te_m = te.Linear(m.in_features, m.out_features, bias=(m.bias is not None), params_dtype=m.weight.dtype)
                te_m.weight.copy_(m.weight)
                if m.bias is not None:
                    te_m.bias.copy_(m.bias)
                setattr(model, name, te_m)
            elif isinstance(m, torch.nn.LayerNorm):
-                te_m = te.LayerNorm(m.normalized_shape[0], eps=m.eps)
+                te_m = te.LayerNorm(m.normalized_shape[0], eps=m.eps, params_dtype=m.weight.dtype)
                if hasattr(te_m, 'weight'):
                    te_m.weight.copy_(m.weight)
                    te_m.bias.copy_(m.bias)