Simplify trainining step in av-asr recipe (#3598)

* Simplify trainining step in av-asr recipe * Run pre-commit

Simplify trainining step in av-asr recipe (#3598)
* Simplify trainining step in av-asr recipe * Run pre-commit
5e893d6f · Pingchuan Ma · GitHub · 3e1d8f3c · 5e893d6f · 5e893d6f
Unverified Commit 5e893d6f authored Sep 08, 2023 by Pingchuan Ma Committed by GitHub Sep 08, 2023
Showing with 1 addition and 24 deletions

examples/avsr/lightning.py examples/avsr/lightning.py +0 -12

examples/avsr/lightning_av.py examples/avsr/lightning_av.py +0 -12

examples/avsr/train.py examples/avsr/train.py +1 -0

No files found.
--- a/examples/avsr/lightning.py
+++ b/examples/avsr/lightning.py
@@ -84,8 +84,6 @@ class ConformerRNNTModule(LightningModule):
            betas=(0.9, 0.98),
        )

-        self.automatic_optimization = False
-
    def _step(self, batch, _, step_type):
        if batch is None:
            return None
@@ -123,20 +121,10 @@ class ConformerRNNTModule(LightningModule):
        return post_process_hypos(hypotheses, self.sp_model)[0][0]

    def training_step(self, batch, batch_idx):
-        opt = self.optimizers()
-        opt.zero_grad()
        loss = self._step(batch, batch_idx, "train")
        batch_size = batch.inputs.size(0)
        batch_sizes = self.all_gather(batch_size)
-
        loss *= batch_sizes.size(0) / batch_sizes.sum()  # world size / batch size
-        self.manual_backward(loss)
-        torch.nn.utils.clip_grad_norm_(self.model.parameters(), 10)
-        opt.step()
-
-        sch = self.lr_schedulers()
-        sch.step()
-
        self.log("monitoring_step", torch.tensor(self.global_step, dtype=torch.float32))

        return loss

--- a/examples/avsr/lightning_av.py
+++ b/examples/avsr/lightning_av.py
@@ -80,8 +80,6 @@ class AVConformerRNNTModule(LightningModule):
            betas=(0.9, 0.98),
        )

-        self.automatic_optimization = False
-
    def _step(self, batch, _, step_type):
        if batch is None:
            return None
@@ -128,20 +126,10 @@ class AVConformerRNNTModule(LightningModule):
        return post_process_hypos(hypotheses, self.sp_model)[0][0]

    def training_step(self, batch, batch_idx):
-        opt = self.optimizers()
-        opt.zero_grad()
        loss = self._step(batch, batch_idx, "train")
        batch_size = batch.videos.size(0)
        batch_sizes = self.all_gather(batch_size)
-
        loss *= batch_sizes.size(0) / batch_sizes.sum()  # world size / batch size
-        self.manual_backward(loss)
-        torch.nn.utils.clip_grad_norm_(self.model.parameters(), 10)
-        opt.step()
-
-        sch = self.lr_schedulers()
-        sch.step()
-
        self.log("monitoring_step", torch.tensor(self.global_step, dtype=torch.float32))

        return loss

--- a/examples/avsr/train.py
+++ b/examples/avsr/train.py
@@ -36,6 +36,7 @@ def get_trainer(args):
        strategy=DDPStrategy(find_unused_parameters=False),
        callbacks=callbacks,
        reload_dataloaders_every_n_epochs=1,
+        gradient_clip_val=10.0,
    )