Commit 872787b9 authored by Gustaf Ahdritz's avatar Gustaf Ahdritz
Browse files

Add gradient clipping to DeepSpeed config generator

parent ac058f54
...@@ -20,6 +20,8 @@ parser = argparse.ArgumentParser(description='''Outputs a DeepSpeed ...@@ -20,6 +20,8 @@ parser = argparse.ArgumentParser(description='''Outputs a DeepSpeed
configuration file to configuration file to
stdout''') stdout''')
parser.add_argument("--gradient_clipping", type=float, default=None,
help="Value of gradient clipping")
p = parser.add_argument_group("Optimizer") p = parser.add_argument_group("Optimizer")
p.add_argument("--optimizer", default=None, p.add_argument("--optimizer", default=None,
help='''Choice of optimizer. Choose between "Adam" or help='''Choice of optimizer. Choose between "Adam" or
...@@ -295,4 +297,7 @@ flops_profiler["top_modules"] = args.top_modules ...@@ -295,4 +297,7 @@ flops_profiler["top_modules"] = args.top_modules
flops_profiler["detailed"] = args.detailed_flops_profile flops_profiler["detailed"] = args.detailed_flops_profile
d ["flops_profiler"] = flops_profiler d ["flops_profiler"] = flops_profiler
if(args.gradient_clipping):
d["gradient_clipping"] = args.gradient_clipping
print(json.dumps(d, indent=2)) print(json.dumps(d, indent=2))
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment