# first plot the time occupied by different operations
fork,marker,ls,color,namein[
('standard_gx+standard_gw+standard_fwd','s','-','C2','Standard fp16 (sum of parts)'),
('x_quantize_rowwise+g_quantize_rowwise+w_quantize_global+w_quantize_global_transpose+standard_gw+global_fwd+global_bwd','o','-','C4','SwitchBack int8 (sum of parts)'),