Unverified Commit 665b99bf authored by Rick Ho's avatar Rick Ho Committed by GitHub
Browse files

Merge pull request #107 from laekov/faster-bug

fix bug: skip computeFn when batch is empty
parents 59bcec8e d90ff389
......@@ -80,6 +80,9 @@ void computeFn(py::function fn, c10::Device device,
scalar_t* inp_buf, scalar_t* out_buf,
long idx, long offset, long micro_batch_size, long d_model,
CudaStreamManager* smgr) {
if(micro_batch_size == 0) {
return;
}
auto options = torch::TensorOptions()
.dtype(c10::CppTypeToScalarType<scalar_t>::value)
.device(device)
......
......@@ -69,5 +69,5 @@ def get_shadow_policy(d_model=None):
if d_model is not None and 'FMOE_FASTER_GLBPLC_DMODEL' not in os.environ:
os.environ['FMOE_FASTER_GLBPLC_DMODEL'] = str(d_model)
if not switch_from_env('FMOE_FASTER_SHADOW_ENABLE'):
return no_policy
return no_shadow_policy
return global_policy
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment