Commit f107780a authored by zhangqha's avatar zhangqha
Browse files

Merge branch 'v0.15.1-dev-custom' into 'v0.15.1-dev'

解决custom allreduce在K100AI上新模型报错问题

See merge request dcutoolkit/deeplearing/vllm!459
parents db85ab07 02effa65
......@@ -651,7 +651,7 @@ class CustomAllreduce {
#define KL(ngpus, name) \
{ \
void* kernelArgs[] = { \
&ptrs, &sg_, &self_sg_, &output, &rank_, &size \
&ptrs, &sg_, &self_sg_, &output, &rank_, &size, &dev_curr_hdp_reg, &world_size_ \
}; \
hipExtLaunchKernel( \
(void*)name<T, ngpus>, \
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment