"src/include/ConstantTensorDescriptor.cuh" did not exist on "24d2f034fac9ec797477baee9fd36f4a930db068"
Unverified Commit e9f832df authored by J-shang's avatar J-shang Committed by GitHub
Browse files

change SIGKILL to SIGTERM in local mode cancel trial job (#3173)

parent 12a5e3de
...@@ -253,7 +253,20 @@ class LocalTrainingService implements TrainingService { ...@@ -253,7 +253,20 @@ class LocalTrainingService implements TrainingService {
return Promise.resolve(); return Promise.resolve();
} }
tkill(trialJob.pid, 'SIGKILL'); tkill(trialJob.pid, 'SIGTERM');
const startTime = Date.now();
while(await isAlive(trialJob.pid)) {
if (Date.now() - startTime > 4999) {
tkill(trialJob.pid, 'SIGKILL', (err) => {
if (err) {
this.log.error(`kill trial job error: ${err}`);
}
});
break;
}
await delay(500);
}
this.setTrialJobStatus(trialJob, getJobCancelStatus(isEarlyStopped)); this.setTrialJobStatus(trialJob, getJobCancelStatus(isEarlyStopped));
return Promise.resolve(); return Promise.resolve();
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment