// Copyright (c) Microsoft Corporation. // Licensed under the MIT license. import assert from 'assert'; import { MethodNotImplementedError, NNIError, NNIErrorNames } from 'common/errors'; import { getLogger, Logger } from 'common/log'; import { TrialJobStatus } from 'common/trainingService'; import { KubernetesCRDClient } from './kubernetesApiClient'; import { KubernetesTrialJobDetail } from './kubernetesData'; /** * Collector Kubeflow jobs info from Kubernetes cluster, and update kubeflow job status locally */ export class KubernetesJobInfoCollector { protected readonly trialJobsMap: Map; protected readonly log: Logger = getLogger('KubernetesJobInfoCollector'); protected readonly statusesNeedToCheck: TrialJobStatus[]; constructor(jobMap: Map) { this.trialJobsMap = jobMap; this.statusesNeedToCheck = ['RUNNING', 'WAITING']; } public async retrieveTrialStatus(kubernetesCRDClient: KubernetesCRDClient | undefined): Promise { assert(kubernetesCRDClient !== undefined); const updateKubernetesTrialJobs: Promise[] = []; for (const [trialJobId, kubernetesTrialJob] of this.trialJobsMap) { if (kubernetesTrialJob === undefined) { throw new NNIError(NNIErrorNames.NOT_FOUND, `trial job id ${trialJobId} not found`); } updateKubernetesTrialJobs.push(this.retrieveSingleTrialJobInfo(kubernetesCRDClient, kubernetesTrialJob)); } return Promise.all(updateKubernetesTrialJobs); } protected async retrieveSingleTrialJobInfo(_kubernetesCRDClient: KubernetesCRDClient | undefined, _kubernetesTrialJob: KubernetesTrialJobDetail): Promise { throw new MethodNotImplementedError(); } }