localTrainingService.test.ts 5.26 KB
Newer Older
liuzhe-lz's avatar
liuzhe-lz committed
1
2
// Copyright (c) Microsoft Corporation.
// Licensed under the MIT license.
Deshui Yu's avatar
Deshui Yu committed
3
4
5

'use strict';

SparkSnail's avatar
SparkSnail committed
6
7
8
import * as chai from 'chai';
import * as chaiAsPromised from 'chai-as-promised';
import * as fs from 'fs';
9
import * as path from 'path';
SparkSnail's avatar
SparkSnail committed
10
import * as tmp from 'tmp';
Deshui Yu's avatar
Deshui Yu committed
11
import * as component from '../../common/component';
12
13
import { TrialJobApplicationForm, TrialJobDetail} from '../../common/trainingService';
import { cleanupUnitTest, delay, prepareUnitTest, getExperimentRootDir } from '../../common/utils';
SparkSnail's avatar
SparkSnail committed
14
import { TrialConfigMetadataKey } from '../common/trialConfigMetadataKey';
15
import { LocalTrainingService } from '../local/localTrainingService';
16
import { ExperimentConfig } from '../../common/experimentConfig';
SparkSnail's avatar
SparkSnail committed
17
18

// TODO: copy mockedTrail.py to local folder
19
const localCodeDir: string = tmp.dirSync().name.split('\\').join('\\\\');
SparkSnail's avatar
SparkSnail committed
20
21
const mockedTrialPath: string = './training_service/test/mockedTrial.py'
fs.copyFileSync(mockedTrialPath, localCodeDir + '/mockedTrial.py')
Deshui Yu's avatar
Deshui Yu committed
22
23

describe('Unit Test for LocalTrainingService', () => {
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
    const config = <ExperimentConfig>{
        trialCommand: 'sleep 1h && echo hello',
        trialCodeDirectory: `${localCodeDir}`,
        trialGpuNumber: 1,
        trainingService: {
            platform: 'local'
        }
    };

    const config2 = <ExperimentConfig>{
        trialCommand: 'python3 mockedTrial.py',
        trialCodeDirectory: `${localCodeDir}`,
        trialGpuNumber: 0,
        trainingService: {
            platform: 'local'
        }
    };
SparkSnail's avatar
SparkSnail committed
41
42
43
44
45
46
47
48
49
50
51

    before(() => {
        chai.should();
        chai.use(chaiAsPromised);
        prepareUnitTest();
    });

    after(() => {
        cleanupUnitTest();
    });

52
53
    it('List empty trial jobs', async () => {
        const localTrainingService = new LocalTrainingService(config);
SparkSnail's avatar
SparkSnail committed
54
55
56
57
        localTrainingService.run();

        //trial jobs should be empty, since there are no submitted jobs
        chai.expect(await localTrainingService.listTrialJobs()).to.be.empty;
58

59
        localTrainingService.cleanUp();
SparkSnail's avatar
SparkSnail committed
60
61
62
    });

    it('Submit job and Cancel job', async () => {
63
64
        const localTrainingService = new LocalTrainingService(config);
        localTrainingService.run();
SparkSnail's avatar
SparkSnail committed
65
66
67

        // submit job
        const form: TrialJobApplicationForm = {
68
            sequenceId: 0,
SparkSnail's avatar
SparkSnail committed
69
70
71
72
73
74
75
76
77
            hyperParameters: {
                value: 'mock hyperparameters',
                index: 0
            }
        };
        const jobDetail: TrialJobDetail = await localTrainingService.submitTrialJob(form);
        chai.expect(jobDetail.status).to.be.equals('WAITING');
        await localTrainingService.cancelTrialJob(jobDetail.id);
        chai.expect(jobDetail.status).to.be.equals('USER_CANCELED');
78
79

        localTrainingService.cleanUp();
SparkSnail's avatar
SparkSnail committed
80
    }).timeout(20000);
81

82
    it('Get trial log', async () => {
83
84
        const localTrainingService = new LocalTrainingService(config);
        localTrainingService.run();
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110

        // submit job
        const form: TrialJobApplicationForm = {
            sequenceId: 0,
            hyperParameters: {
                value: 'mock hyperparameters',
                index: 0
            }
        };

        const jobDetail: TrialJobDetail = await localTrainingService.submitTrialJob(form);

        // get trial log
        const rootDir: string = getExperimentRootDir()
        fs.mkdirSync(path.join(rootDir, 'trials'))
        fs.mkdirSync(jobDetail.workingDirectory)
        fs.writeFileSync(path.join(jobDetail.workingDirectory, 'trial.log'), 'trial log')
        fs.writeFileSync(path.join(jobDetail.workingDirectory, 'stderr'), 'trial stderr')
        chai.expect(await localTrainingService.getTrialLog(jobDetail.id, 'TRIAL_LOG')).to.be.equals('trial log');
        chai.expect(await localTrainingService.getTrialLog(jobDetail.id, 'TRIAL_ERROR')).to.be.equals('trial stderr');
        fs.unlinkSync(path.join(jobDetail.workingDirectory, 'trial.log'))
        fs.unlinkSync(path.join(jobDetail.workingDirectory, 'stderr'))
        fs.rmdirSync(jobDetail.workingDirectory)
        fs.rmdirSync(path.join(rootDir, 'trials'))

        await localTrainingService.cancelTrialJob(jobDetail.id);
111
        localTrainingService.cleanUp();
112
113
    }).timeout(20000);

SparkSnail's avatar
SparkSnail committed
114
    it('Read metrics, Add listener, and remove listener', async () => {
115
116
        const localTrainingService = new LocalTrainingService(config2);
        localTrainingService.run();
SparkSnail's avatar
SparkSnail committed
117

118
        // set meta data
SparkSnail's avatar
SparkSnail committed
119
120
        // submit job
        const form: TrialJobApplicationForm = {
121
            sequenceId: 0,
SparkSnail's avatar
SparkSnail committed
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
            hyperParameters: {
                value: 'mock hyperparameters',
                index: 0
            }
        };
        const jobDetail: TrialJobDetail = await localTrainingService.submitTrialJob(form);
        chai.expect(jobDetail.status).to.be.equals('WAITING');
        localTrainingService.listTrialJobs().then((jobList)=>{
            chai.expect(jobList.length).to.be.equals(1);
        });
        // Add metrics listeners
        const listener1 = function f1(metric: any) {
            chai.expect(metric.id).to.be.equals(jobDetail.id);
        }
        localTrainingService.addTrialJobMetricListener(listener1);
        // Wait to collect metric
        await delay(1000);

        await localTrainingService.cancelTrialJob(jobDetail.id);
        localTrainingService.removeTrialJobMetricListener(listener1);
142
        localTrainingService.cleanUp();
SparkSnail's avatar
SparkSnail committed
143
    }).timeout(20000);
144
});