manager.ts 3.91 KB
Newer Older
liuzhe-lz's avatar
liuzhe-lz committed
1
2
// Copyright (c) Microsoft Corporation.
// Licensed under the MIT license.
Deshui Yu's avatar
Deshui Yu committed
3
4
5
6

'use strict';

import { MetricDataRecord, MetricType, TrialJobInfo } from './datastore';
7
import { TrialJobStatus, LogType } from './trainingService';
Deshui Yu's avatar
Deshui Yu committed
8

QuanluZhang's avatar
QuanluZhang committed
9
type ProfileUpdateType = 'TRIAL_CONCURRENCY' | 'MAX_EXEC_DURATION' | 'SEARCH_SPACE' | 'MAX_TRIAL_NUM';
chicm-ms's avatar
chicm-ms committed
10
type ExperimentStatus = 'INITIALIZED' | 'RUNNING' | 'ERROR' | 'STOPPING' | 'STOPPED' | 'DONE' | 'NO_MORE_TRIAL' | 'TUNER_NO_MORE_TRIAL';
SparkSnail's avatar
SparkSnail committed
11
12
13
14
namespace ExperimentStartUpMode {
    export const NEW = 'new';
    export const RESUME = 'resume';
}
Deshui Yu's avatar
Deshui Yu committed
15
16
17
18

interface ExperimentParams {
    authorName: string;
    experimentName: string;
19
    description?: string;
Deshui Yu's avatar
Deshui Yu committed
20
21
22
23
    trialConcurrency: number;
    maxExecDuration: number; //seconds
    maxTrialNum: number;
    searchSpace: string;
24
    trainingServicePlatform: string;
chicm-ms's avatar
chicm-ms committed
25
    multiPhase?: boolean;
chicm-ms's avatar
chicm-ms committed
26
    multiThread?: boolean;
27
    versionCheck?: boolean;
SparkSnail's avatar
SparkSnail committed
28
    logCollection?: string;
QuanluZhang's avatar
QuanluZhang committed
29
    tuner?: {
chicm-ms's avatar
chicm-ms committed
30
        className?: string;
31
32
33
34
35
        builtinTunerName?: string;
        codeDir?: string;
        classArgs?: any;
        classFileName?: string;
        checkpointDir: string;
36
        includeIntermediateResults?: boolean;
37
        gpuIndices?: string;
Deshui Yu's avatar
Deshui Yu committed
38
39
    };
    assessor?: {
chicm-ms's avatar
chicm-ms committed
40
        className?: string;
41
42
43
44
45
        builtinAssessorName?: string;
        codeDir?: string;
        classArgs?: any;
        classFileName?: string;
        checkpointDir: string;
Deshui Yu's avatar
Deshui Yu committed
46
    };
QuanluZhang's avatar
QuanluZhang committed
47
    advisor?: {
chicm-ms's avatar
chicm-ms committed
48
        className?: string;
QuanluZhang's avatar
QuanluZhang committed
49
50
51
52
53
        builtinAdvisorName?: string;
        codeDir?: string;
        classArgs?: any;
        classFileName?: string;
        checkpointDir: string;
54
        gpuIndices?: string;
QuanluZhang's avatar
QuanluZhang committed
55
    };
Deshui Yu's avatar
Deshui Yu committed
56
57
58
59
60
61
62
63
64
65
    clusterMetaData?: {
        key: string;
        value: string;
    }[];
}

interface ExperimentProfile {
    params: ExperimentParams;
    id: string;
    execDuration: number;
66
    logDir?: string;
67
68
    startTime?: number;
    endTime?: number;
69
    nextSequenceId: number;
Deshui Yu's avatar
Deshui Yu committed
70
71
72
73
74
75
76
77
    revision: number;
}

interface TrialJobStatistics {
    trialJobStatus: TrialJobStatus;
    trialJobNumber: number;
}

78
interface NNIManagerStatus {
chicm-ms's avatar
chicm-ms committed
79
    status: ExperimentStatus;
80
81
82
    errors: string[];
}

Deshui Yu's avatar
Deshui Yu committed
83
84
abstract class Manager {
    public abstract startExperiment(experimentParams: ExperimentParams): Promise<string>;
SparkSnail's avatar
SparkSnail committed
85
    public abstract resumeExperiment(readonly: boolean): Promise<void>;
Deshui Yu's avatar
Deshui Yu committed
86
    public abstract stopExperiment(): Promise<void>;
87
88
    public abstract stopExperimentTopHalf(): Promise<void>;
    public abstract stopExperimentBottomHalf(): Promise<void>;
Deshui Yu's avatar
Deshui Yu committed
89
90
    public abstract getExperimentProfile(): Promise<ExperimentProfile>;
    public abstract updateExperimentProfile(experimentProfile: ExperimentProfile, updateType: ProfileUpdateType): Promise<void>;
91
    public abstract importData(data: string): Promise<void>;
92
    public abstract getImportedData(): Promise<string[]>;
93
    public abstract exportData(): Promise<string>;
Deshui Yu's avatar
Deshui Yu committed
94

95
    public abstract addCustomizedTrialJob(hyperParams: string): Promise<number>;
Deshui Yu's avatar
Deshui Yu committed
96
97
98
99
100
101
102
    public abstract cancelTrialJobByUser(trialJobId: string): Promise<void>;

    public abstract listTrialJobs(status?: TrialJobStatus): Promise<TrialJobInfo[]>;
    public abstract getTrialJob(trialJobId: string): Promise<TrialJobInfo>;
    public abstract setClusterMetadata(key: string, value: string): Promise<void>;
    public abstract getClusterMetadata(key: string): Promise<string>;

103
    public abstract getMetricData(trialJobId?: string, metricType?: MetricType): Promise<MetricDataRecord[]>;
104
105
106
    public abstract getMetricDataByRange(minSeqId: number, maxSeqId: number): Promise<MetricDataRecord[]>;
    public abstract getLatestMetricData(): Promise<MetricDataRecord[]>;

107
108
    public abstract getTrialLog(trialJobId: string, logType: LogType): Promise<string>;

Deshui Yu's avatar
Deshui Yu committed
109
    public abstract getTrialJobStatistics(): Promise<TrialJobStatistics[]>;
110
    public abstract getStatus(): NNIManagerStatus;
Deshui Yu's avatar
Deshui Yu committed
111
112
}

SparkSnail's avatar
SparkSnail committed
113
export { Manager, ExperimentParams, ExperimentProfile, TrialJobStatistics, ProfileUpdateType, NNIManagerStatus, ExperimentStatus, ExperimentStartUpMode };