config_hybrid.yml 1.49 KB
Newer Older
qianyj's avatar
qianyj committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
searchSpaceFile: search_space.json
trialCommand: python3 mnist.py
trialGpuNumber: 0
trialConcurrency: 5
maxTrialNumber: 20
tuner:
  name: TPE
  classArgs:
    optimize_mode: maximize
# For local, remote, openpai, and aml, NNI can use multiple training services at one time
trainingService:
  - platform: local
  - platform: remote
    machineList:
      - host: ${your server's IP or domain name}
        user: ${your user name}
        ssh_key_file: ~/.ssh/id_rsa
  - platform: aml
    dockerImage: msranni/nni
    subscriptionId: ${your subscription ID}
    resourceGroup: ${your resource group}
    workspaceName: ${your workspace name}
    computeTarget: ${your compute target}
  - platform: kubeflow
    reuseMode: true
    worker:
      command:
      code_directory: 
      dockerImage: msranni/nni
      cpuNumber: 
      gpuNumber: 
      memorySize: 
      replicas: 
    operator: tf-operator
    storage:
      storageType: 
      azureAccount: 
      azureShare: 
      keyVaultName: 
      keyVaultKey: 
    apiVersion: v1
  - platform: frameworkcontroller
    reuseMode: true
    serviceAccountName: 
    taskRoles:
      - name: worker
        dockerImage: 'msranni/nni:latest'
        taskNumber: 
        command: 
        gpuNumber: 
        cpuNumber: 
        memorySize: 
        framework_attempt_completion_policy:
          min_failed_task_count: 1
          minSucceedTaskCount: 1
    storage:
      storageType: 
      azureAccount: 
      azureShare: 
      keyVaultName: 
      keyVaultKey: