Fix hyperband (#571)

* fix * update * fix * fix * fix

Fix hyperband (#571)
* fix * update * fix * fix * fix
043fb758 · QuanluZhang · GitHub · 96bab1a6 · 043fb758 · 043fb758
Unverified Commit 043fb758 authored Jan 16, 2019 by QuanluZhang Committed by GitHub Jan 16, 2019
Showing with 19 additions and 11 deletions

src/sdk/pynni/nni/hyperband_advisor/README.md src/sdk/pynni/nni/hyperband_advisor/README.md +3 -1

src/sdk/pynni/nni/hyperband_advisor/hyperband_advisor.py src/sdk/pynni/nni/hyperband_advisor/hyperband_advisor.py +16 -10

No files found.
--- a/src/sdk/pynni/nni/hyperband_advisor/README.md
+++ b/src/sdk/pynni/nni/hyperband_advisor/README.md
@@ -26,7 +26,9 @@ advisor:
 ```
 Note that once you use advisor, it is not allowed to add tuner and assessor spec in the config file any more.
-If you use Hyperband, among the hyperparameters (i.e., key-value pairs) received by a trial, there is one more key called `STEPS` besides the hyperparameters defined by user. By using this `STEPS`, the trial can control how long it runs.
+If you use Hyperband, among the hyperparameters (i.e., key-value pairs) received by a trial, there is one more key called `STEPS` besides the hyperparameters defined by user. **By using this `STEPS`, the trial can control how long it runs**.
+For `report_intermediate_result(metric)` and `report_final_result(metric)` in your trial code, **`metric` should be either a number or a dict which has a key `default` with a number as its value**. This number is the one you want to maximize or minimize, for example, accuracy or loss.
 `R` and `eta` are the parameters of Hyperband that you can change. `R` means the maximum STEPS that can be allocated to a configuration. Here, STEPS could mean the number of epochs or mini-batches. This `STEPS` should be used by the trial to control how long it runs. Refer to the example under `examples/trials/mnist-hyperband/` for details.

--- a/src/sdk/pynni/nni/hyperband_advisor/hyperband_advisor.py
+++ b/src/sdk/pynni/nni/hyperband_advisor/hyperband_advisor.py
@@ -22,6 +22,7 @@ hyperband_tuner.py
 '''
 from enum import Enum, unique
+import sys
 import math
 import copy
 import logging
@@ -140,13 +141,6 @@ class Bracket():
        value: latest result with sequence number seq
        '''
        if parameter_id in self.configs_perf[i]:
-            # this should always be true if there is no retry in training service
-            _logger.debug('assertion: %d %d, %s %s\n',
-                          self.configs_perf[i][parameter_id][0],
-                          seq,
-                          str(type(self.configs_perf[i][parameter_id][0])),
-                          str(type(seq)))
-            # assert self.configs_perf[i][parameter_id][0] < seq
            if self.configs_perf[i][parameter_id][0] < seq:
                self.configs_perf[i][parameter_id] = [seq, value]
        else:
@@ -214,6 +208,14 @@ class Bracket():
        self.num_configs_to_run.append(len(hyper_configs))
        self.increase_i()
+def extract_scalar_reward(value, scalar_key='default'):
+    if isinstance(value, float) or isinstance(value, int):
+        reward = value
+    elif isinstance(value, dict) and scalar_key in value and isinstance(value[scalar_key], (float, int)):
+        reward = value[scalar_key]
+    else:
+        raise RuntimeError('Incorrect final result: the final result for %s should be float/int, or a dict which has a key named "default" whose value is float/int.' % str(self.__class__)) 
+    return reward
 class Hyperband(MsgDispatcherBase):
    '''
@@ -345,12 +347,16 @@ class Hyperband(MsgDispatcherBase):
        '''
        data: it is an object which has keys 'parameter_id', 'value', 'trial_job_id', 'type', 'sequence'.
        '''
+        value = extract_scalar_reward(data['value'])
+        bracket_id, i, _ = data['parameter_id'].split('_')
+        bracket_id = int(bracket_id)
        if data['type'] == 'FINAL':
+            # sys.maxsize indicates this value is from FINAL metric data, because data['sequence'] from FINAL metric
+            # and PERIODICAL metric are independent, thus, not comparable.
+            self.brackets[bracket_id].set_config_perf(int(i), data['parameter_id'], sys.maxsize, value)
            self.completed_hyper_configs.append(data)
        elif data['type'] == 'PERIODICAL':
-            bracket_id, i, _ = data['parameter_id'].split('_')
+            self.brackets[bracket_id].set_config_perf(int(i), data['parameter_id'], data['sequence'], value)
-            bracket_id = int(bracket_id)
-            self.brackets[bracket_id].set_config_perf(int(i), data['parameter_id'], data['sequence'], data['value'])
        else:
            raise ValueError('Data type not supported: {}'.format(data['type']))