params.yaml 2.89 KB
Newer Older
Vishnu Banna's avatar
Vishnu Banna committed
1
2
3
4
5
6
7
8
runtime:
  all_reduce_alg: null
  batchnorm_spatial_persistent: false
  dataset_num_private_threads: null
  default_shard_dim: -1
  distribution_strategy: mirrored
  enable_xla: false
  gpu_thread_mode: null
Vishnu Banna's avatar
Vishnu Banna committed
9
  loss_scale: dynamic
10
  mixed_precision_dtype: float16
Vishnu Banna's avatar
Vishnu Banna committed
11
  num_cores_per_replica: 1
Vishnu Banna's avatar
Vishnu Banna committed
12
  num_gpus: 2
Vishnu Banna's avatar
Vishnu Banna committed
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
  num_packs: 1
  per_gpu_thread_count: 0
  run_eagerly: false
  task_index: -1
  tpu: null
  worker_hosts: null
task:
  gradient_clip_norm: 0.0
  init_checkpoint: ''
  logging_dir: null
  losses:
    l2_weight_decay: 0.0005
    label_smoothing: 0.0
    one_hot: true
  model:
    add_head_batch_norm: false
    backbone:
      darknet:
        model_id: darknet53
      type: darknet
    dropout_rate: 0.0
    input_size: [256, 256, 3]
    norm_activation:
      activation: relu
      norm_epsilon: 0.001
      norm_momentum: 0.99
      use_sync_bn: false
    num_classes: 1001
  train_data:
    block_length: 1
    cache: false
    cycle_length: 10
    deterministic: null
    drop_remainder: true
    dtype: float16
    enable_tf_data_service: false
Vishnu Banna's avatar
Vishnu Banna committed
49
    global_batch_size: 16
Vishnu Banna's avatar
Vishnu Banna committed
50
51
52
    input_path: ''
    is_training: true
    sharding: true
Vishnu Banna's avatar
Vishnu Banna committed
53
    shuffle_buffer_size: 100
Vishnu Banna's avatar
Vishnu Banna committed
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
    tf_data_service_address: null
    tf_data_service_job_name: null
    tfds_as_supervised: false
    tfds_data_dir: ~/tensorflow_datasets/
    tfds_download: true
    tfds_name: imagenet2012
    tfds_skip_decoding_feature: ''
    tfds_split: train
  validation_data:
    block_length: 1
    cache: false
    cycle_length: 10
    deterministic: null
    drop_remainder: false
    dtype: float16
    enable_tf_data_service: false
Vishnu Banna's avatar
Vishnu Banna committed
70
    global_batch_size: 16
Vishnu Banna's avatar
Vishnu Banna committed
71
72
73
    input_path: ''
    is_training: true
    sharding: true
Vishnu Banna's avatar
Vishnu Banna committed
74
    shuffle_buffer_size: 100
Vishnu Banna's avatar
Vishnu Banna committed
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
    tf_data_service_address: null
    tf_data_service_job_name: null
    tfds_as_supervised: false
    tfds_data_dir: ~/tensorflow_datasets/
    tfds_download: true
    tfds_name: imagenet2012
    tfds_skip_decoding_feature: ''
    tfds_split: validation
trainer:
  allow_tpu_summary: false
  best_checkpoint_eval_metric: ''
  best_checkpoint_export_subdir: ''
  best_checkpoint_metric_comp: higher
  checkpoint_interval: 10000
  continuous_eval_timeout: 3600
  eval_tf_function: true
  max_to_keep: 5
  optimizer_config:
    ema: null
    learning_rate:
      polynomial:
        cycle: false
Vishnu Banna's avatar
Vishnu Banna committed
97
98
99
        decay_steps: 6392000
        end_learning_rate: 1.25e-05
        initial_learning_rate: 0.0125
Vishnu Banna's avatar
Vishnu Banna committed
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
        name: PolynomialDecay
        power: 4.0
      type: polynomial
    optimizer:
      sgd:
        clipnorm: null
        clipvalue: null
        decay: 0.0
        momentum: 0.9
        name: SGD
        nesterov: false
      type: sgd
    warmup:
      linear:
        name: linear
        warmup_learning_rate: 0
Vishnu Banna's avatar
Vishnu Banna committed
116
        warmup_steps: 8000
Vishnu Banna's avatar
Vishnu Banna committed
117
118
119
      type: linear
  steps_per_loop: 10000
  summary_interval: 10000
Vishnu Banna's avatar
Vishnu Banna committed
120
  train_steps: 6400000
Vishnu Banna's avatar
Vishnu Banna committed
121
122
  train_tf_function: true
  train_tf_while_loop: true
Vishnu Banna's avatar
Vishnu Banna committed
123
124
  validation_interval: 10000
  validation_steps: 3200