|
93 | 93 | LARS_OPT_END_LR = "lars_opt_end_learning_rate"
|
94 | 94 | LARS_OPT_LR_DECAY_POLY_POWER = "lars_opt_learning_rate_decay_poly_power"
|
95 | 95 | LARS_OPT_LR_DECAY_STEPS = "lars_opt_learning_rate_decay_steps"
|
96 |
| -LARS_OPT_LR_MIN = "lars_opt_learning_rate_min" |
97 | 96 | LARS_OPT_WEIGHT_DECAY = "lars_opt_weight_decay"
|
98 |
| -LARS_OPT_BETA_1 = "lars_beta_1" |
99 |
| -LARS_OPT_BETA_2 = "lars_beta_2" |
100 | 97 | MAX_IMAGE_SIZE = "max_image_size"
|
101 | 98 | MAX_SAMPLES = "max_samples"
|
102 | 99 | MAX_SEQUENCE_LENGTH = "max_sequence_length"
|
|
120 | 117 | OPT_LR_WARMUP_EPOCHS = "opt_learning_rate_warmup_epochs"
|
121 | 118 | OPT_LR_WARMUP_FACTOR = "opt_learning_rate_warmup_factor"
|
122 | 119 | OPT_LR_WARMUP_STEPS = "opt_learning_rate_warmup_steps"
|
123 |
| -OPT_LR_HOLD_EPOCHS = "opt_learning_rate_hold_epochs" |
124 | 120 | OPT_WEIGHT_DECAY = "opt_weight_decay"
|
125 |
| -OPT_GRADIENT_CLIP_NORM = "opt_gradient_clip_norm" |
126 |
| -DATA_SPEED_PERTURBATON_MAX = "data_speed_perturbaton_max" |
127 |
| -DATA_SPEED_PERTURBATON_MIN = "data_speed_perturbaton_min" |
128 |
| -DATA_SPEC_AUGMENT_FREQ_N = "data_spec_augment_freq_n" |
129 |
| -DATA_SPEC_AUGMENT_FREQ_MIN = "data_spec_augment_freq_min" |
130 |
| -DATA_SPEC_AUGMENT_FREQ_MAX = "data_spec_augment_freq_max" |
131 |
| -DATA_SPEC_AUGMENT_TIME_N = "data_spec_augment_time_n" |
132 |
| -DATA_SPEC_AUGMENT_TIME_MIN = "data_spec_augment_time_min" |
133 |
| -DATA_SPEC_AUGMENT_TIME_MAX = "data_spec_augment_time_max" |
134 |
| -DATA_NUM_BUCKETS = "data_num_buckets" |
135 |
| -EMA_FACTOR = "ema_factor" |
136 | 121 |
|
137 | 122 | # Log keys - misc.
|
138 | 123 | BBOX = "bbox"
|
|
0 commit comments