-
Notifications
You must be signed in to change notification settings - Fork 13
/
default_config.yaml
32 lines (27 loc) · 1.42 KB
/
default_config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
# This file contains the default train settings
device: 'cuda:0' # or 'cpu'
amp: False # Enable automatic mixed precision
# Model
variant: 'F0' # F0 - F7
num_classes: 1000 # Number of classes
activation: 'gelu' # or 'relu'
stochdepth_rate: 0.25 # 0-1, the probability that a layer is dropped during one step
alpha: 0.2 # Scaling factor at the end of each block
se_ratio: 0.5 # Squeeze-Excite expansion ratio
use_fp16: False # Use 16bit floats, which lowers memory footprint. This currently sets
# the complete model to FP16 (will be changed to match FP16 ops from paper)
# Dataset
dataset: '/media/benjs/ext/' # Dataset root directory
num_workers: 8 # Number of workers in dataloader
pin_memory: True # This can fasten or slow down data loading depending on your hardware
# Training
batch_size: 64 # Batch size
epochs: 360 # Number of epochs
overfit: False # Train on one batch size only
learning_rate: 0.1 # Learning rate
scale_lr: True # Scale learning rate with batch size. lr = lr*batch_size/256
momentum: 0.9 # Contribution of earlier gradient to gradient update
weight_decay: 0.00002 # Factor with which weights are added to gradient
nesterov: True # Enable nesterov correction
do_clip: True # Enable adaptive gradient clipping
clipping: 0.1 # Adaptive gradient clipping parameter