algorithm: supervised
save_dir: ./saved_models/usb_nlp
save_name: supervised_ag_news_200_0
resume: True
load_path: ./saved_models/usb_nlp/supervised_ag_news_200_0/latest_model.pth
overwrite: True
use_tensorboard: True
epoch: 100
num_train_iter: 102400
num_warmup_iter: 5120
num_log_iter: 256
num_eval_iter: 2048
num_labels: 200
batch_size: 8
eval_batch_size: 8
uratio: 1
use_cat: False
ema_m: 0.0
optim: AdamW
lr: 5e-05
momentum: 0.9
weight_decay: 0.0005
layer_decay: 0.65
amp: False
clip: 0.0
net: bert_base_uncased
net_from_name: False
data_dir: ./data
dataset: ag_news
train_sampler: RandomSampler
num_classes: 4
num_workers: 4
max_length: 512
seed: 0
world_size: 1
rank: 0
multiprocessing_distributed: False
dist_url: tcp://127.0.0.1:10032
dist_backend: nccl
gpu: None
