learning_rate: 0.0005480015685663855 weight_decay: 1.544480236681167e-05 batch_size: 2