--n_epochs = 100 --patience = 15 --mbatch_size = 64 --lr = 0.003 --lr_scheduler = null --lr_scheduler_kwargs = {} --param_lr_map = {} --grad_clip = null --grad_clip_kwargs = {} --regularization = 0.0 --l1_reg = 0.0 --l2_reg = 0.0 --optimizer = "Adam" --loss = "L1Loss" --initializer = null --initialization_seed = 0 --batch_shuffle_seed = 0