{ "train_config": { "model_name": "microsoft/graphcodebert-base", "num_epochs": 3, "batch_size": 256, "learning_rate": 2e-05, "max_length": 512, "num_labels": 2, "loss_type": "ce", "focal_alpha": 1.0, "focal_gamma": 2.0, "r_drop_alpha": 6.0, "infonce_temperature": 0.07, "infonce_weight": 0.5, "label_smoothing": 0, "adversarial_epsilon": 0, "use_swa": false, "swa_start_epoch": 0, "swa_lr": 1e-05, "data_augmentation": false, "aug_rename_prob": 0.0, "aug_format_prob": 0.0, "freeze_base": true, "seed": 42, "use_wandb": true, "mixup_alpha": 0.0, "low_pass_keep_ratio": 0.5, "freq_consistency_weight": 0.0 }, "training_arguments": { "output_dir": "output_checkpoints/graphcodebert-vanilla/", "num_train_epochs": 3, "per_device_train_batch_size": 256, "per_device_eval_batch_size": 512, "learning_rate": 2e-05, "warmup_steps": 612, "weight_decay": 0.1, "logging_steps": 5, "eval_steps": 50, "save_steps": 100, "metric_for_best_model": "macro_f1", "greater_is_better": true, "save_total_limit": 5, "fp16": true, "seed": 42 }, "training_state": { "global_step": 300, "epoch": 0.29354207436399216, "best_metric": 0.5962545254252696, "best_model_checkpoint": "output_checkpoints/graphcodebert-vanilla/checkpoint-200" } }