diff options
| author | Zitian Gao <zitian.gao@outlook.com> | 2025-05-30 17:57:24 +0800 |
|---|---|---|
| committer | GitHub <noreply@github.com> | 2025-05-30 17:57:24 +0800 |
| commit | ac6cda0b04f9b84935a2480740b1ea2b84cf1eaa (patch) | |
| tree | 97fb0424cf80e09e431fddf0bb87c37ea176a37d | |
| parent | cd24bc8775320ee306583f3246977503516a7da9 (diff) | |
update args
| -rw-r--r-- | train.py | 8 |
1 files changed, 3 insertions, 5 deletions
@@ -33,14 +33,12 @@ def parse_args(): parser.add_argument('--learning_rate', type=float, default=2e-5, help='Learning rate') parser.add_argument('--log_steps', type=int, default=1, help='Logging step interval') parser.add_argument('--save_steps', type=int, default=1, help='Checkpoint saving step interval') - parser.add_argument('--max_steps', type=int, default=1000, help='Maximum training steps') + parser.add_argument('--max_steps', type=int, default=50, help='Maximum training steps') parser.add_argument('--sample_temp', type=float, default=0.5, help='Generation temperature parameter') parser.add_argument('--run_name', type=str, default=None, help='Experiment run name') - parser.add_argument('--wandb_project', type=str, default='entropy-maximization-ft', help='W&B project name') + parser.add_argument('--wandb_project', type=str, default='one-shot-em', help='W&B project name') parser.add_argument('--wandb_name', type=str, default=None, help='W&B run name') - parser.add_argument('--enable_self_distill', action='store_true', help='Enable self-distillation MSE constraint') - parser.add_argument('--self_distill_gamma', type=float, default=0.0, help='Self-distillation MSE weight γ') - parser.add_argument('--seed', type=int, default=42, help='Random seed') + parser.add_argument('--seed', type=int, default=15, help='Random seed') return parser.parse_args() class FTDataset(Dataset): |
