From dc801c07cf38b0c495686463e6ca6f871a64440e Mon Sep 17 00:00:00 2001 From: YurenHao0426 Date: Tue, 27 Jan 2026 09:57:37 -0600 Subject: Add collaborativeagents module and update gitignore - Add collaborativeagents subproject with adapters, agents, and evaluation modules - Update .gitignore to exclude large binary files (.whl, .tar), wandb logs, and results Co-Authored-By: Claude Opus 4.5 --- .../outputs/sft_reflection_lf/trainer_log.jsonl | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) create mode 100644 collaborativeagents/training/outputs/sft_reflection_lf/trainer_log.jsonl (limited to 'collaborativeagents/training/outputs/sft_reflection_lf') diff --git a/collaborativeagents/training/outputs/sft_reflection_lf/trainer_log.jsonl b/collaborativeagents/training/outputs/sft_reflection_lf/trainer_log.jsonl new file mode 100644 index 0000000..d53e55c --- /dev/null +++ b/collaborativeagents/training/outputs/sft_reflection_lf/trainer_log.jsonl @@ -0,0 +1,20 @@ +{"current_steps": 10, "total_steps": 260, "loss": 2.0947, "lr": 3.461538461538461e-07, "epoch": 0.15579357351509251, "percentage": 3.85, "elapsed_time": "0:01:32", "remaining_time": "0:38:20"} +{"current_steps": 20, "total_steps": 260, "loss": 1.4871, "lr": 7.307692307692307e-07, "epoch": 0.31158714703018503, "percentage": 7.69, "elapsed_time": "0:02:56", "remaining_time": "0:35:23"} +{"current_steps": 30, "total_steps": 260, "loss": 0.4596, "lr": 9.995944990857847e-07, "epoch": 0.4673807205452775, "percentage": 11.54, "elapsed_time": "0:04:23", "remaining_time": "0:33:39"} +{"current_steps": 40, "total_steps": 260, "loss": 0.0813, "lr": 9.92403876506104e-07, "epoch": 0.6231742940603701, "percentage": 15.38, "elapsed_time": "0:05:49", "remaining_time": "0:32:01"} +{"current_steps": 50, "total_steps": 260, "loss": 0.0687, "lr": 9.763511454798266e-07, "epoch": 0.7789678675754625, "percentage": 19.23, "elapsed_time": "0:07:12", "remaining_time": "0:30:18"} +{"current_steps": 60, "total_steps": 260, "loss": 0.058, "lr": 9.517252173051911e-07, "epoch": 0.934761441090555, "percentage": 23.08, "elapsed_time": "0:08:38", "remaining_time": "0:28:49"} +{"current_steps": 70, "total_steps": 260, "loss": 0.063, "lr": 9.189693006092905e-07, "epoch": 1.0778967867575462, "percentage": 26.92, "elapsed_time": "0:09:56", "remaining_time": "0:26:57"} +{"current_steps": 80, "total_steps": 260, "loss": 0.0525, "lr": 8.786729246380899e-07, "epoch": 1.2336903602726388, "percentage": 30.77, "elapsed_time": "0:11:21", "remaining_time": "0:25:33"} +{"current_steps": 90, "total_steps": 260, "loss": 0.0485, "lr": 8.315613291203976e-07, "epoch": 1.3894839337877314, "percentage": 34.62, "elapsed_time": "0:12:43", "remaining_time": "0:24:03"} +{"current_steps": 100, "total_steps": 260, "loss": 0.047, "lr": 7.784824116632196e-07, "epoch": 1.5452775073028238, "percentage": 38.46, "elapsed_time": "0:14:05", "remaining_time": "0:22:33"} +{"current_steps": 110, "total_steps": 260, "loss": 0.0476, "lr": 7.203914675945928e-07, "epoch": 1.7010710808179161, "percentage": 42.31, "elapsed_time": "0:16:16", "remaining_time": "0:22:11"} +{"current_steps": 120, "total_steps": 260, "loss": 0.0448, "lr": 6.583339969007363e-07, "epoch": 1.8568646543330087, "percentage": 46.15, "elapsed_time": "0:17:40", "remaining_time": "0:20:37"} +{"current_steps": 130, "total_steps": 260, "loss": 0.0442, "lr": 5.934268876921025e-07, "epoch": 2.0, "percentage": 50.0, "elapsed_time": "0:18:59", "remaining_time": "0:18:59"} +{"current_steps": 140, "total_steps": 260, "loss": 0.0409, "lr": 5.268383148515607e-07, "epoch": 2.1557935735150924, "percentage": 53.85, "elapsed_time": "0:20:24", "remaining_time": "0:17:29"} +{"current_steps": 150, "total_steps": 260, "loss": 0.0383, "lr": 4.5976671564163703e-07, "epoch": 2.311587147030185, "percentage": 57.69, "elapsed_time": "0:21:48", "remaining_time": "0:15:59"} +{"current_steps": 160, "total_steps": 260, "loss": 0.0397, "lr": 3.9341922066029205e-07, "epoch": 2.4673807205452776, "percentage": 61.54, "elapsed_time": "0:23:12", "remaining_time": "0:14:30"} +{"current_steps": 170, "total_steps": 260, "loss": 0.0398, "lr": 3.2898992833716563e-07, "epoch": 2.62317429406037, "percentage": 65.38, "elapsed_time": "0:24:37", "remaining_time": "0:13:02"} +{"current_steps": 180, "total_steps": 260, "loss": 0.0389, "lr": 2.676384139781157e-07, "epoch": 2.7789678675754628, "percentage": 69.23, "elapsed_time": "0:26:04", "remaining_time": "0:11:35"} +{"current_steps": 190, "total_steps": 260, "loss": 0.0391, "lr": 2.1046886014456054e-07, "epoch": 2.934761441090555, "percentage": 73.08, "elapsed_time": "0:27:29", "remaining_time": "0:10:07"} +{"current_steps": 200, "total_steps": 260, "loss": 0.0366, "lr": 1.5851018397157917e-07, "epoch": 3.077896786757546, "percentage": 76.92, "elapsed_time": "0:28:45", "remaining_time": "0:08:37"} -- cgit v1.2.3