/collaborativeagents/training/
../
dataset_info.json
ds_z3_config.json
estimate_token_lengths.py
generate_training_data.py
grpo
grpo_verl
llama_factory_config.yaml
llama_factory_lora_config.yaml
llama_factory_qlora_config.yaml
llama_factory_resume_config.yaml
outputs
run_train.sh
sft
sft_config.yaml
train_grpo.py
train_sft.py
train_sft.sbatch
train_sft_lf.sbatch
train_sft_lora.sbatch
train_sft_qlora.sbatch
train_sft_resume.sbatch
training_data
training_script.sh