diff options
Diffstat (limited to 'configs/accelerate')
| -rw-r--r-- | configs/accelerate/1xa5000_bf16.yaml | 16 | ||||
| -rw-r--r-- | configs/accelerate/4xa5000_bf16.yaml | 16 | ||||
| -rw-r--r-- | configs/accelerate/default_config.yaml | 16 |
3 files changed, 45 insertions, 3 deletions
diff --git a/configs/accelerate/1xa5000_bf16.yaml b/configs/accelerate/1xa5000_bf16.yaml new file mode 100644 index 0000000..1470ad5 --- /dev/null +++ b/configs/accelerate/1xa5000_bf16.yaml @@ -0,0 +1,16 @@ +compute_environment: LOCAL_MACHINE +distributed_type: NO +downcast_bf16: 'no' +dynamo_backend: 'NO' +fsdp_config: {} +gpu_ids: 0 +machine_rank: 0 +main_process_ip: null +main_process_port: 29500 +main_training_function: main +mixed_precision: bf16 +num_machines: 1 +num_processes: 1 +rdzv_backend: static +same_network: true +use_cpu: false diff --git a/configs/accelerate/4xa5000_bf16.yaml b/configs/accelerate/4xa5000_bf16.yaml new file mode 100644 index 0000000..a874c61 --- /dev/null +++ b/configs/accelerate/4xa5000_bf16.yaml @@ -0,0 +1,16 @@ +compute_environment: LOCAL_MACHINE +distributed_type: MULTI_GPU +downcast_bf16: 'no' +dynamo_backend: 'NO' +fsdp_config: {} +gpu_ids: 0,1,2,3 +machine_rank: 0 +main_process_ip: null +main_process_port: 29500 +main_training_function: main +mixed_precision: bf16 +num_machines: 1 +num_processes: 4 +rdzv_backend: static +same_network: true +use_cpu: false diff --git a/configs/accelerate/default_config.yaml b/configs/accelerate/default_config.yaml index f290654..1470ad5 100644 --- a/configs/accelerate/default_config.yaml +++ b/configs/accelerate/default_config.yaml @@ -1,6 +1,16 @@ -# Accelerate default config placeholder (customize as needed) compute_environment: LOCAL_MACHINE -distributed_type: MULTI_GPU -mixed_precision: no +distributed_type: NO +downcast_bf16: 'no' +dynamo_backend: 'NO' +fsdp_config: {} +gpu_ids: 0 +machine_rank: 0 +main_process_ip: null +main_process_port: 29500 +main_training_function: main +mixed_precision: bf16 +num_machines: 1 num_processes: 1 +rdzv_backend: static +same_network: true use_cpu: false |
