deepspeed_zero3.yaml 391 B

123456789101112131415
  1. compute_environment: LOCAL_MACHINE
  2. distributed_type: DEEPSPEED
  3. num_processes: 4
  4. machine_rank: 0
  5. num_machines: 1
  6. gpu_ids: all
  7. mixed_precision: fp16
  8. deepspeed_config:
  9. gradient_accumulation_steps: 4
  10. gradient_clipping: 1.0
  11. offload_optimizer_device: cpu # 优化器状态卸载到CPU
  12. offload_param_device: cpu # 参数卸载到CPU
  13. zero3_init_flag: true
  14. zero_stage: 3 # ZeRO-3