saves some VRAM for 1 GPU training

main
BlinkDL 3 years ago
parent 69e7cfbf39
commit c1f7a72724

@ -217,7 +217,18 @@ if __name__ == '__main__':
"gradient_clipping": 1.0, "gradient_clipping": 1.0,
"gradient_accumulation_steps": 1, "gradient_accumulation_steps": 1,
} }
if NUM_GPUS == 1:
DEEPSPEED_CFG['zero_optimization'] = {
"stage":1, # saves some VRAM
"contiguous_gradients":False,
"overlap_comm":False,
"allgather_partitions":False,
"reduce_scatter":False,
"allgather_bucket_size":200000000,
"reduce_bucket_size":200000000,
"sub_group_size":1000000000000
}
if os.environ['RWKV_FLOAT_MODE'] == 'fp16': if os.environ['RWKV_FLOAT_MODE'] == 'fp16':
DEEPSPEED_CFG["fp16"] = { DEEPSPEED_CFG["fp16"] = {
"fp16": True, "fp16": True,

Loading…
Cancel
Save