@ -63,6 +63,11 @@ os.environ['RWKV_NUM_GPUS'] = '1' # num of GPUs to use
os.environ['RWKV_FLOAT_MODE']='bf16'# 'bf16' (stable) or 'fp16' (will overflow after training a large model for very long. can be solved in the future) or 'fp32'
os.environ['RWKV_FLOAT_MODE']='bf16'# 'bf16' (stable) or 'fp16' (will overflow after training a large model for very long. can be solved in the future) or 'fp32'
os.environ['RWKV_DEEPSPEED']='1'# Use DeepSpeed? 0 = False, 1 = True
ifint(os.environ['RWKV_NUM_GPUS'])==1andos.environ['RWKV_FLOAT_MODE']=='fp32':# the only case where DeepSpeed is worse