Traceback (most recent call last):
File "/root/Llama2-Chinese/train/sft/finetune_clm_lora.py", line 691, in
main()
File "/root/Llama2-Chinese/train/sft/finetune_clm_lora.py", line 281, in main
model_args, data_args, training_args = parser.parse_args_into_dataclasses()
File "/usr/local/lib/python3.10/site-packages/transformers/hf_argparser.py", line 338, in parse_args_into_dataclasses
obj = dtype(**inputs)
File "", line 112, in init
File "/usr/local/lib/python3.10/site-packages/transformers/training_args.py", line 1607, in post_init
self.hf_deepspeed_config = HfTrainerDeepSpeedConfig(self.deepspeed)
File "/usr/local/lib/python3.10/site-packages/transformers/deepspeed.py", line 76, in init
super().init__(config_file_or_dict)
File "/usr/local/lib/python3.10/site-packages/transformers/deepspeed.py", line 66, in init
super().init__(config_file_or_dict)
File "/usr/local/lib/python3.10/site-packages/accelerate/utils/deepspeed.py", line 55, in init
raise ValueError(
ValueError: Expected a string path to an existing deepspeed config, or a dictionary, or a base64 encoded string. Received: ds_config_zero2.json
Traceback (most recent call last): File "/root/Llama2-Chinese/train/sft/finetune_clm_lora.py", line 691, in
main()
File "/root/Llama2-Chinese/train/sft/finetune_clm_lora.py", line 281, in main
model_args, data_args, training_args = parser.parse_args_into_dataclasses()
File "/usr/local/lib/python3.10/site-packages/transformers/hf_argparser.py", line 338, in parse_args_into_dataclasses
obj = dtype(**inputs)
File "", line 112, in init
File "/usr/local/lib/python3.10/site-packages/transformers/training_args.py", line 1607, in post_init
self.hf_deepspeed_config = HfTrainerDeepSpeedConfig(self.deepspeed)
File "/usr/local/lib/python3.10/site-packages/transformers/deepspeed.py", line 76, in init
super().init__(config_file_or_dict)
File "/usr/local/lib/python3.10/site-packages/transformers/deepspeed.py", line 66, in init
super().init__(config_file_or_dict)
File "/usr/local/lib/python3.10/site-packages/accelerate/utils/deepspeed.py", line 55, in init
raise ValueError(
ValueError: Expected a string path to an existing deepspeed config, or a dictionary, or a base64 encoded string. Received: ds_config_zero2.json