first install pytorch2.0 https://pytorch.org/get-started/locally/ then install others pip install -r requirements.txt
https://pytorch.org/get-started/locally/
pip install -r requirements.txt
bash run.sh
bash run-reward.sh
bash run-rlhf.sh
refer sft-data-construction
sft-data-construction
refer rlhf-ppo
rlhf-ppo