first install pytorch2.0 https://pytorch.org/get-started/locally/
then install others
pip install -r requirements.txt
bash run.sh
bash run-reward.sh
bash run-rlhf.sh
refer sft-data-construction
refer rlhf-ppo
first install pytorch2.0 https://pytorch.org/get-started/locally/
then install others
pip install -r requirements.txt
bash run.sh
bash run-reward.sh
bash run-rlhf.sh
refer sft-data-construction
refer rlhf-ppo