- Set MODEL env var to the LLaMa2-70B path in HF format.
export MODEL=<path>
- Build and run container
./docker_build.sh && ./docker_run.sh
- Prepare dataset
python3 prepare_dataset.py
- Convert model into nemo format
python NeMo/scripts/nlp_language_modeling/convert_hf_llama_to_nemo.py --in-file=/model/llama2-70b-hf/ --out-file=./model/llama2-70b.nemo
- Run training
./run.sh