-
Notifications
You must be signed in to change notification settings - Fork 85
/
example_instchat_ft_3bv1.1_low_budget.sh
executable file
·53 lines (52 loc) · 1.92 KB
/
example_instchat_ft_3bv1.1_low_budget.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#!/bin/bash
EXP_NAME="example_instchat_ft_3bv1.1_low_budget"
python3 -m instruction_fine_tuning.fine_tuning \
--run_name "$EXP_NAME" \
--output_dir "$EXP_NAME"/ \
--model_path "syzymon/long_llama_3b_v1_1" \
--torch_dtype float32 \
--data_type "instructions,chat" \
--data_path "Open-Orca/OpenOrca,zetavg/ShareGPT-Processed" \
--data_revision "f0823c7ffc48c9d33a42f16cf0b885fed4a7d0a1,15968d6dfa02529988da12e382af3ab7c857ebcd" \
--data_filter "<,>lang<M>^en$<;>conversations.<int>*^.value<M>(?i)^((?!openai).)*$<;>conversations.<int>*^.value<M>^((?!DAN).)*$<;>conversations.<int>0.value<LENLT>8000" \
--dataset_split "train,train" \
--data_proportions 0.99 0.01 \
--prompt_field "system_prompt" \
--post_prompt_text "
" \
--question_field "question" \
--post_question_text "
" \
--response_field "response" \
--chat_conversations_field "conversations" \
--chat_data_field "markdown" \
--chat_source_name_field "from" \
--chat_model_source_name "gpt" \
--chat_initial_prompt "A chat between a user (denoted as USER:) and an artificial intelligence assistant (denoted as ASSISTANT:). The assistant gives helpful, detailed, and polite answers to the user's questions.
" \
--chat_model_response_prefix "
ASSISTANT: " \
--chat_human_response_prefix "
USER: " \
--last_context_length 1024 \
--max_input_length 2048 \
--max_output_length 2048 \
--max_total_length 2048 \
--always_pad True \
--random_pad True \
--max_steps 4000 \
--per_device_train_batch_size 4 \
--gradient_accumulation_steps 16 \
--learning_rate 1e-5 \
--weight_decay 0. \
--warmup_steps 200 \
--lr_scheduler_type "cosine" \
--evaluation_strategy "no" \
--save_strategy "steps" \
--save_total_limit 3 \
--save_steps 500 \
--logging_strategy "steps" \
--logging_steps 25 \
--gradient_checkpointing True \
--tf32 True \
--bf16 True