Update README.md
Browse files
README.md
CHANGED
@@ -202,7 +202,7 @@ The evaluation code for this can be found [here](https://drive.google.com/file/d
|
|
202 |
|
203 |
```yaml
|
204 |
### model
|
205 |
-
model_name_or_path: deepseek-ai/DeepSeek-R1-Distill-Qwen-
|
206 |
|
207 |
### method
|
208 |
stage: sft
|
@@ -219,7 +219,7 @@ preprocessing_num_workers: 16
|
|
219 |
packing: true
|
220 |
|
221 |
### output
|
222 |
-
output_dir: /root/train_outputs/DeepSeek-R1-Distill-Qwen-
|
223 |
logging_steps: 1
|
224 |
save_steps: 0.99999
|
225 |
plot_loss: true
|
@@ -250,11 +250,10 @@ echo '{
|
|
250 |
}
|
251 |
}' > /root/LLaMA-Factory/data/dataset_info.json
|
252 |
|
253 |
-
#
|
254 |
-
cd /root/LLaMA-Factory && llamafactory-cli train /root/
|
255 |
-
rm -r /root/train_outputs/DeepSeek-R1-Distill-Qwen-
|
256 |
-
huggingface-cli upload lightblue/DeepSeek-R1-Distill-Qwen-
|
257 |
-
|
258 |
```
|
259 |
|
260 |
# License
|
|
|
202 |
|
203 |
```yaml
|
204 |
### model
|
205 |
+
model_name_or_path: deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
|
206 |
|
207 |
### method
|
208 |
stage: sft
|
|
|
219 |
packing: true
|
220 |
|
221 |
### output
|
222 |
+
output_dir: /root/train_outputs/DeepSeek-R1-Distill-Qwen-1.5B/reasoning-multilingual-R1-Llama-70B-train
|
223 |
logging_steps: 1
|
224 |
save_steps: 0.99999
|
225 |
plot_loss: true
|
|
|
250 |
}
|
251 |
}' > /root/LLaMA-Factory/data/dataset_info.json
|
252 |
|
253 |
+
# # 1.5B Llama
|
254 |
+
cd /root/LLaMA-Factory && llamafactory-cli train /root/reasoning_multilingual_train_1.5B.yaml
|
255 |
+
rm -r /root/train_outputs/DeepSeek-R1-Distill-Qwen-1.5B/reasoning-multilingual-R1-Llama-70B-train/checkpoint*
|
256 |
+
huggingface-cli upload lightblue/DeepSeek-R1-Distill-Qwen-1.5B-Multilingual /root/train_outputs/DeepSeek-R1-Distill-Qwen-1.5B/reasoning-multilingual-R1-Llama-70B-train
|
|
|
257 |
```
|
258 |
|
259 |
# License
|