We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 69112cb commit 2010891Copy full SHA for 2010891
recipes/A5000_24GB_x8/Mistral-7B-v0.1/i18n-ja-wikipedia-sakura.yaml
@@ -0,0 +1,18 @@
1
+target_task: tasks/i18n/ja.md
2
+base_model_id: yuiseki/Mistral-7B-v0.1-ja-wikipedia-v0.1
3
+model_name: Mistral-7B-v0.1-ja-wikipedia-sakura-v0.1
4
+output_base_dir: output
5
+dataset_id: saldra/sakura_japanese_dataset
6
+dataset_context_field_name: input
7
+dataset_input_field_name: instruction
8
+dataset_output_field_name: output
9
+dataset_filter_field_value: 0
10
+dataset_train_split_seed: 42
11
+dataset_train_split_test_size: 0.2
12
+lora_r: 8
13
+lora_alpha: 16
14
+lora_dropout: 0.05
15
+train_claim_gpu_num: 2
16
+train_per_device_train_batch_size: 2
17
+train_gradient_accumulation_steps: 16
18
+train_num_train_epochs: 4
0 commit comments