|
4 | 4 | from datasets.load import load_dataset
|
5 | 5 |
|
6 | 6 | # TinyLlamaが使ってる
|
7 |
| -load_dataset("HuggingFaceH4/ultrafeedback_binarized", trust_remote_code=True) |
| 7 | +# load_dataset("HuggingFaceH4/ultrafeedback_binarized", trust_remote_code=True) |
8 | 8 | # TinyLlamaが使ってる
|
9 |
| -load_dataset("HuggingFaceH4/ultrachat_200k", trust_remote_code=True) |
| 9 | +# load_dataset("HuggingFaceH4/ultrachat_200k", trust_remote_code=True) |
10 | 10 | # dolphinが使ってる
|
11 |
| -load_dataset("ise-uiuc/Magicoder-Evol-Instruct-110K", trust_remote_code=True) |
| 11 | +# load_dataset("ise-uiuc/Magicoder-Evol-Instruct-110K", trust_remote_code=True) |
12 | 12 | # マルチターン対話
|
13 |
| -load_dataset("LDJnr/Capybara", trust_remote_code=True) |
| 13 | +# load_dataset("LDJnr/Capybara", trust_remote_code=True) |
14 | 14 |
|
15 | 15 | # Instruction
|
16 |
| -load_dataset("OpenAssistant/oasst1", trust_remote_code=True) |
17 |
| -load_dataset("OpenAssistant/oasst2", trust_remote_code=True) |
| 16 | +# load_dataset("OpenAssistant/oasst1", trust_remote_code=True) |
| 17 | +# load_dataset("OpenAssistant/oasst2", trust_remote_code=True) |
18 | 18 | # RLHF
|
19 |
| -load_dataset("Anthropic/hh-rlhf", trust_remote_code=True) |
20 |
| -load_dataset("shi3z/anthropic_hh_rlhf_japanese", trust_remote_code=True) |
| 19 | +# load_dataset("Anthropic/hh-rlhf", trust_remote_code=True) |
| 20 | +# load_dataset("shi3z/anthropic_hh_rlhf_japanese", trust_remote_code=True) |
21 | 21 |
|
22 | 22 |
|
23 | 23 | # GBオーダー
|
24 |
| -load_dataset("cognitivecomputations/dolphin", "all", trust_remote_code=True) |
| 24 | +load_dataset("cognitivecomputations/dolphin", "flan1m-alpaca-uncensored", trust_remote_code=True) |
| 25 | +load_dataset("cognitivecomputations/dolphin", "flan5m-alpaca-uncensored", trust_remote_code=True) |
25 | 26 | load_dataset("Open-Orca/OpenOrca", trust_remote_code=True)
|
26 | 27 |
|
27 | 28 | # デカい
|
|
0 commit comments