4
4
from datasets .load import load_dataset
5
5
6
6
# load_dataset("oscar")
7
- load_dataset ("cc100" , "en" )
8
- load_dataset ("cc100" , "ja" )
9
- load_dataset ("cerebras/SlimPajama-627B" )
10
- load_dataset ("bigcode/starcoderdata" )
11
- load_dataset ("Open-Orca/OpenOrca" )
12
- load_dataset ("HuggingFaceH4/ultrafeedback_binarized" )
13
- load_dataset ("HuggingFaceH4/ultrachat_200k" )
14
- load_dataset ("cognitivecomputations/dolphin" )
15
- load_dataset ("LDJnr/Capybara" )
16
- load_dataset ("ise-uiuc/Magicoder-Evol-Instruct-110K" )
17
- load_dataset ("allenai/c4" , "en" )
18
- load_dataset ("allenai/c4" , "ja" )
19
- load_dataset ("the_pile" , "all" )
7
+ load_dataset ("cc100" , "en" , trust_remote_code = True )
8
+ load_dataset ("cc100" , "ja" , trust_remote_code = True )
9
+ load_dataset ("cerebras/SlimPajama-627B" , trust_remote_code = True )
10
+ load_dataset ("bigcode/starcoderdata" , trust_remote_code = True )
11
+ load_dataset ("Open-Orca/OpenOrca" , trust_remote_code = True )
12
+ load_dataset ("HuggingFaceH4/ultrafeedback_binarized" , trust_remote_code = True )
13
+ load_dataset ("HuggingFaceH4/ultrachat_200k" , trust_remote_code = True )
14
+ load_dataset ("cognitivecomputations/dolphin" , trust_remote_code = True )
15
+ load_dataset ("LDJnr/Capybara" , trust_remote_code = True )
16
+ load_dataset ("ise-uiuc/Magicoder-Evol-Instruct-110K" , trust_remote_code = True )
17
+ load_dataset ("allenai/c4" , "en" , trust_remote_code = True )
18
+ load_dataset ("allenai/c4" , "ja" , trust_remote_code = True )
19
+ load_dataset ("the_pile" , "all" , trust_remote_code = True )
20
20
21
21
22
22
# 指定されたファイルパスからyamlファイルを読み込む
@@ -43,7 +43,7 @@ def load_yaml(file_path):
43
43
is_lte_10gb_dataset = data ["converted_size" ][- 2 :] == "GB" and float (data ["converted_size" ][:- 2 ]) <= 10
44
44
# MBオーダーか10GB以下のデータセットの場合のみ読み込む
45
45
if is_mb_dataset or is_lte_10gb_dataset :
46
- dataset = load_dataset (data ["id" ])
46
+ dataset = load_dataset (data ["id" ], trust_remote_code = True )
47
47
print (dataset )
48
48
except Exception as e :
49
49
print (f"Error loading dataset: { e } " )
0 commit comments