File tree 1 file changed +6
-6
lines changed
1 file changed +6
-6
lines changed Original file line number Diff line number Diff line change 26
26
load_dataset ("Open-Orca/OpenOrca" , trust_remote_code = True )
27
27
28
28
# デカい
29
- load_dataset ("cc100" , "en" , trust_remote_code = True )
30
- load_dataset ("cc100" , "ja" , trust_remote_code = True )
31
- load_dataset ("allenai/c4" , "en" , trust_remote_code = True )
32
- load_dataset ("allenai/c4" , "ja" , trust_remote_code = True )
29
+ # load_dataset("cc100", "en", trust_remote_code=True)
30
+ # load_dataset("cc100", "ja", trust_remote_code=True)
31
+ # load_dataset("allenai/c4", "en", trust_remote_code=True)
32
+ # load_dataset("allenai/c4", "ja", trust_remote_code=True)
33
33
34
34
# デカすぎる
35
35
# TinyLlamaが使ってる、895 GB
36
- # load_dataset("cerebras/SlimPajama-627B", trust_remote_code=True)
36
+ load_dataset ("cerebras/SlimPajama-627B" , trust_remote_code = True )
37
37
# TinyLlamaが使ってる、311 GB
38
- # load_dataset("bigcode/starcoderdata", trust_remote_code=True)
38
+ load_dataset ("bigcode/starcoderdata" , trust_remote_code = True )
39
39
# 886 GB
40
40
# load_dataset("EleutherAI/pile", "all", trust_remote_code=True)
41
41
# load_dataset("oscar")
You can’t perform that action at this time.
0 commit comments