Skip to content

Commit dc16faf

Browse files
committed
Update src/dataset/load.py
1 parent acf93fa commit dc16faf

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

src/dataset/load.py

+5-5
Original file line numberDiff line numberDiff line change
@@ -21,9 +21,9 @@
2121

2222

2323
# GBオーダー
24-
load_dataset("cognitivecomputations/dolphin", "flan1m-alpaca-uncensored", trust_remote_code=True)
25-
load_dataset("cognitivecomputations/dolphin", "flan5m-alpaca-uncensored", trust_remote_code=True)
26-
load_dataset("Open-Orca/OpenOrca", trust_remote_code=True)
24+
# load_dataset("cognitivecomputations/dolphin", "flan1m-alpaca-uncensored", trust_remote_code=True)
25+
# load_dataset("cognitivecomputations/dolphin", "flan5m-alpaca-uncensored", trust_remote_code=True)
26+
# load_dataset("Open-Orca/OpenOrca", trust_remote_code=True)
2727

2828
# デカい
2929
# load_dataset("cc100", "en", trust_remote_code=True)
@@ -33,9 +33,9 @@
3333

3434
# デカすぎる
3535
# TinyLlamaが使ってる、895 GB
36-
load_dataset("cerebras/SlimPajama-627B", trust_remote_code=True)
36+
# load_dataset("cerebras/SlimPajama-627B", trust_remote_code=True)
3737
# TinyLlamaが使ってる、311 GB
38-
load_dataset("bigcode/starcoderdata", trust_remote_code=True)
38+
# load_dataset("bigcode/starcoderdata", trust_remote_code=True)
3939
# 886 GB
4040
# load_dataset("EleutherAI/pile", "all", trust_remote_code=True)
4141
# load_dataset("oscar")

0 commit comments

Comments
 (0)