Skip to content

Commit 853311a

Browse files
committed
Add deepseek distils as options
1 parent 1874be7 commit 853311a

File tree

2 files changed

+4
-0
lines changed

2 files changed

+4
-0
lines changed

jetstream_pt/fetch_models.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -93,6 +93,8 @@ class ModelInfo:
9393
"google/gemma-7b-it": _gemma_7b,
9494
"mistralai/Mixtral-8x7B-v0.1": _mixtral_87,
9595
"mistralai/Mixtral-8x7B-Instruct-v0.1": _mixtral_87,
96+
"deepseek-ai/DeepSeek-R1-Distill-Llama-8B": _llama3_1_8b,
97+
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": _llama3_3_70b,
9698
}
9799

98100

jetstream_pt/third_party/llama/model_exportable.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -344,6 +344,8 @@ def from_hf_model_id(cls, model_id, env, is_tiny=False):
344344
"meta-llama/Llama-3.2-1B-Instruct": "llama-3.2-1b",
345345
"meta-llama/Llama-3.3-70B": "llama-3.3-70b",
346346
"meta-llama/Llama-3.3-70B-Instruct": "llama-3.3-70b",
347+
"deepseek-ai/DeepSeek-R1-Distill-Llama-8B": "llama-3.1-8b",
348+
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": "llama-3.3-70b",
347349
}.get(model_id)
348350
assert name
349351
args = model_args.get_model_args(

0 commit comments

Comments
 (0)