File tree 2 files changed +4
-1
lines changed
tensorrt_llm/_torch/speculative
tests/unittest/llmapi/apps
2 files changed +4
-1
lines changed Original file line number Diff line number Diff line change @@ -689,7 +689,7 @@ def sample_and_accept_draft_tokens(
689
689
num_accepted_tokens = torch .ones (batch_size ,
690
690
dtype = torch .int ,
691
691
device = logits .device )
692
-
692
+
693
693
if self .spec_config .use_relaxed_acceptance_for_thinking :
694
694
mtp_relaxed_delta_pool = spec_metadata .mtp_hidden_states_manager .mtp_relaxed_delta_pool
695
695
Original file line number Diff line number Diff line change @@ -34,6 +34,9 @@ def test_health(client):
34
34
response = client .get ("/health" )
35
35
assert response .status_code == 200
36
36
37
+ def test_health_generate (client ):
38
+ response = client .get ("/health_generate" )
39
+ assert response .status_code == 200
37
40
38
41
def test_generate (client ):
39
42
response = client .post ("/generate" , json = {"prompt" : "A B C" })
You can’t perform that action at this time.
0 commit comments