server : adjust spec tests to generate up to 16 tokens (#19093)
This commit is contained in:
parent
c5c64f72ac
commit
b931f81b5a
|
|
@ -30,6 +30,7 @@ def test_with_and_without_draft():
|
||||||
"prompt": "I believe the meaning of life is",
|
"prompt": "I believe the meaning of life is",
|
||||||
"temperature": 0.0,
|
"temperature": 0.0,
|
||||||
"top_k": 1,
|
"top_k": 1,
|
||||||
|
"n_predict": 16,
|
||||||
})
|
})
|
||||||
assert res.status_code == 200
|
assert res.status_code == 200
|
||||||
content_no_draft = res.body["content"]
|
content_no_draft = res.body["content"]
|
||||||
|
|
@ -42,6 +43,7 @@ def test_with_and_without_draft():
|
||||||
"prompt": "I believe the meaning of life is",
|
"prompt": "I believe the meaning of life is",
|
||||||
"temperature": 0.0,
|
"temperature": 0.0,
|
||||||
"top_k": 1,
|
"top_k": 1,
|
||||||
|
"n_predict": 16,
|
||||||
})
|
})
|
||||||
assert res.status_code == 200
|
assert res.status_code == 200
|
||||||
content_draft = res.body["content"]
|
content_draft = res.body["content"]
|
||||||
|
|
@ -68,6 +70,7 @@ def test_different_draft_min_draft_max():
|
||||||
"prompt": "I believe the meaning of life is",
|
"prompt": "I believe the meaning of life is",
|
||||||
"temperature": 0.0,
|
"temperature": 0.0,
|
||||||
"top_k": 1,
|
"top_k": 1,
|
||||||
|
"n_predict": 16,
|
||||||
})
|
})
|
||||||
assert res.status_code == 200
|
assert res.status_code == 200
|
||||||
if last_content is not None:
|
if last_content is not None:
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue