server : do not return error out of context (with ctx shift disabled) (#13577)
This commit is contained in:
parent
aea9f8b4e7
commit
6aa892ec2a
2 changed files with 26 additions and 0 deletions
|
@ -65,3 +65,21 @@ def test_ctx_shift_disabled_long_prompt():
|
|||
assert res.status_code != 200
|
||||
assert "error" in res.body
|
||||
assert "exceeds the available context size" in res.body["error"]["message"]
|
||||
|
||||
def test_ctx_shift_disabled_stream():
|
||||
global server
|
||||
server.disable_ctx_shift = True
|
||||
server.start()
|
||||
res = server.make_stream_request("POST", "/v1/completions", data={
|
||||
"n_predict": 256,
|
||||
"prompt": "Once",
|
||||
"stream": True,
|
||||
})
|
||||
content = ""
|
||||
for data in res:
|
||||
choice = data["choices"][0]
|
||||
if choice["finish_reason"] == "length":
|
||||
assert len(content) > 0
|
||||
else:
|
||||
assert choice["finish_reason"] is None
|
||||
content += choice["text"]
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue