server : add tests

2025-02-04 15:43:53 +01:00 · 2024-12-04 13:11:26 +02:00 · 2024-12-04 13:11:26 +02:00 · 81611bef72
commit 81611bef72
parent b436edaad9
1 changed files with 31 additions and 0 deletions
--- a/examples/server/tests/unit/test_speculative.py
+++ b/examples/server/tests/unit/test_speculative.py
@ -82,6 +82,37 @@ def test_different_draft_min_draft_max():
        last_content = res.body["content"]
 def test_slot_ctx_not_exceeded():
    global server
    server.n_ctx = 64
    server.start()
    res = server.make_request("POST", "/completion", data={
        "prompt": "Hello " * 56,
        "temperature": 0.0,
        "top_k": 1,
        "speculative.p_min": 0.0,
    })
    assert res.status_code == 200
    assert len(res.body["content"]) > 0
 def test_with_ctx_shift():
    global server
    server.n_ctx = 64
    server.start()
    res = server.make_request("POST", "/completion", data={
        "prompt": "Hello " * 56,
        "temperature": 0.0,
        "top_k": 1,
        "n_predict": 64,
        "speculative.p_min": 0.0,
    })
    assert res.status_code == 200
    assert len(res.body["content"]) > 0
    assert res.body["tokens_predicted"] == 64
    assert res.body["truncated"] == True
@pytest.mark.parametrize("n_slots,n_requests", [
    (1, 2),
    (2, 2),