-
-
Notifications
You must be signed in to change notification settings - Fork 5.3k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[Bugfix][Frontend] Fix missing
/metrics
endpoint (#6463)
- Loading branch information
1 parent
dbe5588
commit 6366efc
Showing
2 changed files
with
70 additions
and
5 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,61 @@ | ||
from http import HTTPStatus | ||
|
||
import openai | ||
import pytest | ||
import requests | ||
|
||
from vllm.version import __version__ as VLLM_VERSION | ||
|
||
from ...utils import RemoteOpenAIServer | ||
|
||
MODEL_NAME = "HuggingFaceH4/zephyr-7b-beta" | ||
|
||
|
||
@pytest.fixture(scope="module") | ||
def server(): | ||
args = [ | ||
# use half precision for speed and memory savings in CI environment | ||
"--dtype", | ||
"bfloat16", | ||
"--max-model-len", | ||
"8192", | ||
"--enforce-eager", | ||
"--max-num-seqs", | ||
"128", | ||
] | ||
|
||
with RemoteOpenAIServer(MODEL_NAME, args) as remote_server: | ||
yield remote_server | ||
|
||
|
||
@pytest.fixture(scope="module") | ||
def client(server): | ||
return server.get_async_client() | ||
|
||
|
||
@pytest.mark.asyncio | ||
async def test_show_version(client: openai.AsyncOpenAI): | ||
base_url = str(client.base_url)[:-3].strip("/") | ||
|
||
response = requests.get(base_url + "/version") | ||
response.raise_for_status() | ||
|
||
assert response.json() == {"version": VLLM_VERSION} | ||
|
||
|
||
@pytest.mark.asyncio | ||
async def test_check_health(client: openai.AsyncOpenAI): | ||
base_url = str(client.base_url)[:-3].strip("/") | ||
|
||
response = requests.get(base_url + "/health") | ||
|
||
assert response.status_code == HTTPStatus.OK | ||
|
||
|
||
@pytest.mark.asyncio | ||
async def test_log_metrics(client: openai.AsyncOpenAI): | ||
base_url = str(client.base_url)[:-3].strip("/") | ||
|
||
response = requests.get(base_url + "/metrics") | ||
|
||
assert response.status_code == HTTPStatus.OK |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters