| .. |
|
rpc
|
[Frontend] error suppression cleanup (#7786)
|
2024-08-22 21:50:21 +00:00 |
|
__init__.py
|
[CI/Build] [3/3] Reorganize entrypoints tests (#5966)
|
2024-06-30 12:58:49 +08:00 |
|
test_accuracy.py
|
[Bugfix][Frontend] Fix Issues Under High Load With zeromq Frontend (#7394)
|
2024-08-21 13:34:14 -04:00 |
|
test_audio.py
|
[Model] Add UltravoxModel and UltravoxConfig (#7615)
|
2024-08-21 22:49:39 +00:00 |
|
test_basic.py
|
[ Bugfix ] Fix Prometheus Metrics With zeromq Frontend (#7279)
|
2024-08-18 20:19:48 +00:00 |
|
test_chat.py
|
[mypy] Enable following imports for entrypoints (#7248)
|
2024-08-20 23:28:21 -07:00 |
|
test_completion.py
|
[mypy] Enable following imports for entrypoints (#7248)
|
2024-08-20 23:28:21 -07:00 |
|
test_embedding.py
|
[Bugfix] Fix encoding_format in examples/openai_embedding_client.py (#6755)
|
2024-07-24 22:48:07 -07:00 |
|
test_encoder_decoder.py
|
[Core] Support serving encoder/decoder models (#7258)
|
2024-08-09 10:39:41 +08:00 |
|
test_guided_processors.py
|
[Misc] add fixture to guided processor tests (#6341)
|
2024-07-12 09:55:39 -07:00 |
|
test_metrics.py
|
[ Bugfix ] Fix Prometheus Metrics With zeromq Frontend (#7279)
|
2024-08-18 20:19:48 +00:00 |
|
test_models.py
|
[Doc][CI/Build] Update docs and tests to use vllm serve (#6431)
|
2024-07-17 07:43:21 +00:00 |
|
test_mp_api_server.py
|
[Frontend] Improve Startup Failure UX (#7716)
|
2024-08-21 19:53:01 +00:00 |
|
test_oot_registration.py
|
[misc][plugin] add plugin system implementation (#7426)
|
2024-08-13 16:24:17 -07:00 |
|
test_return_tokens_as_ids.py
|
[Frontend] Represent tokens with identifiable strings (#6626)
|
2024-07-25 09:51:00 +08:00 |
|
test_run_batch.py
|
[Frontend] Support embeddings in the run_batch API (#7132)
|
2024-08-09 09:48:21 -07:00 |
|
test_serving_chat.py
|
[Misc] improve logits processors logging message (#7435)
|
2024-08-13 02:29:34 +00:00 |
|
test_shutdown.py
|
[Frontend] Kill the server on engine death (#6594)
|
2024-08-08 09:47:48 -07:00 |
|
test_tokenization.py
|
[BugFix][Frontend] Use LoRA tokenizer in OpenAI APIs (#6227)
|
2024-07-18 15:13:30 +08:00 |
|
test_vision.py
|
[Misc] Manage HTTP connections in one place (#6600)
|
2024-07-22 21:32:02 -07:00 |