| .. |
|
rpc
|
[Frontend] error suppression cleanup (#7786)
|
2024-08-22 21:50:21 +00:00 |
|
__init__.py
|
[CI/Build] [3/3] Reorganize entrypoints tests (#5966)
|
2024-06-30 12:58:49 +08:00 |
|
test_accuracy.py
|
[Bugfix][Frontend] Fix Issues Under High Load With zeromq Frontend (#7394)
|
2024-08-21 13:34:14 -04:00 |
|
test_audio.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_basic.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_chat.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_completion.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_embedding.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_encoder_decoder.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_guided_processors.py
|
[Misc] add fixture to guided processor tests (#6341)
|
2024-07-12 09:55:39 -07:00 |
|
test_metrics.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_models.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_mp_api_server.py
|
[Frontend] Improve Startup Failure UX (#7716)
|
2024-08-21 19:53:01 +00:00 |
|
test_oot_registration.py
|
[misc][plugin] add plugin system implementation (#7426)
|
2024-08-13 16:24:17 -07:00 |
|
test_prompt_validation.py
|
[BugFix] Fix server crash on empty prompt (#7746)
|
2024-08-23 13:12:44 +00:00 |
|
test_return_tokens_as_ids.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_run_batch.py
|
[Frontend] Create ErrorResponse instead of raising exceptions in run_batch (#8347)
|
2024-09-11 05:30:11 +00:00 |
|
test_serving_chat.py
|
[Frontend][VLM] Add support for multiple multi-modal items (#8049)
|
2024-08-31 16:35:53 -07:00 |
|
test_serving_engine.py
|
[Core] Support load and unload LoRA in api server (#6566)
|
2024-09-05 18:10:33 -07:00 |
|
test_shutdown.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_tokenization.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_vision.py
|
[Frontend][VLM] Add support for multiple multi-modal items (#8049)
|
2024-08-31 16:35:53 -07:00 |