| .. |
|
__init__.py
|
[CI/Build] [3/3] Reorganize entrypoints tests (#5966)
|
2024-06-30 12:58:49 +08:00 |
|
test_accuracy.py
|
Add output streaming support to multi-step + async while ensuring RequestOutput obj reuse (#8335)
|
2024-09-23 15:38:04 -07:00 |
|
test_audio.py
|
[Core][VLM] Test registration for OOT multimodal models (#8717)
|
2024-10-04 10:38:25 -07:00 |
|
test_basic.py
|
[Bugfix] fix OpenAI API server startup with --disable-frontend-multiprocessing (#8537)
|
2024-10-08 09:38:40 -07:00 |
|
test_chat_template.py
|
[Frontend] Added support for HF's new continue_final_message parameter (#8942)
|
2024-09-29 17:59:47 +00:00 |
|
test_chat.py
|
[BugFix] Fix chat API continuous usage stats (#9357)
|
2024-10-14 23:19:48 -07:00 |
|
test_chunked_prompt.py
|
[Bugfix] Fix vLLM UsageInfo and logprobs None AssertionError with empty token_ids (#9034)
|
2024-10-15 15:40:43 -07:00 |
|
test_cli_args.py
|
[Frontend] Add Early Validation For Chat Template / Tool Call Parser (#9151)
|
2024-10-08 14:31:26 +00:00 |
|
test_completion.py
|
[Frontend] API support for beam search for MQLLMEngine (#9117)
|
2024-10-08 05:51:43 +00:00 |
|
test_embedding.py
|
Adds truncate_prompt_tokens param for embeddings creation (#8999)
|
2024-10-04 18:31:40 +00:00 |
|
test_encoder_decoder.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_lora_lineage.py
|
[Core] Support Lora lineage and base model metadata management (#6315)
|
2024-09-20 06:20:56 +00:00 |
|
test_metrics.py
|
[misc] hide best_of from engine (#9261)
|
2024-10-10 21:30:44 -07:00 |
|
test_models.py
|
[Core] Support Lora lineage and base model metadata management (#6315)
|
2024-09-20 06:20:56 +00:00 |
|
test_oot_registration.py
|
[misc][plugin] add plugin system implementation (#7426)
|
2024-08-13 16:24:17 -07:00 |
|
test_prompt_validation.py
|
[BugFix] Fix server crash on empty prompt (#7746)
|
2024-08-23 13:12:44 +00:00 |
|
test_return_tokens_as_ids.py
|
[Tests] Disable retries and use context manager for openai client (#7565)
|
2024-08-26 21:33:17 -07:00 |
|
test_run_batch.py
|
[Frontend] Create ErrorResponse instead of raising exceptions in run_batch (#8347)
|
2024-09-11 05:30:11 +00:00 |
|
test_serving_chat.py
|
[BugFix] Fix test breakages from transformers 4.45 upgrade (#8829)
|
2024-09-26 16:46:43 -07:00 |
|
test_serving_engine.py
|
[Core] Support Lora lineage and base model metadata management (#6315)
|
2024-09-20 06:20:56 +00:00 |
|
test_shutdown.py
|
[Core][Bugfix][Perf] Introduce MQLLMEngine to avoid asyncio OH (#8157)
|
2024-09-18 13:56:58 +00:00 |
|
test_tokenization.py
|
[Frontend] Added support for HF's new continue_final_message parameter (#8942)
|
2024-09-29 17:59:47 +00:00 |
|
test_vision.py
|
[Core][VLM] Test registration for OOT multimodal models (#8717)
|
2024-10-04 10:38:25 -07:00 |