| .. |
|
data
|
[mypy] Enable type checking for test directory (#5017)
|
2024-06-15 04:45:31 +00:00 |
|
__init__.py
|
[Experimental] Add multi-LoRA support (#1804)
|
2024-01-23 15:26:37 -08:00 |
|
conftest.py
|
[MISC] Consolidate cleanup() and refactor offline_inference_with_prefix.py (#9510)
|
2024-10-18 14:30:55 -07:00 |
|
test_baichuan.py
|
[MISC] Consolidate cleanup() and refactor offline_inference_with_prefix.py (#9510)
|
2024-10-18 14:30:55 -07:00 |
|
test_chatglm3.py
|
[mypy] Enable type checking for test directory (#5017)
|
2024-06-15 04:45:31 +00:00 |
|
test_gemma.py
|
[CI] Change test input in Gemma LoRA test (#8163)
|
2024-09-04 13:05:50 -07:00 |
|
test_layers.py
|
[Misc] Standardize RoPE handling for Qwen2-VL (#9250)
|
2024-10-16 13:56:17 +08:00 |
|
test_llama.py
|
[MISC] Consolidate cleanup() and refactor offline_inference_with_prefix.py (#9510)
|
2024-10-18 14:30:55 -07:00 |
|
test_long_context.py
|
[CI/Build][LoRA] Temporarily fix long context failure issue (#9579)
|
2024-10-22 11:32:51 +00:00 |
|
test_lora_checkpoints.py
|
[Misc][LoRA] Support loading LoRA weights for target_modules in reg format (#9275)
|
2024-10-11 12:31:21 +00:00 |
|
test_lora_huggingface.py
|
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234)
|
2024-07-22 15:42:40 -07:00 |
|
test_lora_manager.py
|
[Misc/Testing] Use torch.testing.assert_close (#7324)
|
2024-08-16 04:24:04 +00:00 |
|
test_minicpmv_tp.py
|
[Model][LoRA]LoRA support added for MiniCPMV2.5 (#7199)
|
2024-09-29 06:59:45 +00:00 |
|
test_minicpmv.py
|
🐛 Fixup more test failures from memory profiling (#9563)
|
2024-10-21 17:10:56 -07:00 |
|
test_mixtral.py
|
[Model] add a bunch of supported lora modules for mixtral (#9008)
|
2024-10-04 16:24:40 +00:00 |
|
test_phi.py
|
[mypy] Enable type checking for test directory (#5017)
|
2024-06-15 04:45:31 +00:00 |
|
test_punica_sizes.py
|
[Kernel][LoRA] Add assertion for punica sgmv kernels (#7585)
|
2024-09-23 18:57:42 +00:00 |
|
test_punica_variation.py
|
[Kernel][LoRA] Add assertion for punica sgmv kernels (#7585)
|
2024-09-23 18:57:42 +00:00 |
|
test_quant_model.py
|
[MISC] Consolidate cleanup() and refactor offline_inference_with_prefix.py (#9510)
|
2024-10-18 14:30:55 -07:00 |
|
test_tokenizer_group.py
|
[BugFix] Fix test breakages from transformers 4.45 upgrade (#8829)
|
2024-09-26 16:46:43 -07:00 |
|
test_utils.py
|
[Core] Support dynamically loading Lora adapter from HuggingFace (#6234)
|
2024-07-22 15:42:40 -07:00 |
|
test_worker.py
|
[Model] Add user-configurable task for models that support both generation and embedding (#9424)
|
2024-10-18 11:31:58 -07:00 |
|
utils.py
|
[Kernel][RFC] Refactor the punica kernel based on Triton (#5036)
|
2024-07-31 17:12:24 -07:00 |