| .. |
|
test_basic.py
|
a7a98e0fff
SvelteKit-based WebUI (#14839)
|
4 mesi fa |
|
test_chat_completion.py
|
2b6b55a59f
server : include usage statistics only when user request them (#16052)
|
4 mesi fa |
|
test_completion.py
|
4afb0a746f
server : Support multimodal completion and embeddings prompts in JSON format (#15108)
|
4 mesi fa |
|
test_ctx_shift.py
|
e81b8e4b7f
llama: use FA + max. GPU layers by default (#15434)
|
4 mesi fa |
|
test_embedding.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_infill.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_lora.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_rerank.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_security.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_slot_save.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_speculative.py
|
e81b8e4b7f
llama: use FA + max. GPU layers by default (#15434)
|
4 mesi fa |
|
test_template.py
|
3c3635d2f2
server : speed up tests (#15836)
|
4 mesi fa |
|
test_tokenize.py
|
d2fcd91cf9
server : disable context shift by default (#15416)
|
5 mesi fa |
|
test_tool_call.py
|
3c3635d2f2
server : speed up tests (#15836)
|
4 mesi fa |
|
test_vision_api.py
|
3c3635d2f2
server : speed up tests (#15836)
|
4 mesi fa |