cturan/llama.cpp @ ce8784bdb153ff7794dde5a50b0ebfa51baa6171

Xuan Son Nguyen ce8784bdb1 server : fix format_infill (#10724)		hace 1 año
..
batched	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
batched-bench	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
batched.swift	0abc6a2c25 llama : llama_perf + option to disable timings during decode (#9355)	hace 1 año
convert-llama2c-to-ggml	8648c52101 make : deprecate (#10514)	hace 1 año
cvector-generator	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
deprecation-warning	f112d198cd Update deprecation-warning.cpp (#10619)	hace 1 año
embedding	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
eval-callback	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
export-lora	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
gbnf-validator	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
gen-docs	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
gguf	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
gguf-hash	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
gguf-split	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
gritlm	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
imatrix	8648c52101 make : deprecate (#10514)	hace 1 año
infill	82bca2257b readme : add option, update default value, fix formatting (#10271)	hace 1 año
jeopardy	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
llama-bench	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
llama.android	cda0e4b648 llama : remove all_pos_0, all_pos_1, all_seq_id from llama_batch (#9745)	hace 1 año
llama.swiftui	43ed389a3f llama : use cmake for swift build (#10525)	hace 1 año
llava	01e6d9bb71 clip : add sycl support (#10574)	hace 1 año
lookahead	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
lookup	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
main	82bca2257b readme : add option, update default value, fix formatting (#10271)	hace 1 año
main-cmake-pkg	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
parallel	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
passkey	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
perplexity	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
quantize	19d8762ab6 ggml : refactor online repacking (#10446)	hace 1 año
quantize-stats	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
retrieval	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
rpc	9f40989351 ggml : move CPU backend to a separate file (#10144)	hace 1 año
run	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
save-load-state	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
server	ce8784bdb1 server : fix format_infill (#10724)	hace 1 año
simple	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
simple-chat	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
speculative	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
speculative-simple	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
sycl	faf67b3de4 [SYCL]set context default value to avoid memory issue, update guide (#9476)	hace 1 año
tokenize	7cc2d2c889 ggml : move AMX to the CPU backend (#10570)	hace 1 año
CMakeLists.txt	ab96610b1e cmake : enable warnings in llama (#10474)	hace 1 año
Miku.sh	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
chat-13B.bat	d9ad104440 Create chat-13B.bat (#592)	hace 2 años
chat-13B.sh	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
chat-persistent.sh	8fc393f246 scripts : fix pattern and get n_tokens in one go (#10221)	hace 1 año
chat-vicuna.sh	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
chat.sh	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
convert_legacy_llama.py	a0ec17b32e metadata: Detailed Dataset Authorship Metadata (#8875)	hace 1 año
json_schema_pydantic_example.py	3fd62a6b1c py : type-check all Python scripts with Pyright (#8341)	hace 1 año
json_schema_to_grammar.py	66c2c93082 grammar : fix JSON Schema for string regex with top-level alt. (#9903)	hace 1 año
llama.vim	2d3aba9ee8 llama.vim : bump generation time limit to 3s [no ci]	hace 1 año
llm.vim	ad9ddcff6e llm.vim : stop generation at multiple linebreaks, bind to <F2> (#2879)	hace 2 años
pydantic_models_to_grammar.py	090fca7a07 pydantic : replace uses of __annotations__ with get_type_hints (#8474)	hace 1 año
pydantic_models_to_grammar_examples.py	22f281aa16 examples : Rewrite pydantic_models_to_grammar_examples.py (#8493)	hace 1 año
reason-act.sh	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
regex_to_grammar.py	e235b267a2 py : switch to snake_case (#8305)	hace 1 año
server-llama2-13B.sh	1c641e6aac `build`: rename main → llama-cli, server → llama-server, llava-cli → llama-llava-cli, etc... (#7809)	hace 1 año
server_embd.py	3fd62a6b1c py : type-check all Python scripts with Pyright (#8341)	hace 1 año
ts-type-to-grammar.sh	ab9a3240a9 JSON schema conversion: ⚡️ faster repetitions, min/maxLength for strings, cap number length (#6555)	hace 1 año