cturan/llama.cpp @ 9e2b1e83c68a38ea0c64f726dd979439bd02189b

Eric Curtin badb80cadb Document the new max GPU layers default in help (#15771)		4 месяцев назад
..
CMakeLists.txt	a457551332 cmake : do not search for curl libraries by ourselves (#14613)	6 месяцев назад
arg.cpp	badb80cadb Document the new max GPU layers default in help (#15771)	4 месяцев назад
arg.h	2d451c8059 common : add common_remote_get_content (#13123)	8 месяцев назад
base64.hpp	381efbf480 llava : expose as a shared library for downstream projects (#3613)	2 лет назад
build-info.cpp.in	cc8d081879 cmake: Add ability to pass in LLAMA_BUILD_NUMBER/COMMIT (#14167)	7 месяцев назад
chat-parser.cpp	3db4da56a5 chat : support Granite model reasoning and tool call (#14864)	5 месяцев назад
chat-parser.h	3cb203c89f llama-chat : Do not throw when tool parsing fails (#14012)	7 месяцев назад
chat.cpp	60e5eee31f chat : Seed OSS thinking + tool call support (#15552)	4 месяцев назад
chat.h	60e5eee31f chat : Seed OSS thinking + tool call support (#15552)	4 месяцев назад
common.cpp	e81b8e4b7f llama: use FA + max. GPU layers by default (#15434)	4 месяцев назад
common.h	0d161f021a server : enable /slots by default and make it secure (#15630)	4 месяцев назад
console.cpp	8277a817f1 console : utf-8 fix for windows stdin (#9690)	1 год назад
console.h	6381d4e110 gguf : new file format with flexible meta data (beta) (#2398)	2 лет назад
json-partial.cpp	53f925074d sync : vendor (#13901)	7 месяцев назад
json-partial.h	53f925074d sync : vendor (#13901)	7 месяцев назад
json-schema-to-grammar.cpp	40bfa04c95 common : use std::string_view now that we target c++17 (#14319)	6 месяцев назад
json-schema-to-grammar.h	53f925074d sync : vendor (#13901)	7 месяцев назад
llguidance.cpp	43dfd741a5 llguidance : set tokenizer slices to default (#13424)	8 месяцев назад
log.cpp	bfd11a2344 Fix: Compile failure due to Microsoft STL breaking change (#11836)	11 месяцев назад
log.h	fef0cbeadf cleanup: fix compile warnings associated with gnu_printf (#11811)	11 месяцев назад
ngram-cache.cpp	5bbe6a9fe9 ggml : portability fixes for VS 2017 (#12150)	10 месяцев назад
ngram-cache.h	727368c60f llama : use LLAMA_TOKEN_NULL (#11062)	1 год назад
regex-partial.cpp	3198405e98 `common`: add partial regex support (#12808)	8 месяцев назад
regex-partial.h	3198405e98 `common`: add partial regex support (#12808)	8 месяцев назад
sampling.cpp	e92d53b29e sampling : optimize samplers by reusing bucket sort (#15665)	4 месяцев назад
sampling.h	e92d53b29e sampling : optimize samplers by reusing bucket sort (#15665)	4 месяцев назад
speculative.cpp	e92d53b29e sampling : optimize samplers by reusing bucket sort (#15665)	4 месяцев назад
speculative.h	94933c8c2e server : implement universal assisted decoding (#12635)	5 месяцев назад