| .. |
|
internal
|
chore: fix some inconsistent function name in comment
|
2025-08-13 09:50:27 -07:00 |
|
auth.go
|
…
|
|
|
create.go
|
remove support for multiple ggufs in a single file (#10722)
|
2025-05-21 13:55:31 -07:00 |
|
create_test.go
|
server: validate local path on safetensor create (#9379)
|
2025-02-28 16:10:43 -08:00 |
|
download.go
|
server: abort download on empty digest
|
2025-05-27 11:28:48 -07:00 |
|
fixblobs.go
|
…
|
|
|
fixblobs_test.go
|
…
|
|
|
images.go
|
update vendored llama.cpp and ggml (#11823)
|
2025-08-14 14:42:58 -07:00 |
|
images_test.go
|
Reapply "feat: incremental gguf parser (#10822)" (#11114) (#11119)
|
2025-06-20 11:11:40 -07:00 |
|
layer.go
|
…
|
|
|
manifest.go
|
…
|
|
|
manifest_test.go
|
…
|
|
|
model.go
|
tools: refactor tool call parsing and enable streaming (#10415)
|
2025-05-23 14:19:31 -07:00 |
|
modelpath.go
|
server: add hint to the error message when model path access fails (#10843)
|
2025-05-24 13:17:04 -07:00 |
|
modelpath_test.go
|
lint: enable usetesting, disable tenv (#10594)
|
2025-05-08 11:42:14 -07:00 |
|
prompt.go
|
fix(openai): handle reasoning_effort (#11868)
|
2025-08-12 11:02:01 -07:00 |
|
prompt_test.go
|
gpt-oss (#11672)
|
2025-08-05 12:21:16 -07:00 |
|
quantization.go
|
skip quantizing per_layer_token_embd (#11207)
|
2025-06-26 21:49:35 -07:00 |
|
quantization_test.go
|
Reapply "feat: incremental gguf parser (#10822)" (#11114) (#11119)
|
2025-06-20 11:11:40 -07:00 |
|
routes.go
|
server: skip parsing initial <think> if provided in the prompt (#12024)
|
2025-08-22 12:00:16 -07:00 |
|
routes_create_test.go
|
Move quantization to new backend (#10363)
|
2025-05-06 11:20:48 -07:00 |
|
routes_debug_test.go
|
server: add debug option for printing out prompt instead of calling model
|
2025-08-15 13:52:50 -07:00 |
|
routes_delete_test.go
|
…
|
|
|
routes_generate_test.go
|
server: skip parsing initial <think> if provided in the prompt (#12024)
|
2025-08-22 12:00:16 -07:00 |
|
routes_harmony_streaming_test.go
|
llm: New memory management
|
2025-08-14 15:24:01 -07:00 |
|
routes_list_test.go
|
…
|
|
|
routes_test.go
|
server: use slices.Equal to simplify code (#11502)
|
2025-07-23 14:25:39 -07:00 |
|
sched.go
|
llm: New memory management
|
2025-08-14 15:24:01 -07:00 |
|
sched_test.go
|
llm: New memory management
|
2025-08-14 15:24:01 -07:00 |
|
sparse_common.go
|
…
|
|
|
sparse_windows.go
|
…
|
|
|
upload.go
|
server: always print upload/download part info (#8832)
|
2025-02-04 19:30:49 -08:00 |