On windows, detect large multi-socket systems and reduce to the number of cores in one socket for best performance |
||
|---|---|---|
| .. | ||
| ext_server | ||
| generate | ||
| llama.cpp@8962422b1c | ||
| patches | ||
| filetype.go | ||
| ggla.go | ||
| ggml_test.go | ||
| ggml.go | ||
| gguf.go | ||
| llm_darwin.go | ||
| llm_linux.go | ||
| llm_windows.go | ||
| memory_test.go | ||
| memory.go | ||
| server.go | ||
| status.go | ||