Revert n_threads and n_threads_batch change

This commit is contained in:
Aleksandras Kostarevas 2024-04-23 15:21:53 -04:00
parent 15eb04895d
commit f261de9fab

View File

@ -52,9 +52,8 @@ LanguageModel *LlamaAdapter::createLanguageModel(const std::string &modelPath) {
llama_context_params ctx_params = llama_context_default_params();
ctx_params.n_ctx = LLAMA_CONTEXT_SIZE;
ctx_params.n_threads = 4;
ctx_params.n_threads_batch = 4;
ctx_params.n_batch = 128;
ctx_params.n_threads = 1;
ctx_params.n_threads_batch = 1;
adapter->n_batch = ctx_params.n_batch;