Skip to content

Commit

Permalink
fix two more public APIs to use int32_t for n_threads
Browse files Browse the repository at this point in the history
  • Loading branch information
max-krasnyansky committed Aug 29, 2024
1 parent c49d634 commit 3b5f7c2
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
4 changes: 2 additions & 2 deletions include/llama.h
Original file line number Diff line number Diff line change
Expand Up @@ -847,10 +847,10 @@ extern "C" {
LLAMA_API void llama_set_n_threads(struct llama_context * ctx, int32_t n_threads, int32_t n_threads_batch);

// Get the number of threads used for generation of a single token.
LLAMA_API int llama_n_threads(struct llama_context * ctx);
LLAMA_API int32_t llama_n_threads(struct llama_context * ctx);

// Get the number of threads used for prompt and batch processing (multiple token).
LLAMA_API int llama_n_threads_batch(struct llama_context * ctx);
LLAMA_API int32_t llama_n_threads_batch(struct llama_context * ctx);

// Set whether the model is in embeddings mode or not
// If true, embeddings will be returned but logits will not
Expand Down
4 changes: 2 additions & 2 deletions src/llama.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -19394,11 +19394,11 @@ void llama_set_n_threads(struct llama_context * ctx, int32_t n_threads, int32_t
ctx->cparams.n_threads_batch = n_threads_batch;
}

int llama_n_threads(struct llama_context * ctx) {
int32_t llama_n_threads(struct llama_context * ctx) {
return ctx->cparams.n_threads;
}

int llama_n_threads_batch(struct llama_context * ctx) {
int32_t llama_n_threads_batch(struct llama_context * ctx) {
return ctx->cparams.n_threads_batch;
}

Expand Down

0 comments on commit 3b5f7c2

Please sign in to comment.