llama : allow getting n_batch from llama_context in c api (#4540)

MarcusDunn · ggerganov · web-flow · commit 31f27758faf4 · 2023-12-21T21:57:48.000+02:00
* allowed getting n_batch from llama_context in c api

* changed to use `uint32_t` instead of `int`

* changed to use `uint32_t` instead of `int` in `llama_n_ctx`

* Update llama.h

---------

Co-authored-by: Georgi Gerganov &lt;ggerganov@gmail.com&gt;
diff --git a/llama.cpp b/llama.cpp
@@ -9532,10 +9532,14 @@ const llama_model * llama_get_model(const struct llama_context * ctx) {
     return &ctx->model;
 }
 
-int llama_n_ctx(const struct llama_context * ctx) {
+uint32_t llama_n_ctx(const struct llama_context * ctx) {
     return ctx->cparams.n_ctx;
 }
 
+uint32_t llama_n_batch(const struct llama_context * ctx) {
+    return ctx->cparams.n_batch;
+}
+
 enum llama_vocab_type llama_vocab_type(const struct llama_model * model) {
     return model->vocab.type;
 }
diff --git a/llama.h b/llama.h
@@ -314,7 +314,9 @@ extern "C" {
 
     LLAMA_API const struct llama_model * llama_get_model(const struct llama_context * ctx);
 
-    LLAMA_API int llama_n_ctx      (const struct llama_context * ctx);
+    // TODO: become more consistent with returned int types across the API
+    LLAMA_API uint32_t llama_n_ctx      (const struct llama_context * ctx);
+    LLAMA_API uint32_t llama_n_batch    (const struct llama_context * ctx);
 
     LLAMA_API enum llama_vocab_type llama_vocab_type(const struct llama_model * model);
 

Original file line number	Diff line number	Diff line change
`@@ -9532,10 +9532,14 @@ const llama_model * llama_get_model(const struct llama_context * ctx) {`
`9532`	`9532`	`return &ctx->model;`
`9533`	`9533`	`}`
`9534`	`9534`
`9535`		`-int llama_n_ctx(const struct llama_context * ctx) {`
	`9535`	`+uint32_t llama_n_ctx(const struct llama_context * ctx) {`
`9536`	`9536`	`return ctx->cparams.n_ctx;`
`9537`	`9537`	`}`
`9538`	`9538`
	`9539`	`+uint32_t llama_n_batch(const struct llama_context * ctx) {`
	`9540`	`+ return ctx->cparams.n_batch;`
	`9541`	`+}`
	`9542`	`+`
`9539`	`9543`	`enum llama_vocab_type llama_vocab_type(const struct llama_model * model) {`
`9540`	`9544`	`return model->vocab.type;`
`9541`	`9545`	`}`