Skip to content

Commit b637bc6

Browse files
author
pockers21
committed
make memset range dynamic
1 parent 2f74c35 commit b637bc6

File tree

3 files changed

+6
-0
lines changed

3 files changed

+6
-0
lines changed

ggml/include/ggml-backend.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -224,6 +224,7 @@ extern "C" {
224224
// = ggml_backend_dev_init(ggml_backend_dev_by_type(GPU) OR ggml_backend_dev_by_type(CPU), NULL)
225225
GGML_API ggml_backend_t ggml_backend_init_best(void);
226226

227+
GGML_API void ggml_backend_set_size(ggml_backend_buffer_t buffer, size_t cur_size);
227228
// Load a backend from a dynamic library and register it
228229
GGML_API ggml_backend_reg_t ggml_backend_load(const char * path);
229230
// Unload a backend if loaded dynamically and unregister it

ggml/src/ggml-backend.cpp

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -536,6 +536,10 @@ struct ggml_backend_multi_buffer_context {
536536
size_t n_buffers;
537537
};
538538

539+
void ggml_backend_set_size(ggml_backend_buffer_t buffer, size_t cur_size){
540+
buffer->size = cur_size;
541+
}
542+
539543
static void ggml_backend_multi_buffer_free_buffer(ggml_backend_buffer_t buffer) {
540544
ggml_backend_multi_buffer_context * ctx = (ggml_backend_multi_buffer_context *) buffer->context;
541545
for (size_t i = 0; i < ctx->n_buffers; i++) {

src/llama-context.cpp

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1548,6 +1548,7 @@ int32_t llama_context::output_reserve(int32_t n_outputs) {
15481548
std::fill(output_ids.begin(), output_ids.end(), -1);
15491549

15501550
ggml_backend_buffer_clear(buf_output.get(), 0);
1551+
ggml_backend_set_size(buf_output.get(), new_size);
15511552

15521553
this->n_outputs = 0;
15531554
this->n_outputs_max = n_outputs_max;

0 commit comments

Comments
 (0)