0001-cuda.patch 1.71 KB
Newer Older
1
2
3
4
5
6
From 0000000000000000000000000000000000000000 Mon Sep 17 00:00:00 2001
From: jmorganca <jmorganca@gmail.com>
Date: Thu, 6 Jun 2024 23:55:47 -0700
Subject: [PATCH] cuda

---
Michael Yang's avatar
Michael Yang committed
7
8
9
10
 ggml/src/ggml-backend.cpp        | 1 -
 ggml/src/ggml-cuda/ggml-cuda.cu  | 1 +
 ggml/src/ggml-metal/ggml-metal.m | 1 +
 3 files changed, 2 insertions(+), 1 deletion(-)
11

12
diff --git a/ggml/src/ggml-backend.cpp b/ggml/src/ggml-backend.cpp
Michael Yang's avatar
Michael Yang committed
13
index e2d6c405..a12172dc 100644
14
15
--- a/ggml/src/ggml-backend.cpp
+++ b/ggml/src/ggml-backend.cpp
Michael Yang's avatar
Michael Yang committed
16
@@ -106,7 +106,6 @@ void ggml_backend_buffer_free(ggml_backend_buffer_t buffer) {
17
18
19
     if (buffer->iface.free_buffer != NULL) {
         buffer->iface.free_buffer(buffer);
     }
Michael Yang's avatar
Michael Yang committed
20
-    delete buffer;
21
22
23
 }
 
 size_t ggml_backend_buffer_get_size(ggml_backend_buffer_t buffer) {
24
diff --git a/ggml/src/ggml-cuda/ggml-cuda.cu b/ggml/src/ggml-cuda/ggml-cuda.cu
Michael Yang's avatar
Michael Yang committed
25
index 0b06be72..be29e979 100644
26
27
--- a/ggml/src/ggml-cuda/ggml-cuda.cu
+++ b/ggml/src/ggml-cuda/ggml-cuda.cu
Michael Yang's avatar
Michael Yang committed
28
@@ -424,6 +424,7 @@ struct ggml_backend_cuda_buffer_context {
29
 static void ggml_backend_cuda_buffer_free_buffer(ggml_backend_buffer_t buffer) {
30
31
     ggml_backend_cuda_buffer_context * ctx = (ggml_backend_cuda_buffer_context *)buffer->context;
     delete ctx;
Michael Yang's avatar
Michael Yang committed
32
+    delete buffer;
33
34
 }
 
35
 static bool ggml_backend_buffer_is_cuda(ggml_backend_buffer_t buffer) {
Michael Yang's avatar
Michael Yang committed
36
37
38
39
40
41
42
43
44
45
46
47
diff --git a/ggml/src/ggml-metal/ggml-metal.m b/ggml/src/ggml-metal/ggml-metal.m
index a85502ee..cd8ef741 100644
--- a/ggml/src/ggml-metal/ggml-metal.m
+++ b/ggml/src/ggml-metal/ggml-metal.m
@@ -4187,6 +4187,7 @@ static void ggml_backend_metal_buffer_free_buffer(ggml_backend_buffer_t buffer)
     }
 
     free(ctx);
+    free(buffer);
 }
 
 static void * ggml_backend_metal_buffer_get_base(ggml_backend_buffer_t buffer) {