Spaces:
Running
Running
CUDA: fix DEBUG_CUDA_MALLOC (llama/5729)
Browse files- ggml-cuda.cu +4 -4
ggml-cuda.cu
CHANGED
|
@@ -8079,8 +8079,8 @@ static void * ggml_cuda_pool_malloc_leg(int device, size_t size, size_t * actual
|
|
| 8079 |
*actual_size = look_ahead_size;
|
| 8080 |
g_cuda_pool_size[device] += look_ahead_size;
|
| 8081 |
#ifdef DEBUG_CUDA_MALLOC
|
| 8082 |
-
fprintf(stderr, "%s[%d]: %d buffers, max_size = %u MB, pool_size = %u MB, requested %u MB\n", __func__,
|
| 8083 |
-
(uint32_t)(max_size/1024/1024), (uint32_t)(g_cuda_pool_size[
|
| 8084 |
#endif
|
| 8085 |
return ptr;
|
| 8086 |
}
|
|
@@ -8166,7 +8166,7 @@ static void * ggml_cuda_pool_malloc_vmm(int device, size_t size, size_t * actual
|
|
| 8166 |
g_cuda_pool_used[device] += size;
|
| 8167 |
|
| 8168 |
#ifdef DEBUG_CUDA_MALLOC
|
| 8169 |
-
printf("cuda pool[%d]: allocated %llu bytes at %llx
|
| 8170 |
#endif
|
| 8171 |
|
| 8172 |
return ptr;
|
|
@@ -8176,7 +8176,7 @@ static void ggml_cuda_pool_free_vmm(int device, void * ptr, size_t size) {
|
|
| 8176 |
scoped_spin_lock lock(g_cuda_pool_lock);
|
| 8177 |
|
| 8178 |
#ifdef DEBUG_CUDA_MALLOC
|
| 8179 |
-
printf("cuda pool[%d]: freed %llu bytes at %llx\n",
|
| 8180 |
#endif
|
| 8181 |
|
| 8182 |
g_cuda_pool_used[device] -= size;
|
|
|
|
| 8079 |
*actual_size = look_ahead_size;
|
| 8080 |
g_cuda_pool_size[device] += look_ahead_size;
|
| 8081 |
#ifdef DEBUG_CUDA_MALLOC
|
| 8082 |
+
fprintf(stderr, "%s[%d]: %d buffers, max_size = %u MB, pool_size = %u MB, requested %u MB\n", __func__, device, nnz,
|
| 8083 |
+
(uint32_t)(max_size/1024/1024), (uint32_t)(g_cuda_pool_size[device]/1024/1024), (uint32_t)(size/1024/1024));
|
| 8084 |
#endif
|
| 8085 |
return ptr;
|
| 8086 |
}
|
|
|
|
| 8166 |
g_cuda_pool_used[device] += size;
|
| 8167 |
|
| 8168 |
#ifdef DEBUG_CUDA_MALLOC
|
| 8169 |
+
printf("cuda pool[%d]: allocated %llu bytes at %llx\n", device, (unsigned long long) size, ptr);
|
| 8170 |
#endif
|
| 8171 |
|
| 8172 |
return ptr;
|
|
|
|
| 8176 |
scoped_spin_lock lock(g_cuda_pool_lock);
|
| 8177 |
|
| 8178 |
#ifdef DEBUG_CUDA_MALLOC
|
| 8179 |
+
printf("cuda pool[%d]: freed %llu bytes at %llx\n", device, (unsigned long long) size, ptr);
|
| 8180 |
#endif
|
| 8181 |
|
| 8182 |
g_cuda_pool_used[device] -= size;
|