ggerganov commited on
Commit
43d5a06
·
1 Parent(s): c5e24da

metal : reduce command encoding overhead (llama/9698)

Browse files
ggml/include/ggml-metal.h CHANGED
@@ -25,9 +25,6 @@
25
  #include <stddef.h>
26
  #include <stdbool.h>
27
 
28
- // max memory buffers that can be mapped to the device
29
- #define GGML_METAL_MAX_BUFFERS 64
30
-
31
  struct ggml_tensor;
32
  struct ggml_cgraph;
33
 
@@ -48,8 +45,6 @@ GGML_API bool ggml_backend_is_metal(ggml_backend_t backend);
48
 
49
  GGML_API GGML_CALL ggml_backend_buffer_t ggml_backend_metal_buffer_from_ptr(void * data, size_t size, size_t max_size);
50
 
51
- GGML_API void ggml_backend_metal_set_n_cb(ggml_backend_t backend, int n_cb);
52
-
53
  GGML_API void ggml_backend_metal_set_abort_callback(ggml_backend_t backend, ggml_abort_callback abort_callback, void * user_data);
54
 
55
  GGML_API GGML_CALL ggml_backend_buffer_type_t ggml_backend_metal_buffer_type(void);
 
25
  #include <stddef.h>
26
  #include <stdbool.h>
27
 
 
 
 
28
  struct ggml_tensor;
29
  struct ggml_cgraph;
30
 
 
45
 
46
  GGML_API GGML_CALL ggml_backend_buffer_t ggml_backend_metal_buffer_from_ptr(void * data, size_t size, size_t max_size);
47
 
 
 
48
  GGML_API void ggml_backend_metal_set_abort_callback(ggml_backend_t backend, ggml_abort_callback abort_callback, void * user_data);
49
 
50
  GGML_API GGML_CALL ggml_backend_buffer_type_t ggml_backend_metal_buffer_type(void);
ggml/src/ggml-metal.m CHANGED
The diff for this file is too large to render. See raw diff