Skip to content

Commit

Permalink
metal : reduce command encoding overhead (llama/9698)
Browse files Browse the repository at this point in the history
  • Loading branch information
ggerganov committed Oct 2, 2024
1 parent fce227e commit f083908
Show file tree
Hide file tree
Showing 2 changed files with 1,898 additions and 1,792 deletions.
5 changes: 0 additions & 5 deletions ggml/include/ggml-metal.h
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,6 @@
#include <stddef.h>
#include <stdbool.h>

// max memory buffers that can be mapped to the device
#define GGML_METAL_MAX_BUFFERS 64

struct ggml_tensor;
struct ggml_cgraph;

Expand All @@ -48,8 +45,6 @@ GGML_API bool ggml_backend_is_metal(ggml_backend_t backend);

GGML_API GGML_CALL ggml_backend_buffer_t ggml_backend_metal_buffer_from_ptr(void * data, size_t size, size_t max_size);

GGML_API void ggml_backend_metal_set_n_cb(ggml_backend_t backend, int n_cb);

GGML_API void ggml_backend_metal_set_abort_callback(ggml_backend_t backend, ggml_abort_callback abort_callback, void * user_data);

GGML_API GGML_CALL ggml_backend_buffer_type_t ggml_backend_metal_buffer_type(void);
Expand Down
Loading

0 comments on commit f083908

Please sign in to comment.