Skip to content

Commit

Permalink
metal : reduce command encoding overhead (llama/9698)
Browse files Browse the repository at this point in the history
ggml-ci
  • Loading branch information
ggerganov committed Oct 1, 2024
1 parent 4de6ee8 commit b302031
Show file tree
Hide file tree
Showing 3 changed files with 1,900 additions and 1,793 deletions.
5 changes: 0 additions & 5 deletions include/ggml-metal.h
Original file line number Diff line number Diff line change
Expand Up @@ -25,9 +25,6 @@
#include <stddef.h>
#include <stdbool.h>

// max memory buffers that can be mapped to the device
#define GGML_METAL_MAX_BUFFERS 64

struct ggml_tensor;
struct ggml_cgraph;

Expand All @@ -48,8 +45,6 @@ GGML_API bool ggml_backend_is_metal(ggml_backend_t backend);

GGML_API GGML_CALL ggml_backend_buffer_t ggml_backend_metal_buffer_from_ptr(void * data, size_t size, size_t max_size);

GGML_API void ggml_backend_metal_set_n_cb(ggml_backend_t backend, int n_cb);

GGML_API void ggml_backend_metal_set_abort_callback(ggml_backend_t backend, ggml_abort_callback abort_callback, void * user_data);

GGML_API GGML_CALL ggml_backend_buffer_type_t ggml_backend_metal_buffer_type(void);
Expand Down
2 changes: 1 addition & 1 deletion scripts/sync-llama.last
Original file line number Diff line number Diff line change
@@ -1 +1 @@
c919d5db39c8a7fcb64737f008e4b105ee0acd20
f1b8c4271125c2bfb9cfebd72a8b9e9f99061a30
Loading

0 comments on commit b302031

Please sign in to comment.