Skip to content

Commit afd6d35

Browse files
committed
Merge branch 'master' into crokeso
2 parents 9e6ff33 + 67d1ef2 commit afd6d35

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

46 files changed

+15583
-453
lines changed

ggml/include/ggml-kompute.h

Lines changed: 0 additions & 50 deletions
This file was deleted.

ggml/include/ggml.h

Lines changed: 35 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -686,6 +686,8 @@ extern "C" {
686686
GGML_GLU_OP_REGLU,
687687
GGML_GLU_OP_GEGLU,
688688
GGML_GLU_OP_SWIGLU,
689+
GGML_GLU_OP_GEGLU_ERF,
690+
GGML_GLU_OP_GEGLU_QUICK,
689691

690692
GGML_GLU_OP_COUNT,
691693
};
@@ -1295,6 +1297,22 @@ extern "C" {
12951297
struct ggml_context * ctx,
12961298
struct ggml_tensor * a);
12971299

1300+
GGML_API struct ggml_tensor * ggml_geglu_erf(
1301+
struct ggml_context * ctx,
1302+
struct ggml_tensor * a);
1303+
1304+
GGML_API struct ggml_tensor * ggml_geglu_erf_swapped(
1305+
struct ggml_context * ctx,
1306+
struct ggml_tensor * a);
1307+
1308+
GGML_API struct ggml_tensor * ggml_geglu_quick(
1309+
struct ggml_context * ctx,
1310+
struct ggml_tensor * a);
1311+
1312+
GGML_API struct ggml_tensor * ggml_geglu_quick_swapped(
1313+
struct ggml_context * ctx,
1314+
struct ggml_tensor * a);
1315+
12981316
// A: n columns, r rows,
12991317
// B: n columns, r rows,
13001318
GGML_API struct ggml_tensor * ggml_glu_split(
@@ -1318,6 +1336,16 @@ extern "C" {
13181336
struct ggml_tensor * a,
13191337
struct ggml_tensor * b);
13201338

1339+
GGML_API struct ggml_tensor * ggml_geglu_erf_split(
1340+
struct ggml_context * ctx,
1341+
struct ggml_tensor * a,
1342+
struct ggml_tensor * b);
1343+
1344+
GGML_API struct ggml_tensor * ggml_geglu_quick_split(
1345+
struct ggml_context * ctx,
1346+
struct ggml_tensor * a,
1347+
struct ggml_tensor * b);
1348+
13211349
// normalize along rows
13221350
GGML_API struct ggml_tensor * ggml_norm(
13231351
struct ggml_context * ctx,
@@ -2175,15 +2203,16 @@ extern "C" {
21752203

21762204
#define GGML_KQ_MASK_PAD 64
21772205

2178-
// q: [n_embd_k, n_batch, n_head, ne3]
2179-
// k: [n_embd_k, n_kv, n_head_kv, ne3]
2180-
// v: [n_embd_v, n_kv, n_head_kv, ne3] !! not transposed !!
2181-
// mask: [n_kv, n_batch_pad, ne32, 1] !! n_batch_pad = GGML_PAD(n_batch, GGML_KQ_MASK_PAD) !!
2182-
// res: [n_embd_v, n_head, n_batch, ne3] !! permuted !!
2206+
// q: [n_embd_k, n_batch, n_head, ne3 ]
2207+
// k: [n_embd_k, n_kv, n_head_kv, ne3 ]
2208+
// v: [n_embd_v, n_kv, n_head_kv, ne3 ] !! not transposed !!
2209+
// mask: [n_kv, n_batch_pad, ne32, ne33] !! n_batch_pad = GGML_PAD(n_batch, GGML_KQ_MASK_PAD) !!
2210+
// res: [n_embd_v, n_head, n_batch, ne3 ] !! permuted !!
21832211
//
21842212
// broadcast:
21852213
// n_head % n_head_kv == 0
2186-
// ne3 % ne32 == 0
2214+
// n_head % ne32 == 0
2215+
// ne3 % ne33 == 0
21872216
//
21882217
GGML_API struct ggml_tensor * ggml_flash_attn_ext(
21892218
struct ggml_context * ctx,

ggml/src/ggml-backend-reg.cpp

Lines changed: 0 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -61,10 +61,6 @@
6161
#include "ggml-cann.h"
6262
#endif
6363

64-
#ifdef GGML_USE_KOMPUTE
65-
#include "ggml-kompute.h"
66-
#endif
67-
6864
// disable C++17 deprecation warning for std::codecvt_utf8
6965
#if defined(__clang__)
7066
# pragma clang diagnostic push
@@ -189,9 +185,6 @@ struct ggml_backend_registry {
189185
#ifdef GGML_USE_RPC
190186
register_backend(ggml_backend_rpc_reg());
191187
#endif
192-
#ifdef GGML_USE_KOMPUTE
193-
register_backend(ggml_backend_kompute_reg());
194-
#endif
195188
#ifdef GGML_USE_CPU
196189
register_backend(ggml_backend_cpu_reg());
197190
#endif
@@ -576,7 +569,6 @@ void ggml_backend_load_all_from_path(const char * dir_path) {
576569
ggml_backend_load_best("cann", silent, dir_path);
577570
ggml_backend_load_best("cuda", silent, dir_path);
578571
ggml_backend_load_best("hip", silent, dir_path);
579-
ggml_backend_load_best("kompute", silent, dir_path);
580572
ggml_backend_load_best("metal", silent, dir_path);
581573
ggml_backend_load_best("rpc", silent, dir_path);
582574
ggml_backend_load_best("sycl", silent, dir_path);

0 commit comments

Comments
 (0)