Skip to content

Commit bbe7b22

Browse files
committed
build_rwkv6: Simplify graph
Signed-off-by: Molly Sophia <mollysophia379@gmail.com>
1 parent 7f9de4a commit bbe7b22

File tree

1 file changed

+12
-34
lines changed

1 file changed

+12
-34
lines changed

src/llama.cpp

Lines changed: 12 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -8592,40 +8592,18 @@ static struct ggml_tensor * llm_build_time_mix_rwkv6(
85928592
xxx
85938593
);
85948594

8595-
struct ggml_tensor *mw = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embed * n_tokens);
8596-
mw = ggml_reshape_2d(
8597-
ctx,
8598-
ggml_set_1d(ctx, mw, ggml_view_1d(ctx, xxx, n_embed * n_tokens, 0), 0),
8599-
n_embed, n_tokens
8600-
);
8601-
8602-
struct ggml_tensor *mk = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embed * n_tokens);
8603-
mk = ggml_reshape_2d(
8604-
ctx,
8605-
ggml_set_1d(ctx, mk, ggml_view_1d(ctx, xxx, n_embed * n_tokens, n_embed * n_tokens * sizeof(float)), 0),
8606-
n_embed, n_tokens
8607-
);
8608-
8609-
struct ggml_tensor *mv = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embed * n_tokens);
8610-
mv = ggml_reshape_2d(
8611-
ctx,
8612-
ggml_set_1d(ctx, mv, ggml_view_1d(ctx, xxx, n_embed * n_tokens, n_embed * n_tokens * 2 * sizeof(float)), 0),
8613-
n_embed, n_tokens
8614-
);
8615-
8616-
struct ggml_tensor *mr = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embed * n_tokens);
8617-
mr = ggml_reshape_2d(
8618-
ctx,
8619-
ggml_set_1d(ctx, mr, ggml_view_1d(ctx, xxx, n_embed * n_tokens, n_embed * n_tokens * 3 * sizeof(float)), 0),
8620-
n_embed, n_tokens
8621-
);
8622-
8623-
struct ggml_tensor *mg = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embed * n_tokens);
8624-
mg = ggml_reshape_2d(
8625-
ctx,
8626-
ggml_set_1d(ctx, mg, ggml_view_1d(ctx, xxx, n_embed * n_tokens, n_embed * n_tokens * 4 * sizeof(float)), 0),
8627-
n_embed, n_tokens
8628-
);
8595+
// struct ggml_tensor *mw = ggml_new_tensor_1d(ctx, GGML_TYPE_F32, n_embed * n_tokens);
8596+
// mw = ggml_reshape_2d(
8597+
// ctx,
8598+
// ggml_set_1d(ctx, mw, ggml_view_1d(ctx, xxx, n_embed * n_tokens, 0), 0),
8599+
// n_embed, n_tokens
8600+
// );
8601+
8602+
struct ggml_tensor *mw = ggml_view_2d(ctx, xxx, n_embed, n_tokens, xxx->nb[1], 0);
8603+
struct ggml_tensor *mk = ggml_view_2d(ctx, xxx, n_embed, n_tokens, xxx->nb[1], n_embed * n_tokens * sizeof(float));
8604+
struct ggml_tensor *mv = ggml_view_2d(ctx, xxx, n_embed, n_tokens, xxx->nb[1], n_embed * n_tokens * 2 * sizeof(float));
8605+
struct ggml_tensor *mr = ggml_view_2d(ctx, xxx, n_embed, n_tokens, xxx->nb[1], n_embed * n_tokens * 3 * sizeof(float));
8606+
struct ggml_tensor *mg = ggml_view_2d(ctx, xxx, n_embed, n_tokens, xxx->nb[1], n_embed * n_tokens * 4 * sizeof(float));
86298607

86308608
struct ggml_tensor * xw = ggml_add(
86318609
ctx,

0 commit comments

Comments
 (0)