mamba : recurrent inference WORKS!!!

compilade · compilade · commit 5b0373e10264 · 2024-02-03T20:54:11.000-05:00
diff --git a/ggml.c b/ggml.c
@@ -5148,8 +5148,6 @@ static struct ggml_tensor * ggml_soft_plus_impl(
         struct ggml_tensor  * a,
         bool                  inplace) {
 
-    // TODO: does `a` need to be contiguous?
-
     bool is_node = false;
 
     if (a->grad) {
@@ -11736,7 +11734,7 @@ static void ggml_compute_forward_soft_plus_f32(
         float * x = (float *) ((char *) dst->data  + i*( dst->nb[1]));
         float * y = (float *) ((char *) src0->data + i*(src0->nb[1]));
         for (int j = 0; j < nc; ++j) {
-            x[j] = logf(1.0f + expf(y[i]));
+            x[j] = logf(1.0f + expf(y[j]));
         }
     }
 }
diff --git a/llama.cpp b/llama.cpp
@@ -6946,7 +6946,6 @@ struct llm_build_context {
             cur = llm_build_norm(ctx0, inpL, hparams,
                     model.layers[il].attn_norm, NULL,
                     LLM_NORM_RMS, cb, il);
-            // TODO: that's probably the wrong name.
             cb(cur, "attn_norm", il);
 
             // {n_embd, batch} * {n_embd, 2*d_inner} = {batch, 2*d_inner}

Original file line number	Diff line number	Diff line change
`@@ -5148,8 +5148,6 @@ static struct ggml_tensor * ggml_soft_plus_impl(`
`5148`	`5148`	`struct ggml_tensor * a,`
`5149`	`5149`	`bool inplace) {`
`5150`	`5150`
`5151`		- // TODO: does `a` need to be contiguous?
`5152`		`-`
`5153`	`5151`	`bool is_node = false;`
`5154`	`5152`
`5155`	`5153`	`if (a->grad) {`
`@@ -11736,7 +11734,7 @@ static void ggml_compute_forward_soft_plus_f32(`
`11736`	`11734`	`float * x = (float ) ((char ) dst->data + i*( dst->nb[1]));`
`11737`	`11735`	`float * y = (float ) ((char ) src0->data + i*(src0->nb[1]));`
`11738`	`11736`	`for (int j = 0; j < nc; ++j) {`
`11739`		`- x[j] = logf(1.0f + expf(y[i]));`
	`11737`	`+ x[j] = logf(1.0f + expf(y[j]));`
`11740`	`11738`	`}`
`11741`	`11739`	`}`
`11742`	`11740`	`}`