diff --git a/ggml.c b/ggml.c
index 3f72379c3..6ff9d8a34 100644
--- a/ggml.c
+++ b/ggml.c
@@ -9658,6 +9658,14 @@ static void ggml_compute_forward_div_f32(
             }
         }
     }
+    printf("lj.ggml_compute_forward_mul = %f", *(float*)dst->data);
+
+    for (int i = 1; i < 3; i++) {
+
+      printf("   %f", ((float*)dst->data)[i]);
+
+    }
+    printf("\n");
 }
 
 static void ggml_compute_forward_div(
@@ -10897,6 +10905,14 @@ static void ggml_compute_forward_rms_norm_f32(
             }
         }
     }
+    printf("lj.ggml_compute_forward_rms = %f", *(float*)dst->data);
+
+    for (int i = 1; i < 3; i++) {
+
+      printf("   %f", ((float*)dst->data)[i]);
+
+    }
+    printf("\n");
 }
 
 static void ggml_compute_forward_rms_norm(
@@ -11423,6 +11439,14 @@ static void ggml_compute_forward_mul_mat(
             }
         }
     }
+        printf("lj.ggml_compute_forward_mul_mat = %f", *(float*)dst->data);
+
+    for (int i = 1; i < 3; i++) {
+
+      printf("   %f", ((float*)dst->data)[i]);
+
+    }
+    printf("\n");
 }
 
 // ggml_compute_forward_out_prod
@@ -12256,6 +12280,14 @@ static void ggml_compute_forward_soft_max_f32(
         }
 #endif
     }
+    printf("lj.ggml_compute_forward_softmax = %f", *(float*)dst->data);
+
+    for (int i = 1; i < 3; i++) {
+
+      printf("   %f", ((float*)dst->data)[i]);
+
+    }
+    printf("\n");
 }
 
 static void ggml_compute_forward_soft_max(
@@ -12744,9 +12776,19 @@ static void ggml_compute_forward_rope_f32(
                 }
             }
         }
+
     }
+    printf("lj.ggml_compute_forward_rope = %f", *(float*)dst->data);
+
+    for (int i = 1; i < 3; i++) {
+
+      printf("   %f", ((float*)dst->data)[i]);
+
+    }
+    printf("\n");
 }
 
+
 static void ggml_compute_forward_rope_f16(
         const struct ggml_compute_params * params,
         const struct ggml_tensor * src0,
diff --git a/llama.cpp b/llama.cpp
index 2a2a0c9c6..1134ad9a5 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -1966,7 +1966,7 @@ static void llm_load_tensors(
 
                     model.layers.resize(n_layer);
 
-                    for (uint32_t i = 0; i < n_layer; ++i) {
+                    for (uint32_t i = 0; i < 1; ++i) {
                         const ggml_backend backend = int(i) < i_gpu_start ? GGML_BACKEND_CPU : LLAMA_BACKEND_OFFLOAD; // NOLINT
                         const ggml_backend backend_split = int(i) < i_gpu_start ? GGML_BACKEND_CPU : LLAMA_BACKEND_OFFLOAD_SPLIT; // NOLINT
 
@@ -2515,6 +2515,7 @@ static struct ggml_cgraph * llm_build_llama(
 
         // input for next layer
         inpL = cur;
+        printf(" Final inpL = %f  \n", *(float*)inpL->data);
     }
 
     cur = inpL;