From 094046077456566a140edea96af36211c267e416 Mon Sep 17 00:00:00 2001
From: Daniel Bevenius <daniel.bevenius@gmail.com>
Date: Fri, 20 Sep 2024 04:41:29 +0200
Subject: [PATCH 1/3] baby-llama : rename llama_layer to baby_llama_layer

This commit renames the struct llama_layer to baby_llama_layer in the
baby-llama example. This is to avoid a symbol conflict with the
llama_layer struct in llama.cpp.

I ran into this when investigating an issue related to the baby-llama
example and stepping through the code I noticed the following in
`init_model`:
```console
$ gdb --args ./llama-baby-llama
Reading symbols from ./llama-baby-llama...
(gdb) br init_model
Breakpoint 1 at 0x251767: file examples/baby-llama/baby-llama.cpp,
line 190.
(gdb) r
...
(gdb)
204	    model->layers.resize(n_layer);
```
If we inspect the size of `model->layers` we see that it is 0:
```console
(gdb) p model->layers.size()
$1 = 0
```
And also `n_layer` is 1:
```console
(gdb) p n_layer
$3 = 1
```
And we can inspect the type of `model->layers`:
```console
(gdb) ptype model->layers
type = std::vector<llama_layer>
```

Now if we step over the resize function we will see something
interesting:
```console
(gdb) p model->layers.size()
$2 = 12
```
I also added two print statements to show the size of `n_layer` and
`model->layers.size()`:
```console
n_layer: 1
layers.size(): 2049638230412172414
```

I later realized that there is a symbol conflict. There is a
`llama_layer` in llama.cpp and this object file is compiled into the
`llama-baby-llama` binary:
```console
/usr/bin/ccache c++ -std=c++11 -fPIC -O0 -g -Wall -Wextra -Wpedantic
-Wcast-qual -Wno-unused-function -Wmissing-declarations
-Wmissing-noreturn -pthread -fopenmp  -march=native -mtune=native
-Wno-array-bounds -Wno-format-truncation -Wextra-semi -Iggml/include
-Iggml/src -Iinclude -Isrc -Icommon -D_XOPEN_SOURCE=600 -D_GNU_SOURCE
-D_GLIBCXX_ASSERTIONS -DGGML_USE_OPENMP -DGGML_USE_LLAMAFILE
ggml/src/llamafile/sgemm.o ggml/src/ggml.o ggml/src/ggml-alloc.o
ggml/src/ggml-backend.o ggml/src/ggml-quants.o ggml/src/ggml-aarch64.o
src/llama.o src/llama-vocab.o src/llama-grammar.o src/llama-sampling.o
src/unicode.o src/unicode-data.o common/common.o common/arg.o
common/log.o common/console.o common/ngram-cache.o common/sampling.o
common/train.o common/build-info.o common/json-schema-to-grammar.o
examples/baby-llama/baby-llama.o -o llama-baby-llama -g
```
This could be worked around by renaming the `llama_layer` in
baby-llama.cpp to `baby_llama_layer`, or use a namespace in
baby-llama.cpp. I initially considered not compiling llama.o into the
llama-baby-llama binary, but it looks like the baby-llama example uses
`train.h` so it needs llama.cpp indirectly, so I opted to rename the
struct.

After renaming the resize function works as expected:
```console
(gdb) p model->layers.size()
$1 = 0
(gdb) ptype model->layers
type = std::vector<baby_llama_layer>
(gdb) p model->layers.size()
$2 = 1
```
---
 examples/baby-llama/baby-llama.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/examples/baby-llama/baby-llama.cpp b/examples/baby-llama/baby-llama.cpp
index 3ce91070b..bd9359801 100644
--- a/examples/baby-llama/baby-llama.cpp
+++ b/examples/baby-llama/baby-llama.cpp
@@ -105,7 +105,7 @@ struct llama_hparams_lora {
     }
 };
 
-struct llama_layer {
+struct baby_llama_layer {
     // normalization
     struct ggml_tensor * attention_norm;
 
@@ -169,7 +169,7 @@ struct llama_model {
     struct ggml_tensor * norm;
     struct ggml_tensor * output;
 
-    std::vector<llama_layer> layers;
+    std::vector<baby_llama_layer> layers;
 };
 
 struct llama_model_lora {

From c93300f02fec5ccfa70158969c39dc0278c3280c Mon Sep 17 00:00:00 2001
From: Daniel Bevenius <daniel.bevenius@gmail.com>
Date: Fri, 20 Sep 2024 15:05:00 +0200
Subject: [PATCH 2/3] squash! baby-llama : rename llama_layer to
 baby_llama_layer

Rename baby_llama_layer to gpt_layer.
---
 examples/baby-llama/baby-llama.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/examples/baby-llama/baby-llama.cpp b/examples/baby-llama/baby-llama.cpp
index bd9359801..28a40dde1 100644
--- a/examples/baby-llama/baby-llama.cpp
+++ b/examples/baby-llama/baby-llama.cpp
@@ -105,7 +105,7 @@ struct llama_hparams_lora {
     }
 };
 
-struct baby_llama_layer {
+struct gpt_layer {
     // normalization
     struct ggml_tensor * attention_norm;
 
@@ -169,7 +169,7 @@ struct llama_model {
     struct ggml_tensor * norm;
     struct ggml_tensor * output;
 
-    std::vector<baby_llama_layer> layers;
+    std::vector<gpt_layer> layers;
 };
 
 struct llama_model_lora {

From f9c2155158c4f71e9a30f65e43bbf513873b66af Mon Sep 17 00:00:00 2001
From: Daniel Bevenius <daniel.bevenius@gmail.com>
Date: Fri, 20 Sep 2024 15:45:22 +0200
Subject: [PATCH 3/3] squash! baby-llama : rename llama_layer to
 baby_llama_layer

Use an unnamed namespace to make identifiers unique to the translation
unit.
---
 examples/baby-llama/baby-llama.cpp | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/examples/baby-llama/baby-llama.cpp b/examples/baby-llama/baby-llama.cpp
index 28a40dde1..ebce9a997 100644
--- a/examples/baby-llama/baby-llama.cpp
+++ b/examples/baby-llama/baby-llama.cpp
@@ -11,6 +11,8 @@
 #pragma warning(disable: 4244 4267) // possible loss of data
 #endif
 
+namespace {
+
 #ifdef LLAMA_DEFAULT_RMS_EPS
 constexpr float rms_norm_eps = LLAMA_DEFAULT_RMS_EPS;
 #else
@@ -105,7 +107,7 @@ struct llama_hparams_lora {
     }
 };
 
-struct gpt_layer {
+struct llama_layer {
     // normalization
     struct ggml_tensor * attention_norm;
 
@@ -169,7 +171,7 @@ struct llama_model {
     struct ggml_tensor * norm;
     struct ggml_tensor * output;
 
-    std::vector<gpt_layer> layers;
+    std::vector<llama_layer> layers;
 };
 
 struct llama_model_lora {
@@ -1432,7 +1434,7 @@ static struct ggml_tensor * cross_entropy_loss(
                                 ggml_new_f32(ctx, eps)))))));
 }
 
-int main(int argc, char ** argv) {
+int baby_llama_main(int argc, char ** argv) {
     if (argc < 1) {
         fprintf(stderr, "usage: %s\n", argv[0]);
 
@@ -1637,3 +1639,9 @@ int main(int argc, char ** argv) {
 
     return 0;
 }
+
+}
+
+int main(int argc, char ** argv) {
+    return baby_llama_main(argc, argv);
+}