add stub example for finetuning, based on train-text-from-scratch

2023-08-15 13:54:28 +02:00 · 2023-08-15 13:54:28 +02:00 · 5e059ace25
commit 5e059ace25
parent 316b0707f4
4 changed files with 2816 additions and 0 deletions
--- a/examples/CMakeLists.txt
+++ b/examples/CMakeLists.txt
@ -42,6 +42,7 @@ else()
    add_subdirectory(benchmark)
    add_subdirectory(baby-llama)
    add_subdirectory(train-text-from-scratch)
    add_subdirectory(finetune)
    add_subdirectory(simple)
    add_subdirectory(embd-input)
    if (LLAMA_METAL)
--- a/examples/finetune/CMakeLists.txt
+++ b/examples/finetune/CMakeLists.txt
@ -0,0 +1,5 @@
 set(TARGET finetune)
 add_executable(${TARGET} finetune.cpp)
 install(TARGETS ${TARGET} RUNTIME)
 target_link_libraries(${TARGET} PRIVATE common llama ${CMAKE_THREAD_LIBS_INIT})
 target_compile_features(${TARGET} PRIVATE cxx_std_11)
--- a/examples/finetune/README.md
+++ b/examples/finetune/README.md
@ -0,0 +1,22 @@
 # train-text-from-scratch
 Basic usage instructions:
 ```bash
 # get training data
 wget https://raw.githubusercontent.com/brunoklein99/deep-learning-notes/master/shakespeare.txt
 # train
 ./bin/train-text-from-scratch \
        --vocab-model ../models/ggml-vocab.bin \
        --ctx 64 --embd 256 --head 8 --layer 16 \
        --checkpoint-in  chk-shakespeare-256x16.bin \
        --checkpoint-out chk-shakespeare-256x16.bin \
        --model-out ggml-shakespeare-256x16-f32.bin \
        --train-data "shakespeare.txt" \
        -t 6 -b 16 -n 32 --seed 1 --adam-iter 16 \
        --print-details-interval 0 --predict 16 --use-flash
 # predict
 ./bin/main -m ggml-shakespeare-256x16-f32.bin
 ```
--- a/examples/finetune/finetune.cpp
+++ b/examples/finetune/finetune.cpp