add test

2024-09-05 16:46:31 +02:00 · 2024-09-05 16:46:31 +02:00 · 753782ae35
commit 753782ae35
parent 9ae4d8a96d
5 changed files with 122 additions and 33 deletions
--- a/6
+++ b/6
@ -43,6 +43,7 @@ BUILD_TARGETS = \
 # Binaries only useful for tests
 TEST_TARGETS = \
 	tests/test-arg-parser \
 	tests/test-autorelease \
 	tests/test-backend-ops \
 	tests/test-chat-template \
@ -1505,6 +1506,11 @@ run-benchmark-matmult: llama-benchmark-matmult
 .PHONY: run-benchmark-matmult swift
 tests/test-arg-parser: tests/test-arg-parser.cpp \
 	$(OBJ_ALL)
 	$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
 	$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
 tests/test-llama-grammar: tests/test-llama-grammar.cpp \
 	$(OBJ_ALL)
 	$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
--- a/common/common.cpp
+++ b/common/common.cpp
@ -383,8 +383,8 @@ bool gpt_params_parse_ex(int argc, char ** argv, gpt_params & params, std::vecto
    const std::string arg_prefix = "--";
    llama_sampling_params & sparams = params.sparams;
-    std::unordered_map<std::string, const llama_arg *> arg_to_options;
+    std::unordered_map<std::string, llama_arg *> arg_to_options;
-    for (const auto & opt : options) {
+    for (auto & opt : options) {
        for (const auto & arg : opt.args) {
            arg_to_options[arg] = &opt;
        }
@ -404,8 +404,8 @@ bool gpt_params_parse_ex(int argc, char ** argv, gpt_params & params, std::vecto
        if (arg_to_options.find(arg) == arg_to_options.end()) {
            throw std::invalid_argument(format("error: invalid argument: %s", arg.c_str()));
        }
        auto opt = *arg_to_options[arg];
        try {
            auto opt = *arg_to_options[arg];
            if (opt.handler_void) {
                opt.handler_void();
                continue;
@ -431,7 +431,10 @@ bool gpt_params_parse_ex(int argc, char ** argv, gpt_params & params, std::vecto
                continue;
            }
        } catch (std::exception & e) {
-            throw std::invalid_argument(format("error: %s", e.what()));
+            throw std::invalid_argument(format(
                "error while handling argument \"%s\": %s\n\n"
                "usage:\n%s\n\nto show complete usage, run with -h",
                arg.c_str(), e.what(), arg_to_options[arg]->to_string(false).c_str()));
        }
    }
@ -592,39 +595,49 @@ static std::vector<std::string> break_str_into_lines(std::string input, size_t m
    return result;
 }
-void gpt_params_print_usage(std::vector<llama_arg> & options) {
+std::string llama_arg::to_string(bool markdown) {
    // params for printing to console
    const static int n_leading_spaces = 40;
    const static int n_char_per_line_help = 70; // TODO: detect this based on current console
    std::string leading_spaces(n_leading_spaces, ' ');
-    auto print_options = [](std::vector<const llama_arg *> & options) {
+    std::ostringstream ss;
-        std::string leading_spaces(n_leading_spaces, ' ');
+    if (markdown) ss << "| `";
-        for (const auto & opt : options) {
+    for (const auto & arg : args) {
-            std::ostringstream ss;
+        if (arg == args.front()) {
-            for (const auto & arg : opt->args) {
+            ss << (args.size() == 1 ? arg : format("%-7s", (arg + ",").c_str()));
-                if (&arg == &opt->args.front()) {
+        } else {
-                    ss << (opt->args.size() == 1 ? arg : format("%-7s", (arg + ",").c_str()));
+            ss << arg << (arg != args.back() ? ", " : "");
-                } else {
+        }
-                    ss << arg << (&arg != &opt->args.back() ? ", " : "");
+    }
-                }
+    if (!value_hint.empty()) ss << " " << value_hint;
-            }
+    if (!markdown) {
-            if (!opt->value_hint.empty()) ss << " " << opt->value_hint;
+        if (ss.tellp() > n_leading_spaces - 3) {
-            if (ss.tellp() > n_leading_spaces - 3) {
+            // current line is too long, add new line
-                // current line is too long, add new line
+            ss << "\n" << leading_spaces;
-                ss << "\n" << leading_spaces;
+        } else {
-            } else {
+            // padding between arg and help, same line
-                // padding between arg and help, same line
+            ss << std::string(leading_spaces.size() - ss.tellp(), ' ');
-                ss << std::string(leading_spaces.size() - ss.tellp(), ' ');
+        }
-            }
+        const auto help_lines = break_str_into_lines(help, n_char_per_line_help);
-            const auto help_lines = break_str_into_lines(opt->help, n_char_per_line_help);
+        for (const auto & line : help_lines) {
-            for (const auto & line : help_lines) {
+            ss << (&line == &help_lines.front() ? "" : leading_spaces) << line << "\n";
-                ss << (&line == &help_lines.front() ? "" : leading_spaces) << line << "\n";
+        }
-            }
+    } else {
-            printf("%s", ss.str().c_str());
+        ss << "` | " << help << " |";
    }
    return ss.str();
 }
 void gpt_params_print_usage(std::vector<llama_arg> & options) {
    auto print_options = [](std::vector<llama_arg *> & options) {
        for (llama_arg * opt : options) {
            printf("%s", opt->to_string(false).c_str());
        }
    };
-    std::vector<const llama_arg *> common_options;
+    std::vector<llama_arg *> common_options;
-    std::vector<const llama_arg *> specific_options;
+    std::vector<llama_arg *> specific_options;
    for (auto & opt : options) {
        if (opt.in_example(LLAMA_EXAMPLE_COMMON)) {
            common_options.push_back(&opt);
@ -1688,7 +1701,7 @@ std::vector<llama_arg> gpt_params_parser_init(gpt_params & params, llama_example
        }
    ));
    add_opt(llama_arg(
-        {"-sm", "--split-mode"}, "SPLIT_MODE",
+        {"-sm", "--split-mode"}, "{none,layer,row}",
        "how to split the model across multiple GPUs, one of:\n"
        "- none: use one GPU only\n"
        "- layer (default): split layers and KV across GPUs\n"
--- a/common/common.h
+++ b/common/common.h
@ -331,6 +331,8 @@ struct llama_arg {
    bool in_example(enum llama_example ex) {
        return examples.find(ex) != examples.end();
    }
    std::string to_string(bool markdown);
 };
 std::vector<llama_arg> gpt_params_parser_init(gpt_params & params, llama_example ex);
--- a/tests/CMakeLists.txt
+++ b/tests/CMakeLists.txt
@ -108,6 +108,7 @@ llama_test(test-tokenizer-1-spm  NAME test-tokenizer-1-llama-spm ARGS ${CMAKE_CU
 #llama_test(test-tokenizer-1-spm  NAME test-tokenizer-1-baichuan  ARGS ${CMAKE_CURRENT_SOURCE_DIR}/../models/ggml-vocab-baichuan.gguf)
 # llama_target_and_test(test-double-float.cpp) # SLOW
 llama_target_and_test(test-arg-parser.cpp)
 llama_target_and_test(test-quantize-fns.cpp)
 llama_target_and_test(test-quantize-perf.cpp)
 llama_target_and_test(test-sampling.cpp)
--- a/tests/test-arg-parser.cpp
+++ b/tests/test-arg-parser.cpp
@ -0,0 +1,67 @@
 #include <string>
 #include <vector>
 #include <sstream>
 #undef NDEBUG
 #include <cassert>
 #include "common.h"
 int main(void) {
    gpt_params params;
    printf("test-arg-parser: make sure there is no duplicated arguments in any examples\n\n");
    for (int ex = 0; ex < LLAMA_EXAMPLE_COUNT; ex++) {
        try {
            gpt_params_parser_init(params, (enum llama_example)ex);
        } catch (std::exception & e) {
            printf("%s\n", e.what());
            assert(false);
        }
    }
    auto list_str_to_char = [](std::vector<std::string> & argv) -> std::vector<char *> {
        std::vector<char *> res;
        for (auto & arg : argv) {
            res.push_back(const_cast<char *>(arg.data()));
        }
        return res;
    };
    std::vector<std::string> argv;
    auto options = gpt_params_parser_init(params, LLAMA_EXAMPLE_COMMON);
    printf("test-arg-parser: test invalid usage\n\n");
    argv = {"binary_name", "-m"};
    assert(false == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    argv = {"binary_name", "-ngl", "hello"};
    assert(false == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    argv = {"binary_name", "-sm", "hello"};
    assert(false == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    printf("test-arg-parser: test valid usage\n\n");
    argv = {"binary_name", "-m", "model_file.gguf"};
    assert(true == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    assert(params.model == "model_file.gguf");
    argv = {"binary_name", "-t", "1234"};
    assert(true == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    assert(params.cpuparams.n_threads == 1234);
    argv = {"binary_name", "--verbose"};
    assert(true == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    assert(params.verbosity == 1);
    argv = {"binary_name", "-m", "abc.gguf", "--predict", "6789", "--batch-size", "9090"};
    assert(true == gpt_params_parse(argv.size(), list_str_to_char(argv).data(), params, options));
    assert(params.model == "abc.gguf");
    assert(params.n_predict == 6789);
    assert(params.n_batch == 9090);
    printf("test-arg-parser: all tests OK\n\n");
 }