Detect multi-byte responses and wait

2023-04-28 12:50:30 +02:00 · 2023-04-28 12:50:30 +02:00 · 441d30811a
commit 441d30811a
parent 36b3494332
1 changed files with 1 additions and 1 deletions
--- a/examples/low_level_api_chat_cpp.py
+++ b/examples/low_level_api_chat_cpp.py
@ -96,7 +96,7 @@ specified) expect poor results""", file=sys.stderr)
        print(file=sys.stderr)
        print(f"system_info: n_threads = {self.params.n_threads} / {cpu_count()} \
-| {llama_cpp.llama_print_system_info().decode('utf8', errors='ignore')}", file=sys.stderr)
+| {llama_cpp.llama_print_system_info().decode('utf8')}", file=sys.stderr)
        # determine the required inference memory per token:
        if (self.params.mem_test):