Detect multi-byte responses and wait
This commit is contained in:
parent
36b3494332
commit
441d30811a
1 changed files with 1 additions and 1 deletions
|
@ -96,7 +96,7 @@ specified) expect poor results""", file=sys.stderr)
|
||||||
|
|
||||||
print(file=sys.stderr)
|
print(file=sys.stderr)
|
||||||
print(f"system_info: n_threads = {self.params.n_threads} / {cpu_count()} \
|
print(f"system_info: n_threads = {self.params.n_threads} / {cpu_count()} \
|
||||||
| {llama_cpp.llama_print_system_info().decode('utf8', errors='ignore')}", file=sys.stderr)
|
| {llama_cpp.llama_print_system_info().decode('utf8')}", file=sys.stderr)
|
||||||
|
|
||||||
# determine the required inference memory per token:
|
# determine the required inference memory per token:
|
||||||
if (self.params.mem_test):
|
if (self.params.mem_test):
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue