default horde name and better handling for horde (+3 squashed commit)
Squashed commit: [fadfa60] better idle handling for horde worker [a3971e6] updated lite [2ca2b79] seems to not generate rubbish
This commit is contained in:
parent
c7136f03d9
commit
825e34baa3
3 changed files with 10 additions and 5 deletions
|
@ -99,7 +99,7 @@ if (LLAMA_CUBLAS)
|
||||||
if (LLAMA_CUDA_DMMV_F16)
|
if (LLAMA_CUDA_DMMV_F16)
|
||||||
set(CMAKE_CUDA_ARCHITECTURES "60;61") # needed for f16 CUDA intrinsics
|
set(CMAKE_CUDA_ARCHITECTURES "60;61") # needed for f16 CUDA intrinsics
|
||||||
else()
|
else()
|
||||||
set(CMAKE_CUDA_ARCHITECTURES "37;86") # lowest CUDA 12 standard + lowest for integer intrinsics
|
set(CMAKE_CUDA_ARCHITECTURES "37;61") # lowest CUDA 12 standard + lowest for integer intrinsics
|
||||||
endif()
|
endif()
|
||||||
endif()
|
endif()
|
||||||
message(STATUS "Using CUDA architectures: ${CMAKE_CUDA_ARCHITECTURES}")
|
message(STATUS "Using CUDA architectures: ${CMAKE_CUDA_ARCHITECTURES}")
|
||||||
|
|
File diff suppressed because one or more lines are too long
11
koboldcpp.py
11
koboldcpp.py
|
@ -978,7 +978,7 @@ def show_new_gui():
|
||||||
else:
|
else:
|
||||||
item.grid_forget()
|
item.grid_forget()
|
||||||
labels[idx].grid_forget()
|
labels[idx].grid_forget()
|
||||||
if usehorde_var.get()==1 and horde_name_var.get()=="koboldcpp" and model_var.get()!="":
|
if usehorde_var.get()==1 and (horde_name_var.get()=="koboldcpp" or horde_name_var.get()=="") and model_var.get()!="":
|
||||||
basefile = os.path.basename(model_var.get())
|
basefile = os.path.basename(model_var.get())
|
||||||
horde_name_var.set(os.path.splitext(basefile)[0])
|
horde_name_var.set(os.path.splitext(basefile)[0])
|
||||||
|
|
||||||
|
@ -1388,6 +1388,7 @@ def run_horde_worker(args, api_key, worker_name):
|
||||||
current_id = None
|
current_id = None
|
||||||
current_payload = None
|
current_payload = None
|
||||||
current_generation = None
|
current_generation = None
|
||||||
|
sleepy_counter = 0 #if this exceeds a value, worker becomes sleepy (slower)
|
||||||
print("===\nEmbedded Horde Worker '"+worker_name+"' Starting...\n(To use your own KAI Bridge/Scribe worker instead, don't set your API key)")
|
print("===\nEmbedded Horde Worker '"+worker_name+"' Starting...\n(To use your own KAI Bridge/Scribe worker instead, don't set your API key)")
|
||||||
BRIDGE_AGENT = f"KoboldCppEmbedWorker:1:https://github.com/LostRuins/koboldcpp"
|
BRIDGE_AGENT = f"KoboldCppEmbedWorker:1:https://github.com/LostRuins/koboldcpp"
|
||||||
cluster = "https://horde.koboldai.net"
|
cluster = "https://horde.koboldai.net"
|
||||||
|
@ -1424,9 +1425,13 @@ def run_horde_worker(args, api_key, worker_name):
|
||||||
time.sleep(5)
|
time.sleep(5)
|
||||||
continue
|
continue
|
||||||
if not pop["id"]:
|
if not pop["id"]:
|
||||||
#print(f"Server {cluster} has no valid generations to do for us.")
|
slp = (2 if sleepy_counter<10 else (3 if sleepy_counter<20 else 4))
|
||||||
time.sleep(3)
|
#print(f"Server {cluster} has no valid generations for us. Sleep for {slp}s")
|
||||||
|
time.sleep(slp)
|
||||||
|
sleepy_counter += 1
|
||||||
continue
|
continue
|
||||||
|
|
||||||
|
sleepy_counter = 0
|
||||||
current_id = pop['id']
|
current_id = pop['id']
|
||||||
current_payload = pop['payload']
|
current_payload = pop['payload']
|
||||||
print(f"\nJob received from {cluster} for {current_payload.get('max_length',80)} tokens and {current_payload.get('max_context_length',1024)} max context. Starting generation...")
|
print(f"\nJob received from {cluster} for {current_payload.get('max_length',80)} tokens and {current_payload.get('max_context_length',1024)} max context. Starting generation...")
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue