Qwen-2-llamacpp

Sleeping

TobDeBer commited on Aug 20, 2024

Commit

62ec359

1 Parent(s): 6145328

use selection

Files changed (1) hide show

app_local.py CHANGED Viewed

@@ -17,7 +17,7 @@ llm_model = None
 def respond(
     message,
     history: list[tuple[str, str]],
-    model,
     system_message,
     max_tokens,
     temperature,
@@ -29,16 +29,17 @@ def respond(
     global llm
     global llm_model
-    if llm is None or llm_model != model:
         llm = Llama(
-            model_path=f"models/{model}",
             flash_attn=True,
             n_gpu_layers=81,
             n_batch=1024,
             n_ctx=8192,
         )
-        llm_model = model
     provider = LlamaCppPythonProvider(llm)

 def respond(
     message,
     history: list[tuple[str, str]],
+    selected_model,
     system_message,
     max_tokens,
     temperature,
     global llm
     global llm_model
+    # Check if the selected model has changed
+    if llm is None or llm_model != selected_model:
         llm = Llama(
+            model_path=f"models/{selected_model}",
             flash_attn=True,
             n_gpu_layers=81,
             n_batch=1024,
             n_ctx=8192,
         )
+        llm_model = selected_model
     provider = LlamaCppPythonProvider(llm)