Refactor code for local models

2024-01-16 17:52:33 +09:00
parent 9db4810bbc
commit 1b1c6ad2fd
3 changed files with 47 additions and 10 deletions
--- a/src-tauri/src-python/main.py
+++ b/src-tauri/src-python/main.py
@@ -66,17 +66,39 @@ def stream_chat_llamacpp(item:LlamaItem):
    chunks = app.llm.create_completion(
        prompt = item.prompt,
        temperature = item.temperature,
-        top_p = item.top_p,
-        top_k = item.top_k,
-        max_tokens = item.max_tokens,
-        presence_penalty = item.presence_penalty,
-        frequency_penalty = item.frequency_penalty,
-        repeat_penalty = item.repeat_penalty,
-        stop=item.stop,
-        stream=True
+        # top_p = item.top_p,
+        # top_k = item.top_k,
+        # max_tokens = item.max_tokens,
+        # presence_penalty = item.presence_penalty,
+        # frequency_penalty = item.frequency_penalty,
+        # repeat_penalty = item.repeat_penalty,
+        # stop=item.stop,
+        stream=False,
    )
+    if(type(chunks) == str):
+        print(chunks, end="")
+        yield chunks
+        return
+    if(type(chunks) == bytes):
+        print(chunks.decode('utf-8'), end="")
+        yield chunks.decode('utf-8')
+        return
+    if(type(chunks) == dict and "choices" in chunks):
+        print(chunks["choices"][0]["text"], end="")
+        yield chunks["choices"][0]["text"]
+        return
+
    for chunk in chunks:
+        if(type(chunk) == str):
+            print(chunk, end="")
+            yield chunk
+            continue
+        if(type(chunk) == bytes):
+            print(chunk.decode('utf-8'), end="")
+            yield chunk.decode('utf-8')
+            continue
        cont:CompletionChunk  = chunk
+        print(cont)
        encoded = cont["choices"][0]["text"]
        print(encoded, end="")
        yield encoded