Spaces:

theotherdylan
/

TinyChat

Sleeping

theotherdylan commited on Feb 21, 2024

Commit

b50e8e0

1 Parent(s): 13dde62

switch back to ollama

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,6 +1,11 @@
-from transformers import pipeline
 import gradio
 history = []
@@ -13,8 +18,27 @@ def get_history_messages():
 def predict(prompt):
     print("Predict:", prompt)
     pipe = pipeline("conversational", model="cognitivecomputations/TinyDolphin-2.8-1.1b")
     response = pipe(
         [
             *get_history_messages(),

+import subprocess
+#from transformers import pipeline
+import ollama
 import gradio
+subprocess.run("curl -fsSL https://ollama.com/install.sh | sh")
 history = []
 def predict(prompt):
+    response = ollama.chat(
+        model="tinydolphin",
+        messages=[
+            *get_history_messages(),
+            {"role": "user", "content": prompt}
+        ],
+        stream=True
+    )
+    history.append((prompt, ""))
+    message = ""
+    for chunk in response:
+        message += chunk["message"]["content"]
+        history[-1] = (prompt, message)
+        yield "", history
+def predict_t(prompt):
     print("Predict:", prompt)
+    print("Loading model")
     pipe = pipeline("conversational", model="cognitivecomputations/TinyDolphin-2.8-1.1b")
+    print("Running pipeline")
     response = pipe(
         [
             *get_history_messages(),

requirements.txt CHANGED Viewed

@@ -1,4 +1,3 @@
-torch
-transformers
 gradio
 sentencepiece

+ollama
 gradio
 sentencepiece