Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -1,8 +1,12 @@
|
|
| 1 |
import gradio as gr
|
| 2 |
-
|
|
|
|
|
|
|
| 3 |
from llama_cpp import Llama
|
|
|
|
| 4 |
|
| 5 |
-
|
|
|
|
| 6 |
|
| 7 |
history = []
|
| 8 |
history.append(["Hi there!", "Hello, how can I help you?"])
|
|
@@ -30,6 +34,3 @@ demo.launch()
|
|
| 30 |
|
| 31 |
|
| 32 |
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
|
|
|
| 1 |
import gradio as gr
|
| 2 |
+
import time
|
| 3 |
+
import ctypes #to run on C api directly
|
| 4 |
+
import llama_cpp
|
| 5 |
from llama_cpp import Llama
|
| 6 |
+
from huggingface_hub import hf_hub_download #load from huggingfaces
|
| 7 |
|
| 8 |
+
|
| 9 |
+
llm = Llama(model_path= hf_hub_download(repo_id="TheBloke/airoboros-l2-13b-gpt4-m2.0-GGML", filename="airoboros-l2-13b-gpt4-m2.0.ggmlv3.q6_K.bin"), n_ctx=2048) #download model from hf/ n_ctx=2048 for high ccontext length
|
| 10 |
|
| 11 |
history = []
|
| 12 |
history.append(["Hi there!", "Hello, how can I help you?"])
|
|
|
|
| 34 |
|
| 35 |
|
| 36 |
|
|
|
|
|
|
|
|
|