AlexandreScriptsMT commited on
Commit
3e76c04
·
verified ·
1 Parent(s): c78952a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +18 -3
app.py CHANGED
@@ -1,6 +1,21 @@
1
  import gradio as gr
 
2
 
3
- # Usa a API gratuita do Hugging Face para rodar o modelo sem consumir sua RAM
4
- demo = gr.load("models/Qwen/Qwen2.5-0.5B-Instruct")
 
 
5
 
6
- demo.launch()
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  import gradio as gr
2
+ from transformers import pipeline
3
 
4
+ # Carrega o modelo para rodar na CPU do seu Space
5
+ # Usamos o modelo de 0.5B pois ele cabe nos 16GB de RAM gratuitos
6
+ model_id = "Qwen/Qwen2.5-0.5B-Instruct"
7
+ pipe = pipeline("text-generation", model=model_id, device_map="cpu")
8
 
9
+ def chat_function(message, history):
10
+ # Formata a mensagem para o modelo
11
+ messages = [{"role": "user", "content": message}]
12
+
13
+ # Gera a resposta
14
+ results = pipe(messages, max_new_tokens=512, truncation=True)
15
+ return results[0]['generated_text'][-1]['content']
16
+
17
+ # Cria a interface de Chat
18
+ demo = gr.ChatInterface(fn=chat_function, title="Meu Chat Qwen Local")
19
+
20
+ if __name__ == "__main__":
21
+ demo.launch()