Spaces:

seckdaara
/

chatbot

Build error

seckdaara commited on Aug 10

Commit

fe60596

verified ·

1 Parent(s): bd9b66b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,8 +1,15 @@
 import gradio as gr
 from llama_cpp import Llama
-model_path = "gemma-2b-it-Q4_K_M.gguf"
 llm = Llama(model_path=model_path, n_ctx=2048, n_threads=2)
 def chatbot(message, history):
@@ -15,11 +22,11 @@ def chatbot(message, history):
         "Ne fais pas de diagnostic médical et précise toujours que l'utilisateur doit consulter "
         "un médecin pour tout problème grave. Réponds avec bienveillance et clarté.\n\n"
     )
     for human, bot in history:
         prompt += f"Utilisateur: {human}\nAssistant: {bot}\n"
     prompt += f"Utilisateur: {message}\nAssistant:"
     output = llm(prompt, max_tokens=300)
     return output["choices"][0]["text"]

 import gradio as gr
+from huggingface_hub import hf_hub_download
 from llama_cpp import Llama
+# Téléchargement automatique du modèle depuis Hugging Face Hub
+model_path = hf_hub_download(
+    repo_id="google/gemma-2b-it-GGUF",
+    filename="gemma-2b-it-Q4_K_M.gguf",
+    cache_dir="./model_cache"  # dossier local pour stocker le modèle
+)
+# Chargement du modèle en CPU
 llm = Llama(model_path=model_path, n_ctx=2048, n_threads=2)
 def chatbot(message, history):
         "Ne fais pas de diagnostic médical et précise toujours que l'utilisateur doit consulter "
         "un médecin pour tout problème grave. Réponds avec bienveillance et clarté.\n\n"
     )
     for human, bot in history:
         prompt += f"Utilisateur: {human}\nAssistant: {bot}\n"
     prompt += f"Utilisateur: {message}\nAssistant:"
     output = llm(prompt, max_tokens=300)
     return output["choices"][0]["text"]