demo-allama

Sleeping

App Files Files Community

aigos commited on Dec 28, 2025

Commit

4ab13d7

verified ·

1 Parent(s): 5000921

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -13

app.py CHANGED Viewed

@@ -2,8 +2,7 @@ import gradio as gr
 from huggingface_hub import InferenceClient
 import os
-# We gebruiken Llama-3.1-8B omdat deze het meest stabiel is op HF gratis servers.
-# Zorg dat je 'Request Access' hebt gedaan op de HF pagina van dit model!
 client = InferenceClient(
     "meta-llama/Llama-3.1-8B-Instruct",
     token=os.getenv("HF_TOKEN")
@@ -11,27 +10,27 @@ client = InferenceClient(
 def respond(
     message,
-    history,  # History is nu een lijst van dicts: [{"role": "user", "content": "..."}, ...]
     system_message,
     max_tokens,
     temperature,
     top_p,
 ):
-    # We beginnen met de system prompt
     messages = [{"role": "system", "content": system_message}]
-    # We voegen de geschiedenis toe aan de berichtenlijst
-    # Gradio 5+ stuurt de geschiedenis al in het juiste format (dicts)
-    for entry in history:
-        messages.append(entry)
-    # Voeg de nieuwste vraag van de gebruiker toe
     messages.append({"role": "user", "content": message})
     response = ""
     try:
-        # Roep de AI aan
         for msg in client.chat_completion(
             messages,
             max_tokens=max_tokens,
@@ -43,12 +42,11 @@ def respond(
             response += token
             yield response
     except Exception as e:
-        yield f"Verbindingsfout: {str(e)}. Probeer het over een momentje opnieuw."
-# De interface
 demo = gr.ChatInterface(
     respond,
-    type="messages", # DIT IS DE BELANGRIJKE FIX: Vertelt Gradio het nieuwe format te gebruiken
     additional_inputs=[
         gr.Textbox(
             value="Bismillah. You are Noor AI, a wise Islamic scholar. Answer accurately based on Quran and Sunnah. End with Wa Allahu a'la wa a'lam.",

 from huggingface_hub import InferenceClient
 import os
+# Gebruik Llama-3.1-8B-Instruct (Zorg dat je 'Request Access' hebt gedaan op HF!)
 client = InferenceClient(
     "meta-llama/Llama-3.1-8B-Instruct",
     token=os.getenv("HF_TOKEN")
 def respond(
     message,
+    history,
     system_message,
     max_tokens,
     temperature,
     top_p,
 ):
     messages = [{"role": "system", "content": system_message}]
+    # Veilige manier om geschiedenis te verwerken (werkt in Gradio 4, 5 en 6)
+    for val in history:
+        if isinstance(val, dict): # Moderne Gradio stijl
+            messages.append(val)
+        elif isinstance(val, (list, tuple)): # Klassieke Gradio stijl
+            if val[0]: messages.append({"role": "user", "content": val[0]})
+            if val[1]: messages.append({"role": "assistant", "content": val[1]})
     messages.append({"role": "user", "content": message})
     response = ""
     try:
         for msg in client.chat_completion(
             messages,
             max_tokens=max_tokens,
             response += token
             yield response
     except Exception as e:
+        yield f"Verbindingsfout: {str(e)}. Controleer of je 'Request Access' hebt gedaan voor Llama-3.1 op Hugging Face."
+# GEEN 'type' argument meer, zodat het nooit meer crasht op TypeError
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
         gr.Textbox(
             value="Bismillah. You are Noor AI, a wise Islamic scholar. Answer accurately based on Quran and Sunnah. End with Wa Allahu a'la wa a'lam.",