Spaces:

lumen-models
/

lumen-admin-assistant

Sleeping

lumen-models commited on Dec 5, 2025

Commit

1a892e3

verified ·

1 Parent(s): 4a8ecd1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,18 +4,24 @@ from ctransformers import AutoModelForCausalLM
 # Cargar modelo GGUF
 model = AutoModelForCausalLM.from_pretrained(
     "tinyllama-1.1b-chat-v1.0.Q4_0.gguf",
-    model_type="llama"
 )
 def chat_fn(message, history):
-    # Generar texto
     output = model(
-        message,
         max_new_tokens=200,
         temperature=0.7
     )
-    # Convertir a string por seguridad
     if isinstance(output, bytes):
         output = output.decode("utf-8", errors="ignore")
@@ -29,4 +35,3 @@ demo = gr.ChatInterface(
 demo.launch()

 # Cargar modelo GGUF
 model = AutoModelForCausalLM.from_pretrained(
     "tinyllama-1.1b-chat-v1.0.Q4_0.gguf",
+    model_type="llama",
+    gpu_layers=0,
+    threads=4
 )
 def chat_fn(message, history):
+    prompt = (
+        "<|system|>Eres un asistente útil especializado en trámites y administración en España.<|end|>\n"
+        f"<|user|>{message}<|end|>\n"
+        "<|assistant|>"
+    )
     output = model(
+        prompt,
         max_new_tokens=200,
         temperature=0.7
     )
     if isinstance(output, bytes):
         output = output.decode("utf-8", errors="ignore")
 demo.launch()