Spaces:

Mauricio-100
/

agent-ai

Sleeping

Mauricio-100 commited on Oct 30

Commit

b5fcde2

verified ·

1 Parent(s): 4e63c00

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ from pydantic import BaseModel
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 import torch, gradio as gr
 MODEL_ID = "Gopu-poss/gopu-agent-2k-fdf"
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
@@ -12,6 +13,7 @@ model = AutoModelForCausalLM.from_pretrained(
     device_map="auto"
 )
 app = FastAPI()
 class Input(BaseModel):
@@ -28,14 +30,15 @@ def infer(data: Input):
     return {"generated_text": text}
 # --- Gradio multimodal ---
-# Ajoutons un champ "system prompt" + micro pour parler
-# Pipeline de reconnaissance vocale (tu peux choisir un modèle HF adapté)
-asr = pipeline("automatic-speech-recognition", model="openai/whisper-small")
 def gopu_chat(system_prompt, prompt, audio=None, image=None, video=None):
     # Si audio fourni → transcrire et remplacer le prompt
-    if audio is not None:
         transcription = asr(audio)["text"]
         prompt = transcription
@@ -53,11 +56,12 @@ demo = gr.Interface(
         gr.Textbox(label="Texte utilisateur"),
         gr.Audio(label="Voix (optionnel)", type="filepath"),
         gr.Image(label="Image (optionnel)", type="filepath"),
-        gr.Video(label="Vidéo (optionnel)"
     ],
     outputs="text",
     title="GopuOS Agentic Endpoint",
     description="Ajoute un prompt système, parle avec ta voix, ou envoie texte/image/vidéo."
 )
 app = gr.mount_gradio_app(app, demo, path="/gradio")

 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
 import torch, gradio as gr
+# --- Chargement du modèle ---
 MODEL_ID = "Gopu-poss/gopu-agent-2k-fdf"
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID)
     device_map="auto"
 )
+# --- FastAPI ---
 app = FastAPI()
 class Input(BaseModel):
     return {"generated_text": text}
 # --- Gradio multimodal ---
+# Pipeline de reconnaissance vocale (optionnel)
+try:
+    asr = pipeline("automatic-speech-recognition", model="openai/whisper-small")
+except Exception:
+    asr = None
 def gopu_chat(system_prompt, prompt, audio=None, image=None, video=None):
     # Si audio fourni → transcrire et remplacer le prompt
+    if audio is not None and asr is not None:
         transcription = asr(audio)["text"]
         prompt = transcription
         gr.Textbox(label="Texte utilisateur"),
         gr.Audio(label="Voix (optionnel)", type="filepath"),
         gr.Image(label="Image (optionnel)", type="filepath"),
+        gr.Video(label="Vidéo (optionnel)")
     ],
     outputs="text",
     title="GopuOS Agentic Endpoint",
     description="Ajoute un prompt système, parle avec ta voix, ou envoie texte/image/vidéo."
 )
+# Monter Gradio dans FastAPI
 app = gr.mount_gradio_app(app, demo, path="/gradio")