Spaces:

Alejo760
/

heraudio

Sleeping

App Files Files Community

Alejo760 commited on Feb 17

Commit

6a77f47

verified ·

1 Parent(s): 29c5abd

Update app.py

Browse files

Files changed (1) hide show

app.py +141 -18

app.py CHANGED Viewed

@@ -4,6 +4,112 @@ import fitz  # PyMuPDF
 from groq import Groq
 from langchain_groq import ChatGroq
 # Inicialización del cliente
 api_key = os.environ.get("GROQ_API_KEY")
 if not api_key:
@@ -107,18 +213,19 @@ def process_input(audio, pdfs, current_text):
     except Exception as e:
         transcription_text = ""
         print(f"Error en transcripción de audio: {e}")
     try:
         pdf_text = extract_texts_from_pdfs(pdfs)
     except Exception as e:
         pdf_text = ""
         print(f"Error en extracción de PDFs: {e}")
-    # Now process the transcription_text and pdf_text in batches
     updated_text = current_text
-    # Define the maximum words per chunk (adjust as needed)
-    max_chunk_words = 2500  # Adjust this number based on your API limits
     for text_label, text_content in [("Audio", transcription_text), ("PDF", pdf_text)]:
         if not text_content:
             continue
@@ -128,15 +235,18 @@ def process_input(audio, pdfs, current_text):
         for chunk in text_chunks:
             transcription_chunk = chunk if text_label == "Audio" else ""
             pdf_chunk = chunk if text_label == "PDF" else ""
             organized_record = organize_clinical_record(updated_text, transcription_chunk, pdf_chunk)
             if organized_record:
                 updated_text = organized_record.content
-            else:
-                # Handle error
-                print("Error processing chunk.")
-                continue
-    return updated_text, "Información de depuración"
@@ -178,17 +288,30 @@ initial_text = """
 # Interfaz de Gradio
 with gr.Blocks(theme=theme) as iface:
-    gr.Markdown("# Aplicación de Procesamiento de Audio y PDFs")
-    iterative_output = gr.Textbox(
-        label="Registro Clínico Organizado",
-        value=initial_text,
-        lines=20
-    )
     current_state = gr.State(value=initial_text)
-    audio_filepath = gr.Audio(sources=["microphone"], type="filepath", label="Entrada de Audio")
-    pdf_files = gr.File(file_types=[".pdf"], label="Subir PDF", file_count="multiple")
-    debug_output = gr.Textbox(label="Información de Depuración", lines=10)
     # Función para capturar cambios en el iterative_output
     def on_text_change(updated_text):

 from groq import Groq
 from langchain_groq import ChatGroq
+RAID_WEIGHTS = {
+    "Dolor": 0.21,
+    "Discapacidad Funcional": 0.16,
+    "Fatiga": 0.15,
+    "Sueño": 0.12,
+    "Bienestar Físico": 0.12,
+    "Bienestar Emocional": 0.12,
+    "Afronte": 0.12
+}
+RAID_PROMPT_TEMPLATE = """
+Analiza la siguiente conversación y registro clínico del paciente con artritis reumatoide.
+Asigna un puntaje de 0 a 10 para cada categoría del RAID según la escala proporcionada.
+La respuesta DEBE ser SOLO un JSON válido con los puntajes y el cálculo final.
+Escalas:
+1. Dolor (0 = Ninguno, 10 = Extremo)
+2. Discapacidad Funcional (0 = Sin dificultad, 10 = Dificultad extrema)
+3. Fatiga (0 = Sin fatiga, 10 = Totalmente exhausto)
+4. Sueño (0 = Sin dificultad, 10 = Dificultad extrema)
+5. Bienestar Físico (0 = Muy bueno, 10 = Muy malo)
+6. Bienestar Emocional (0 = Muy bueno, 10 = Muy malo)
+7. Afronte (0 = Muy bien, 10 = Muy mal)
+Texto del paciente:
+{patient_text}
+Registro clínico relevante:
+{clinical_record}
+Calcula el puntaje total usando estos pesos:
+{weights}
+Respuesta JSON (ejemplo):
+{{
+    "raid_scores": {{
+        "Dolor": 8,
+        "Discapacidad Funcional": 6,
+        "Fatiga": 7,
+        "Sueño": 5,
+        "Bienestar Físico": 6,
+        "Bienestar Emocional": 7,
+        "Afronte": 4
+    }},
+    "raid_total": 6.45
+}}
+"""
+def evaluate_raid(patient_text, clinical_record):
+    """Evalúa el RAID score basado en el texto del paciente y registro clínico"""
+    try:
+        prompt = RAID_PROMPT_TEMPLATE.format(
+            patient_text=patient_text[:2000],  # Limitar texto para contexto
+            clinical_record=clinical_record[:2000],
+            weights=RAID_WEIGHTS
+        )
+        response = chat_groq.invoke(prompt)
+        # Extraer JSON de la respuesta
+        start = response.content.find('{')
+        end = response.content.rfind('}') + 1
+        json_response = json.loads(response.content[start:end])
+        # Validar estructura
+        if not all(key in json_response['raid_scores'] for key in RAID_WEIGHTS):
+            raise ValueError("Faltan componentes del RAID en la respuesta")
+        return json_response
+    except Exception as e:
+        print(f"Error en evaluación RAID: {e}")
+        return {
+            "raid_scores": {k: 0 for k in RAID_WEIGHTS},
+            "raid_total": 0
+        }
+def format_raid_results(raid_data):
+    """Formatea los resultados del RAID para visualización"""
+    if not raid_data:
+        return "No se pudo calcular el RAID score"
+    scores = raid_data.get('raid_scores', {})
+    total = raid_data.get('raid_total', 0)
+    breakdown = "\n".join([
+        f"- {category}: {score} (Peso: {weight*100}%)"
+        for (category, score), weight in zip(scores.items(), RAID_WEIGHTS.values())
+    ])
+    interpretation = "Interpretación del puntaje:\n"
+    if total >= 7:
+        interpretation += "RAID alto: Impacto significativo en la calidad de vida. Considerar ajuste terapéutico."
+    elif total >= 4:
+        interpretation += "RAID moderado: Impacto notable. Monitoreo cercano recomendado."
+    else:
+        interpretation += "RAID bajo: Buen control sintomático. Mantener seguimiento."
+    return f"""
+    **Puntaje Total RAID: {total:.2f}/10**
+    **Desglose:**
+    {breakdown}
+    {interpretation}
+    """
 # Inicialización del cliente
 api_key = os.environ.get("GROQ_API_KEY")
 if not api_key:
     except Exception as e:
         transcription_text = ""
         print(f"Error en transcripción de audio: {e}")
     try:
         pdf_text = extract_texts_from_pdfs(pdfs)
     except Exception as e:
         pdf_text = ""
         print(f"Error en extracción de PDFs: {e}")
     updated_text = current_text
+    raid_results = None
+    # Procesamiento en lotes
+    max_chunk_words = 2500
     for text_label, text_content in [("Audio", transcription_text), ("PDF", pdf_text)]:
         if not text_content:
             continue
         for chunk in text_chunks:
             transcription_chunk = chunk if text_label == "Audio" else ""
             pdf_chunk = chunk if text_label == "PDF" else ""
+            # Actualizar registro clínico
             organized_record = organize_clinical_record(updated_text, transcription_chunk, pdf_chunk)
             if organized_record:
                 updated_text = organized_record.content
+            # Evaluar RAID solo con el audio (conversación actual)
+            if text_label == "Audio" and chunk:
+                raid_results = evaluate_raid(chunk, updated_text)
+    return updated_text, format_raid_results(raid_results), ""
 # Interfaz de Gradio
 with gr.Blocks(theme=theme) as iface:
+    gr.Markdown("# Sistema de Evaluación Reumatológica")
+    with gr.Row():
+        iterative_output = gr.Textbox(
+            label="Registro Clínico",
+            value=initial_text,
+            lines=20,
+            elem_id="clinical_record"
+        )
+        raid_output = gr.Markdown(
+            "### Resultados RAID\nEsperando evaluación...",
+            elem_id="raid_results"
+        )
     current_state = gr.State(value=initial_text)
+    with gr.Row():
+        audio_filepath = gr.Audio(sources=["microphone"], type="filepath",
+                                label="Conversación con el Paciente")
+        pdf_files = gr.File(file_types=[".pdf"], label="Documentos Médicos",
+                          file_count="multiple")
+    debug_output = gr.Textbox(label="Registros", lines=5, visible=False)
     # Función para capturar cambios en el iterative_output
     def on_text_change(updated_text):