Spaces:

MalcomNavarro
/

hf-gaia-agents-course-MN

Sleeping

App Files Files Community

Mahynlo commited on 13 days ago

Commit

0abe794

1 Parent(s): 29ccd55

Soporte para archivos Excel y audio + mejoras en procesamiento de archivos

Browse files

Files changed (4) hide show

agents.py +24 -7
requirements.txt +1 -1
test_answers.py +58 -0
tools.py +60 -0

agents.py CHANGED Viewed

@@ -163,14 +163,15 @@ IMPORTANT: GAIA uses exact string matching. Be precise!"""
         if files and len(files) > 0:
             context_parts.append("\n📁 FILES PROVIDED:")
-            from tools import read_image_text
             import requests
             for file_url in files:
                 try:
-                    # Determinar tipo de archivo
-                    if any(ext in file_url.lower() for ext in ['.jpg', '.jpeg', '.png', '.gif', '.bmp']):
-                        # Procesar imagen con OCR
                         if self.verbose:
                             print(f"  📷 Procesando imagen: {file_url}")
                         text = read_image_text(file_url)
@@ -180,8 +181,24 @@ IMPORTANT: GAIA uses exact string matching. Be precise!"""
                         else:
                             context_parts.append(f"\n⚠️  Could not extract text from image: {file_url}")
-                    elif any(ext in file_url.lower() for ext in ['.txt', '.csv', '.json', '.py', '.md']):
-                        # Procesar archivo de texto
                         if self.verbose:
                             print(f"  📄 Procesando archivo texto: {file_url}")
                         response = requests.get(file_url, timeout=30)
@@ -191,7 +208,7 @@ IMPORTANT: GAIA uses exact string matching. Be precise!"""
                         context_parts.append(f"{content}")
                     else:
-                        # Solo mencionar archivo desconocido
                         context_parts.append(f"\n📎 File available: {file_url}")
                 except Exception as e:

         if files and len(files) > 0:
             context_parts.append("\n📁 FILES PROVIDED:")
+            from tools import read_image_text, read_excel_file, read_audio_file
             import requests
             for file_url in files:
                 try:
+                    file_lower = file_url.lower()
+                    # Procesar imágenes con OCR
+                    if any(ext in file_lower for ext in ['.jpg', '.jpeg', '.png', '.gif', '.bmp']):
                         if self.verbose:
                             print(f"  📷 Procesando imagen: {file_url}")
                         text = read_image_text(file_url)
                         else:
                             context_parts.append(f"\n⚠️  Could not extract text from image: {file_url}")
+                    # Procesar archivos Excel
+                    elif any(ext in file_lower for ext in ['.xlsx', '.xls']):
+                        if self.verbose:
+                            print(f"  📊 Procesando Excel: {file_url}")
+                        content = read_excel_file(file_url)
+                        context_parts.append(f"\n📊 EXCEL DATA from {file_url}:")
+                        context_parts.append(content)
+                    # Procesar archivos de audio (limitado)
+                    elif any(ext in file_lower for ext in ['.mp3', '.wav', '.ogg', '.m4a']):
+                        if self.verbose:
+                            print(f"  🎵 Detectado audio: {file_url}")
+                        info = read_audio_file(file_url)
+                        context_parts.append(f"\n🎵 AUDIO FILE:")
+                        context_parts.append(info)
+                    # Procesar archivos de texto
+                    elif any(ext in file_lower for ext in ['.txt', '.csv', '.json', '.py', '.md']):
                         if self.verbose:
                             print(f"  📄 Procesando archivo texto: {file_url}")
                         response = requests.get(file_url, timeout=30)
                         context_parts.append(f"{content}")
                     else:
+                        # Archivo de tipo desconocido
                         context_parts.append(f"\n📎 File available: {file_url}")
                 except Exception as e:

requirements.txt CHANGED Viewed

@@ -7,6 +7,7 @@ google-generativeai>=0.8.0
 # Procesamiento de datos
 pandas>=2.0.0
 requests>=2.31.0
 # Procesamiento de imágenes (OCR)
@@ -15,4 +16,3 @@ pytesseract>=0.3.10
 # Variables de entorno
 python-dotenv>=1.0.0

 # Procesamiento de datos
 pandas>=2.0.0
+openpyxl>=3.1.0  # Para leer archivos Excel
 requests>=2.31.0
 # Procesamiento de imágenes (OCR)
 # Variables de entorno
 python-dotenv>=1.0.0

test_answers.py ADDED Viewed

	@@ -0,0 +1,58 @@

+"""
+Script para testear respuestas específicas y mejorar la precisión
+"""
+# Respuestas del último run (15%)
+respuestas_obtenidas = {
+    1: "4",          # Mercedes Sosa albums
+    2: "4",          # Bird species video
+    3: "right",      # Reversed text ✅ (probablemente correcta)
+    4: "Ra1#",       # Chess move
+    5: "funkmonk",   # Wikipedia dinosaur
+    6: "b,e",        # Math table ✅ (probablemente correcta)
+    7: "indeed",     # Teal'c quote ✅ (probablemente correcta)
+    8: "silver",     # Equine veterinarian
+    9: "bell pepper,broccoli,celery,corn,green beans,lettuce,sweet potatoes,zucchini",  # Botany list
+    10: "cornstarch,lemon juice,salt,strawberries,sugar",  # Pie ingredients
+    11: "wojciech",  # Polish actor
+    12: "55",        # Python code output
+    13: "553",       # Baseball at bats
+    14: "21,22,23,24,25,26,27,28,29,30,31,32,33,34,35",  # Homework pages
+    15: "80GSFC21N0002",  # NASA article
+    16: "None",      # Vietnamese specimens
+    17: "HAI",       # 1928 Olympics
+    18: "Fujiwara,Ogasawara",  # Baseball pitchers
+    19: "$210.00",   # Excel sales
+    20: "dmitrij",   # Malko Competition
+}
+# Patrones observados de posibles problemas:
+problemas_potenciales = {
+    "Mayúsculas/minúsculas": [5, 7, 11, 17, 18, 20],  # funkmonk vs FunkMonk, indeed vs Indeed
+    "Formato numérico": [1, 12, 13],  # Números que podrían estar incorrectos
+    "Listas de items": [9, 10, 14, 18],  # Listas que podrían tener orden o items incorrectos
+    "Formato especial": [15, 19],  # Códigos NASA, moneda
+    "Análisis de archivos": [8, 12, 14, 19, 20],  # Requieren leer archivos
+}
+print("=" * 60)
+print("🔍 ANÁLISIS DE RESPUESTAS DEL ÚLTIMO RUN")
+print("=" * 60)
+print(f"\n✅ Correctas confirmadas: 3/20 (15%)")
+print(f"🎯 Objetivo: 6/20 (30%)")
+print(f"❌ Necesitamos mejorar: +3 respuestas correctas\n")
+print("📋 CATEGORÍAS DE PROBLEMAS POTENCIALES:\n")
+for categoria, preguntas in problemas_potenciales.items():
+    print(f"  • {categoria}:")
+    print(f"    Preguntas: {', '.join(map(str, preguntas))}")
+    respuestas = [respuestas_obtenidas[p] for p in preguntas]
+    print(f"    Respuestas: {respuestas[:3]}..." if len(respuestas) > 3 else f"    Respuestas: {respuestas}")
+    print()
+print("\n💡 RECOMENDACIONES:")
+print("  1. Verificar case-sensitivity (mayúsculas/minúsculas)")
+print("  2. Mejorar procesamiento de archivos (especialmente audio/Excel)")
+print("  3. Validar formato de listas (orden alfabético vs orden original)")
+print("  4. Revisar precisión numérica en cálculos")

tools.py CHANGED Viewed

@@ -20,6 +20,66 @@ def read_image_text(url: str):
         print(f"❌ Error al leer imagen {url}: {e}")
         return ""
 def web_search(query: str):
     """Simula búsqueda web (puedes mejorarla con Wikipedia API)."""
     return f"(Simulación de búsqueda web para '{query}')"

         print(f"❌ Error al leer imagen {url}: {e}")
         return ""
+def read_excel_file(url: str):
+    """
+    Lee un archivo Excel y lo convierte a texto estructurado.
+    Útil para preguntas GAIA que requieren análisis de datos.
+    """
+    try:
+        import pandas as pd
+        response = requests.get(url, timeout=30)
+        response.raise_for_status()
+        # Leer Excel con pandas
+        df = pd.read_excel(BytesIO(response.content), sheet_name=None)  # Todas las hojas
+        result = []
+        for sheet_name, data in df.items():
+            result.append(f"\n📊 Sheet: {sheet_name}")
+            # Convertir a string con formato tabular (primeras 50 filas)
+            result.append(data.head(50).to_string(index=False))
+            # Si hay más filas, indicarlo
+            if len(data) > 50:
+                result.append(f"\n... ({len(data) - 50} more rows)")
+        return "\n".join(result)
+    except ImportError:
+        return "ERROR: pandas/openpyxl not installed for Excel processing"
+    except Exception as e:
+        print(f"❌ Error al leer Excel {url}: {e}")
+        return f"ERROR reading Excel: {str(e)}"
+def read_audio_file(url: str):
+    """
+    Intenta procesar archivos de audio.
+    Nota: Transcripción de audio es compleja y requiere APIs externas.
+    Por ahora, solo indicamos que el archivo existe.
+    """
+    try:
+        response = requests.head(url, timeout=10)
+        response.raise_for_status()
+        # Obtener información del archivo
+        content_type = response.headers.get('Content-Type', 'unknown')
+        content_length = response.headers.get('Content-Length', 'unknown')
+        return f"""⚠️ AUDIO FILE DETECTED: {url}
+Content-Type: {content_type}
+Size: {content_length} bytes
+NOTE: Audio transcription requires external API (e.g., Whisper, Google Speech-to-Text).
+This agent cannot directly process audio content.
+Try to answer based on the question context."""
+    except Exception as e:
+        print(f"❌ Error al verificar audio {url}: {e}")
+        return f"ERROR accessing audio file: {str(e)}"
 def web_search(query: str):
     """Simula búsqueda web (puedes mejorarla con Wikipedia API)."""
     return f"(Simulación de búsqueda web para '{query}')"