Final_Assignment_Template

Sleeping

mchinea commited on May 30

Commit

e71f323

1 Parent(s): f8e3605

add new tool

Files changed (2) hide show

requirements.txt CHANGED Viewed

@@ -13,3 +13,4 @@ pydub
 tavily-python
 wikipedia
 pytesseract

 tavily-python
 wikipedia
 pytesseract
+openai-whisper

tools.py CHANGED Viewed

@@ -8,6 +8,7 @@ from typing import Dict
 from pathlib import Path
 #from markitdown import MarkItDown
 from urllib.parse import urlparse
 from langchain_core.tools import tool
@@ -364,6 +365,35 @@ def extract_text_from_image(image_path: str) -> str:
         return f"Unexpected error during OCR: {str(e)}"
 level1_tools = [
     multiply,
     add,
@@ -379,5 +409,6 @@ level1_tools = [
     download_file_from_url,
     save_and_read_file,
     read_python_file,
-    extract_text_from_image
 ]

 from pathlib import Path
 #from markitdown import MarkItDown
 from urllib.parse import urlparse
+from smolagents import Tool
 from langchain_core.tools import tool
         return f"Unexpected error during OCR: {str(e)}"
+@tool
+def transcribe_audio(audio_path: str) -> str:
+    """
+    Transcribes speech from an audio file using Whisper (local).
+    Args:
+        audio_path: Path to the audio file (e.g., .mp3, .wav, .m4a).
+    Returns:
+        The transcribed text or an error message.
+    """
+    try:
+        import whisper
+        if not os.path.exists(audio_path):
+            return f"Error: File not found at '{audio_path}'."
+        model = whisper.load_model("base")  # You can use "small", "medium", "large"
+        result = model.transcribe(audio_path)
+        return result["text"].strip()
+    except ImportError:
+        return (
+            "Error: 'whisper' library is not installed. "
+            "Install it using 'pip install openai-whisper'."
+        )
+    except Exception as e:
+        return f"Error during transcription: {str(e)}"
 level1_tools = [
     multiply,
     add,
     download_file_from_url,
     save_and_read_file,
     read_python_file,
+    extract_text_from_image,
+    transcribe_audio
 ]