Source code for steamship.agents.tools.audio_transcription.whisper_speech_to_text_tool

"""Tool for generating images."""
from steamship import Steamship
from steamship.agents.llms import OpenAI
from steamship.agents.tools import AudioBlockifierTool
from steamship.agents.utils import with_llm
from steamship.utils.repl import ToolREPL


[docs] class WhisperSpeechToTextTool(AudioBlockifierTool): """Tool to generate audio from text.""" name: str = "WhisperSpeechToTextTool" human_description: str = "Generates text from spoken audio." agent_description: str = ( "Used to generate text from spoken audio at a URL. Only use if the user has asked directly for a an text version of an audio file. " "The input is a URL. " "The output is the text from that URL." ) blockifier_plugin_handle: str = "whisper-s2t-blockifier"
if __name__ == "__main__": print( "You can try: https://d3ctxlq1ktw2nl.cloudfront.net/staging/2023-4-14/2ba758be-d152-f80d-4ef0-9c63789e556b.mp3" ) tool = WhisperSpeechToTextTool() # Try on: https://anchor.fm/s/e1369b4c/podcast/play/70381739/https%3A%2F%2Fd3ctxlq1ktw2nl.cloudfront.net%2Fstaging%2F2023-4-14%2Fda96d64d-3c27-3e84-eb63-d5bc55eaf52e.mp3 with Steamship.temporary_workspace() as client: ToolREPL(tool).run_with_client(client=client, context=with_llm(llm=OpenAI(client=client)))