mirror of
https://github.com/aljazceru/Auto-GPT.git
synced 2025-12-23 00:44:22 +01:00
* feat: pass config to call_ai_functions in coimmands * feat: config for read_audio_from_file * feat: file operations cfg NOTE: we replaced the CFG in the command enable with TRUE b/c not sure how to handle this yet * feat: git command conversion * feat: google search * feat: image generation * feat: extract cfg from browser commands * feat: remove cfg from execute code commands * fix: file operation related tests * fix: linting * fix: tests for read_audio * fix: test error * feat: update cassettes * fix: linting * fix: test typechecking * fix: google_search errors if unexpected kw arg is passed * fix: pass config param to google search test * fix: agent commands were broken + cassettes * fix: agent test * feat: cassettes * feat: enable/disable logic for commands * fix: some commands threw errors * feat: fix tests * Add new cassettes * Add new cassettes * ci: trigger ci * Update autogpt/commands/execute_code.py Co-authored-by: Reinier van der Leer <github@pwuts.nl> * fix prompt * fix prompt + rebase * add config remove useless imports * put back CFG just for download file * lint * The signature should be mandatory in the decorator * black isort * fix: remove the CFG * fix: non typed arg * lint: type some args * lint: add types for libraries * Add new cassettes * fix: windows compatibility * fix: add config access to decorator * fix: remove twitter mention * DDGS search works at 3.0.2 version * ci: linting --------- Co-authored-by: Auto-GPT-Bot <github-bot@agpt.co> Co-authored-by: merwanehamadi <merwanehamadi@gmail.com> Co-authored-by: Reinier van der Leer <github@pwuts.nl> Co-authored-by: kinance <kinance@gmail.com>
65 lines
1.6 KiB
Python
65 lines
1.6 KiB
Python
"""Commands for converting audio to text."""
|
|
import json
|
|
from typing import TYPE_CHECKING
|
|
|
|
import requests
|
|
|
|
from autogpt.commands.command import command
|
|
from autogpt.config import Config
|
|
|
|
if TYPE_CHECKING:
|
|
from autogpt.config import Config
|
|
|
|
|
|
@command(
|
|
"read_audio_from_file",
|
|
"Convert Audio to text",
|
|
'"filename": "<filename>"',
|
|
lambda config: config.huggingface_audio_to_text_model
|
|
and config.huggingface_api_token,
|
|
"Configure huggingface_audio_to_text_model and Hugging Face api token.",
|
|
)
|
|
def read_audio_from_file(filename: str, config: Config) -> str:
|
|
"""
|
|
Convert audio to text.
|
|
|
|
Args:
|
|
filename (str): The path to the audio file
|
|
|
|
Returns:
|
|
str: The text from the audio
|
|
"""
|
|
with open(filename, "rb") as audio_file:
|
|
audio = audio_file.read()
|
|
return read_audio(audio, config)
|
|
|
|
|
|
def read_audio(audio: bytes, config: Config) -> str:
|
|
"""
|
|
Convert audio to text.
|
|
|
|
Args:
|
|
audio (bytes): The audio to convert
|
|
|
|
Returns:
|
|
str: The text from the audio
|
|
"""
|
|
model = config.huggingface_audio_to_text_model
|
|
api_url = f"https://api-inference.huggingface.co/models/{model}"
|
|
api_token = config.huggingface_api_token
|
|
headers = {"Authorization": f"Bearer {api_token}"}
|
|
|
|
if api_token is None:
|
|
raise ValueError(
|
|
"You need to set your Hugging Face API token in the config file."
|
|
)
|
|
|
|
response = requests.post(
|
|
api_url,
|
|
headers=headers,
|
|
data=audio,
|
|
)
|
|
|
|
text = json.loads(response.content.decode("utf-8"))["text"]
|
|
return f"The audio says: {text}"
|