Maga222006
commited on
Commit
·
29082ec
1
Parent(s):
5cf48c0
MultiagentPersonalAssistant
Browse files
agent/file_preprocessing.py
CHANGED
|
@@ -1,6 +1,5 @@
|
|
| 1 |
from speechbrain.inference.classifiers import EncoderClassifier
|
| 2 |
from langchain_core.messages import HumanMessage
|
| 3 |
-
from agent.models import llm_image
|
| 4 |
import speech_recognition as sr
|
| 5 |
from pydub import AudioSegment
|
| 6 |
from dotenv import load_dotenv
|
|
@@ -69,6 +68,7 @@ def preprocess_audio(file_name: str):
|
|
| 69 |
|
| 70 |
|
| 71 |
async def preprocess_image(file_name: str):
|
|
|
|
| 72 |
with open(file_name, "rb") as f:
|
| 73 |
img_b64 = base64.b64encode(f.read()).decode("utf-8")
|
| 74 |
response = await llm_image.ainvoke([HumanMessage(
|
|
|
|
| 1 |
from speechbrain.inference.classifiers import EncoderClassifier
|
| 2 |
from langchain_core.messages import HumanMessage
|
|
|
|
| 3 |
import speech_recognition as sr
|
| 4 |
from pydub import AudioSegment
|
| 5 |
from dotenv import load_dotenv
|
|
|
|
| 68 |
|
| 69 |
|
| 70 |
async def preprocess_image(file_name: str):
|
| 71 |
+
from agent.models import llm_image
|
| 72 |
with open(file_name, "rb") as f:
|
| 73 |
img_b64 = base64.b64encode(f.read()).decode("utf-8")
|
| 74 |
response = await llm_image.ainvoke([HumanMessage(
|