56 lines
2.3 KiB
Python
56 lines
2.3 KiB
Python
import subprocess
|
|
import speech_recognition as sr
|
|
import os
|
|
from functions.loging import loging
|
|
|
|
|
|
class Converter:
|
|
def __init__(self, path_to_file: str, message, language: str = "ru-RU"):
|
|
self.language = language
|
|
self.path_to_file = path_to_file
|
|
self.service = None
|
|
self.message = message
|
|
|
|
def audio_to_text(self) -> str:
|
|
try:
|
|
try:
|
|
import mutagen
|
|
f = mutagen.File(self.path_to_file)
|
|
if float(f.info.length) >= 30.0:
|
|
self.service = "google"
|
|
return self.google()
|
|
else:
|
|
self.service = "yandex"
|
|
return self.yandex()
|
|
except:
|
|
return self.google()
|
|
except sr.RequestError:
|
|
return "Толи файл слишком большой, толи с ботом что-то случилось"
|
|
|
|
def google(self) -> str:
|
|
subprocess.run(['ffmpeg', '-v', 'quiet', '-i', self.path_to_file, self.path_to_file.replace(".ogg", ".wav")])
|
|
try:
|
|
os.remove(self.path_to_file)
|
|
wav_file = self.path_to_file.replace(".ogg", ".wav")
|
|
r = sr.Recognizer()
|
|
with sr.AudioFile(wav_file) as source:
|
|
audio = r.record(source)
|
|
r.adjust_for_ambient_noise(source)
|
|
try:
|
|
response = "google\n\n" + r.recognize_google(audio, language=self.language)
|
|
loging(self.message, "google", wav_file, response)
|
|
os.remove(wav_file)
|
|
return response
|
|
except sr.UnknownValueError:
|
|
return "google\n\n Слова не распознаны, вы что вообще мне впихнуть пытаетесь"
|
|
except FileNotFoundError:
|
|
return "Толи файл слишком большой, толи с ботом что-то случилось"
|
|
|
|
def yandex(self) -> str:
|
|
from speechkit import ShortAudioRecognition, Session
|
|
reg = ShortAudioRecognition(Session.from_api_key("AQVN3xNJamAFP4_FS6Gis0Uud0vONFk24umBSXvh"))
|
|
response = "yandex\n\n" + reg.recognize(open(str(self.path_to_file), str('rb')).read())
|
|
loging(self.message, "yandex", self.path_to_file, response)
|
|
os.remove(self.path_to_file)
|
|
return response
|