interstellar_ai/py/voice.py

import speech_recognition as sr
from pydub import AudioSegment


class VoiceRecognition:
    def check_audio_format(self, file_path):
        try:
            audio = AudioSegment.from_ogg(file_path)
            print(f"Audio format: {audio.format}")
            return True
        except Exception as e:
            print(f"Error reading audio file: {e}")
            return False

    def basic_recognition(self, audio, option):
        print(type(audio))
        print("preparing")
        r = sr.Recognizer()

        # Read the data from the FileStorage object
        audio_data = audio.read()

        # Write the audio data to a file
        with open('output.wav', 'wb') as file:
            file.write(audio_data)

        self.check_audio_format(audio)
        if option == "online":
            with sr.AudioFile(audio) as source:
                print(type(source))
                print("online")
                text = r.recognize_google_cloud(source)
                print("recognized as: " + text)
                return text
        elif option == "offline":
            with sr.AudioFile(audio) as source:
                print(type(source))
                print("offline")
                text = r.recognize_sphinx(source)
                print("recognized as: " + text)
                return text

        print("nothing")
        return False
google-help-me 2024-09-24 09:55:23 +02:00			`import speech_recognition as sr`
small fix? 2024-09-26 10:43:39 +02:00			`from pydub import AudioSegment`
google-help-me 2024-09-24 09:55:23 +02:00

			`class VoiceRecognition:`
small fix? 2024-09-26 10:43:39 +02:00			`def check_audio_format(self, file_path):`
			`try:`
			`audio = AudioSegment.from_ogg(file_path)`
			`print(f"Audio format: {audio.format}")`
			`return True`
			`except Exception as e:`
			`print(f"Error reading audio file: {e}")`
			`return False`

			`def basic_recognition(self, audio, option):`
backend audio fix woo 2024-09-26 09:52:31 +02:00			`print(type(audio))`
super cool fix 2024-09-26 09:32:14 +02:00			`print("preparing")`
google-help-me 2024-09-24 09:55:23 +02:00			`r = sr.Recognizer()`
small fix? 2024-09-26 10:43:39 +02:00
			`# Read the data from the FileStorage object`
			`audio_data = audio.read()`

			`# Write the audio data to a file`
			`with open('output.wav', 'wb') as file:`
			`file.write(audio_data)`

			`self.check_audio_format(audio)`
google-help-me 2024-09-24 09:55:23 +02:00			`if option == "online":`
backend audio fix woo 2024-09-26 09:52:31 +02:00			`with sr.AudioFile(audio) as source:`
small fix? 2024-09-26 10:43:39 +02:00			`print(type(source))`
backend audio fix woo 2024-09-26 09:52:31 +02:00			`print("online")`
super cool fix 2024-09-26 09:32:14 +02:00			`text = r.recognize_google_cloud(source)`
			`print("recognized as: " + text)`
			`return text`
Fixed the Backend and added Voice recognition API 2024-09-24 10:36:12 +02:00			`elif option == "offline":`
backend audio fix woo 2024-09-26 09:52:31 +02:00			`with sr.AudioFile(audio) as source:`
small fix? 2024-09-26 10:43:39 +02:00			`print(type(source))`
backend audio fix woo 2024-09-26 09:52:31 +02:00			`print("offline")`
super cool fix 2024-09-26 09:32:14 +02:00			`text = r.recognize_sphinx(source)`
			`print("recognized as: " + text)`
			`return text`
Fixed the Backend and added Voice recognition API 2024-09-24 10:36:12 +02:00
super cool fix 2024-09-26 09:32:14 +02:00			`print("nothing")`
Fixed the Backend and added Voice recognition API 2024-09-24 10:36:12 +02:00			`return False`