Merge pull request 'Updates' (#21 ) from React-Group/interstellar_ai:main into main

Reviewed-on: https://interstellardevelopment.org/code/code/sageTheDm/interstellar_ai/pulls/21
whisper is better
2024-09-26 12:32:17 +02:00 · 2024-09-26 11:01:15 +02:00 · 2024-09-26 10:43:47 +02:00 · 2024-09-26 10:43:39 +02:00 · 2024-09-26 09:55:40 +02:00
3 changed files with 10 additions and 30 deletions
--- a/py/api.py
+++ b/py/api.py
@ -99,16 +99,9 @@ class API:

        @self.app.route('/interstellar_ai/api/voice_recognition', methods=['POST'])
        def voice_recognition():
-            print(request.args)
-            recog_type = request.form.get('type')
-            print(recog_type)
            audio = request.files.get('audio')
-            option = request.form.get('option')
-            if recog_type == "basic":
-                text = self.voice.basic_recognition(audio, option)
-                return jsonify({'status': 200, 'response': text})
-            else:
-                return jsonify({'status': 401, 'response': "Invalid type"})
+            text = self.voice.recognition(audio)
+            return jsonify({'status': 200, 'response': text})

        @self.app.route('/interstellar_ai/api/weather', methods=['POST'])
        def get_weather():
--- a/py/requirements.txt
+++ b/py/requirements.txt
@ -14,3 +14,4 @@ pycouchdb
 pyttsx3
 pip-licenses
 openai-whisper
+pydub
--- a/py/voice.py
+++ b/py/voice.py
@ -1,24 +1,10 @@
-import speech_recognition as sr
+import whisper


 class VoiceRecognition:
    @staticmethod
-    def basic_recognition(audio, option):
-        print(type(audio))
-        print("preparing")
-        r = sr.Recognizer()
-        if option == "online":
-            with sr.AudioFile(audio) as source:
-                print("online")
-                text = r.recognize_google_cloud(source)
-                print("recognized as: " + text)
-                return text
-        elif option == "offline":
-            with sr.AudioFile(audio) as source:
-                print("offline")
-                text = r.recognize_sphinx(source)
-                print("recognized as: " + text)
-                return text
-
-        print("nothing")
-        return False
+    def recognition(audio):
+        model = whisper.load_model("base")
+        result = model.transcribe(audio)
+        print(result["text"])
+        return result["text"]
Author	SHA1	Message	Date
sageTheDm	a07961d65d	Merge pull request 'Updates' (#21 ) from React-Group/interstellar_ai:main into main Reviewed-on: https://interstellardevelopment.org/code/code/sageTheDm/interstellar_ai/pulls/21	2024-09-26 12:32:17 +02:00
Patrick_Pluto	ab12b796ec	whisper is better	2024-09-26 11:01:15 +02:00
Patrick_Pluto	8cc9b1b015	Merge branch 'main' of interstellardevelopment.org:React-Group/interstellar_ai	2024-09-26 10:43:47 +02:00
Patrick_Pluto	58d1a68bac	small fix?	2024-09-26 10:43:39 +02:00
Patrick	9d27354c1e	Merge pull request 'models are broken' (#52 ) from sageTheDm/interstellar_ai:main into main Reviewed-on: https://interstellardevelopment.org/code/code/React-Group/interstellar_ai/pulls/52	2024-09-26 09:55:40 +02:00