Initial

2026-03-10 05:51:43 +01:00 · 2018-08-15 20:56:35 +02:00
commit 0eb65e4772
8 changed files with 51 additions and 0 deletions
--- a/.plan.txt.swp
+++ b/.plan.txt.swp
--- a/plan.txt
+++ b/plan.txt
@@ -0,0 +1,15 @@
+Smartphone:
+    - record
+    - play
+    - send to server
+    - recive text form server (?)
+
+Server:
+    - revice from smartphone
+    - use google api for recognition
+    - process/format result (i.e. templating (i.e. templating))
+    - send resulting text
+
+Computer/Client:
+    - recivce text
+    - place it somewhere
--- a/python-server/.main.py.swp
+++ b/python-server/.main.py.swp
--- a/python-server/main.py
+++ b/python-server/main.py
@@ -0,0 +1,8 @@
+#!/usr/bin/python3
+import s_input
+import sys
+
+if __name__ == "__main__":
+    path = sys.argv[1]
+    print("AudioFile: {}".format(path))
+    print(s_input.analyse_file_by_path(path))
--- a/python-server/s_input.py
+++ b/python-server/s_input.py
@@ -0,0 +1,6 @@
+import speech
+
+def analyse_file_by_path(file_path):
+    transcript = speech.analyse(file_path)
+
+    return transcript
--- a/python-server/speech.py
+++ b/python-server/speech.py
@@ -0,0 +1,17 @@
+import speech_recognition as spr
+def analyse(file_path):
+    ''' returns the transcripted audio, or None if the analysis fails '''
+    recognizer = spr.Recognizer()
+    with sr.AudioFile(file_path) as source:
+        audio = r.record(source)
+
+    try:
+        string = r.recognize_google(audio)
+    except spr.UnknownValueError:
+        log.log("Audio file is broken or not an audio file")
+        return None
+    except spr.RequestError as e:
+        log.log("Could not connect to google API: {}".format(e))
+        return None
+
+    return string
--- a/setup.sh
+++ b/setup.sh
@@ -0,0 +1,5 @@
+apt-get install python python-all-dev python-pip build-essential swig git libpulse-dev libasound2-dev
+pip3 install wheel
+pip3 install google-cloud-speech
+pip3 install pocketsphin
+pip3 install SpeechRecognition
--- a/test-data/das_ist_ein_test.wav
+++ b/test-data/das_ist_ein_test.wav