This api transcribes up to 1 min of audio to text. You'll need a google cloud account.
https://cloud.google.com/translate/docs/
#!/usr/bin/env python3
import speech_recognition as sr
from os import path
audio = "K:\\random\\part4.wav"
r = sr.Recognizer() #recognizer object, we can use various services with this including google, microsoft and ibm watson
with sr.AudioFile(audio) as source:
audio = r.record(source) # read the entire audio file
# Google Cloud Speech Recognition
Whisper = r"""<entire contents of json credentials from google>"""
try:
ish = r.recognize_google_cloud(audio, credentials_json=Whisper)
print("Transcribed:... " +ish)
#canwehassavedfile!
file = open("K:\\random\\part4.txt","w")
file.write(ish)
file.close()
except sr.RequestError as e:
print("Sorry, can't help you. ; {0}".format(e))
except sr.UnknownValueError:
print("What was that?")