noch kein weiches (fade) Ende und die Spracherkennung geht garnicht
This commit is contained in:
@@ -3,7 +3,7 @@ import speech_recognition as sr
|
||||
import os
|
||||
|
||||
# Lade die MP3-Datei und konvertiere sie zu WAV
|
||||
audio = AudioSegment.from_mp3("input.mp3")
|
||||
audio = AudioSegment.from_mp3("dreiWorte.mp3")
|
||||
audio = audio.set_channels(1).set_frame_rate(16000) # Mono & 16kHz für bessere Erkennung
|
||||
|
||||
# Stille erkennen mit optimierten Werten
|
||||
@@ -25,21 +25,23 @@ recognizer = sr.Recognizer()
|
||||
for i, (start, end) in enumerate(word_segments):
|
||||
segment = audio[start:end]
|
||||
temp_file = f"temp_word_{i+1}.wav"
|
||||
print(temp_file)
|
||||
segment.export(temp_file, format="wav")
|
||||
|
||||
word_text = ""
|
||||
# Spracherkennung durchführen
|
||||
with sr.AudioFile(temp_file) as source:
|
||||
audio_data = recognizer.record(source)
|
||||
try:
|
||||
word_text = recognizer.recognize_google(audio_data, language="de-DE")
|
||||
word_text = recognizer.recognize_google(audio_data, language="sv-SV") # Schwedisch
|
||||
print("Erkanntes Wort:", word_text)
|
||||
except sr.UnknownValueError:
|
||||
try:
|
||||
word_text = recognizer.recognize_sphinx(audio_data, language="de-DE")
|
||||
except sr.UnknownValueError:
|
||||
word_text = f"unbekannt_{i+1}"
|
||||
print("Google konnte nichts erkennen.")
|
||||
except Exception as e:
|
||||
print(f"Fehler: {e}")
|
||||
|
||||
word_text = word_text.replace(" ", "_") # Leerzeichen durch Unterstrich ersetzen
|
||||
final_file = f"{word_text}.wav"
|
||||
#word_text = word_text.replace(" ", "_") # Leerzeichen durch Unterstrich ersetzen
|
||||
#final_file = f"{word_text}.wav"
|
||||
final_file = "1.wav"
|
||||
os.rename(temp_file, final_file)
|
||||
|
||||
print(f"Wort {i+1}: {word_text} -> Gespeichert als {final_file}")
|
||||
|
||||
Reference in New Issue
Block a user