diff --git a/mp3/01/5050.mp3 b/mp3/01/10.mp3 similarity index 100% rename from mp3/01/5050.mp3 rename to mp3/01/10.mp3 diff --git a/mp3/01/5053.mp3 b/mp3/01/12.mp3 similarity index 100% rename from mp3/01/5053.mp3 rename to mp3/01/12.mp3 diff --git a/mp3/01/5043.mp3 b/mp3/01/14.mp3 similarity index 100% rename from mp3/01/5043.mp3 rename to mp3/01/14.mp3 diff --git a/mp3/01/5035.mp3 b/mp3/01/16.mp3 similarity index 100% rename from mp3/01/5035.mp3 rename to mp3/01/16.mp3 diff --git a/mp3/01/5038.mp3 b/mp3/01/17.mp3 similarity index 100% rename from mp3/01/5038.mp3 rename to mp3/01/17.mp3 diff --git a/mp3/01/5052.mp3 b/mp3/01/2.mp3 similarity index 100% rename from mp3/01/5052.mp3 rename to mp3/01/2.mp3 diff --git a/mp3/01/5051.mp3 b/mp3/01/20.mp3 similarity index 100% rename from mp3/01/5051.mp3 rename to mp3/01/20.mp3 diff --git a/mp3/01/5042.mp3 b/mp3/01/4.mp3 similarity index 100% rename from mp3/01/5042.mp3 rename to mp3/01/4.mp3 diff --git a/mp3/01/5034.mp3 b/mp3/01/6.mp3 similarity index 100% rename from mp3/01/5034.mp3 rename to mp3/01/6.mp3 diff --git a/mp3/01/5037.mp3 b/mp3/01/7.mp3 similarity index 100% rename from mp3/01/5037.mp3 rename to mp3/01/7.mp3 diff --git a/mp3/01/5013.mp3 b/mp3/01/elva.mp3 similarity index 100% rename from mp3/01/5013.mp3 rename to mp3/01/elva.mp3 diff --git a/mp3/01/5012.mp3 b/mp3/01/ett.mp3 similarity index 100% rename from mp3/01/5012.mp3 rename to mp3/01/ett.mp3 diff --git a/mp3/01/5019.mp3 b/mp3/01/fem.mp3 similarity index 100% rename from mp3/01/5019.mp3 rename to mp3/01/fem.mp3 diff --git a/mp3/01/5020.mp3 b/mp3/01/femton.mp3 similarity index 100% rename from mp3/01/5020.mp3 rename to mp3/01/femton.mp3 diff --git a/mp3/01/5044.mp3 b/mp3/01/från.mp3 similarity index 100% rename from mp3/01/5044.mp3 rename to mp3/01/från.mp3 diff --git a/mp3/01/5021.mp3 b/mp3/01/god_kväll.mp3 similarity index 100% rename from mp3/01/5021.mp3 rename to mp3/01/god_kväll.mp3 diff --git a/mp3/01/5022.mp3 b/mp3/01/god_morgon.mp3 similarity index 100% rename from mp3/01/5022.mp3 rename to mp3/01/god_morgon.mp3 diff --git a/mp3/01/5125.mp3 b/mp3/01/gå.mp3 similarity index 100% rename from mp3/01/5125.mp3 rename to mp3/01/gå.mp3 diff --git a/mp3/01/5023.mp3 b/mp3/01/hej.mp3 similarity index 100% rename from mp3/01/5023.mp3 rename to mp3/01/hej.mp3 diff --git a/mp3/01/5024.mp3 b/mp3/01/hjälp.mp3 similarity index 100% rename from mp3/01/5024.mp3 rename to mp3/01/hjälp.mp3 diff --git a/mp3/01/5046.mp3 b/mp3/01/hur.mp3 similarity index 100% rename from mp3/01/5046.mp3 rename to mp3/01/hur.mp3 diff --git a/mp3/01/5027.mp3 b/mp3/01/ja.mp3 similarity index 100% rename from mp3/01/5027.mp3 rename to mp3/01/ja.mp3 diff --git a/mp3/01/5026.mp3 b/mp3/01/jag_föddes.mp3 similarity index 100% rename from mp3/01/5026.mp3 rename to mp3/01/jag_föddes.mp3 diff --git a/mp3/01/5028.mp3 b/mp3/01/komma.mp3 similarity index 100% rename from mp3/01/5028.mp3 rename to mp3/01/komma.mp3 diff --git a/mp3/01/5029.mp3 b/mp3/01/leva.mp3 similarity index 100% rename from mp3/01/5029.mp3 rename to mp3/01/leva.mp3 diff --git a/mp3/01/5008.mp3 b/mp3/01/lovet.mp3 similarity index 100% rename from mp3/01/5008.mp3 rename to mp3/01/lovet.mp3 diff --git a/mp3/01/5007.mp3 b/mp3/01/namnet.mp3 similarity index 100% rename from mp3/01/5007.mp3 rename to mp3/01/namnet.mp3 diff --git a/mp3/01/5030.mp3 b/mp3/01/nej.mp3 similarity index 100% rename from mp3/01/5030.mp3 rename to mp3/01/nej.mp3 diff --git a/mp3/01/5032.mp3 b/mp3/01/nio.mp3 similarity index 100% rename from mp3/01/5032.mp3 rename to mp3/01/nio.mp3 diff --git a/mp3/01/5033.mp3 b/mp3/01/nitton.mp3 similarity index 100% rename from mp3/01/5033.mp3 rename to mp3/01/nitton.mp3 diff --git a/mp3/01/5003.mp3 b/mp3/01/på_återseende.mp3 similarity index 100% rename from mp3/01/5003.mp3 rename to mp3/01/på_återseende.mp3 diff --git a/mp3/01/5036.mp3 b/mp3/01/se.mp3 similarity index 100% rename from mp3/01/5036.mp3 rename to mp3/01/se.mp3 diff --git a/mp3/01/5039.mp3 b/mp3/01/senare.mp3 similarity index 100% rename from mp3/01/5039.mp3 rename to mp3/01/senare.mp3 diff --git a/mp3/01/5004.mp3 b/mp3/01/sverige.mp3 similarity index 100% rename from mp3/01/5004.mp3 rename to mp3/01/sverige.mp3 diff --git a/mp3/01/5005.mp3 b/mp3/01/tack.mp3 similarity index 100% rename from mp3/01/5005.mp3 rename to mp3/01/tack.mp3 diff --git a/mp3/01/5009.mp3 b/mp3/01/tre.mp3 similarity index 100% rename from mp3/01/5009.mp3 rename to mp3/01/tre.mp3 diff --git a/mp3/01/5040.mp3 b/mp3/01/treffa.mp3 similarity index 100% rename from mp3/01/5040.mp3 rename to mp3/01/treffa.mp3 diff --git a/mp3/01/5010.mp3 b/mp3/01/tretton.mp3 similarity index 100% rename from mp3/01/5010.mp3 rename to mp3/01/tretton.mp3 diff --git a/mp3/01/5031.mp3 b/mp3/01/trevlig.mp3 similarity index 100% rename from mp3/01/5031.mp3 rename to mp3/01/trevlig.mp3 diff --git a/mp3/01/5014.mp3 b/mp3/01/tyskland.mp3 similarity index 100% rename from mp3/01/5014.mp3 rename to mp3/01/tyskland.mp3 diff --git a/mp3/01/5015.mp3 b/mp3/01/ursäkta.mp3 similarity index 100% rename from mp3/01/5015.mp3 rename to mp3/01/ursäkta.mp3 diff --git a/mp3/01/5049.mp3 b/mp3/01/var.mp3 similarity index 100% rename from mp3/01/5049.mp3 rename to mp3/01/var.mp3 diff --git a/mp3/01/5045.mp3 b/mp3/01/varför.mp3 similarity index 100% rename from mp3/01/5045.mp3 rename to mp3/01/varför.mp3 diff --git a/mp3/01/5047.mp3 b/mp3/01/välkommen.mp3 similarity index 100% rename from mp3/01/5047.mp3 rename to mp3/01/välkommen.mp3 diff --git a/mp3/01/5006.mp3 b/mp3/01/året.mp3 similarity index 100% rename from mp3/01/5006.mp3 rename to mp3/01/året.mp3 diff --git a/mp3/01/5002.mp3 b/mp3/01/årton.mp3 similarity index 100% rename from mp3/01/5002.mp3 rename to mp3/01/årton.mp3 diff --git a/mp3/01/5001.mp3 b/mp3/01/åtta.mp3 similarity index 100% rename from mp3/01/5001.mp3 rename to mp3/01/åtta.mp3 diff --git a/mp3/02/5054.mp3 b/mp3/02/5054.mp3 deleted file mode 100644 index 9bd5c8d..0000000 Binary files a/mp3/02/5054.mp3 and /dev/null differ diff --git a/mp3/02/5055.mp3 b/mp3/02/5055.mp3 deleted file mode 100644 index 1374c92..0000000 Binary files a/mp3/02/5055.mp3 and /dev/null differ diff --git a/mp3/02/5056.mp3 b/mp3/02/5056.mp3 deleted file mode 100644 index b2aa86a..0000000 Binary files a/mp3/02/5056.mp3 and /dev/null differ diff --git a/mp3/på_återseende.mp3 b/mp3/på_återseende.mp3 deleted file mode 100644 index d4c9c82..0000000 Binary files a/mp3/på_återseende.mp3 and /dev/null differ diff --git a/mp3/toRightName.py b/mp3/toRightName.py new file mode 100644 index 0000000..13235cf --- /dev/null +++ b/mp3/toRightName.py @@ -0,0 +1,53 @@ +import sys + +import whisper +import os +import re +import ssl + + +def transcribe_and_fix(mp3_file): + # 1. Whisper Modell laden (Base reicht für einzelne Wörter meist aus) + + # 1. SSL-Check für Standard-Python-Tools deaktivieren + if (not os.environ.get('PYTHONHTTPSVERIFY', '') and + getattr(ssl, '_create_unverified_context', None)): + ssl._create_default_https_context = ssl._create_unverified_context + + # 2. Umgebungsvariable setzen, die viele Bibliotheken (wie certifi) erkennen + os.environ['CURL_CA_BUNDLE'] = "" + os.environ['PYTHONHTTPSVERIFY'] = "0" + + model = whisper.load_model("large-v3") + + directory = os.path.dirname(mp3_file) + + #ssl._create_default_https_context = ssl._create_unverified_context + + print("Analysiere Audio...") + # 'language="sv"' zwingt Whisper auf Schwedisch + result = model.transcribe(mp3_file, language="sv", fp16=False) + text = result['text'].strip() + + # 2. Fehlerhafte Zeichen & Leerzeichen korrigieren + # Wir entfernen alles, was kein Buchstabe oder Zahl ist + # und ersetzen Leerzeichen durch Unterstriche + clean_text = re.sub(r'[^\w\säöåÄÖÅ]', '', text) # Behält schwedische Zeichen + clean_text = clean_text.replace(" ", "_").lower() + + if not clean_text: + print("Konnte keinen Text extrahieren.") + return + + new_filename = f"{clean_text}.mp3" + + # 3. Umbenennen + try: + os.rename(mp3_file, directory +"/" + new_filename) + print(f"Erfolg: '{mp3_file}' -> '{new_filename}'") + except Exception as e: + print(f"Fehler beim Umbenennen: {e}") + + +# Testlauf +transcribe_and_fix(sys.argv[1]) \ No newline at end of file diff --git a/mp3/åtta.mp3 b/mp3/åtta.mp3 deleted file mode 100644 index 58be7ad..0000000 Binary files a/mp3/åtta.mp3 and /dev/null differ diff --git a/mp3cut/mp3cut.py b/mp3cut/mp3cut.py index 37d8138..ca40647 100644 --- a/mp3cut/mp3cut.py +++ b/mp3cut/mp3cut.py @@ -3,13 +3,13 @@ import speech_recognition as sr import os # Lade die MP3-Datei und konvertiere sie zu WAV -audio = AudioSegment.from_mp3("20250614.mp3") +audio = AudioSegment.from_mp3("/Users/svenriwoldt/PycharmProjects/CSV2ANKI/mp3/01/5002.mp3") audio = audio.set_channels(2).set_frame_rate(48000) # Mono & 16kHz für bessere Erkennung BUFFER_BEFORE = 300 BUFFER_AFTER = 300 # Stille erkennen mit optimierten Werten -silent_ranges = silence.detect_silence(audio, min_silence_len=400, silence_thresh=-45) +silent_ranges = silence.detect_silence(audio, min_silence_len=400, silence_thresh=0) silent_ranges = [(start, end) for start, end in silent_ranges if end - start > 200] # Kurze Pausen filtern # Wortsegmente bestimmen