redfr
/

easyGUI

Model card Files Files and versions Community

Blane187 commited on Jul 16, 2024

Commit

ad8a960

verified ·

1 Parent(s): e52d4e5

Update infer/lib/audio.py

Browse files

Files changed (1) hide show

infer/lib/audio.py +56 -57

infer/lib/audio.py CHANGED Viewed

@@ -1,57 +1,56 @@
-import platform, os
-import ffmpeg
-import numpy as np
-import av
-from io import BytesIO
-def wav2(i, o, format):
-    inp = av.open(i, "rb")
-    if format == "m4a":
-        format = "mp4"
-    out = av.open(o, "wb", format=format)
-    if format == "ogg":
-        format = "libvorbis"
-    if format == "mp4":
-        format = "aac"
-    ostream = out.add_stream(format)
-    for frame in inp.decode(audio=0):
-        for p in ostream.encode(frame):
-            out.mux(p)
-    for p in ostream.encode(None):
-        out.mux(p)
-    out.close()
-    inp.close()
-def load_audio(file, sr):
-    try:
-        # https://github.com/openai/whisper/blob/main/whisper/audio.py#L26
-        # This launches a subprocess to decode audio while down-mixing and resampling as necessary.
-        # Requires the ffmpeg CLI and `ffmpeg-python` package to be installed.
-        file = clean_path(file)  # 防止小白拷路径头尾带了空格和"和回车
-        if os.path.exists(file) == False:
-            raise RuntimeError(
-                "You input a wrong audio path that does not exists, please fix it!"
-            )
-        out, _ = (
-            ffmpeg.input(file, threads=0)
-            .output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sr)
-            .run(cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True)
-        )
-    except Exception as e:
-        traceback.print_exc()
-        raise RuntimeError(f"Failed to load audio: {e}")
-    return np.frombuffer(out, np.float32).flatten()
-def clean_path(path_str):
-    if platform.system() == "Windows":
-        path_str = path_str.replace("/", "\\")
-    return path_str.strip(" ").strip('"').strip("\n").strip('"').strip(" ")

+import platform
+import os
+import ffmpeg
+import numpy as np
+import av
+import traceback
+from io import BytesIO
+def wav2(i, o, format):
+    inp = av.open(i, "rb")
+    if format == "m4a":
+        format = "mp4"
+    out = av.open(o, "wb", format=format)
+    if format == "ogg":
+        format = "libvorbis"
+    elif format == "mp4":
+        format = "aac"
+    ostream = out.add_stream(format)
+    for frame in inp.decode(audio=0):
+        for p in ostream.encode(frame):
+            out.mux(p)
+    for p in ostream.encode(None):
+        out.mux(p)
+    out.close()
+    inp.close()
+def load_audio(file, sr):
+    try:
+        # Clean the file path
+        file = clean_path(file)
+        if not os.path.exists(file):
+            raise RuntimeError(
+                "You input a wrong audio path that does not exist, please fix it!"
+            )
+        out, _ = (
+            ffmpeg.input(file, threads=0)
+            .output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sr)
+            .run(cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True)
+        )
+    except Exception as e:
+        traceback.print_exc()
+        raise RuntimeError(f"Failed to load audio: {e}")
+    return np.frombuffer(out, np.float32).flatten()
+def clean_path(path_str):
+    if platform.system() == "Windows":
+        path_str = path_str.replace("/", "\\")
+    return path_str.strip().strip('"').strip("\n").strip('"').strip()