Spaces:

Vgjkmhf
/

cctvoi

Runtime error

App Files Files Community

Vgjkmhf commited on 19 days ago

Commit

6de1485

verified ·

1 Parent(s): 5031d1a

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -29

app.py CHANGED Viewed

@@ -14,7 +14,7 @@ import scipy.signal as signal
 from datetime import datetime
 # ==========================================
-# 1. تنظیمات اولیه
 # ==========================================
 print(">>> System Startup: RVC Pro Max...")
@@ -27,7 +27,7 @@ except ImportError as e:
     print(f"Import Error: {e}")
     sys.exit(1)
-# تنظیم مسیر FFmpeg
 try:
     static_ffmpeg.add_paths()
     ffmpeg_exe = imageio_ffmpeg.get_ffmpeg_exe()
@@ -41,7 +41,7 @@ os.environ["TEMP"] = TEMP_DIR
 os.environ["TMPDIR"] = TEMP_DIR
 # ==========================================
-# 2. توابع پردازش صدا (DSP)
 # ==========================================
 def log_message(message):
@@ -49,18 +49,19 @@ def log_message(message):
     return f"[{timestamp}] {message}"
 def apply_clarity_eq(y, sr):
-    """اعمال EQ برای شفاف‌سازی و رفع تودماغی"""
     try:
-        # 1. Low-Cut (حذف نویز زیر 60 هرتز)
         sos_hp = signal.butter(4, 60, 'hp', fs=sr, output='sos')
         y = signal.sosfilt(sos_hp, y)
-        # 2. کاهش فرکانس‌های تودماغی (حدود 1000 هرتز)
         sos_mid = signal.butter(2, [800, 1200], 'bandstop', fs=sr, output='sos')
         y_filtered = signal.sosfilt(sos_mid, y)
         y = (y * 0.7) + (y_filtered * 0.3)
-        # 3. High Boost (شفافیت)
         sos_high = signal.butter(2, 5000, 'hp', fs=sr, output='sos')
         y_high = signal.sosfilt(sos_high, y)
         y = y + (y_high * 0.15)
@@ -102,7 +103,7 @@ def cleanup_temp():
         pass
 # ==========================================
-# 3. موتور تبدیل (اصلاح شده)
 # ==========================================
 def rvc_process_pipeline(
@@ -125,18 +126,18 @@ def rvc_process_pipeline(
         model_path = model_file.name
         index_path = index_file.name if index_file else None
-        # پیش‌پردازش
         clean_audio, msg = preprocess_audio(audio_path)
         logs.append(log_message(msg))
-        # بارگذاری مدل
         logs.append(log_message(f"Model: {os.path.basename(model_path)}"))
         rvc = RVCInference(device="cpu")
         rvc.load_model(model_path)
         output_temp = os.path.join(TEMP_DIR, f"rvc_out_{int(time.time())}.wav")
-        # پارامترها
         kwargs = {
             "input_path": clean_audio,
             "output_path": output_temp,
@@ -151,7 +152,7 @@ def rvc_process_pipeline(
             "hop_length": int(hop_length)
         }
-        # فیلتر کردن پارامترهای نامعتبر
         sig = inspect.signature(rvc.infer_file)
         valid_keys = sig.parameters.keys()
@@ -169,7 +170,7 @@ def rvc_process_pipeline(
         start_time = time.time()
         rvc.infer_file(**final_kwargs)
-        # پس‌پردازش
         final_output = output_temp
         if enable_clarity and os.path.exists(output_temp):
             logs.append(log_message("Applying clarity filter..."))
@@ -178,9 +179,7 @@ def rvc_process_pipeline(
         duration = time.time() - start_time
         logs.append(log_message(f"Done! ({duration:.2f}s)"))
-        # === رفع خطای Syntax Error ===
-        # استفاده از chr(10) به جای "
-" برای جلوگیری از شکستن خط در کپی
         separator = chr(10)
         log_text = separator.join(logs)
@@ -193,7 +192,7 @@ def rvc_process_pipeline(
         return None, err_msg
 # ==========================================
-# 4. رابط کاربری
 # ==========================================
 custom_css = """
@@ -201,35 +200,35 @@ custom_css = """
 """
 with gr.Blocks(title="RVC Pro Persian", theme=gr.themes.Soft(), css=custom_css) as demo:
-    gr.Markdown("## 🎙️ RVC Pro: مبدل صدای حرفه‌ای (اصلاح شده)")
     with gr.Row():
         with gr.Column():
-            audio_input = gr.Audio(label="ورودی صدا", type="filepath")
             with gr.Row():
-                model_input = gr.File(label="مدل (.pth)", file_types=[".pth"])
-                index_input = gr.File(label="ایندکس (.index)", file_types=[".index"])
             algo_dropdown = gr.Dropdown(
                 choices=["rmvpe", "fcpe", "crepe", "harvest", "pm"],
                 value="rmvpe",
-                label="الگوریتم"
             )
-            pitch_slider = gr.Slider(-24, 24, value=0, step=1, label="تغییر گام")
-            btn_run = gr.Button("🚀 تبدیل صدا", elem_id="run_btn", variant="primary")
         with gr.Column():
-            with gr.Accordion("تنظیمات کیفیت", open=True):
-                enable_clarity = gr.Checkbox(value=True, label="رفع تودماغی (Clarity)")
-                index_rate = gr.Slider(0, 1, value=0.4, step=0.05, label="تاثیر ایندکس")
                 envelope_mix = gr.Slider(0, 1, value=0.25, step=0.05, label="Volume Mix")
                 protect_val = gr.Slider(0, 0.5, value=0.33, step=0.01, label="Protect")
                 filter_radius = gr.Slider(0, 7, value=3, step=1, label="Filter Radius")
                 resample_sr = gr.Slider(0, 48000, value=0, step=1000, label="Resample SR")
                 hop_len = gr.Slider(1, 512, value=128, step=1, label="Hop Length")
-            output_audio = gr.Audio(label="خروجی نهایی", type="filepath")
-            logs = gr.Textbox(label="گزارش", lines=5)
     btn_run.click(
         rvc_process_pipeline,

 from datetime import datetime
 # ==========================================
+# 1. SETUP & IMPORTS
 # ==========================================
 print(">>> System Startup: RVC Pro Max...")
     print(f"Import Error: {e}")
     sys.exit(1)
+# Setup FFmpeg
 try:
     static_ffmpeg.add_paths()
     ffmpeg_exe = imageio_ffmpeg.get_ffmpeg_exe()
 os.environ["TMPDIR"] = TEMP_DIR
 # ==========================================
+# 2. AUDIO PROCESSING (DSP)
 # ==========================================
 def log_message(message):
     return f"[{timestamp}] {message}"
 def apply_clarity_eq(y, sr):
+    # Apply EQ to fix nasal sound and boost clarity
     try:
+        # 1. Low-Cut (remove rumble < 60Hz)
         sos_hp = signal.butter(4, 60, 'hp', fs=sr, output='sos')
         y = signal.sosfilt(sos_hp, y)
+        # 2. Cut Nasal Frequencies (around 1000Hz)
         sos_mid = signal.butter(2, [800, 1200], 'bandstop', fs=sr, output='sos')
         y_filtered = signal.sosfilt(sos_mid, y)
+        # Mix: 70% original, 30% filtered
         y = (y * 0.7) + (y_filtered * 0.3)
+        # 3. High Boost (Air/Clarity > 5000Hz)
         sos_high = signal.butter(2, 5000, 'hp', fs=sr, output='sos')
         y_high = signal.sosfilt(sos_high, y)
         y = y + (y_high * 0.15)
         pass
 # ==========================================
+# 3. CORE INFERENCE LOGIC
 # ==========================================
 def rvc_process_pipeline(
         model_path = model_file.name
         index_path = index_file.name if index_file else None
+        # Pre-process
         clean_audio, msg = preprocess_audio(audio_path)
         logs.append(log_message(msg))
+        # Load Model
         logs.append(log_message(f"Model: {os.path.basename(model_path)}"))
         rvc = RVCInference(device="cpu")
         rvc.load_model(model_path)
         output_temp = os.path.join(TEMP_DIR, f"rvc_out_{int(time.time())}.wav")
+        # Params
         kwargs = {
             "input_path": clean_audio,
             "output_path": output_temp,
             "hop_length": int(hop_length)
         }
+        # Filter invalid params based on installed library version
         sig = inspect.signature(rvc.infer_file)
         valid_keys = sig.parameters.keys()
         start_time = time.time()
         rvc.infer_file(**final_kwargs)
+        # Post-process
         final_output = output_temp
         if enable_clarity and os.path.exists(output_temp):
             logs.append(log_message("Applying clarity filter..."))
         duration = time.time() - start_time
         logs.append(log_message(f"Done! ({duration:.2f}s)"))
+        # SAFE STRING JOINING
         separator = chr(10)
         log_text = separator.join(logs)
         return None, err_msg
 # ==========================================
+# 4. GRADIO UI
 # ==========================================
 custom_css = """
 """
 with gr.Blocks(title="RVC Pro Persian", theme=gr.themes.Soft(), css=custom_css) as demo:
+    gr.Markdown("## RVC Pro: Professional Voice Converter")
     with gr.Row():
         with gr.Column():
+            audio_input = gr.Audio(label="Input Audio", type="filepath")
             with gr.Row():
+                model_input = gr.File(label="Model (.pth)", file_types=[".pth"])
+                index_input = gr.File(label="Index (.index)", file_types=[".index"])
             algo_dropdown = gr.Dropdown(
                 choices=["rmvpe", "fcpe", "crepe", "harvest", "pm"],
                 value="rmvpe",
+                label="Algorithm"
             )
+            pitch_slider = gr.Slider(-24, 24, value=0, step=1, label="Pitch Change")
+            btn_run = gr.Button("Start Conversion", elem_id="run_btn", variant="primary")
         with gr.Column():
+            with gr.Accordion("Quality Settings", open=True):
+                enable_clarity = gr.Checkbox(value=True, label="Fix Nasal Sound (Clarity)")
+                index_rate = gr.Slider(0, 1, value=0.4, step=0.05, label="Index Rate")
                 envelope_mix = gr.Slider(0, 1, value=0.25, step=0.05, label="Volume Mix")
                 protect_val = gr.Slider(0, 0.5, value=0.33, step=0.01, label="Protect")
                 filter_radius = gr.Slider(0, 7, value=3, step=1, label="Filter Radius")
                 resample_sr = gr.Slider(0, 48000, value=0, step=1000, label="Resample SR")
                 hop_len = gr.Slider(1, 512, value=128, step=1, label="Hop Length")
+            output_audio = gr.Audio(label="Final Output", type="filepath")
+            logs = gr.Textbox(label="Logs", lines=5)
     btn_run.click(
         rvc_process_pipeline,