abus-aikorea
diff --git a/‎.env.example‎
Lines changed: 12 additions & 0 deletions b/‎.env.example‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎LICENSE‎
Lines changed: 674 additions & 21 deletions b/‎LICENSE‎
Lines changed: 674 additions & 21 deletions
diff --git a/‎README.md‎
Lines changed: 95 additions & 114 deletions b/‎README.md‎
Lines changed: 95 additions & 114 deletions
diff --git a/‎app/abus_aicover.py‎
Lines changed: 60 additions & 0 deletions b/‎app/abus_aicover.py‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎app/abus_app_aria.py‎
Lines changed: 83 additions & 0 deletions b/‎app/abus_app_aria.py‎
Lines changed: 83 additions & 0 deletions
diff --git a/‎app/abus_app_gulliver.py‎
Lines changed: 153 additions & 0 deletions b/‎app/abus_app_gulliver.py‎
Lines changed: 153 additions & 0 deletions
@@ -0,0 +1,12 @@
+# Azure Configuration
+# Copy this file to .env and fill in your Azure credentials
+# Do NOT commit .env to version control
+
+# Azure Speech Service (TTS)
+AZURE_SPEECH_KEY=your_azure_speech_key_here
+AZURE_SPEECH_REGION=eastus
+
+# Azure Translator Service
+AZURE_TRANSLATOR_KEY=your_azure_translator_key_here
+AZURE_TRANSLATOR_ENDPOINT=https://your-translator-resource.cognitiveservices.azure.com/
+AZURE_TRANSLATOR_REGION=eastus
@@ -0,0 +1,60 @@
+import gc
+import librosa
+import soundfile as sf
+from pydub import AudioSegment
+from pedalboard import Pedalboard, Reverb, Compressor, HighpassFilter
+from pedalboard.io import AudioFile
+
+from src.aicover.rvc import Config, load_hubert, get_vc, rvc_infer
+
+
+from app.abus_path import *
+
+
+def rvc_change_voice(input_path, output_path, rvc_voice, pitch_change, f0_method, index_rate, filter_radius, rms_mix_rate, protect, crepe_hop_length):
+    voice_model_folder = os.path.join(os.getcwd(), 'model', 'rvc-voice', rvc_voice)
+    voice_pth_path = path_subfile(voice_model_folder, ".pth")
+    voice_index_path = path_subfile(voice_model_folder, ".index")
+    
+    device = 'cuda:0'
+    config = Config(device, False)
+    hubert_model = load_hubert(device, config.is_half, os.path.join(os.getcwd(), 'model', 'rvc-model', 'hubert_base.pt'))
+    cpt, version, net_g, tgt_sr, vc = get_vc(device, config.is_half, config, voice_pth_path)
+
+    # convert main vocals
+    rvc_infer(voice_index_path, index_rate, input_path, output_path, pitch_change, f0_method, cpt, version, net_g, filter_radius, tgt_sr, rms_mix_rate, protect, crepe_hop_length, vc, hubert_model)
+    del hubert_model, cpt
+    gc.collect()
+    
+    
+def rvc_add_effects(input_path, output_path, reverb_rm_size, reverb_wet, reverb_dry, reverb_damping):
+    # Initialize audio effects plugins
+    board = Pedalboard(
+        [
+            HighpassFilter(),
+            Compressor(ratio=4, threshold_db=-15),
+            Reverb(room_size=reverb_rm_size, dry_level=reverb_dry, wet_level=reverb_wet, damping=reverb_damping)
+         ]
+    )
+
+    with AudioFile(input_path) as f:
+        with AudioFile(output_path, 'w', f.samplerate, f.num_channels) as o:
+            # Read one second of audio at a time, until the file is empty:
+            while f.tell() < f.frames:
+                chunk = f.read(int(f.samplerate))
+                effected = board(chunk, f.samplerate, reset=False)
+                o.write(effected)
+                
+
+def rvc_shift_pitch(input_path, output_path, n_steps):
+    if not os.path.exists(output_path):
+        y, sr = librosa.load(input_path)
+        y_changed = librosa.effects.pitch_shift(y, sr, n_steps=n_steps)
+        sf.write(output_path, y_changed, sr)
+
+ 
+def rvc_combine_audio(audio_paths: list, output_path: str, main_gain: int, backup_gain: int, inst_gain: int, output_format: str):
+    main_vocal_audio = AudioSegment.from_wav(audio_paths[0]) + main_gain
+    backup_vocal_audio = AudioSegment.from_wav(audio_paths[1]) + backup_gain
+    instrumental_audio = AudioSegment.from_wav(audio_paths[2]) + inst_gain
+    main_vocal_audio.overlay(backup_vocal_audio).overlay(instrumental_audio).export(output_path, format=output_format)    
@@ -0,0 +1,83 @@
+import os
+import sys
+from pathlib import Path
+import random
+
+current_dir = os.path.dirname(os.path.abspath(__file__))
+parent_dir = os.path.dirname(current_dir)
+sys.path.append(parent_dir)
+
+import platform
+import torch
+import gradio as gr
+from src.config import UserConfig
+
+import src.ui as ui
+from src.i18n.i18n import I18nAuto
+i18n = I18nAuto()
+
+import structlog
+import logging
+
+level = os.environ.get("LOG_LEVEL", "INFO").upper()
+LOG_LEVEL = getattr(logging, level)
+structlog.configure(
+    wrapper_class=structlog.make_filtering_bound_logger(logging.WARNING)
+)
+logger = structlog.get_logger()
+
+
+from app.abus_genuine import *  
+from app.tab_aicover import aicover_tab
+from app.tab_demixing import demixing_tab
+
+
+##############################################################################################
+# Gradio
+##############################################################################################    
+
+def create_ui(user_config: UserConfig):
+    # css/js strings
+    css = ui.css
+    js = ui.js
+
+    with gr.Blocks(title='Aria CoverSong', css=css, theme=ui.theme) as gradio_interface:
+        gr.HTML(f'<center><h6>{i18n("")}</h6></center>')
+        
+        with gr.Tab(i18n("AI Cover")):
+            aicover_tab(user_config)
+
+        with gr.Tab(i18n("Demixing")):
+            demixing_tab(user_config)
+
+        create_app_footer()
+                        
+        gradio_interface.load(None, None, None, js="() => document.getElementsByTagName('body')[0].classList.add('dark')")
+        gradio_interface.load(None, None, None, js=f"() => {{{js}}}")
+                    
+        
+    gradio_interface.launch(
+        share=False,
+        server_name=None, 
+        server_port=7910,
+        inbrowser=True
+    )
+
+def create_app_footer():
+    gradio_version = gr.__version__
+    python_version = platform.python_version()
+    torch_version = torch.__version__
+
+    footer_items = ["🔊 [aria-coversong](https://github.com/abus-aikorea/aria-coversong)"]
+    footer_items.append(f"python: `{python_version}`")
+    footer_items.append(f"torch: `{torch_version}`")
+    footer_items.append(f"gradio: `{gradio_version}`")
+
+    genuine = "activated version"
+    footer_items.append(f"{genuine}")
+    
+    gr.Markdown(
+        " | ".join(footer_items),
+        elem_classes=["no-translate"],
+    )
+
@@ -0,0 +1,153 @@
+import os
+import sys
+from pathlib import Path
+import random
+import requests
+
+
+current_dir = os.path.dirname(os.path.abspath(__file__))
+parent_dir = os.path.dirname(current_dir)
+sys.path.append(parent_dir)
+
+matcha_dir = os.path.join(parent_dir, 'third_party', 'Matcha-TTS')
+sys.path.append(matcha_dir)
+
+
+import platform
+import torch
+import gradio as gr
+from src.config import UserConfig
+
+import src.ui as ui
+from src.i18n.i18n import I18nAuto
+i18n = I18nAuto()
+
+import structlog
+import logging
+
+logging.getLogger("httpx").setLevel(logging.WARNING)
+logging.getLogger("httpcore").setLevel(logging.WARNING)
+logging.getLogger("fairseq").setLevel(logging.WARNING)
+logging.getLogger("azure.core").setLevel(logging.WARNING)
+logging.getLogger("faster_whisper").setLevel(logging.DEBUG)
+
+logging.getLogger('matplotlib').setLevel(logging.WARNING)
+
+
+level = os.environ.get("LOG_LEVEL", "INFO").upper()
+LOG_LEVEL = getattr(logging, level)
+structlog.configure(
+    wrapper_class=structlog.make_filtering_bound_logger(logging.DEBUG)
+)
+logger = structlog.get_logger()
+
+
+from app.abus_genuine import *
+from app.tab_gulliver import gulliver_tab
+from app.tab_subtitle import subtitle_tab
+from app.tab_tts_edge import tts_edge_tab
+from app.tab_tts_f5_single import tts_f5_single_tab
+from app.tab_tts_f5_multi import tts_f5_multi_tab
+from app.tab_tts_cosyvoice import tts_cosyvoice_tab
+from app.tab_tts_kokoro import tts_kokoro_tab
+from app.tab_translate import translate_tab
+from app.tab_live_translate import live_translate_tab
+from app.tab_vsr import vsr_tab
+from app.tab_aicover import aicover_tab
+from app.tab_demixing import demixing_tab
+from app.tab_tts_rvc import tts_rvc_tab
+from app.tab_rvc import rvc_tab
+from app.tab_batch_tts import batch_tts_tab
+
+
+##############################################################################################
+# Gradio
+##############################################################################################    
+
+
+def create_ui(user_config: UserConfig):
+    # css/js strings
+    css = ui.css
+    js = ui.js
+
+    with gr.Blocks(title='Voice Gulliver', css=css, theme=ui.theme) as gradio_interface:
+        gr.HTML(f'<center><h6>{i18n("")}</h6></center>')
+        
+        with gr.Tab(i18n("Dubbing Studio")):
+            gulliver_tab(user_config)
+            
+        with gr.Tab(i18n("Whisper subtitles")):
+            subtitle_tab(user_config)            
+            
+        with gr.Tab(i18n("Translation")):
+            with gr.Tabs():
+                with gr.Tab(i18n("VOD")):
+                    translate_tab(user_config)
+                with gr.Tab(i18n("Live")):
+                    live_translate_tab(user_config)
+            
+        with gr.Tab(i18n("Speech Generation")):
+            with gr.Tabs():
+                tab_name = i18n('Azure-TTS') if azure_text_api_working() else i18n('Edge-TTS')
+                with gr.Tab(tab_name):
+                    tts_edge_tab(user_config)
+                with gr.Tab(i18n("F5-TTS (Single)")):
+                    tts_f5_single_tab(user_config)
+                with gr.Tab(i18n("F5-TTS (Multi)")):
+                    tts_f5_multi_tab(user_config)                   
+                with gr.Tab(i18n("CosyVoice")):
+                    tts_cosyvoice_tab(user_config)                           
+                with gr.Tab(i18n("kokoro")):
+                    tts_kokoro_tab(user_config)       
+                    
+        with gr.Tab(i18n("AI Cover")):
+            with gr.Tabs():                      
+                with gr.Tab(i18n("Cover Studio")):
+                    aicover_tab(user_config)                                    
+                with gr.Tab(i18n("Demixing")):
+                    demixing_tab(user_config)              
+
+        with gr.Tab(i18n("Batch processing")):
+            batch_tts_tab(user_config)
+
+        with gr.Tab(i18n("RVC")):
+            rvc_tab(user_config)
+                                 
+        with gr.Tab(i18n("TTS + RVC")):
+            tts_rvc_tab(user_config)
+            
+        with gr.Tab(i18n("NVIDIA RTX")):
+            vsr_tab(user_config) 
+            
+        create_app_footer()    
+
+        gradio_interface.load(None, None, None, js="() => document.getElementsByTagName('body')[0].classList.add('dark')")
+        gradio_interface.load(None, None, None, js=f"() => {{{js}}}")
+                    
+        
+    gradio_interface.launch(
+        share=False,
+        server_name=None, 
+        server_port=7860,
+        inbrowser=True
+    )
+    
+def create_app_footer():
+    gradio_version = gr.__version__
+    python_version = platform.python_version()
+    torch_version = torch.__version__
+
+    footer_items = ["🔊 [voice-gulliver](https://github.com/abus-aikorea/voice-gulliver)"]
+    footer_items.append(f"python: `{python_version}`")
+    footer_items.append(f"torch: `{torch_version}`")
+    footer_items.append(f"gradio: `{gradio_version}`")
+
+    genuine = "activated version"
+    footer_items.append(f"{genuine}")
+
+    gr.Markdown(
+        " | ".join(footer_items),
+        elem_classes=["no-translate"],
+    )
+
+