import gradio as gr
from rvc_infer import download_online_model
import os
import re
import random
from scipy.io.wavfile import write
from scipy.io.wavfile import read
import numpy as np
import yt_dlp
import subprocess


def download_model(url, dir_name):
    output_models = download_online_model(url, dir_name)
    return dir_name


uvr_models = {
        'BS-Roformer-Viperx-1297.ckpt': 'model_bs_roformer_ep_317_sdr_12.9755.ckpt',
        'MDX23C-8KFFT-InstVoc_HQ.ckpt': 'MDX23C-8KFFT-InstVoc_HQ.ckpt',
        'BS-Roformer-Viperx-1053.ckpt': 'model_bs_roformer_ep_937_sdr_10.5309.ckpt',
        'Mel-Roformer-Viperx-1143.ckpt': 'model_mel_band_roformer_ep_3005_sdr_11.4360.ckpt',
        'Kim_Vocal_2.onnx': 'Kim_Vocal_2.onnx',
        'UVR-De-Echo-Aggressive.pth': 'UVR-De-Echo-Aggressive.pth',
}


output_format = [
    'wav',
    'flac',
    'mp3',
]

mdxnet_overlap_values = [
    '0.25',
    '0.5',
    '0.75',
    '0.99',
]

vrarch_window_size_values = [
    '320',
    '512',
    '1024',
]


def download_audio(url):
    ydl_opts = {
        'format': 'bestaudio/best',
        'outtmpl': 'ytdl/%(title)s.%(ext)s',
        'postprocessors': [{
            'key': 'FFmpegExtractAudio',
            'preferredcodec': 'wav',
            'preferredquality': '192',
        }],
    }

    with yt_dlp.YoutubeDL(ydl_opts) as ydl:
        info_dict = ydl.extract_info(url, download=True)
        file_path = ydl.prepare_filename(info_dict).rsplit('.', 1)[0] + '.wav'
        sample_rate, audio_data = read(file_path)
        audio_array = np.asarray(audio_data, dtype=np.int16)

        return sample_rate, audio_array

def roformer_separator(roformer_audio, roformer_model, roformer_output_format, roformer_overlap, roformer_segment_size, mdx23c_denoise, mdxnet_denoise, vrarch_tta, vrarch_high_end_process):
  files_list = []
  files_list.clear()
  directory = "./outputs"
  random_id = str(random.randint(10000, 99999))
  pattern = f"{random_id}"
  os.makedirs("outputs", exist_ok=True)
  write(f'{random_id}.wav', roformer_audio[0], roformer_audio[1])
  full_roformer_model = roformer_models[roformer_model]
  prompt = f"audio-separator {random_id}.wav --model_filename {full_roformer_model} --output_dir=./outputs --output_format={roformer_output_format} --normalization=0.9 --mdxc_overlap={roformer_overlap} --mdxc_segment_size={roformer_segment_size}"
    
    if mdx23c_denoise:
        prompt += " --mdx_enable_denoise"
  
    if mdxnet_denoise:
        prompt += " --mdx_enable_denoise"


    if vrarch_tta:
        prompt += " --vr_enable_tta"
    if vrarch_high_end_process:
        prompt += " --vr_high_end_process"

  os.system(prompt)

  for file in os.listdir(directory):
    if re.search(pattern, file):
      files_list.append(os.path.join(directory, file))

  stem1_file = files_list[0]
  stem2_file = files_list[1]

  return stem1_file, stem2_file


CSS = """
"""

with gr.Blocks(theme="Hev832/Applio", fill_width=True, css=CSS) as demo:

    with gr.Tabs():
        with gr.Tab("inferenece"):
            gr.Markdown("in progress")
        with gr.Tab("Download model"):
            gr.Markdown("## Download Model for infernece")
            url_input = gr.Textbox(label="Model URL", placeholder="Enter the URL of the model")
            dir_name_input = gr.Textbox(label="Directory Name", placeholder="Enter the directory name")
         
            download_button = gr.Button("Download Model")
        download_button.click(download_model, inputs=[url_input, dir_name_input], outputs=url_input)

        with gr.Tab("UVR5"):
            roformer_model = gr.Dropdown(
                label = "Select the Model",
                choices=list(uvr_models.keys()),
                interactive = True
            )
            roformer_output_format = gr.Dropdown(
                label = "Select the Output Format",
                choices = output_format,
                interactive = True
            )
            roformer_overlap = gr.Slider(
                minimum = 2,
                maximum = 4,
                step = 1,
                label = "Overlap",
                info = "Amount of overlap between prediction windows.",
                value = 4,
                interactive = True
            )
            roformer_segment_size = gr.Slider(
                minimum = 32,
                maximum = 4000,
                step = 32,
                label = "Segment Size",
                info = "Larger consumes more resources, but may give better results.",
                value = 256,
                interactive = True
            )
            mdx23c_denoise = gr.Checkbox(
                label = "Denoise",
                info = "Enable denoising during separation.",
                value = False,
                interactive = True
            )
        with gr.Tab(" Credits"):
            gr.Markdown(
                """
                this project made by [Blane187](https://huggingface.co/Blane187) with Improvements by [John6666](https://huggingfce.co/John6666)
                """)


demo.launch(debug=True,show_api=False)