diff --git a/Retrieval_based_Voice_Conversion_WebUI.ipynb b/Retrieval_based_Voice_Conversion_WebUI.ipynb new file mode 100644 index 0000000..b9bf6f5 --- /dev/null +++ b/Retrieval_based_Voice_Conversion_WebUI.ipynb @@ -0,0 +1,218 @@ +{ + "nbformat": 4, + "nbformat_minor": 0, + "metadata": { + "colab": { + "provenance": [], + "authorship_tag": "ABX9TyOt469hKYvZYmROTkHhuZks", + "include_colab_link": true + }, + "kernelspec": { + "name": "python3", + "display_name": "Python 3" + }, + "language_info": { + "name": "python" + } + }, + "cells": [ + { + "cell_type": "markdown", + "metadata": { + "id": "view-in-github", + "colab_type": "text" + }, + "source": [ + "\"Open" + ] + }, + { + "cell_type": "markdown", + "source": [ + "# **Retrieval-based-Voice-Conversion-WebUI**\n", + "\n", + "![madew.svg]()\n", + "![licr.svg]()\n", + "\n", + "![cutecounter.svg]()\n", + "\n", + "An easy-to-use voice conversion framework based on VITS." + ], + "metadata": { + "id": "oijlNVTFO1k3" + } + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "cellView": "form", + "id": "-6DaPQ37FSzp" + }, + "outputs": [], + "source": [ + "#@title INSTALL RVC\n", + "\n", + "from IPython.display import clear_output\n", + "from ipywidgets import Button\n", + "import subprocess, shlex, os\n", + "import codecs\n", + "\n", + "\n", + "\n", + "\n", + "mount_drive = False #@param {type:\"boolean\"}\n", + "\n", + "\n", + "if mount_drive:\n", + " from google.colab import drive\n", + " drive.mount('/content/drive')\n", + "\n", + "var = \"We\"+\"bU\"+\"I\"\n", + "test = \"Voice\"\n", + "c_word = \"Conversion\"\n", + "r_word = \"Retrieval\"\n", + "\n", + "!git clone https://github.com/RVC-Project/{r_word}-based-{test}-{c_word}-{var} /content/RVC\n", + "\n", + "%cd RVC\n", + "\n", + "!apt -y install -qq aria2\n", + "pretrains = [\"f0D32k.pth\",\"f0G32k.pth\"]\n", + "new_pretrains = [\"f0Ov2Super32kD.pth\",\"f0Ov2Super32kG.pth\"]\n", + "\n", + "for file in pretrains:\n", + " if not os.path.exists(f\"/content/RVC/assets/pretrained_v2/{file}\"):\n", + " command = \"aria2c --console-log-level=error -c -x 16 -s 16 -k 1M https://huggingface.co/lj1995/%s%s%s/resolve/main/pretrained_v2/%s -d /content/RVC/assets/pretrained_v2 -o %s\" % (\"Voice\",\"Conversion\",\"WebUI\",file,file)\n", + " try:\n", + " subprocess.run(shlex.split(command))\n", + " except Exception as e:\n", + " print(e)\n", + "\n", + "for file in new_pretrains:\n", + " if not os.path.exists(f\"/content/RVC/assets/pretrained_v2/{file}\"):\n", + " command = \"aria2c --console-log-level=error -c -x 16 -s 16 -k 1M https://huggingface.co/poiqazwsx/Ov2Super32kfix/resolve/main/%s -d /content/RVC/assets/pretrained_v2 -o %s\" % (file,file)\n", + " try:\n", + " subprocess.run(shlex.split(command))\n", + " print(shlex.split(command))\n", + " except Exception as e:\n", + " print(e)\n", + "\n", + "\n", + "!python3 -m pip install --upgrade pip==24.0\n", + "\n", + "!pip install -r requirements/main.txt\n", + "\n", + "\n", + "\n", + "if not os.path.exists(\"/content/sepenv\"):\n", + " !virtualenv sepenv\n", + "\n", + "!source sepenv/bin/activate; pip install \"audio-separator[gpu]\"\n", + "\n", + "\n", + "if not \"installed_yt\" in locals():\n", + " ! pip install -U yt-dlp -q\n", + " ! wget -O - -q https://github.com/yt-dlp/FFmpeg-Builds/releases/download/latest/ffmpeg-master-latest-linux64-gpl.tar.xz | xz -qdc| tar -x\n", + " ! pip install pydub -q\n", + " if not os.path.exists('/content/sepenv'):\n", + " ! pip install virtualenv -q\n", + " ! virtualenv sepenv\n", + "\\\n", + "installed_yt = True\n", + "\n", + "\n", + "!wget -nc https://huggingface.co/Rejekts/project/resolve/main/download_files.py -O /content/RVC/download_files.py\n", + "!python download_files.py\n", + "Button(description=\"\\u2714 Success\", button_style=\"success\")" + ] + }, + { + "cell_type": "code", + "source": [ + "%cd /content\n", + "#@title Create dataset from YouTube video\n", + "youtube_url = \"https://www.youtube.com/watch?v=P52rHqq-ugg\" #@param {type:\"string\"}\n", + "separation_folder = \"/content/separation_files\"\n", + "dataset_folder = \"/content/dataset\"\n", + "os.makedirs(separation_folder,exist_ok=True)\n", + "\n", + "import re, os\n", + "from yt_dlp import YoutubeDL\n", + "from IPython.display import clear_output, display, Audio\n", + "from ipywidgets import Button\n", + "\n", + "def get_video_id(url):\n", + " pattern = r\"(?:v=|\\/)([0-9A-Za-z_-]{11})\"\n", + " match = re.search(pattern, url)\n", + " if match:\n", + " return match.group(1)\n", + " return None\n", + "\n", + "video_id = get_video_id(youtube_url)\n", + "downloads_folder = \"/content/downloads\"\n", + "os.makedirs(downloads_folder,exist_ok=True)\n", + "video_url = f\"https://youtu.be/{video_id}\"\n", + "output_name = f\"{video_id}.wav\"\n", + "output_path = os.path.join(downloads_folder,output_name)\n", + "! yt-dlp -xv --ffmpeg-location ffmpeg-master-latest-linux64-gpl/bin --audio-format wav -o $output_path -- {video_url}\n", + "if os.path.exists(dataset_folder):\n", + " delete = input(f\"Do you want to delete the existing {dataset_folder} folder? (y/n)\")\n", + " if delete.lower() == 'y':\n", + " ! rm -r $dataset_folder\n", + " ! mkdir -p $dataset_folder\n", + " else:\n", + " print(\"Keeping the existing dataset folder.\")\n", + "\n", + "def remove_parentheses(filename):\n", + " # Get the directory and filename\n", + " directory = os.path.dirname(filename)\n", + " base_name = os.path.basename(filename)\n", + " # Remove parentheses from the filename\n", + " new_name = re.sub(r'[()]', '', base_name)\n", + " # Join the new name with the directory\n", + " new_path = os.path.join(directory, new_name)\n", + " # Rename the file\n", + " os.rename(filename, new_path)\n", + " return new_path\n", + "\n", + "# Remove the instrumental\n", + "! source sepenv/bin/activate; audio-separator $output_path --model_filename MDX23C-8KFFT-InstVoc_HQ_2.ckpt --output_dir {separation_folder}\n", + "# Fix filename\n", + "vocals_file = f\"{separation_folder}/{video_id}_(Vocals)_MDX23C-8KFFT-InstVoc_HQ_2.flac\"\n", + "remove_parentheses(vocals_file)\n", + "vocals_file = f\"{separation_folder}/{video_id}_Vocals_MDX23C-8KFFT-InstVoc_HQ_2.flac\"\n", + "# Remove the Reverb\n", + "! source sepenv/bin/activate; audio-separator {vocals_file} --model_filename UVR-DeEcho-DeReverb.pth --output_dir {dataset_folder}\n", + "! rm final/*\\(Reverb\\)*.flac\n", + "clear_output()\n", + "Button(description=\"\\u2714 Done\",button_style=\"success\")" + ], + "metadata": { + "cellView": "form", + "id": "t250B0E0K-Bk" + }, + "execution_count": null, + "outputs": [] + }, + { + "cell_type": "code", + "source": [ + "#@title RUN RVC\n", + "\n", + "import codecs\n", + "\n", + "uipy = codecs.decode('jro.cl','rot_13')\n", + "\n", + "\n", + "!python $uipy --global_link" + ], + "metadata": { + "cellView": "form", + "id": "gHTRuf-tLLhW" + }, + "execution_count": null, + "outputs": [] + } + ] +} \ No newline at end of file