daswer123 · abeiro · Jun 11, 2024 · Sep 2, 2024 · Sep 12, 2024 · Sep 12, 2024
diff --git a/.gitignore b/.gitignore
@@ -1,11 +1,10 @@
 dist
 venv
-speakers
 output
 test
 models
 xtts_api_server/models
 *.pyc
 xtts_api_server/RealtimeTTS/engines/coqui_engine_old.py
 xtts_models
-modules-xtts.txt
+modules-xtts.txt
diff --git a/XTTSv2_AIFF.ipynb b/XTTSv2_AIFF.ipynb
@@ -0,0 +1,116 @@
+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "provenance": [],
+      "gpuType": "T4"
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    },
+    "language_info": {
+      "name": "python"
+    },
+    "accelerator": "GPU"
+  },
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "source": [
+        "**Run next block, restart session when asked and run same block until everything installs.**\n",
+        "\n",
+        "Last message should be like this (yes, ignore ERROR)\n",
+        "\n",
+        "\n",
+        "```\n",
+        "ERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.\n",
+        "torchvision 0.19.0+cu121 requires torch==2.4.0, but you have torch 2.1.1+cu121 which is incompatible\n",
+        "Successfully installed torch-2.1.1+cu121 torchaudio-2.1.1+cu121 triton-2.1.0\n",
+        "\n",
+        "```\n",
+        "\n"
+      ],
+      "metadata": {
+        "id": "FmMMJppi2-Gh"
+      }
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "id": "lT4ieCTnr_L7"
+      },
+      "outputs": [],
+      "source": [
+        "!apt-get update && apt-get install --no-install-recommends -y sox libsox-fmt-all curl wget gcc git git-lfs build-essential libaio-dev libsndfile1 ssh ffmpeg sshpass portaudio19-dev libportaudio2\n",
+        "!git clone https://github.com/abeiro/xtts-api-server\n",
+        "%cd xtts-api-server\n",
+        "!python3 -m pip install --upgrade pip wheel ninja virtualenv\n",
+        "!pip install setuptools==68.1.2\n",
+        "!pip install deepspeed\n",
+        "!pip install -r requirements.txt\n",
+        "!pip install torch==2.1.1+cu121 torchaudio==2.1.1+cu121 --index-url https://download.pytorch.org/whl/cu121"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "**Run this once to get model downloaded and deepspeed compiled. Once uvicorn starts, stop and proceed to next block**\n",
+        "\n",
+        "\n",
+        "\n"
+      ],
+      "metadata": {
+        "id": "u1Ir_s5U3ZcT"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "!python3 -m xtts_api_server --listen --deepspeed"
+      ],
+      "metadata": {
+        "id": "Xs5dXNL43VFB"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "**Run and note cloudflare address. Wait for message:**\n",
+        "\n",
+        "```\n",
+        "INFO:     Uvicorn running on http://0.0.0.0:8020 (Press CTRL+C to quit)\n",
+        "\n",
+        "```\n",
+        "\n",
+        "Use http://generated-domain-name:80 in AI-FF conf.\n",
+        "\n"
+      ],
+      "metadata": {
+        "id": "xOowr61z3nT2"
+      }
+    },
+    {
+      "cell_type": "code",
+      "source": [
+        "#Run\n",
+        "!rm nohup.out\n",
+        "!wget -c https://github.com/cloudflare/cloudflared/releases/latest/download/cloudflared-linux-amd64 -O cloudflared-linux-amd64\n",
+        "!chmod +x cloudflared-linux-amd64\n",
+        "!nohup ./cloudflared-linux-amd64 tunnel --url http://localhost:8020 &\n",
+        "!sleep 8\n",
+        "!cat nohup.out\n",
+        "!python3 -m xtts_api_server --listen --deepspeed"
+      ],
+      "metadata": {
+        "id": "xuLmVnEW2PYM"
+      },
+      "execution_count": null,
+      "outputs": []
+    }
+  ]
+}
diff --git a/conf.sh b/conf.sh
@@ -0,0 +1,65 @@
+#!/bin/bash
+clear
+cat << EOF
+CHIM XTTS
+
+This will install CHIM XTTS. This is a high quality TTS service that works with Skyrim voices. 
+You can also generate your own voices.
+However it will require around 4GB of VRAM! 
+
+Options:
+* deepseed = Uses more VRAM but faster
+* lowvram = Uses less VRAM but slower
+* regular = Middle ground of both options above
+
+If you are not sure use lowvram.
+
+EOF
+
+if [ ! -d /home/dwemer/python-tts ]; then
+        exit "XTTSv2 not installed"
+fi
-if [ ! -d /home/dwemer/python-tts ]; then
-        exit "XTTSv2 not installed"
-fi
+if [ ! -d /home/dwemer/python-tts ]; then
+        echo "Error: XTTSv2 not installed" >&2
+        exit 1
+fi
-if [ ! -d /home/dwemer/python-tts ]; then
-        exit "XTTSv2 not installed"
-fi
+if [ ! -d /home/dwemer/python-tts ]; then
+        echo "Error: XTTSv2 not installed" >&2
+        exit 1
+fi
+
+mapfile -t files < <(find /home/dwemer/xtts-api-server/ -name "start-*.sh")
+# Check if any files were found
+
+if [ ${#files[@]} -eq 0 ]; then
+    echo "No files found matching the pattern."
+    exit 1
+fi
+
+# Display the files in a numbered list
+echo -e "Select a an option from the list:\n\n"
+for i in "${!files[@]}"; do
+    echo "$((i+1)). ${files[$i]}"
+done
+
+echo "0. Disable service";
+echo
+
-# Display the files in a numbered list
-echo -e "Select a an option from the list:\n\n"
-for i in "${!files[@]}"; do
-    echo "$((i+1)). ${files[$i]}"
-done
-
-echo "0. Disable service";
-echo
+# Display the files in a numbered list
+echo -e "Select an option from the list:\n\n"
+for i in "${!files[@]}"; do
+    echo "$((i+1)). ${files[$i]}"
+done
+
+echo "0. Disable service";
+echo
-# Display the files in a numbered list
-echo -e "Select a an option from the list:\n\n"
-for i in "${!files[@]}"; do
-    echo "$((i+1)). ${files[$i]}"
-done
-
-echo "0. Disable service";
-echo
+# Display the files in a numbered list
+echo -e "Select an option from the list:\n\n"
+for i in "${!files[@]}"; do
+    echo "$((i+1)). ${files[$i]}"
+done
+
+echo "0. Disable service";
+echo
+# Prompt the user to make a selection
+read -p "Select an option by picking the matching number: " selection
+
+# Validate the input
+
+if [ "$selection" -eq "0" ]; then
+    echo "Disabling service. Run this again to enable"
+    rm /home/dwemer/xtts-api-server/start.sh &>/dev/null
+    exit 0
+fi
+
+if ! [[ "$selection" =~ ^[0-9]+$ ]] || [ "$selection" -lt 1 ] || [ "$selection" -gt ${#files[@]} ]; then
+    echo "Invalid selection."
+    exit 1
+fi
-if [ "$selection" -eq "0" ]; then
-    echo "Disabling service. Run this again to enable"
-    rm /home/dwemer/xtts-api-server/start.sh &>/dev/null
-    exit 0
-fi
-
-if ! [[ "$selection" =~ ^[0-9]+$ ]] || [ "$selection" -lt 1 ] || [ "$selection" -gt ${#files[@]} ]; then
-    echo "Invalid selection."
-    exit 1
-fi
+# Check for zero before numeric comparison
+if [ "$selection" = "0" ]; then
+    echo "Disabling service. Run this again to enable"
+    rm /home/dwemer/xtts-api-server/start.sh &>/dev/null
+    exit 0
+fi
+
+if ! [[ "$selection" =~ ^[0-9]+$ ]] || [ "$selection" -lt 1 ] || [ "$selection" -gt ${#files[@]} ]; then
+    echo "Invalid selection."
+    exit 1
+fi
-if [ "$selection" -eq "0" ]; then
-    echo "Disabling service. Run this again to enable"
-    rm /home/dwemer/xtts-api-server/start.sh &>/dev/null
-    exit 0
-fi
-
-if ! [[ "$selection" =~ ^[0-9]+$ ]] || [ "$selection" -lt 1 ] || [ "$selection" -gt ${#files[@]} ]; then
-    echo "Invalid selection."
-    exit 1
-fi
+# Check for zero before numeric comparison
+if [ "$selection" = "0" ]; then
+    echo "Disabling service. Run this again to enable"
+    rm /home/dwemer/xtts-api-server/start.sh &>/dev/null
+    exit 0
+fi
+
+if ! [[ "$selection" =~ ^[0-9]+$ ]] || [ "$selection" -lt 1 ] || [ "$selection" -gt ${#files[@]} ]; then
+    echo "Invalid selection."
+    exit 1
+fi
+
+# Get the selected file
+selected_file="${files[$((selection-1))]}"
+
+echo "You selected: $selected_file"
+
+ln -sf $selected_file /home/dwemer/xtts-api-server/start.sh
-ln -sf $selected_file /home/dwemer/xtts-api-server/start.sh
+ln -sf "$selected_file" "/home/dwemer/xtts-api-server/start.sh"
-ln -sf $selected_file /home/dwemer/xtts-api-server/start.sh
+ln -sf "$selected_file" "/home/dwemer/xtts-api-server/start.sh"
+
+
+
+
diff --git a/ddistro_install.sh b/ddistro_install.sh
@@ -0,0 +1,54 @@
+#!/bin/bash
+
+cd /home/dwemer/xtts-api-server
-cd /home/dwemer/xtts-api-server
+cd /home/dwemer/xtts-api-server || { echo "Error: cannot cd to xtts-api-server"; exit 1; }
-cd /home/dwemer/xtts-api-server
+cd /home/dwemer/xtts-api-server || { echo "Error: cannot cd to xtts-api-server"; exit 1; }
+python3 -m venv /home/dwemer/python-tts
+source /home/dwemer/python-tts/bin/activate
+
+echo "This will take a while so please wait."
+
+# Ask user about GPU
+read -p "Are you using a GT10XX series GPU? (yes/no): " gpu_answer
+if [[ "$gpu_answer" =~ ^[Yy][Ee][Ss]$ || "$gpu_answer" =~ ^[Yy]$ ]]; then
+    cu_tag="cu118"
+    torch_url="https://download.pytorch.org/whl/${cu_tag}"
+    torch_ver="2.2.2"
+    torchaudio_ver="2.2.2"
+else
+    cu_tag="cu124"
+    torch_url="https://download.pytorch.org/whl/${cu_tag}"
+    torch_ver="2.4.0"
+    torchaudio_ver="2.4.0"
+fi
+
+python3 -m pip install --upgrade pip wheel ninja virtualenv
+pip install setuptools==68.1.2
+# Install app requirements without auto-pulling torch/torchaudio from deps
+pip install --no-deps -r requirements.txt
+# Pin to stable, CUDA-tagged PyTorch/Torchaudio that do not require TorchCodec
+pip cache purge || true
+pip uninstall -y torch torchaudio torchcodec torchvision || true
+pip install --no-deps --no-cache-dir --index-url "$torch_url" "torch==${torch_ver}+${cu_tag}" "torchaudio==${torchaudio_ver}+${cu_tag}"
+pip check || true
+# Ensure fallback audio loader is available
+pip install --no-cache-dir soundfile
+#pip install xtts-api-server #Fails
+
+sed -i 's/checkpoint = load_fsspec(model_path, map_location=torch.device("cpu"))\["model"\]/checkpoint = load_fsspec(model_path, map_location=torch.device("cpu"), weights_only=False)["model"]/' /home/dwemer/python-tts/lib/python3.11/site-packages/TTS/tts/models/xtts.py
+
+cp /home/dwemer/TheNarrator.wav speakers/TheNarrator.wav
+
+source /home/dwemer/python-tts/bin/activate
+
+./conf.sh
+
+echo 
+echo "This will start CHIM XTTS to download the selected model"
+echo "Wait for the message 'Uvicorn running on http://0.0.0.0:8020 (Press CTRL+C to quit)'"
+echo "Then close this window. Press ENTER to continue"
+read
+
+echo "please wait...."
+
+python -m xtts_api_server --listen
+
-python -m xtts_api_server --listen
+-python -m xtts_api_server --listen
+python3 -m xtts_api_server --listen
-python -m xtts_api_server --listen
+-python -m xtts_api_server --listen
+python3 -m xtts_api_server --listen
+echo "Press Enter"