Explicitly add poetry export plugin; change docker compose example; s…

…peedup docker cache
Darwinkel · Feb 26, 2024 · 798956e · 798956e
1 parent 9f0cb3e
commit 798956e
Show file tree

Hide file tree

Showing 10 changed files with 22 additions and 18 deletions.
diff --git a/.github/workflows/build_docker_image.yml b/.github/workflows/build_docker_image.yml
@@ -23,6 +23,9 @@ jobs:
       - name: Install poetry
         run: curl -sSL https://install.python-poetry.org | python3 -
 
+      - name: Install poetry export plugin
+        run: poetry self add poetry-plugin-export
+
       - name: Export requirements
         run: poetry export -o requirements.txt --only main,deploy
 

diff --git a/Dockerfile b/Dockerfile
@@ -5,7 +5,7 @@ WORKDIR /usr/src/app
 RUN apt-get update && apt-get install -y ffmpeg
 
 COPY requirements.txt ./
-COPY code ./
 RUN pip install --no-cache-dir -r requirements.txt
 
+COPY code ./
 CMD [ "python", "./app.py" ]
diff --git a/README.md b/README.md
@@ -11,6 +11,9 @@ Most voices perform best when narrating medium-length sentences with medium-leng
 
 ![This paragraph is a good example of appropriate text input.](/examples/1708512151_ME2_f-player_f-Shepard.ogg)
 
+## Deployment
+GitHub Actions automatically produces a fresh image on every push to the `main` branch. See `docker-compose.example.yml` on how it can be deployed.
+
 ## History (and other experiments)
 I initially [fine-tuned SpeechT5](https://huggingface.co/learn/audio-course/chapter6/fine-tuning), but the results were disappointing. That model very frequently produced garbage and/or hallucinated output for most voices. Interestingly, it also had a very strong bias towards female speakers. 
 

diff --git a/code/app.py b/code/app.py
@@ -1,16 +1,14 @@
 """Gradio web interface for ShepardTTS."""
 
-import os
 import time
 from pathlib import Path
 
 import gradio as gr
 import numpy as np
-import torch
-from torchaudio.io import CodecConfig, StreamWriter
-
 import settings
+import torch
 from app_helpers import description, examples, links
+from torchaudio.io import CodecConfig, StreamWriter
 from utils import load_checkpoint, normalize_line
 
 model = load_checkpoint()
@@ -83,7 +81,7 @@ def predict(
     for sentence in out["wav"]:
         waveform = torch.cat((waveform, QUARTER_SECOND_PAUSE, sentence, QUARTER_SECOND_PAUSE))
 
-    base_filename = f"{os.environ['GRADIO_EXAMPLES_CACHE']}/{int(time.time())}_{character}"
+    base_filename = f"{settings.GRADIO_EXAMPLES_CACHE}/{int(time.time())}_{character}"
 
     if codec_format == "mp3":
         # Write compressed mp3
@@ -231,4 +229,4 @@ def predict(
     )
 
 demo.queue(max_size=10)
-demo.launch(debug=False, show_api=True, share=False, auth=("shepard", os.environ["SECRET_KEY"]))
+demo.launch(debug=False, show_api=True, share=False, auth=("shepard", settings.SECRET_KEY))
diff --git a/code/create_character_embeddings.py b/code/create_character_embeddings.py
@@ -3,7 +3,6 @@
 from pathlib import Path
 
 import torch
-
 from utils import load_checkpoint
 
 

diff --git a/code/create_dataset.py b/code/create_dataset.py
@@ -5,7 +5,6 @@
 import pandas as pd
 import soundfile
 from datasets import Audio, Dataset, concatenate_datasets
-
 from utils import normalize_line
 
 

diff --git a/code/inference.py b/code/inference.py
@@ -5,7 +5,6 @@
 import numpy as np
 import torch
 from torchaudio.io import StreamWriter
-
 from utils import load_checkpoint, normalize_line
 
 model = load_checkpoint()

diff --git a/code/settings.py b/code/settings.py
@@ -1,8 +1,12 @@
 """Contains some universal settings."""
+import os
 
 import torch
 
-CHECKPOINTS_CONFIG_JSON = "./current_model/config.json"
-CHECKPOINT_DIR = "./current_model"
-CHECKPOINT_VOCAB = "./current_model/vocab.json"
+CHECKPOINTS_CONFIG_JSON = "/xtts_model/config.json"
+CHECKPOINT_DIR = "/xtts_model/current_model"
+CHECKPOINT_VOCAB = "/xtts_model/current_model/vocab.json"
 DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
+
+GRADIO_EXAMPLES_CACHE = os.environ["GRADIO_EXAMPLES_CACHE"]
+SECRET_KEY = os.environ["SECRET_KEY"]
diff --git a/code/utils.py b/code/utils.py
@@ -2,12 +2,11 @@
 
 import re
 
+import settings
 from cleantext import clean
 from num2words import num2words
-from TTS.tts.configs.xtts_config import XttsConfig
-
-import settings
 from overrides import ShepardXtts
+from TTS.tts.configs.xtts_config import XttsConfig
 
 
 def load_checkpoint():

diff --git a/docker-compose.example.yml b/docker-compose.example.yml
@@ -2,11 +2,11 @@ version: '3.8'
 
 services:
   gradio:
-    build: .
+    image: "ghcr.io/darwinkel/shepardtts:main"
     ports:
       - "1337:1337"
     volumes:
-      - .:/usr/src/app
+      - ./current_model/:/xtts_model/:ro
     environment:
       GRADIO_EXAMPLES_CACHE: "/tmp/"
       GRADIO_ANALYTICS_ENABLED: False
Original file line number	Diff line number	Diff line change
Expand Up		@@ -3,7 +3,6 @@
		from pathlib import Path

		import torch

		from utils import load_checkpoint


Expand Down