Adding ffmpeg formatting

This commit is contained in:
Nik Afiq 2024-11-21 11:19:51 +09:00
parent 4a48507014
commit 2e64dc0b64
3 changed files with 16 additions and 21 deletions

10
.gitignore vendored
View File

@ -1,2 +1,12 @@
app.log app.log
.DS_Store .DS_Store
__pycache__/commons.cpython-312.pyc
__pycache__/constant.cpython-312.pyc
models/__pycache__/attentions.cpython-312.pyc
models/__pycache__/models.cpython-312.pyc
models/__pycache__/modules.cpython-312.pyc
models/__pycache__/transforms.cpython-312.pyc
models/__pycache__/utils.cpython-312.pyc
monotonic_align/__pycache__/__init__.cpython-312.pyc
text/__pycache__/__init__.cpython-312.pyc
text/__pycache__/cleaners.cpython-312.pyc

12
app.py
View File

@ -1,7 +1,6 @@
import torch import torch
from torch import LongTensor, no_grad from torch import LongTensor, no_grad
import soundfile as sf import soundfile as sf
import base64
import commons import commons
from models import utils from models import utils
from io import BytesIO from io import BytesIO
@ -12,8 +11,9 @@ from flask import Flask, request, jsonify, send_file
import threading import threading
from constant import speakerList from constant import speakerList
import logging import logging
import imageio_ffmpeg
from pydub import AudioSegment from pydub import AudioSegment
from pydub.utils import which
app = Flask(__name__) app = Flask(__name__)
@ -51,12 +51,8 @@ umas_name_to_id = {name: int(idx) for idx, name in umas.items()}
# Define a lock for thread-safe model inference # Define a lock for thread-safe model inference
model_lock = threading.Lock() model_lock = threading.Lock()
# Explicitly Set FFmpeg Path for Pydub # Set FFmpeg Path for Pydub
AudioSegment.converter = "/usr/bin/ffmpeg" AudioSegment.converter = imageio_ffmpeg.get_ffmpeg_exe()
# Debug: Print the resolved path of ffmpeg
print("FFmpeg path:", which("ffmpeg"))
def get_text(text, hps): def get_text(text, hps):
""" """

View File

@ -5,25 +5,15 @@ Cython==3.0.11
filelock==3.16.1 filelock==3.16.1
Flask==3.1.0 Flask==3.1.0
fsspec==2024.10.0 fsspec==2024.10.0
imageio-ffmpeg==0.5.1
itsdangerous==2.2.0 itsdangerous==2.2.0
Jinja2==3.1.4 Jinja2==3.1.4
MarkupSafe==3.0.2 MarkupSafe==3.0.2
mpmath==1.3.0 mpmath==1.3.0
networkx==3.4.2 networkx==3.4.2
numpy==2.1.3 numpy==2.1.3
nvidia-cublas-cu12==12.4.5.8
nvidia-cuda-cupti-cu12==12.4.127
nvidia-cuda-nvrtc-cu12==12.4.127
nvidia-cuda-runtime-cu12==12.4.127
nvidia-cudnn-cu12==9.1.0.70
nvidia-cufft-cu12==11.2.1.3
nvidia-curand-cu12==10.3.5.147
nvidia-cusolver-cu12==11.6.1.9
nvidia-cusparse-cu12==12.3.1.170
nvidia-nccl-cu12==2.21.5
nvidia-nvjitlink-cu12==12.4.127
nvidia-nvtx-cu12==12.4.127
pycparser==2.22 pycparser==2.22
pydub==0.25.1
pyopenjtalk==0.3.4 pyopenjtalk==0.3.4
scipy==1.14.1 scipy==1.14.1
setuptools==75.5.0 setuptools==75.5.0
@ -31,7 +21,6 @@ soundfile==0.12.1
sympy==1.13.1 sympy==1.13.1
torch==2.5.1 torch==2.5.1
tqdm==4.67.0 tqdm==4.67.0
triton==3.1.0
typing_extensions==4.12.2 typing_extensions==4.12.2
Unidecode==1.3.8 Unidecode==1.3.8
Werkzeug==3.1.3 Werkzeug==3.1.3