Spaces:

microhum
/

Nurse_LLM_Demo

Sleeping

App Files Files Community

Titihinan Sobking commited on Dec 11, 2024

Commit

5bf324a

unverified ·

2 Parent(s): 982f969 e05a344

Merge pull request #1 from Ohmmykung09/main

Browse files

Files changed (8) hide show

.env_template +3 -1
.gitignore +167 -2
__pycache__/main.cpython-311.pyc +0 -0
llm/__pycache__/basemodel.cpython-311.pyc +0 -0
llm/__pycache__/client.cpython-311.pyc +0 -0
llm/__pycache__/llm.cpython-311.pyc +0 -0
llm/__pycache__/prompt.cpython-311.pyc +0 -0
tts/tts.py +186 -0

.env_template CHANGED Viewed

@@ -1,2 +1,4 @@
 TYPHOON_CHAT_API = *
-OPENTHAIGPT_CHAT_API = *

 TYPHOON_CHAT_API = *
+OPENTHAIGPT_CHAT_API = *
+BOTNOI_API_TOKEN = *
+VAJA9_API_KEY = *

.gitignore CHANGED Viewed

@@ -1,3 +1,168 @@
-.venv
 .env
-__pycache__

+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# UV
+#   Similar to Pipfile.lock, it is generally recommended to include uv.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#uv.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
+.pdm.toml
+.pdm-python
+.pdm-build/
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
 .env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/

__pycache__/main.cpython-311.pyc DELETED Viewed

Binary file (2.97 kB)

llm/__pycache__/basemodel.cpython-311.pyc DELETED Viewed

Binary file (3.48 kB)

llm/__pycache__/client.cpython-311.pyc DELETED Viewed

Binary file (3.69 kB)

llm/__pycache__/llm.cpython-311.pyc DELETED Viewed

Binary file (9.32 kB)

llm/__pycache__/prompt.cpython-311.pyc DELETED Viewed

Binary file (22 kB)

tts/tts.py ADDED Viewed

	@@ -0,0 +1,186 @@

+from fastapi import FastAPI, HTTPException
+from pythainlp.tokenize import sent_tokenize
+from pydantic import BaseModel , Field
+import requests
+from fastapi.responses import FileResponse
+import uuid
+from dotenv import load_dotenv
+import os
+# Load environment variables
+load_dotenv()
+app = FastAPI()
+# Pydantic model for input validation
+class VoiceRequest(BaseModel):
+    text: str
+    audio_id: str = "EUOJF"
+    speaker: str = "52"
+    volume: int = 100
+    speed: float = 1
+    type_media: str = "mp3"
+    language: str = "th"
+    token: str = os.getenv("BOTNOI_API_TOKEN")
+# Function to split text for text delay
+def auto_generate_text_delay_with_pythainlp(text):
+    text_delay = sent_tokenize(text, engine="thaisum")
+    text_delay = " ".join(text_delay).strip()
+    return text_delay
+# Function to call Botnoi's API to generate voice
+def generate_voice(audio_id, text, text_delay, speaker, volume, speed, type_media, language, token):
+    url = "https://api-genvoice.botnoi.ai/voice/v1/generate_voice?provider=botnoivoice"
+    headers = {
+        "Accept": "application/json, text/plain, */*",
+        "Authorization": f"Bearer {token}",
+        "Content-Type": "application/json",
+    }
+    payload = {
+        "audio_id": audio_id,
+        "text": text,
+        "text_delay": text_delay,
+        "speaker": speaker,
+        "volume": str(volume),
+        "speed": str(speed),
+        "type_media": type_media,
+        "language": language,
+    }
+    response = requests.post(url, headers=headers, json=payload)
+    if response.status_code == 200:
+        data = response.json()
+        if "data" in data:
+            return data["data"]  # URL of the generated audio
+        else:
+            raise HTTPException(status_code=500, detail=data.get("message", "Unknown error"))
+    else:
+        raise HTTPException(status_code=response.status_code, detail="Voice generation failed")
+# Function to download MP3 from a URL
+def download_mp3(url, output_path):
+    headers = {
+        "Accept-Encoding": "identity;q=1, *;q=0",
+        "Range": "bytes=0-",
+        "Referer": "https://voice.botnoi.ai/",
+    }
+    response = requests.get(url, headers=headers, stream=True)
+    if response.status_code == 200:
+        with open(output_path, "wb") as file:
+            for chunk in response.iter_content(chunk_size=1024):
+                if chunk:  # Filter out keep-alive chunks
+                    file.write(chunk)
+    else:
+        raise HTTPException(status_code=response.status_code, detail="Failed to download MP3")
+# FastAPI endpoint to generate and download voice
+@app.post("/generate_voice_botnoi/")
+def generate_voice_endpoint(request: VoiceRequest):
+    text_delay = auto_generate_text_delay_with_pythainlp(request.text)
+    audio_url = generate_voice(
+        audio_id=request.audio_id,
+        text=request.text,
+        text_delay=text_delay,
+        speaker=request.speaker,
+        volume=request.volume,
+        speed=request.speed,
+        type_media=request.type_media,
+        language=request.language,
+        token=request.token,
+    )
+    # Generate unique filename for the MP3
+    output_file = f"{uuid.uuid4()}.mp3"
+    download_mp3(audio_url, output_file)
+    return FileResponse(output_file, media_type="audio/mpeg", filename="output.mp3")
+# -----------------------------------------------------------VAJA9-----------------------------------------------------------
+# VAJA9 Voice Generation
+class Vaja9Request(BaseModel):
+    text: str
+    speaker: int = 1
+    phrase_break: int = 0
+    audiovisual: int = 0
+def split_text_into_chunks(text: str, chunk_size: int = 20) -> list:
+    words = text.split()
+    return [' '.join(words[i:i + chunk_size]) for i in range(0, len(words), chunk_size)]
+def generate_vaja9_voice(text: str, speaker: int, phrase_break: int, audiovisual: int):
+    url = 'https://api.aiforthai.in.th/vaja9/synth_audiovisual'
+    headers = {
+        'Apikey': os.getenv("VAJA9_API_KEY"),
+        'Content-Type': 'application/json'
+    }
+    data = {
+        'input_text': text,
+        'speaker': speaker,
+        'phrase_break': phrase_break,
+        'audiovisual': audiovisual
+    }
+    try:
+        response = requests.post(url, json=data, headers=headers, timeout=60)  # Increased timeout to 60 seconds
+        if response.status_code == 200:
+            return response.json()['wav_url']
+        elif response.status_code == 502:
+            raise HTTPException(status_code=502, detail="Bad Gateway - The server received an invalid response from the upstream server")
+        else:
+            raise HTTPException(status_code=response.status_code, detail="Voice generation failed")
+    except requests.exceptions.ReadTimeout:
+        raise HTTPException(status_code=504, detail="Gateway Timeout - The server took too long to respond")
+    except requests.exceptions.RequestException as e:
+        raise HTTPException(status_code=502, detail=f"Bad Gateway - Connection error: {str(e)}")
+def download_vaja9_wav(url: str, output_path: str):
+    headers = {'Apikey': os.getenv("VAJA9_API_KEY")}
+    try:
+        response = requests.get(url, headers=headers, timeout=60)  # Increased timeout to 60 seconds
+        if response.status_code == 200:
+            with open(output_path, 'wb') as file:
+                file.write(response.content)
+        elif response.status_code == 502:
+            raise HTTPException(status_code=502, detail="Bad Gateway - The server received an invalid response from the upstream server")
+        else:
+            raise HTTPException(status_code=response.status_code, detail="Failed to download WAV")
+    except requests.exceptions.ReadTimeout:
+        raise HTTPException(status_code=504, detail="Gateway Timeout - The server took too long to respond")
+    except requests.exceptions.RequestException as e:
+        raise HTTPException(status_code=502, detail=f"Bad Gateway - Connection error: {str(e)}")
+@app.post("/generate_voice_vaja9/")
+def generate_voice_vaja9_endpoint(request: Vaja9Request):
+    try:
+        # Split text into chunks of 20 words if needed
+        text_chunks = split_text_into_chunks(request.text)
+        output_files = []
+        # Process each chunk
+        for chunk in text_chunks:
+            audio_url = generate_vaja9_voice(
+                text=chunk,
+                speaker=request.speaker,
+                phrase_break=request.phrase_break,
+                audiovisual=request.audiovisual
+            )
+            # Generate unique filename for each chunk
+            output_file = f"{uuid.uuid4()}.wav"
+            download_vaja9_wav(audio_url, output_file)
+            output_files.append(output_file)
+        # If only one chunk, return it directly
+        if len(output_files) == 1:
+            return FileResponse(output_files[0], media_type="audio/wav", filename="output.wav")
+        # TODO: If multiple chunks, they should be combined into a single audio file
+        # For now, return the first chunk
+        return FileResponse(output_files[0], media_type="audio/wav", filename="output.wav")
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(status_code=502, detail=f"Bad Gateway - Unexpected error: {str(e)}")