-
Notifications
You must be signed in to change notification settings - Fork 205
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
整理: キャラクター情報機能を API Router でモジュール化 (#1159)
* refactor: キャラクター情報 APIs をモジュール化 * fix: lint * fix: `router` 名を明瞭化 * character->speaker --------- Co-authored-by: Hiroshiba Kazuyuki <[email protected]>
- Loading branch information
Showing
2 changed files
with
171 additions
and
153 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,167 @@ | ||
"""話者情報機能を提供する API Router""" | ||
|
||
import base64 | ||
import json | ||
from pathlib import Path | ||
from typing import Callable, Literal | ||
|
||
from fastapi import APIRouter, HTTPException | ||
from pydantic import parse_obj_as | ||
|
||
from voicevox_engine.core.core_adapter import CoreAdapter | ||
from voicevox_engine.metas.MetasStore import MetasStore, filter_speakers_and_styles | ||
from voicevox_engine.model import Speaker, SpeakerInfo | ||
|
||
|
||
def b64encode_str(s: bytes) -> str: | ||
return base64.b64encode(s).decode("utf-8") | ||
|
||
|
||
def generate_router( | ||
get_core: Callable[[str | None], CoreAdapter], | ||
metas_store: MetasStore, | ||
root_dir: Path, | ||
) -> APIRouter: | ||
"""話者情報 API Router を生成する""" | ||
router = APIRouter() | ||
|
||
@router.get("/speakers", response_model=list[Speaker], tags=["その他"]) | ||
def speakers( | ||
core_version: str | None = None, | ||
) -> list[Speaker]: | ||
speakers = metas_store.load_combined_metas(get_core(core_version)) | ||
return filter_speakers_and_styles(speakers, "speaker") | ||
|
||
@router.get("/speaker_info", response_model=SpeakerInfo, tags=["その他"]) | ||
def speaker_info( | ||
speaker_uuid: str, | ||
core_version: str | None = None, | ||
) -> SpeakerInfo: | ||
""" | ||
指定されたspeaker_uuidに関する情報をjson形式で返します。 | ||
画像や音声はbase64エンコードされたものが返されます。 | ||
""" | ||
return _speaker_info( | ||
speaker_uuid=speaker_uuid, | ||
speaker_or_singer="speaker", | ||
core_version=core_version, | ||
) | ||
|
||
# FIXME: この関数をどこかに切り出す | ||
def _speaker_info( | ||
speaker_uuid: str, | ||
speaker_or_singer: Literal["speaker", "singer"], | ||
core_version: str | None, | ||
) -> SpeakerInfo: | ||
# エンジンに含まれる話者メタ情報は、次のディレクトリ構造に従わなければならない: | ||
# {root_dir}/ | ||
# speaker_info/ | ||
# {speaker_uuid_0}/ | ||
# policy.md | ||
# portrait.png | ||
# icons/ | ||
# {id_0}.png | ||
# {id_1}.png | ||
# ... | ||
# portraits/ | ||
# {id_0}.png | ||
# {id_1}.png | ||
# ... | ||
# voice_samples/ | ||
# {id_0}_001.wav | ||
# {id_0}_002.wav | ||
# {id_0}_003.wav | ||
# {id_1}_001.wav | ||
# ... | ||
# {speaker_uuid_1}/ | ||
# ... | ||
|
||
# 該当話者の検索 | ||
speakers = parse_obj_as( | ||
list[Speaker], json.loads(get_core(core_version).speakers) | ||
) | ||
speakers = filter_speakers_and_styles(speakers, speaker_or_singer) | ||
for i in range(len(speakers)): | ||
if speakers[i].speaker_uuid == speaker_uuid: | ||
speaker = speakers[i] | ||
break | ||
else: | ||
raise HTTPException(status_code=404, detail="該当する話者が見つかりません") | ||
|
||
try: | ||
speaker_path = root_dir / "speaker_info" / speaker_uuid | ||
# 話者情報の取得 | ||
# speaker policy | ||
policy_path = speaker_path / "policy.md" | ||
policy = policy_path.read_text("utf-8") | ||
# speaker portrait | ||
portrait_path = speaker_path / "portrait.png" | ||
portrait = b64encode_str(portrait_path.read_bytes()) | ||
# スタイル情報の取得 | ||
style_infos = [] | ||
for style in speaker.styles: | ||
id = style.id | ||
# style icon | ||
style_icon_path = speaker_path / "icons" / f"{id}.png" | ||
icon = b64encode_str(style_icon_path.read_bytes()) | ||
# style portrait | ||
style_portrait_path = speaker_path / "portraits" / f"{id}.png" | ||
style_portrait = None | ||
if style_portrait_path.exists(): | ||
style_portrait = b64encode_str(style_portrait_path.read_bytes()) | ||
# voice samples | ||
voice_samples = [ | ||
b64encode_str( | ||
( | ||
speaker_path | ||
/ "voice_samples/{}_{}.wav".format(id, str(j + 1).zfill(3)) | ||
).read_bytes() | ||
) | ||
for j in range(3) | ||
] | ||
style_infos.append( | ||
{ | ||
"id": id, | ||
"icon": icon, | ||
"portrait": style_portrait, | ||
"voice_samples": voice_samples, | ||
} | ||
) | ||
except FileNotFoundError: | ||
import traceback | ||
|
||
traceback.print_exc() | ||
raise HTTPException( | ||
status_code=500, detail="追加情報が見つかりませんでした" | ||
) | ||
|
||
ret_data = SpeakerInfo( | ||
policy=policy, | ||
portrait=portrait, | ||
style_infos=style_infos, | ||
) | ||
return ret_data | ||
|
||
@router.get("/singers", response_model=list[Speaker], tags=["その他"]) | ||
def singers( | ||
core_version: str | None = None, | ||
) -> list[Speaker]: | ||
singers = metas_store.load_combined_metas(get_core(core_version)) | ||
return filter_speakers_and_styles(singers, "singer") | ||
|
||
@router.get("/singer_info", response_model=SpeakerInfo, tags=["その他"]) | ||
def singer_info( | ||
speaker_uuid: str, | ||
core_version: str | None = None, | ||
) -> SpeakerInfo: | ||
""" | ||
指定されたspeaker_uuidに関する情報をjson形式で返します。 | ||
画像や音声はbase64エンコードされたものが返されます。 | ||
""" | ||
return _speaker_info( | ||
speaker_uuid=speaker_uuid, | ||
speaker_or_singer="singer", | ||
core_version=core_version, | ||
) | ||
|
||
return router |