From 7beddd1398b27d428d4430df9a9d08b862b030d4 Mon Sep 17 00:00:00 2001 From: Sig <62321214+sigprogramming@users.noreply.github.com> Date: Tue, 5 Nov 2024 00:11:19 +0900 Subject: [PATCH 1/3] =?UTF-8?q?=E3=83=94=E3=83=83=E3=83=81=E7=94=9F?= =?UTF-8?q?=E6=88=90=E3=82=B9=E3=83=86=E3=83=BC=E3=82=B8=E3=82=92=E8=BF=BD?= =?UTF-8?q?=E5=8A=A0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/store/singing.ts | 171 +++++++++++++++++++++++++++++++++++++++++-- src/store/type.ts | 30 ++++++++ 2 files changed, 193 insertions(+), 8 deletions(-) diff --git a/src/store/singing.ts b/src/store/singing.ts index 06fdc543f7..4089d96081 100644 --- a/src/store/singing.ts +++ b/src/store/singing.ts @@ -25,6 +25,8 @@ import { EditorFrameAudioQueryKey, EditorFrameAudioQuery, TrackParameters, + SingingPitchKey, + SingingPitch, } from "./type"; import { buildSongTrackAudioFileNameFromRawData, @@ -129,6 +131,7 @@ type PhraseRenderContext = Readonly<{ type PhraseRenderStageId = | "queryGeneration" + | "singingPitchGeneration" | "singingVolumeGeneration" | "singingVoiceSynthesis"; @@ -136,7 +139,7 @@ type PhraseRenderStageId = * フレーズレンダリングのステージのインターフェイス。 * フレーズレンダラー内で順に実行される。 */ -type PhraseRenderBaseStage = Readonly<{ +type PhraseRenderStage = Readonly<{ id: PhraseRenderStageId; /** @@ -172,6 +175,21 @@ type QuerySource = Readonly<{ keyRangeAdjustment: number; }>; +/** + * 歌唱ピッチの生成に必要なデータ + */ + +type SingingPitchSource = Readonly<{ + engineId: EngineId; + engineFrameRate: number; + tpqn: number; + tempos: Tempo[]; + firstRestDuration: number; + notes: Note[]; + keyRangeAdjustment: number; + queryForPitchGeneration: EditorFrameAudioQuery; +}>; + /** * 歌唱ボリュームの生成に必要なデータ */ @@ -381,6 +399,13 @@ const calculateQueryKey = async (querySource: QuerySource) => { return EditorFrameAudioQueryKey(hash); }; +const calculateSingingPitchKey = async ( + singingPitchSource: SingingPitchSource, +) => { + const hash = await calculateHash(singingPitchSource); + return SingingPitchKey(hash); +}; + const calculateSingingVolumeKey = async ( singingVolumeSource: SingingVolumeSource, ) => { @@ -545,6 +570,7 @@ const sequences = new Map(); const animationTimer = new AnimationTimer(); const queryCache = new Map(); +const singingPitchCache = new Map(); const singingVolumeCache = new Map(); const singingVoiceCache = new Map(); @@ -745,6 +771,7 @@ export const singingStoreState: SingingStoreState = { editorFrameRate: DEPRECATED_DEFAULT_EDITOR_FRAME_RATE, phrases: new Map(), phraseQueries: new Map(), + phraseSingingPitches: new Map(), phraseSingingVolumes: new Map(), sequencerZoomX: 0.5, sequencerZoomY: 0.75, @@ -1219,6 +1246,23 @@ export const singingStore = createPartialStore({ }, }, + SET_SINGING_PITCH_KEY_TO_PHRASE: { + mutation( + state, + { + phraseKey, + singingPitchKey, + }: { + phraseKey: PhraseKey; + singingPitchKey: SingingPitchKey | undefined; + }, + ) { + const phrase = getOrThrow(state.phrases, phraseKey); + + phrase.singingPitchKey = singingPitchKey; + }, + }, + SET_SINGING_VOLUME_KEY_TO_PHRASE: { mutation( state, @@ -1291,6 +1335,24 @@ export const singingStore = createPartialStore({ }, }, + SET_PHRASE_SINGING_PITCH: { + mutation( + state, + { + singingPitchKey, + singingPitch, + }: { singingPitchKey: SingingPitchKey; singingPitch: SingingPitch }, + ) { + state.phraseSingingPitches.set(singingPitchKey, singingPitch); + }, + }, + + DELETE_PHRASE_SINGING_PITCH: { + mutation(state, { singingPitchKey }: { singingPitchKey: SingingPitchKey }) { + state.phraseSingingPitches.delete(singingPitchKey); + }, + }, + SET_PHRASE_SINGING_VOLUME: { mutation( state, @@ -1809,9 +1871,7 @@ export const singingStore = createPartialStore({ } }; - const generateQuery = async ( - querySource: QuerySource, - ): Promise => { + const generateQuery = async (querySource: QuerySource) => { const notesForRequestToEngine = createNotesForRequestToEngine( querySource.firstRestDuration, lastRestDurationSeconds, @@ -1836,7 +1896,7 @@ export const singingStore = createPartialStore({ return query; }; - const queryGenerationStage: PhraseRenderBaseStage = { + const queryGenerationStage: PhraseRenderStage = { id: "queryGeneration", shouldBeExecuted: async (context: PhraseRenderContext) => { const track = getOrThrow(context.snapshot.tracks, context.trackId); @@ -1887,6 +1947,99 @@ export const singingStore = createPartialStore({ }, }; + const generateSingingPitchSource = ( + context: PhraseRenderContext, + ): SingingPitchSource => { + const track = getOrThrow(context.snapshot.tracks, context.trackId); + if (track.singer == undefined) { + throw new Error("track.singer is undefined."); + } + const phrase = getOrThrow(state.phrases, context.phraseKey); + const phraseQueryKey = phrase.queryKey; + if (phraseQueryKey == undefined) { + throw new Error("phraseQueryKey is undefined."); + } + const query = getOrThrow(state.phraseQueries, phraseQueryKey); + const clonedQuery = cloneWithUnwrapProxy(query); + // TODO: 音素タイミングの編集データの適用を行うようにする + return { + engineId: track.singer.engineId, + engineFrameRate: query.frameRate, + tpqn: context.snapshot.tpqn, + tempos: context.snapshot.tempos, + firstRestDuration: phrase.firstRestDuration, + notes: phrase.notes, + keyRangeAdjustment: track.keyRangeAdjustment, + queryForPitchGeneration: clonedQuery, + }; + }; + + const generateSingingPitch = async ( + singingPitchSource: SingingPitchSource, + ) => { + // TODO: ピッチ生成APIに対応する + return singingPitchSource.queryForPitchGeneration.f0; + }; + + const singingPitchGenerationStage: PhraseRenderStage = { + id: "singingPitchGeneration", + shouldBeExecuted: async (context: PhraseRenderContext) => { + const track = getOrThrow(context.snapshot.tracks, context.trackId); + if (track.singer == undefined) { + return false; + } + const phrase = getOrThrow(state.phrases, context.phraseKey); + const phraseSingingPitchKey = phrase.singingPitchKey; + const singingPitchSource = generateSingingPitchSource(context); + const singingPitchKey = + await calculateSingingPitchKey(singingPitchSource); + return ( + phraseSingingPitchKey == undefined || + phraseSingingPitchKey !== singingPitchKey + ); + }, + deleteExecutionResult: (context: PhraseRenderContext) => { + const phrase = getOrThrow(state.phrases, context.phraseKey); + const phraseSingingPitchKey = phrase.singingPitchKey; + if (phraseSingingPitchKey != undefined) { + mutations.DELETE_PHRASE_SINGING_PITCH({ + singingPitchKey: phraseSingingPitchKey, + }); + mutations.SET_SINGING_PITCH_KEY_TO_PHRASE({ + phraseKey: context.phraseKey, + singingPitchKey: undefined, + }); + } + }, + execute: async (context: PhraseRenderContext) => { + const singingPitchSource = generateSingingPitchSource(context); + const singingPitchKey = + await calculateSingingPitchKey(singingPitchSource); + + let singingPitch = singingPitchCache.get(singingPitchKey); + if (singingPitch != undefined) { + logger.info(`Loaded singing pitch from cache.`); + } else { + singingPitch = await generateSingingPitch(singingPitchSource); + logger.info(`Generated singing pitch.`); + singingPitchCache.set(singingPitchKey, singingPitch); + } + + const phrase = getOrThrow(state.phrases, context.phraseKey); + const phraseSingingPitchKey = phrase.singingPitchKey; + if (phraseSingingPitchKey != undefined) { + mutations.DELETE_PHRASE_SINGING_PITCH({ + singingPitchKey: phraseSingingPitchKey, + }); + } + mutations.SET_PHRASE_SINGING_PITCH({ singingPitchKey, singingPitch }); + mutations.SET_SINGING_PITCH_KEY_TO_PHRASE({ + phraseKey: context.phraseKey, + singingPitchKey, + }); + }, + }; + const generateSingingVolumeSource = ( context: PhraseRenderContext, ): SingingVolumeSource => { @@ -1899,6 +2052,7 @@ export const singingStore = createPartialStore({ if (phraseQueryKey == undefined) { throw new Error("phraseQueryKey is undefined."); } + // TODO: ピッチ生成ステージで生成したピッチを使用するようにする const query = getOrThrow(state.phraseQueries, phraseQueryKey); const clonedQuery = cloneWithUnwrapProxy(query); applyPitchEdit( @@ -1960,7 +2114,7 @@ export const singingStore = createPartialStore({ return singingVolume; }; - const singingVolumeGenerationStage: PhraseRenderBaseStage = { + const singingVolumeGenerationStage: PhraseRenderStage = { id: "singingVolumeGeneration", shouldBeExecuted: async (context: PhraseRenderContext) => { const track = getOrThrow(context.snapshot.tracks, context.trackId); @@ -2087,7 +2241,7 @@ export const singingStore = createPartialStore({ } }; - const singingVoiceSynthesisStage: PhraseRenderBaseStage = { + const singingVoiceSynthesisStage: PhraseRenderStage = { id: "singingVoiceSynthesis", shouldBeExecuted: async (context: PhraseRenderContext) => { const track = getOrThrow(context.snapshot.tracks, context.trackId); @@ -2142,8 +2296,9 @@ export const singingStore = createPartialStore({ }, }; - const stages: readonly PhraseRenderBaseStage[] = [ + const stages: readonly PhraseRenderStage[] = [ queryGenerationStage, + singingPitchGenerationStage, singingVolumeGenerationStage, singingVoiceSynthesisStage, ]; diff --git a/src/store/type.ts b/src/store/type.ts index 417b8e8329..53468402c6 100644 --- a/src/store/type.ts +++ b/src/store/type.ts @@ -750,6 +750,11 @@ export type PhraseState = */ export type EditorFrameAudioQuery = FrameAudioQuery & { frameRate: number }; +/** + * 歌唱ピッチ + */ +export type SingingPitch = number[]; + /** * 歌唱ボリューム */ @@ -770,6 +775,11 @@ export const EditorFrameAudioQueryKey = ( id: string, ): EditorFrameAudioQueryKey => editorFrameAudioQueryKeySchema.parse(id); +const singingPitchKeySchema = z.string().brand<"SingingPitchKey">(); +export type SingingPitchKey = z.infer; +export const SingingPitchKey = (id: string): SingingPitchKey => + singingPitchKeySchema.parse(id); + const singingVolumeKeySchema = z.string().brand<"SingingVolumeKey">(); export type SingingVolumeKey = z.infer; export const SingingVolumeKey = (id: string): SingingVolumeKey => @@ -794,6 +804,7 @@ export type Phrase = { startTime: number; state: PhraseState; queryKey?: EditorFrameAudioQueryKey; + singingPitchKey?: SingingPitchKey; singingVolumeKey?: SingingVolumeKey; singingVoiceKey?: SingingVoiceKey; sequenceId?: SequenceId; @@ -839,6 +850,7 @@ export type SingingStoreState = { editorFrameRate: number; phrases: Map; phraseQueries: Map; + phraseSingingPitches: Map; phraseSingingVolumes: Map; sequencerZoomX: number; sequencerZoomY: number; @@ -999,6 +1011,13 @@ export type SingingStoreTypes = { }; }; + SET_SINGING_PITCH_KEY_TO_PHRASE: { + mutation: { + phraseKey: PhraseKey; + singingPitchKey: SingingPitchKey | undefined; + }; + }; + SET_SINGING_VOLUME_KEY_TO_PHRASE: { mutation: { phraseKey: PhraseKey; @@ -1031,6 +1050,17 @@ export type SingingStoreTypes = { mutation: { queryKey: EditorFrameAudioQueryKey }; }; + SET_PHRASE_SINGING_PITCH: { + mutation: { + singingPitchKey: SingingPitchKey; + singingPitch: SingingPitch; + }; + }; + + DELETE_PHRASE_SINGING_PITCH: { + mutation: { singingPitchKey: SingingPitchKey }; + }; + SET_PHRASE_SINGING_VOLUME: { mutation: { singingVolumeKey: SingingVolumeKey; From 4badcb1883a0294b52b4e564d95576f489aad15c Mon Sep 17 00:00:00 2001 From: Hiroshiba Date: Tue, 5 Nov 2024 02:41:17 +0900 Subject: [PATCH 2/3] Apply suggestions from code review --- src/store/singing.ts | 1 - 1 file changed, 1 deletion(-) diff --git a/src/store/singing.ts b/src/store/singing.ts index 4089d96081..a198d6d0e7 100644 --- a/src/store/singing.ts +++ b/src/store/singing.ts @@ -178,7 +178,6 @@ type QuerySource = Readonly<{ /** * 歌唱ピッチの生成に必要なデータ */ - type SingingPitchSource = Readonly<{ engineId: EngineId; engineFrameRate: number; From 9e19a0994ac1050d7211fcc39b069be9b4781a2f Mon Sep 17 00:00:00 2001 From: Sig <62321214+sigprogramming@users.noreply.github.com> Date: Tue, 5 Nov 2024 21:38:28 +0900 Subject: [PATCH 3/3] =?UTF-8?q?=E3=82=A8=E3=83=A9=E3=83=BC=E3=82=92throw?= =?UTF-8?q?=E3=81=99=E3=82=8B=E3=82=88=E3=81=86=E3=81=AB=E3=81=97=E3=81=9F?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/store/singing.ts | 14 ++++++-------- 1 file changed, 6 insertions(+), 8 deletions(-) diff --git a/src/store/singing.ts b/src/store/singing.ts index a198d6d0e7..fe81e422ed 100644 --- a/src/store/singing.ts +++ b/src/store/singing.ts @@ -1936,7 +1936,7 @@ export const singingStore = createPartialStore({ const phrase = getOrThrow(state.phrases, context.phraseKey); const phraseQueryKey = phrase.queryKey; if (phraseQueryKey != undefined) { - mutations.DELETE_PHRASE_QUERY({ queryKey: phraseQueryKey }); + throw new Error("The previous query has not been removed."); } mutations.SET_PHRASE_QUERY({ queryKey, query }); mutations.SET_QUERY_KEY_TO_PHRASE({ @@ -2027,9 +2027,7 @@ export const singingStore = createPartialStore({ const phrase = getOrThrow(state.phrases, context.phraseKey); const phraseSingingPitchKey = phrase.singingPitchKey; if (phraseSingingPitchKey != undefined) { - mutations.DELETE_PHRASE_SINGING_PITCH({ - singingPitchKey: phraseSingingPitchKey, - }); + throw new Error("The previous singing pitch has not been removed."); } mutations.SET_PHRASE_SINGING_PITCH({ singingPitchKey, singingPitch }); mutations.SET_SINGING_PITCH_KEY_TO_PHRASE({ @@ -2160,9 +2158,9 @@ export const singingStore = createPartialStore({ const phrase = getOrThrow(state.phrases, context.phraseKey); const phraseSingingVolumeKey = phrase.singingVolumeKey; if (phraseSingingVolumeKey != undefined) { - mutations.DELETE_PHRASE_SINGING_VOLUME({ - singingVolumeKey: phraseSingingVolumeKey, - }); + throw new Error( + "The previous singing volume has not been removed.", + ); } mutations.SET_PHRASE_SINGING_VOLUME({ singingVolumeKey, @@ -2285,7 +2283,7 @@ export const singingStore = createPartialStore({ const phrase = getOrThrow(state.phrases, context.phraseKey); const phraseSingingVoiceKey = phrase.singingVoiceKey; if (phraseSingingVoiceKey != undefined) { - phraseSingingVoices.delete(phraseSingingVoiceKey); + throw new Error("The previous singing voice has not been removed."); } phraseSingingVoices.set(singingVoiceKey, singingVoice); mutations.SET_SINGING_VOICE_KEY_TO_PHRASE({