@techreport{oai:ipsj.ixsq.nii.ac.jp:00080366, author = {小川, 真 and 矢崎, 俊志 and 阿部, 公輝 and Makoto, Ogawa and Syunji, Yazaki and Koki, Abe}, issue = {10}, month = {Jan}, note = {VOCALOID 「初音ミク」 の発売以来,ユーザが自由に歌声ライブラリを制作できるフリーの歌声合成器 UTAU が開発されるなど,歌声合成への関心が高まっている.これら歌声合成器は主にアマチュアの音楽制作に使用されるが,ユーザが声色を任意時刻に混ぜて指定する機能がない.また,声色操作を行うことで処理時間やデータ量が大きくなる.本研究では音声合成分析系 WORLD を用い,メルケプストラムと Vorbis による励起信号からなるコーパスを声色別に収録し,各音素間を時間伸縮関数で接続することで,ユーザがモーフィング率を指定し声色を操作できる歌声合成器 v.Connect を開発した.提案手法を用いて歌声コーパス 「波音リツコネクト」 を制作した.このコーパスの容量は波形の 2 倍程度であった.合成速度は 1.7~2.2 倍と改善され,圧縮による劣化は主観的には感じられなかった., Since the release of Hatsune Miku, interets in singing synthesis increase. For example, a singing synthesis system, UTAU, has been developed as a freeware. Most of these systems, however, lack of the function that users can mix vocal tones at any times. Controling tonal changes in singing requires a large amount of time and data for synthesis. We have developed a singing synthesis system, v.Connect, which connects corresponding phonemes with a time-stretching function to enable users to control tonal changes in singing by specifying the rate of voice morphing. The system processes voice signals with WORLD, a voice synthesis and analysis system, and uses corpora of various tonal voices consisting of Mel cepstra and excitation signals compressed by Vorbis. We constructed a corpus, ”Namine Ritsu Connect”, using the proposed method. It was found that the size of the corpus was two times larger than that of raw waves, and that synthesis from the corpus was 1.7 to 2.2 times faster than that from raw waves. Degradation caused by compression was not sensed subjectively.}, title = {v.Connect:ユーザが声色操作可能な歌声合成器}, year = {2012} }