@techreport{oai:ipsj.ixsq.nii.ac.jp:00234736, author = {内田, 照久 and 森勢, 将雅}, issue = {49}, month = {Jun}, note = {音の高さの知覚を説明するためのピッチ知覚の聴覚モデルが提案されている.そこでは,音の時間的な周期性が重要だとする時間説と,高調波成分を検出する感覚器に軸足を置く周波数説(場所説)とが,長年,議論を戦わせてきた.今回,本研究では声のピッチ知覚の研究のための実験用音声の生成を試みた.音声分析合成 vocoder: WORLD を改変し,通常音声から抽出したスペクトルを白色雑音で駆動した多層動的バンドノイズ音声を生成した.これは周期性が存在しない雑音であるが,調波構造状のスペクトルを備えた動的な帯域雑音となる.評価実験で素材に歌声を用いて,(1) 単純再合成音声,(2) スペクトル包絡を雑音駆動した疑似ささやき声,(3) 調波構造状の多層動的バンドノイズ音声,(4) 基本周波数を移調した歌声を元にした多層動的バンドノイズ音声を準備した.そして,聴覚実験によって調波構造状のエネルギーの集中からピッチを感じるかどうか検証した., An auditory model of pitch perception has been proposed to explain the perception of sound pitch. For decades, a significant debate has raged between the temporal theory, which asserts the temporal periodicity of sound as crucial, and the frequency theory (place theory), which is grounded in the sensory organs that detect harmonic components. In this study, we attempted to generate experimental voices to study voice pitch perception. A voice analysis synthesis vocoder, WORLD, was modified to generate a multilayer dynamic band noise voice with a spectrum extracted from ordinary speech and driven by white noise. This noise has no periodicity, but a dynamic band noise with a harmonic structure-like spectrum. In the evaluation experiment, we used singing voices as materials. We prepared (1) a simple resynthesized voice, (2) a pseudo-whispering voice with noise-vocoded spectral envelope, (3) a multilayered dynamic band noise voice with the harmonic structure preserved, and (4) a multilayered dynamic band noise voice based on singing voices transposed by a constant multiplication of the fundamental frequency. Subsequently, we conducted auditory experiments with the aim of confirming whether pitch perception is influenced by the concentration of energy in the harmonic structure.}, title = {「歌う雑音」:Phantom Skeleton方式による多層動的バンドノイズ音声}, year = {2024} }