{"created":"2021-03-01T06:33:46.366111+00:00","id":25726,"links":{},"metadata":{"_buckets":{"deposit":"9b0e3a6c-73f6-44a0-8221-85f5711323ff"},"_deposit":{"id":"25726","owners":[],"pid":{"revision_id":0,"type":"depid","value":"25726"},"status":"published"},"_oai":{"id":"oai:nagoya.repo.nii.ac.jp:00025726","sets":["435:671:672"]},"author_link":["76249","76250","76251"],"item_10_biblio_info_6":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2017-11-23","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"12","bibliographicPageEnd":"2350","bibliographicPageStart":"2337","bibliographicVolumeNumber":"25","bibliographic_titles":[{"bibliographic_title":"IEEE/ACM Transactions on Audio, Speech, and Language Processing","bibliographic_titleLang":"en"}]}]},"item_10_description_4":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"In this paper, we present an innovative way of utilizing the natural relationship between speech sounds and articulatory movements by developing an articulatory controllable speech modification system. Specifically, we employ statistical acoustic-to-articulatory inversion mapping and articulatory-to-acoustic production mapping based on a Gaussian mixture model, allowing flexible modification of the model parameters and the independence of the text input features. Modification of an input speech signal through manipulation of the unobserved articulatory movements is achievable through a sequence of inversion and production mappings. To ensure the naturalness of articulatory movement trajectories, we introduce a method for manipulating articulatory parameters by considering their intercorrelation. Moreover, to generate high-quality modified speech sounds, we avoid the use of vocoder-based excitation generation by presenting several implementations of direct waveform modification capable of directly filtering an input speech signal using the differences in spectral parameters. The experimental results demonstrate that: 1) higher accuracy in the estimation of spectral parameters is achieved by using sequential inversion and production mappings than for conventional production mapping using measured articulatory parameters, 2) the method for manipulating articulatory parameters by considering their intercorrelation makes it possible to generate more natural trajectories of modified articulatory movements; 3) the implementations of the direct waveform modification method significantly improve the quality of modified speech sounds, even under varying speaking conditions; and 4) the controllability of the system is ensured by its capability of producing modified vowel sounds through the manipulation of appropriate articulatory configurations.","subitem_description_language":"en","subitem_description_type":"Abstract"}]},"item_10_publisher_32":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"IEEE","subitem_publisher_language":"en"}]},"item_10_relation_11":{"attribute_name":"DOI","attribute_value_mlt":[{"subitem_relation_type":"isVersionOf","subitem_relation_type_id":{"subitem_relation_type_id_text":"https://doi.org/10.1109/TASLP.2017.2753583","subitem_relation_type_select":"DOI"}}]},"item_10_rights_12":{"attribute_name":"権利","attribute_value_mlt":[{"subitem_rights":"“(c) 2017 IEEE. Personal use of this material is permitted. Permission from IEEE must be obtained for all other uses, in any current or future media, including reprinting/republishing this material for advertising or promotional purposes, creating new collective works, for resale or redistribution to servers or lists, or reuse of any copyrighted component of this work in other works.” ","subitem_rights_language":"en"}]},"item_10_select_15":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_select_item":"author"}]},"item_10_source_id_7":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"2329-9290","subitem_source_identifier_type":"PISSN"}]},"item_1615787544753":{"attribute_name":"出版タイプ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_ab4af688f83e57aa","subitem_version_type":"AM"}]},"item_access_right":{"attribute_name":"アクセス権","attribute_value_mlt":[{"subitem_access_right":"open access","subitem_access_right_uri":"http://purl.org/coar/access_right/c_abf2"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Tobing, Patrick Lumban","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"76249","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"Kobayashi, Kazuhiro","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"76250","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"Toda, Tomoki","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"76251","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2018-04-24"}],"displaytype":"detail","filename":"artspmod.pdf","filesize":[{"value":"767.8 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"artspmod","objectType":"fulltext","url":"https://nagoya.repo.nii.ac.jp/record/25726/files/artspmod.pdf"},"version_id":"9ec9c588-2e39-4855-beec-8ade8dfe3504"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"articulatory control","subitem_subject_scheme":"Other"},{"subitem_subject":"direct waveform modification","subitem_subject_scheme":"Other"},{"subitem_subject":"intercorrelation of articulators","subitem_subject_scheme":"Other"},{"subitem_subject":"Gaussian mixture model","subitem_subject_scheme":"Other"},{"subitem_subject":"speech modification","subitem_subject_scheme":"Other"},{"subitem_subject":"statistical inversion and production mappings","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"Articulatory Controllable Speech Modification Based on Statistical Inversion and Production Mappings","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Articulatory Controllable Speech Modification Based on Statistical Inversion and Production Mappings","subitem_title_language":"en"}]},"item_type_id":"10","owner":"1","path":["672"],"pubdate":{"attribute_name":"PubDate","attribute_value":"2018-04-24"},"publish_date":"2018-04-24","publish_status":"0","recid":"25726","relation_version_is_last":true,"title":["Articulatory Controllable Speech Modification Based on Statistical Inversion and Production Mappings"],"weko_creator_id":"1","weko_shared_id":-1},"updated":"2023-01-16T03:51:45.550797+00:00"}