{"created":"2023-05-15T12:35:59.093225+00:00","id":5124,"links":{},"metadata":{"_buckets":{"deposit":"ededa5c2-f811-4eb3-b5a2-54d9e527b38c"},"_deposit":{"created_by":3,"id":"5124","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"5124"},"status":"published"},"_oai":{"id":"oai:nitech.repo.nii.ac.jp:00005124","sets":["31"]},"author_link":["10746","17180","17179","17181","464"],"item_10001_biblio_info_28":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2003-03-01","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"3","bibliographicPageEnd":"542","bibliographicPageStart":"534","bibliographicVolumeNumber":"E86-D","bibliographic_titles":[{"bibliographic_title":"IEICE transactions on information and systems"}]}]},"item_10001_description_36":{"attribute_name":"内容記述","attribute_value_mlt":[{"subitem_description":"This paper describes a new context clustering technique for average voice model, which is a set of speaker independent speech synthesis units. In the technique, we first train speaker dependent models using multi-speaker speech database, and then construct a decision tree common to these speaker dependent models for context clustering. When a node of the decision tree is split, only the context related questions which are applicable to all speaker dependent models are adopted. As a result, every node of the decision tree always has training data of all speakers. After construction of the decision tree, all speaker dependent models are clustered using the common decision tree and a speaker independent model, i.e., an average voice model is obtained by combining speaker dependent models. From the results of subjective tests, we show that the average voice models trained using the proposed technique can generate more natural sounding speech than the conventional average voice models.","subitem_description_type":"Other"}]},"item_10001_description_38":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10001_full_name_27":{"attribute_name":"著者別名","attribute_value_mlt":[{"affiliations":[{"affiliationNames":[{"affiliationName":"","lang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"","nameIdentifierScheme":"ISNI","nameIdentifierURI":"http://www.isni.org/isni/"}]}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}],"names":[{"name":"Tokuda, Keiichi","nameLang":"en"},{"name":"徳田, 恵一","nameLang":"ja"},{"name":"トクダ, ケイイチ","nameLang":"ja-Kana"}]}]},"item_10001_publisher_29":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"Institute of Electronics, Information and Communication Engineers"}]},"item_10001_source_id_30":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"09168532","subitem_source_identifier_type":"ISSN"}]},"item_10001_source_id_32":{"attribute_name":"書誌レコードID(NCID)","attribute_value_mlt":[{"subitem_source_identifier":"AA10826272","subitem_source_identifier_type":"NCID"}]},"item_10001_version_type_33":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Yamagishi, Junichi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Tamura, Masatsune","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"Masuko, Takashi","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorAffiliations":[{"affiliationNameIdentifiers":[{"affiliationNameIdentifier":"","affiliationNameIdentifierScheme":"ISNI","affiliationNameIdentifierURI":"http://www.isni.org/isni/"}],"affiliationNames":[{"affiliationName":"","affiliationNameLang":"ja"}]}],"creatorNames":[{"creatorName":"Tokuda, Keiichi","creatorNameLang":"en"},{"creatorName":"徳田, 恵一","creatorNameLang":"ja"},{"creatorName":"トクダ, ケイイチ","creatorNameLang":"ja-Kana"}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}]},{"creatorNames":[{"creatorName":"Kobayashi, Takao","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2017-01-25"}],"displaytype":"detail","filename":"E86-D_534.pdf","filesize":[{"value":"773.0 kB"}],"format":"application/pdf","license_note":"Copyright (c) 2003 IEICE http://search.ieice.org/index.html","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"本文_fulltext","url":"https://nitech.repo.nii.ac.jp/record/5124/files/E86-D_534.pdf"},"version_id":"6d9cdd2c-68fc-4507-8df7-aee6a5d6065b"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"A Context Clustering Technique for Average Voice Models","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"A Context Clustering Technique for Average Voice Models","subitem_title_language":"en"}]},"item_type_id":"10001","owner":"3","path":["31"],"pubdate":{"attribute_name":"公開日","attribute_value":"2012-05-24"},"publish_date":"2012-05-24","publish_status":"0","recid":"5124","relation_version_is_last":true,"title":["A Context Clustering Technique for Average Voice Models"],"weko_creator_id":"3","weko_shared_id":3},"updated":"2023-07-10T03:01:04.023800+00:00"}