WEKO3
アイテム
{"_buckets": {"deposit": "fc81f0aa-dfb1-4b12-bc9f-caa401df9692"}, "_deposit": {"created_by": 3, "id": "3411", "owners": [3], "pid": {"revision_id": 0, "type": "depid", "value": "3411"}, "status": "published"}, "_oai": {"id": "oai:nitech.repo.nii.ac.jp:00003411", "sets": ["31"]}, "author_link": ["471", "8555", "464", "8950", "462"], "item_5_biblio_info_5": {"attribute_name": "書誌情報", "attribute_value_mlt": [{"bibliographicIssueDates": {"bibliographicIssueDate": "2010", "bibliographicIssueDateType": "Issued"}, "bibliographic_titles": [{"bibliographic_title": "ICSP2010 Proceedings"}]}]}, "item_5_description_16": {"attribute_name": "フォーマット", "attribute_value_mlt": [{"subitem_description": "application/pdf", "subitem_description_type": "Other"}]}, "item_5_description_4": {"attribute_name": "内容記述", "attribute_value_mlt": [{"subitem_description": "This paper proposes an improved cross-lingualspeaker adaptation technique with considering the differencesbetween language-dependent average voices in a Speech-to-Speech Translation system. A state mapping based method hadbeen introduced for cross-lingual speaker adaptation in HMMbasedspeech synthesis. In this method, the transforms estimatedfrom the input language are applied to average voice models ofthe output language according to the state mapping information.However, the differences between average voices in the inputand output language may degrade the adaptation performance.To reduce the differences, we apply a global linear transformto output average voice models, which minimizes the symmetricKullback-Leibler divergence between two average voice models.From the experimental results, our approach could not obtaina better result than the original state mapping based method.This is because the global transform affects not only speakercharacteristics but also language identity in acoustic features, andthis degrades the synthetic speech quality. Therefore, it becomesclear that a technique which separate speaker and languageidentities is required.", "subitem_description_type": "Other"}, {"subitem_description": "Oct.24-28 2010 Beijing CHINA", "subitem_description_type": "Other"}]}, "item_5_full_name_3": {"attribute_name": "著者別名", "attribute_value_mlt": [{"affiliations": [{"affiliationNames": [{"affiliationName": "", "lang": "ja"}], "nameIdentifiers": [{"nameIdentifier": "", "nameIdentifierScheme": "ISNI", "nameIdentifierURI": "http://www.isni.org/isni/"}]}], "familyNames": [{"familyName": "Oura", "familyNameLang": "en"}, {"familyName": "大浦", "familyNameLang": "ja"}, {"familyName": "オオウラ", "familyNameLang": "ja-Kana"}], "givenNames": [{"givenName": "Keiichiro", "givenNameLang": "en"}, {"givenName": "圭一郎", "givenNameLang": "ja"}, {"givenName": "ケイイチロウ", "givenNameLang": "ja-Kana"}], "nameIdentifiers": [{"nameIdentifier": "471", "nameIdentifierScheme": "WEKO"}], "names": [{"name": "Oura, Keiichiro", "nameLang": "en"}, {"name": "大浦, 圭一郎", "nameLang": "ja"}, {"name": "オオウラ, ケイイチロウ", "nameLang": "ja-Kana"}]}, {"affiliations": [{"affiliationNames": [{"affiliationName": "", "lang": "ja"}], "nameIdentifiers": [{"nameIdentifier": "", "nameIdentifierScheme": "ISNI", "nameIdentifierURI": "http://www.isni.org/isni/"}]}], "familyNames": [{"familyName": "Nankaku", "familyNameLang": "en"}, {"familyName": "南角", "familyNameLang": "ja"}, {"familyName": "ナンカク", "familyNameLang": "ja-Kana"}], "givenNames": [{"givenName": "Yoshihiko", "givenNameLang": "en"}, {"givenName": "吉彦", "givenNameLang": "ja"}, {"givenName": "ヨシヒコ", "givenNameLang": "ja-Kana"}], "nameIdentifiers": [{"nameIdentifier": "8555", "nameIdentifierScheme": "WEKO"}, {"nameIdentifier": "1000080397497", "nameIdentifierScheme": "NRID", "nameIdentifierURI": "http://rns.nii.ac.jp/nr/1000080397497"}], "names": [{"name": "Nankaku, Yoshihiko", "nameLang": "en"}, {"name": "南角, 吉彦", "nameLang": "ja"}, {"name": "ナンカク, ヨシヒコ", "nameLang": "ja-Kana"}]}, {"affiliations": [{"affiliationNames": [{"affiliationName": "", "lang": "ja"}], "nameIdentifiers": [{"nameIdentifier": "", "nameIdentifierScheme": "ISNI", "nameIdentifierURI": "http://www.isni.org/isni/"}]}], "familyNames": [{"familyName": "Tokuda", "familyNameLang": "en"}, {"familyName": "徳田", "familyNameLang": "ja"}, {"familyName": "トクダ", "familyNameLang": "ja-Kana"}], "givenNames": [{"givenName": "Keiichi", "givenNameLang": "en"}, {"givenName": "恵一", "givenNameLang": "ja"}, {"givenName": "ケイイチ", "givenNameLang": "ja-Kana"}], "nameIdentifiers": [{"nameIdentifier": "464", "nameIdentifierScheme": "WEKO"}, {"nameIdentifier": "1000020217483", "nameIdentifierScheme": "NRID", "nameIdentifierURI": "http://rns.nii.ac.jp/nr/1000020217483"}], "names": [{"name": "Tokuda, Keiichi", "nameLang": "en"}, {"name": "徳田, 恵一", "nameLang": "ja"}, {"name": "トクダ, ケイイチ", "nameLang": "ja-Kana"}]}]}, "item_5_publisher_6": {"attribute_name": "出版者", "attribute_value_mlt": [{"subitem_publisher": "Institute of Electrical and Electronics Engineers"}]}, "item_5_version_type_13": {"attribute_name": "著者版フラグ", "attribute_value_mlt": [{"subitem_version_resource": "http://purl.org/coar/version/c_970fb48d4fbd8a85", "subitem_version_type": "VoR"}]}, "item_creator": {"attribute_name": "著者", "attribute_type": "creator", "attribute_value_mlt": [{"creatorNames": [{"creatorName": "Peng, Xianglin", "creatorNameLang": "en"}], "nameIdentifiers": [{"nameIdentifier": "8950", "nameIdentifierScheme": "WEKO"}]}, {"creatorAffiliations": [{"affiliationNameIdentifiers": [{"affiliationNameIdentifier": "", "affiliationNameIdentifierScheme": "ISNI", "affiliationNameIdentifierURI": "http://www.isni.org/isni/"}], "affiliationNames": [{"affiliationName": "", "affiliationNameLang": "ja"}]}], "creatorNames": [{"creatorName": "Oura, Keiichiro", "creatorNameLang": "en"}, {"creatorName": "大浦, 圭一郎", "creatorNameLang": "ja"}, {"creatorName": "オオウラ, ケイイチロウ", "creatorNameLang": "ja-Kana"}], "familyNames": [{"familyName": "Oura", "familyNameLang": "en"}, {"familyName": "大浦", "familyNameLang": "ja"}, {"familyName": "オオウラ", "familyNameLang": "ja-Kana"}], "givenNames": [{"givenName": "Keiichiro", "givenNameLang": "en"}, {"givenName": "圭一郎", "givenNameLang": "ja"}, {"givenName": "ケイイチロウ", "givenNameLang": "ja-Kana"}], "nameIdentifiers": [{"nameIdentifier": "471", "nameIdentifierScheme": "WEKO"}]}, {"creatorAffiliations": [{"affiliationNameIdentifiers": [{"affiliationNameIdentifier": "", "affiliationNameIdentifierScheme": "ISNI", "affiliationNameIdentifierURI": "http://www.isni.org/isni/"}], "affiliationNames": [{"affiliationName": "", "affiliationNameLang": "ja"}]}], "creatorNames": [{"creatorName": "Nankaku, Yoshihiko", "creatorNameLang": "en"}, {"creatorName": "南角, 吉彦", "creatorNameLang": "ja"}, {"creatorName": "ナンカク, ヨシヒコ", "creatorNameLang": "ja-Kana"}], "familyNames": [{"familyName": "Nankaku", "familyNameLang": "en"}, {"familyName": "南角", "familyNameLang": "ja"}, {"familyName": "ナンカク", "familyNameLang": "ja-Kana"}], "givenNames": [{"givenName": "Yoshihiko", "givenNameLang": "en"}, {"givenName": "吉彦", "givenNameLang": "ja"}, {"givenName": "ヨシヒコ", "givenNameLang": "ja-Kana"}], "nameIdentifiers": [{"nameIdentifier": "8555", "nameIdentifierScheme": "WEKO"}, {"nameIdentifier": "1000080397497", "nameIdentifierScheme": "NRID", "nameIdentifierURI": "http://rns.nii.ac.jp/nr/1000080397497"}]}, {"creatorNames": [{"creatorName": "Tokuda, Keiichi", "creatorNameLang": "en"}], "nameIdentifiers": [{"nameIdentifier": "462", "nameIdentifierScheme": "WEKO"}]}]}, "item_files": {"attribute_name": "ファイル情報", "attribute_type": "file", "attribute_value_mlt": [{"accessrole": "open_date", "date": [{"dateType": "Available", "dateValue": "2017-01-17"}], "displaytype": "detail", "download_preview_message": "", "file_order": 0, "filename": "icsp2010_peng.pdf", "filesize": [{"value": "113.0 kB"}], "format": "application/pdf", "future_date_message": "", "is_thumbnail": false, "licensefree": "c2010 IEEE. Personal use of this material is permitted. However, permission to reprint/republish this material for advertising or promotional purposes or for creating new collective works for resale or redistribution to servers or lists, or to reuse any copyrighted component of this work in other works must be obtained from the IEEE.", "licensetype": "license_free", "mimetype": "application/pdf", "size": 113000.0, "url": {"label": "本文_fulltext", "url": "https://nitech.repo.nii.ac.jp/record/3411/files/icsp2010_peng.pdf"}, "version_id": "ed9d1e69-059b-4e5f-b15c-d3a094752468"}]}, "item_language": {"attribute_name": "言語", "attribute_value_mlt": [{"subitem_language": "eng"}]}, "item_resource_type": {"attribute_name": "資源タイプ", "attribute_value_mlt": [{"resourcetype": "conference paper", "resourceuri": "http://purl.org/coar/resource_type/c_5794"}]}, "item_title": "Cross-lingual speaker adaptation for HMM-based speech synthesis considering differences between language-dependent average voices", "item_titles": {"attribute_name": "タイトル", "attribute_value_mlt": [{"subitem_title": "Cross-lingual speaker adaptation for HMM-based speech synthesis considering differences between language-dependent average voices", "subitem_title_language": "en"}]}, "item_type_id": "5", "owner": "3", "path": ["31"], "permalink_uri": "https://nitech.repo.nii.ac.jp/records/3411", "pubdate": {"attribute_name": "公開日", "attribute_value": "2012-11-07"}, "publish_date": "2012-11-07", "publish_status": "0", "recid": "3411", "relation": {}, "relation_version_is_last": true, "title": ["Cross-lingual speaker adaptation for HMM-based speech synthesis considering differences between language-dependent average voices"], "weko_shared_id": 3}
Cross-lingual speaker adaptation for HMM-based speech synthesis considering differences between language-dependent average voices
https://nitech.repo.nii.ac.jp/records/3411
https://nitech.repo.nii.ac.jp/records/3411b4e162ee-f596-4892-bc91-22845f063a7f
名前 / ファイル | ライセンス | アクション |
---|---|---|
本文_fulltext (113.0 kB)
|
c2010 IEEE. Personal use of this material is permitted. However, permission to reprint/republish this material for advertising or promotional purposes or for creating new collective works for resale or redistribution to servers or lists, or to reuse any copyrighted component of this work in other works must be obtained from the IEEE.
|
Item type | 会議発表論文 / Conference Paper(1) | |||||
---|---|---|---|---|---|---|
公開日 | 2012-11-07 | |||||
タイトル | ||||||
言語 | en | |||||
タイトル | Cross-lingual speaker adaptation for HMM-based speech synthesis considering differences between language-dependent average voices | |||||
言語 | ||||||
言語 | eng | |||||
資源タイプ | ||||||
資源タイプ識別子 | http://purl.org/coar/resource_type/c_5794 | |||||
資源タイプ | conference paper | |||||
著者 |
Peng, Xianglin
× Peng, Xianglin× 大浦, 圭一郎× 南角, 吉彦× Tokuda, Keiichi |
|||||
著者別名 | ||||||
言語 | en | |||||
言語 | ja | |||||
言語 | ja-Kana | |||||
姓名 | Oura, Keiichiro | |||||
言語 | en | |||||
姓名 | 大浦, 圭一郎 | |||||
言語 | ja | |||||
姓名 | オオウラ, ケイイチロウ | |||||
言語 | ja-Kana | |||||
著者別名 | ||||||
言語 | en | |||||
言語 | ja | |||||
言語 | ja-Kana | |||||
姓名 | Nankaku, Yoshihiko | |||||
言語 | en | |||||
姓名 | 南角, 吉彦 | |||||
言語 | ja | |||||
姓名 | ナンカク, ヨシヒコ | |||||
言語 | ja-Kana | |||||
著者別名 | ||||||
言語 | en | |||||
言語 | ja | |||||
言語 | ja-Kana | |||||
姓名 | Tokuda, Keiichi | |||||
言語 | en | |||||
姓名 | 徳田, 恵一 | |||||
言語 | ja | |||||
姓名 | トクダ, ケイイチ | |||||
言語 | ja-Kana | |||||
書誌情報 |
ICSP2010 Proceedings 発行日 2010 |
|||||
出版者 | ||||||
出版者 | Institute of Electrical and Electronics Engineers | |||||
著者版フラグ | ||||||
出版タイプ | VoR | |||||
出版タイプResource | http://purl.org/coar/version/c_970fb48d4fbd8a85 | |||||
内容記述 | ||||||
内容記述タイプ | Other | |||||
内容記述 | This paper proposes an improved cross-lingualspeaker adaptation technique with considering the differencesbetween language-dependent average voices in a Speech-to-Speech Translation system. A state mapping based method hadbeen introduced for cross-lingual speaker adaptation in HMMbasedspeech synthesis. In this method, the transforms estimatedfrom the input language are applied to average voice models ofthe output language according to the state mapping information.However, the differences between average voices in the inputand output language may degrade the adaptation performance.To reduce the differences, we apply a global linear transformto output average voice models, which minimizes the symmetricKullback-Leibler divergence between two average voice models.From the experimental results, our approach could not obtaina better result than the original state mapping based method.This is because the global transform affects not only speakercharacteristics but also language identity in acoustic features, andthis degrades the synthetic speech quality. Therefore, it becomesclear that a technique which separate speaker and languageidentities is required. | |||||
内容記述 | ||||||
内容記述タイプ | Other | |||||
内容記述 | Oct.24-28 2010 Beijing CHINA | |||||
フォーマット | ||||||
内容記述タイプ | Other | |||||
内容記述 | application/pdf |