{"created":"2023-05-15T12:35:58.884847+00:00","id":5119,"links":{},"metadata":{"_buckets":{"deposit":"5140e14b-9294-4289-ad7f-cc44271b66bd"},"_deposit":{"created_by":3,"id":"5119","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"5119"},"status":"published"},"_oai":{"id":"oai:nitech.repo.nii.ac.jp:00005119","sets":["31"]},"author_link":["3028","464","10746","8555"],"item_10001_alternative_title_24":{"attribute_name":"その他(別言語等)のタイトル","attribute_value_mlt":[{"subitem_alternative_title":"カクレ マルコフ モデル オモチイタ シカク オンセイ ニンシキ ノタメノ セイキカ ガクシュウ"},{"subitem_alternative_title":"Normalized Training for HMM-Based Visual Speech Recognition"}]},"item_10001_biblio_info_28":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2003-02-01","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"2","bibliographicPageEnd":"172","bibliographicPageStart":"163","bibliographicVolumeNumber":"J86-D2","bibliographic_titles":[{"bibliographic_title":"電子情報通信学会論文誌. D-2, 情報・システム. 2, パターン処理"}]}]},"item_10001_description_36":{"attribute_name":"内容記述","attribute_value_mlt":[{"subitem_description":"本論文では,視覚音声認識のための連続密度HMM(Hidden Markov Model)のパラメータ推定法について述べる.これまでの視覚音声認識の研究は,大きく画像ベース法とモデルベース法の二つに分類することができる.画像ベース法は,原画像の画素値にサブサンプリングや主成分分析などの何らかの前処理を施したものを特徴ベクトルとして用いる手法である.しかし,唇の位置や大きさ,照明条件などが認識率に直接的な影響を及ぼすため,これらの正規化が重要な要素技術となる.従来の正規化手法は,HMMとは独立に何らかの基準を設け,学習の前に正規化を行うのが一般的であった.本論文では,ML(Maximum Likelihood)基準による正規化を考え,唇の位置,大きさ,傾き,平均輝度,コントラストなどの正規化プロセスがモデルの学習と統合された正規化学習法を提案する.提案法は,EM(Expectation Maximization)アルゴリズムに基づいて定式化されており,正規化学習の繰返しにより学習データに関するゆう度が単調に増加することが保証されている.また,M2VTSデータベースを用いた単語認識実験により提案法の有効性を示す.","subitem_description_type":"Other"}]},"item_10001_description_38":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10001_full_name_27":{"attribute_name":"著者別名","attribute_value_mlt":[{"affiliations":[{"affiliationNames":[{"affiliationName":"","lang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"","nameIdentifierScheme":"ISNI","nameIdentifierURI":"http://www.isni.org/isni/"}]}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}],"names":[{"name":"Nankaku, Yoshihiko","nameLang":"en"},{"name":"南角, 吉彦","nameLang":"ja"},{"name":"ナンカク, ヨシヒコ","nameLang":"ja-Kana"}]},{"affiliations":[{"affiliationNames":[{"affiliationName":"","lang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"","nameIdentifierScheme":"ISNI","nameIdentifierURI":"http://www.isni.org/isni/"}]}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}],"names":[{"name":"Tokuda, Keiichi","nameLang":"en"},{"name":"徳田, 恵一","nameLang":"ja"},{"name":"トクダ, ケイイチ","nameLang":"ja-Kana"}]},{"nameIdentifiers":[{}],"names":[{"name":"Kitamura, Tadashi"}]}]},"item_10001_publisher_29":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"Institute of Electronics, Information and Communication Engineers"}]},"item_10001_source_id_30":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"09151923","subitem_source_identifier_type":"ISSN"}]},"item_10001_source_id_32":{"attribute_name":"書誌レコードID(NCID)","attribute_value_mlt":[{"subitem_source_identifier":"AA11340957","subitem_source_identifier_type":"NCID"}]},"item_10001_version_type_33":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorAffiliations":[{"affiliationNameIdentifiers":[{"affiliationNameIdentifier":"","affiliationNameIdentifierScheme":"ISNI","affiliationNameIdentifierURI":"http://www.isni.org/isni/"}],"affiliationNames":[{"affiliationName":"","affiliationNameLang":"ja"}]}],"creatorNames":[{"creatorName":"Nankaku, Yoshihiko","creatorNameLang":"en"},{"creatorName":"南角, 吉彦","creatorNameLang":"ja"},{"creatorName":"ナンカク, ヨシヒコ","creatorNameLang":"ja-Kana"}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}]},{"creatorAffiliations":[{"affiliationNameIdentifiers":[{"affiliationNameIdentifier":"","affiliationNameIdentifierScheme":"ISNI","affiliationNameIdentifierURI":"http://www.isni.org/isni/"}],"affiliationNames":[{"affiliationName":"","affiliationNameLang":"ja"}]}],"creatorNames":[{"creatorName":"Tokuda, Keiichi","creatorNameLang":"en"},{"creatorName":"徳田, 恵一","creatorNameLang":"ja"},{"creatorName":"トクダ, ケイイチ","creatorNameLang":"ja-Kana"}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}]},{"creatorNames":[{"creatorName":"北村, 正"},{"creatorName":"キタムラ, タダシ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{}]},{"creatorNames":[{"creatorName":"小林, 隆夫"}],"nameIdentifiers":[{}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2017-01-25"}],"displaytype":"detail","filename":"J86-D2_163.pdf","filesize":[{"value":"1.5 MB"}],"format":"application/pdf","license_note":"Copyright(c)2003 IEICE http://search.ieice.org/index.html","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"本文_fulltext","url":"https://nitech.repo.nii.ac.jp/record/5119/files/J86-D2_163.pdf"},"version_id":"1b143de9-0849-43a0-94b1-74fe8634952f"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"隠れマルコフモデルを用いた視覚音声認識のための正規化学習","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"隠れマルコフモデルを用いた視覚音声認識のための正規化学習"}]},"item_type_id":"10001","owner":"3","path":["31"],"pubdate":{"attribute_name":"公開日","attribute_value":"2012-11-07"},"publish_date":"2012-11-07","publish_status":"0","recid":"5119","relation_version_is_last":true,"title":["隠れマルコフモデルを用いた視覚音声認識のための正規化学習"],"weko_creator_id":"3","weko_shared_id":3},"updated":"2023-07-10T05:30:55.400641+00:00"}