{"created":"2023-05-15T12:35:49.438101+00:00","id":4893,"links":{},"metadata":{"_buckets":{"deposit":"8f70b93a-ac12-47ef-87d4-03bff77ce289"},"_deposit":{"created_by":3,"id":"4893","owners":[3],"pid":{"revision_id":0,"type":"depid","value":"4893"},"status":"published"},"_oai":{"id":"oai:nitech.repo.nii.ac.jp:00004893","sets":["31"]},"author_link":["3028","464","16006"],"item_10001_biblio_info_28":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2000-11-20","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"11","bibliographicPageEnd":"1977","bibliographicPageStart":"1969","bibliographicVolumeNumber":"E83-D","bibliographic_titles":[{"bibliographic_title":"IEICE transactions on information and systems"}]}]},"item_10001_description_36":{"attribute_name":"内容記述","attribute_value_mlt":[{"subitem_description":"This paper describes a method to normalize the lip position for improving the performance of a visual-information-based speech recognition system. Basically, there are two types of information useful in speech recognition processes; the first one is the speech signal itself and the second one is the visual information from the lips in motion. This paper tries to solve some problems caused by using images from the lips in motion such as the effect produced by the variation of the lip location. The proposed lip location normalization method is based on a search algorithm of the lip position in which the location normalization is integrated into the model training. Experiments of speaker-independent isolated word recognition were carried out on the Tulips1 and M2VTS databases. Experiments showed a recognition rate of 74.5% and an error reduction rate of 35.7% for the ten digits word recognition M2VTS database.","subitem_description_type":"Other"}]},"item_10001_description_38":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_10001_full_name_27":{"attribute_name":"著者別名","attribute_value_mlt":[{"affiliations":[{"affiliationNames":[{"affiliationName":"","lang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"","nameIdentifierScheme":"ISNI","nameIdentifierURI":"http://www.isni.org/isni/"}]}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}],"names":[{"name":"Tokuda, Keiichi","nameLang":"en"},{"name":"徳田, 恵一","nameLang":"ja"},{"name":"トクダ, ケイイチ","nameLang":"ja-Kana"}]},{"nameIdentifiers":[{}],"names":[{"name":"北村, 正"}]}]},"item_10001_publisher_29":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"Institute of Electronics, Information and Communication Engineers"}]},"item_10001_source_id_30":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"09168532","subitem_source_identifier_type":"ISSN"}]},"item_10001_source_id_32":{"attribute_name":"書誌レコードID(NCID)","attribute_value_mlt":[{"subitem_source_identifier":"AA10826272","subitem_source_identifier_type":"NCID"}]},"item_10001_version_type_33":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"Vanegas, Oscar","creatorNameLang":"en"}],"nameIdentifiers":[{}]},{"creatorAffiliations":[{"affiliationNameIdentifiers":[{"affiliationNameIdentifier":"","affiliationNameIdentifierScheme":"ISNI","affiliationNameIdentifierURI":"http://www.isni.org/isni/"}],"affiliationNames":[{"affiliationName":"","affiliationNameLang":"ja"}]}],"creatorNames":[{"creatorName":"Tokuda, Keiichi","creatorNameLang":"en"},{"creatorName":"徳田, 恵一","creatorNameLang":"ja"},{"creatorName":"トクダ, ケイイチ","creatorNameLang":"ja-Kana"}],"familyNames":[{},{},{}],"givenNames":[{},{},{}],"nameIdentifiers":[{},{}]},{"creatorNames":[{"creatorName":"Kitamura, Tadashi","creatorNameLang":"en"}],"nameIdentifiers":[{}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2017-01-25"}],"displaytype":"detail","filename":"E83-D_1969.pdf","filesize":[{"value":"2.5 MB"}],"format":"application/pdf","license_note":"Copyright (c) 2000 IEICE http://search.ieice.org/index.html","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"本文_fulltext","url":"https://nitech.repo.nii.ac.jp/record/4893/files/E83-D_1969.pdf"},"version_id":"033189ee-d5cd-4b26-af72-537ef8c0101f"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"eng"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"Lip Location Normalized Training for Visual Speech Recognition","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"Lip Location Normalized Training for Visual Speech Recognition","subitem_title_language":"en"}]},"item_type_id":"10001","owner":"3","path":["31"],"pubdate":{"attribute_name":"公開日","attribute_value":"2012-11-07"},"publish_date":"2012-11-07","publish_status":"0","recid":"4893","relation_version_is_last":true,"title":["Lip Location Normalized Training for Visual Speech Recognition"],"weko_creator_id":"3","weko_shared_id":3},"updated":"2023-07-10T03:01:01.635325+00:00"}