{"created":"2021-03-01T06:29:22.621650+00:00","id":21684,"links":{},"metadata":{"_buckets":{"deposit":"bd8c7de9-560c-452e-b3da-57d71a8c2602"},"_deposit":{"id":"21684","owners":[],"pid":{"revision_id":0,"type":"depid","value":"21684"},"status":"published"},"_oai":{"id":"oai:nagoya.repo.nii.ac.jp:00021684","sets":["312:313:314"]},"author_link":["64139","64140","64141","64142","64143","64144","64145","64146","64147","64148","64149","64150"],"item_10_alternative_title_19":{"attribute_name":"その他のタイトル","attribute_value_mlt":[{"subitem_alternative_title":"Extraction of Speech Shots Focusing on Visual and Audio Features within and between Shots","subitem_alternative_title_language":"en"}]},"item_10_biblio_info_6":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2012-03","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"479","bibliographicPageEnd":"86","bibliographicPageStart":"81","bibliographicVolumeNumber":"111","bibliographic_titles":[{"bibliographic_title":"電子情報通信学会技術研究報告. MVE, マルチメディア・仮想環境基礎","bibliographic_titleLang":"ja"}]}]},"item_10_description_4":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"本報告では,ショット内及びショット間の特徴に基づく被写体と話者の異同判定によるニュース映像からのスピーチショット抽出手法を提案する.スピーチショットはマルチメディア情報を豊富に含み,資料的価値が高い.そこで我々はこれまで,被写体の口唇動作と話者の声から得られる複数の音声特徴と画像特徴の相関に基づく被写体と話者の異同判定手法を提案してきた.この手法は,音声ノイズの少ないショットに対しては高精度な異同判定が可能であるが,多量の音声ノイズを含むショットに対しての異同判定は困難であった.そこで本報告では,2段階の処理による被写体と話者の異同判定手法を提案する.まず第1段階で,これまでに提案した手法により異同判定を行う.その後,第2段階で,ショット内及びその前後のショットとの間に表れる特徴的な画像・音声の性質に基づいて異同判定を行う.スピーチショット抽出実験の結果,提案手法の有効性を確認した.","subitem_description_language":"ja","subitem_description_type":"Abstract"},{"subitem_description":"We propose a method to extract speech shots from news videos using detecting the inconsisteny between a subject and the speaker focusing on features within and between shots. Speech shots in news videos contain a wealth of multimedia information, and are valuable as archived material. To extract speech shots, we have previously proposed a method to detect the inconsistency between a subject and the speaker based on the co-occurrence between a subject's lip motion and the speaker's voice. This previous method could detect the inconsistency in a shot with little audio noises. However, it is difficult to detect the inconsistency in a shot with significant amount of audio noises. In order to deal with this problem, the proposed method detects the inconsisteny between a subject and the speaker in two steps. The first step detects the inconsistency by our previous method, and the second step detects the inconsistency based on the intra- and inter- shot features. Experimental results showed the effectiveness of the proposed method.","subitem_description_language":"en","subitem_description_type":"Abstract"}]},"item_10_description_5":{"attribute_name":"内容記述","attribute_value_mlt":[{"subitem_description":"IEICE Technical Report;IE2011-147,IEICE Technical Report;MVE2011-109","subitem_description_language":"en","subitem_description_type":"Other"}]},"item_10_identifier_60":{"attribute_name":"URI","attribute_value_mlt":[{"subitem_identifier_type":"URI","subitem_identifier_uri":"http://ci.nii.ac.jp/naid/110009546402/"},{"subitem_identifier_type":"HDL","subitem_identifier_uri":"http://hdl.handle.net/2237/23832"}]},"item_10_publisher_32":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"一般社団法人電子情報通信学会","subitem_publisher_language":"ja"}]},"item_10_relation_40":{"attribute_name":"シリーズ","attribute_value_mlt":[{"subitem_relation_name":[{"subitem_relation_name_text":"IEICE Technical Report;IE2011-147"}]},{"subitem_relation_name":[{"subitem_relation_name_text":"IEICE Technical Report;MVE2011-109"}]}]},"item_10_relation_43":{"attribute_name":"関連情報","attribute_value_mlt":[{"subitem_relation_type":"isVersionOf","subitem_relation_type_id":{"subitem_relation_type_id_text":"http://ci.nii.ac.jp/naid/110009546402/","subitem_relation_type_select":"URI"}}]},"item_10_rights_12":{"attribute_name":"権利","attribute_value_mlt":[{"subitem_rights":"(c)一般社団法人電子情報通信学会 本文データは学協会の許諾に基づきCiNiiから複製したものである","subitem_rights_language":"ja"}]},"item_10_select_15":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_select_item":"publisher"}]},"item_10_source_id_7":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"0913-5685","subitem_source_identifier_type":"PISSN"}]},"item_1615787544753":{"attribute_name":"出版タイプ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_access_right":{"attribute_name":"アクセス権","attribute_value_mlt":[{"subitem_access_right":"open access","subitem_access_right_uri":"http://purl.org/coar/access_right/c_abf2"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"熊谷, 章吾","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"64139","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"道満, 恵介","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"64140","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"高橋, 友和","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"64141","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"出口, 大輔","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"64142","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"井手, 一郎","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"64143","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"村瀬, 洋","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"64144","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"KUMAGAI, Shogo","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"64145","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"DOMAN, Keisuke","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"64146","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"TAKAHASHI, Tomokazu","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"64147","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"DEGUCHI, Daisuke","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"64148","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"IDE, Ichiro","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"64149","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"MURASE, Hiroshi","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"64150","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2018-02-21"}],"displaytype":"detail","filename":"110009546402.pdf","filesize":[{"value":"923.2 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"110009546402.pdf","objectType":"fulltext","url":"https://nagoya.repo.nii.ac.jp/record/21684/files/110009546402.pdf"},"version_id":"cb4361c8-7404-43b3-a9cf-caf1944fccc2"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"スピーチショット抽出","subitem_subject_scheme":"Other"},{"subitem_subject":"ニュース映像","subitem_subject_scheme":"Other"},{"subitem_subject":"映像検索","subitem_subject_scheme":"Other"},{"subitem_subject":"画像・音声特徴","subitem_subject_scheme":"Other"},{"subitem_subject":"Speech shot extraction","subitem_subject_scheme":"Other"},{"subitem_subject":"news video","subitem_subject_scheme":"Other"},{"subitem_subject":"video retrieval","subitem_subject_scheme":"Other"},{"subitem_subject":"audio−visual features","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"journal article","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"ショット内及びショット間の画像・音声特徴に着目したスピーチショット抽出","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"ショット内及びショット間の画像・音声特徴に着目したスピーチショット抽出","subitem_title_language":"ja"}]},"item_type_id":"10","owner":"1","path":["314"],"pubdate":{"attribute_name":"PubDate","attribute_value":"2016-03-15"},"publish_date":"2016-03-15","publish_status":"0","recid":"21684","relation_version_is_last":true,"title":["ショット内及びショット間の画像・音声特徴に着目したスピーチショット抽出"],"weko_creator_id":"1","weko_shared_id":-1},"updated":"2023-01-16T04:10:57.692506+00:00"}