{"created":"2023-05-15T13:45:18.010402+00:00","id":886,"links":{},"metadata":{"_buckets":{"deposit":"942f2d25-001a-4370-af2b-e709766f40e4"},"_deposit":{"created_by":31,"id":"886","owners":[31],"pid":{"revision_id":0,"type":"depid","value":"886"},"status":"published"},"_oai":{"id":"oai:nichibun.repo.nii.ac.jp:00000886","sets":["192:234"]},"author_link":["18736","18735"],"item_5_alternative_title_20":{"attribute_name":"その他の言語のタイトル","attribute_value_mlt":[{"subitem_alternative_title":"A Computer Utilization on Humanities III : Improvement of OCR Recognition of Documents Printed in Old-fashioned Japanese Fonts","subitem_alternative_title_language":"en"}]},"item_5_biblio_info_7":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"1993-09-30","bibliographicIssueDateType":"Issued"},"bibliographicPageEnd":"173(10)","bibliographicPageStart":"182(1)","bibliographicVolumeNumber":"9","bibliographic_titles":[{"bibliographic_title":"日本研究","bibliographic_titleLang":"ja"}]}]},"item_5_description_4":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":" 旧字体で印刷された文書などをOCR(光学文字認識装置)で読み取った場合の誤認識を、人手の後編集の前に自動的に訂正するプログラムを開発した。\n 日本語の漢字かな交じり文の印刷文書を、現在のOCRは99%以上の精度で読み取るとされている。悪条件下でも、現代フォントの活字ならば95%は正確に読み取るが、旧字体の活字では正読率は80%に満たない。本プログラムはこの状況を改善することを目標としている。\n 本プログラムは、OCRの入力と、その人手による編集結果を比較して、どういう読み誤りをするかの知識を抽出集積して、それを自動的な訂正コマンドに作り上げるものである。実験によると、正読率80%弱のテキストに本プログラムが抽出した自動訂正コマンドをかけると、約10ポイントの向上があり、実質正読率90%に達することがわかった。","subitem_description_type":"Abstract"}]},"item_5_full_name_3":{"attribute_name":"著者別名","attribute_value_mlt":[{"nameIdentifiers":[{"nameIdentifier":"18736","nameIdentifierScheme":"WEKO"}],"names":[{"name":"ONO, Yoshihiko","nameLang":"en"}]}]},"item_5_identifier_registration":{"attribute_name":"ID登録","attribute_value_mlt":[{"subitem_identifier_reg_text":"10.15055/00000880","subitem_identifier_reg_type":"JaLC"}]},"item_5_publisher_33":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"国際日本文化研究センター","subitem_publisher_language":"ja"}]},"item_5_source_id_10":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10088118","subitem_source_identifier_type":"NCID"}]},"item_5_source_id_8":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"24343110","subitem_source_identifier_type":"EISSN"},{"subitem_source_identifier":"09150900","subitem_source_identifier_type":"PISSN"}]},"item_5_version_type_16":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"小野, 芳彦","creatorNameLang":"ja"}],"nameIdentifiers":[{"nameIdentifier":"18735","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2015-11-11"}],"displaytype":"detail","filename":"nk09008.pdf","filesize":[{"value":"8.0 MB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"nk09008.pdf","objectType":"fulltext","url":"https://nichibun.repo.nii.ac.jp/record/886/files/nk09008.pdf"},"version_id":"26b0c6ff-418c-45a4-b6b3-a51f805be014"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"OCR","subitem_subject_language":"ja","subitem_subject_scheme":"Other"},{"subitem_subject":"旧字体","subitem_subject_language":"ja","subitem_subject_scheme":"Other"},{"subitem_subject":"SED","subitem_subject_language":"ja","subitem_subject_scheme":"Other"},{"subitem_subject":"文字列処理言語","subitem_subject_language":"ja","subitem_subject_scheme":"Other"},{"subitem_subject":"正読率","subitem_subject_language":"ja","subitem_subject_scheme":"Other"},{"subitem_subject":"後編集による改善","subitem_subject_language":"ja","subitem_subject_scheme":"Other"},{"subitem_subject":"自動差分検出","subitem_subject_language":"ja","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"departmental bulletin paper","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"文化系の計算機利用III : 旧字体活字の文書の自動読み取りの改良","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"文化系の計算機利用III : 旧字体活字の文書の自動読み取りの改良","subitem_title_language":"ja"}]},"item_type_id":"5","owner":"31","path":["234"],"pubdate":{"attribute_name":"PubDate","attribute_value":"2012-04-01"},"publish_date":"2012-04-01","publish_status":"0","recid":"886","relation_version_is_last":true,"title":["文化系の計算機利用III : 旧字体活字の文書の自動読み取りの改良"],"weko_creator_id":"31","weko_shared_id":-1},"updated":"2024-04-24T06:13:46.580185+00:00"}