{"created":"2023-06-20T13:25:18.330355+00:00","id":2056,"links":{},"metadata":{"_buckets":{"deposit":"3b5f7bb6-60fe-4ac7-8589-2f8e199f0532"},"_deposit":{"created_by":11,"id":"2056","owners":[11],"pid":{"revision_id":0,"type":"depid","value":"2056"},"status":"published"},"_oai":{"id":"oai:kougei.repo.nii.ac.jp:00002056","sets":["12:17:266:270"]},"author_link":["3466","3464","3465","3463"],"item_10002_biblio_info_7":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2019-12-25","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"1","bibliographicPageEnd":"30","bibliographicPageStart":"25","bibliographicVolumeNumber":"42","bibliographic_titles":[{"bibliographic_title":"東京工芸大学工学部紀要"},{"bibliographic_title":"The Academic Reports, the Faculty of Engineering, Tokyo Polytechnic University","bibliographic_titleLang":"en"}]}]},"item_10002_description_5":{"attribute_name":"抄録","attribute_value_mlt":[{"subitem_description":"本論文では，強化学習における転移学習で使用される，転移率というパラメータの効果を検証する．転移率は，転移学習時の過学習状態を回避するために用いられるが，再利用方策の学習進度を疑似的にロールバックできると考えられている．本論文では実際の強化学習・転移学習シミュレーションから，学習進度をロールバックできるか効果を検証したので報告する．","subitem_description_type":"Abstract"},{"subitem_description":"In recent years, the robot systems with learning algorithms are deployed in the real world situation,for example, automatic driving car, warehouse robots and so on. A reinforcement learning (RL) can be contributed for increasing of intelligence of the robot system, and RL do not need the supervised data.\nAdditionally, RL can explore the optimal solution by itself. However, the robot with reinforcement learning(called RL-agent) has probability to encounter with over fitting caused by reusing obtained policy. A transfer rate has been proposed to reduce the utilization of the policy. Moreover, the transfer rate is thought to have the effect of rolling back the learning progress of the policy to be reused. However, this effectiveness is not validated based on actual reinforcement learning and transfer learning. In this paper, the transfer rate is validated with transfer surface which is visual and quantitative evaluation method of transfer, and the transfer rate is verified the contribution for rolling back of learning progress of reusing policy for transfer learning.","subitem_description_type":"Abstract"}]},"item_10002_publisher_8":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"東京工芸大学工学部"}]},"item_10002_source_id_9":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"03876055","subitem_source_identifier_type":"ISSN"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"河野, 仁"},{"creatorName":"コウノ, ヒトシ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{"nameIdentifier":"3463","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"佐藤, 弘和"},{"creatorName":"サトウ, ヒロカズ","creatorNameLang":"ja-Kana"}],"nameIdentifiers":[{"nameIdentifier":"3464","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"Kono, Hitoshi","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"3465","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"Sato, Hirokazu","creatorNameLang":"en"}],"nameIdentifiers":[{"nameIdentifier":"3466","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2019-12-25"}],"displaytype":"detail","filename":"vol42-1-04.pdf","filesize":[{"value":"4.4 MB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"vol42-1-04","url":"https://kougei.repo.nii.ac.jp/record/2056/files/vol42-1-04.pdf"},"version_id":"88036f76-3cef-4038-8d77-3235ebd932fd"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"強化学習","subitem_subject_scheme":"Other"},{"subitem_subject":"転移学習","subitem_subject_scheme":"Other"},{"subitem_subject":"転移率","subitem_subject_scheme":"Other"},{"subitem_subject":"転移曲面","subitem_subject_scheme":"Other"},{"subitem_subject":"Reinforcement learning","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Transfer learning","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Transfer rate","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Transfer surface","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"departmental bulletin paper","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"強化学習の転移学習における転移率を用いた再利用方策学習進度の可逆性","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"強化学習の転移学習における転移率を用いた再利用方策学習進度の可逆性"},{"subitem_title":"Reversibility Validation of Learning Progression Using Transfer Rate in Transfer Reinforcement Learning","subitem_title_language":"en"}]},"item_type_id":"10002","owner":"11","path":["270"],"pubdate":{"attribute_name":"公開日","attribute_value":"2019-12-25"},"publish_date":"2019-12-25","publish_status":"0","recid":"2056","relation_version_is_last":true,"title":["強化学習の転移学習における転移率を用いた再利用方策学習進度の可逆性"],"weko_creator_id":"11","weko_shared_id":-1},"updated":"2023-06-20T13:38:09.410365+00:00"}