{"created":"2023-05-15T12:30:51.048226+00:00","id":424,"links":{},"metadata":{"_buckets":{"deposit":"214fd401-8587-4e75-88ad-ddc401dc995e"},"_deposit":{"created_by":2,"id":"424","owners":[2],"pid":{"revision_id":0,"type":"depid","value":"424"},"status":"published"},"_oai":{"id":"oai:fit.repo.nii.ac.jp:00000424","sets":["256:257:279"]},"author_link":["1952","1950","1957","1951","1958","1954","1953","1956","1955"],"item_3_alternative_title_23":{"attribute_name":"タイトル(ヨミ)","attribute_value_mlt":[{"subitem_alternative_title":"ナッシュQ ガクシュウ ニ オケル キョウチョウ コウドウ ノ セイセイ"}]},"item_3_biblio_info_6":{"attribute_name":"書誌情報","attribute_value_mlt":[{"bibliographicIssueDates":{"bibliographicIssueDate":"2007-09-30","bibliographicIssueDateType":"Issued"},"bibliographicIssueNumber":"1","bibliographicPageEnd":"20","bibliographicPageStart":"15","bibliographicVolumeNumber":"40","bibliographic_titles":[{"bibliographic_title":"福岡工業大学研究論集"}]}]},"item_3_description_17":{"attribute_name":"フォーマット","attribute_value_mlt":[{"subitem_description":"application/pdf","subitem_description_type":"Other"}]},"item_3_description_47":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"subitem_description":"論文(Article)","subitem_description_type":"Other"}]},"item_3_description_5":{"attribute_name":"内容記述","attribute_value_mlt":[{"subitem_description":"The effect of Nash-Q learning algorithm has not yet been confirmed in multiple experiments. We adopted a 5×5 grid world in which two agents started from opposite lower corners and tried to reach their respective goal cell. Experiments showed performance differences between single agent Q-learning and Nash-Q learning. In the Nash-Q learning, both agents obtained similar accumulated re-wards; however, in the Q learning, each agent accumulated his reward differently. Findings of this re-search confirmed that when agents adopt Nash Q-learning to predict the other agent’s behavior, not only is the performance of the agents better than their performance when using single-agent Q-learning, but the emergence of the cooperative action can also be observed.","subitem_description_type":"Other"}]},"item_3_full_name_2":{"attribute_name":"著者(ヨミ)","attribute_value_mlt":[{"nameIdentifiers":[{"nameIdentifier":"1953","nameIdentifierScheme":"WEKO"}],"names":[{"name":"キタハラ, ショウジ"}]},{"nameIdentifiers":[{"nameIdentifier":"1954","nameIdentifierScheme":"WEKO"}],"names":[{"name":"タニガワ, ユウイチ"}]},{"nameIdentifiers":[{"nameIdentifier":"1955","nameIdentifierScheme":"WEKO"}],"names":[{"name":"ツルオカ, ヒサシ"}]}]},"item_3_full_name_3":{"attribute_name":"別言語の著者","attribute_value_mlt":[{"nameIdentifiers":[{"nameIdentifier":"1956","nameIdentifierScheme":"WEKO"}],"names":[{"name":"KITAHARA, Shouji"}]},{"nameIdentifiers":[{"nameIdentifier":"1957","nameIdentifierScheme":"WEKO"}],"names":[{"name":"TANIGAWA, Yuichi"}]},{"nameIdentifiers":[{"nameIdentifier":"1958","nameIdentifierScheme":"WEKO"}],"names":[{"name":"TSURUOKA, Hisashi"}]}]},"item_3_publisher_37":{"attribute_name":"出版者","attribute_value_mlt":[{"subitem_publisher":"福岡工業大学"}]},"item_3_source_id_7":{"attribute_name":"ISSN","attribute_value_mlt":[{"subitem_source_identifier":"02876620","subitem_source_identifier_type":"ISSN"}]},"item_3_source_id_9":{"attribute_name":"書誌レコードID","attribute_value_mlt":[{"subitem_source_identifier":"AN10036974","subitem_source_identifier_type":"NCID"}]},"item_3_subject_20":{"attribute_name":"日本十進分類法","attribute_value_mlt":[{"subitem_subject":"007.1","subitem_subject_scheme":"NDC"}]},"item_3_text_18":{"attribute_name":"形態","attribute_value_mlt":[{"subitem_text_value":"843268 bytes"}]},"item_3_text_38":{"attribute_name":"出版者(ヨミ)","attribute_value_mlt":[{"subitem_text_value":"フクオカ コウギョウ ダイガク"}]},"item_3_text_39":{"attribute_name":"別言語の出版者","attribute_value_mlt":[{"subitem_text_value":"Fukuoka Institute of Technology"}]},"item_3_text_48":{"attribute_name":"資源タイプ・ローカル","attribute_value_mlt":[{"subitem_text_value":"紀要論文"}]},"item_3_text_49":{"attribute_name":"資源タイプ・NII","attribute_value_mlt":[{"subitem_text_value":"Departmental Bulletin Paper"}]},"item_3_text_50":{"attribute_name":"資源タイプ・DCMI","attribute_value_mlt":[{"subitem_text_value":"text"}]},"item_3_text_51":{"attribute_name":"資源タイプ・ローカル表示コード","attribute_value_mlt":[{"subitem_text_value":"02"}]},"item_3_version_type_19":{"attribute_name":"著者版フラグ","attribute_value_mlt":[{"subitem_version_resource":"http://purl.org/coar/version/c_970fb48d4fbd8a85","subitem_version_type":"VoR"}]},"item_creator":{"attribute_name":"著者","attribute_type":"creator","attribute_value_mlt":[{"creatorNames":[{"creatorName":"北原, 頌士"}],"nameIdentifiers":[{"nameIdentifier":"1950","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"谷川, 裕一"}],"nameIdentifiers":[{"nameIdentifier":"1951","nameIdentifierScheme":"WEKO"}]},{"creatorNames":[{"creatorName":"鶴岡, 久"}],"nameIdentifiers":[{"nameIdentifier":"1952","nameIdentifierScheme":"WEKO"}]}]},"item_files":{"attribute_name":"ファイル情報","attribute_type":"file","attribute_value_mlt":[{"accessrole":"open_date","date":[{"dateType":"Available","dateValue":"2020-09-14"}],"displaytype":"detail","filename":"11478-937_p15鶴岡 久.pdf","filesize":[{"value":"843.3 kB"}],"format":"application/pdf","licensetype":"license_note","mimetype":"application/pdf","url":{"label":"11478-937_p15鶴岡 久.pdf","url":"https://fit.repo.nii.ac.jp/record/424/files/11478-937_p15鶴岡 久.pdf"},"version_id":"e830ecc7-2cd5-477b-8c08-8488733963a3"}]},"item_keyword":{"attribute_name":"キーワード","attribute_value_mlt":[{"subitem_subject":"Q learning","subitem_subject_scheme":"Other"},{"subitem_subject":"Nash-Q learning","subitem_subject_scheme":"Other"},{"subitem_subject":"grid world","subitem_subject_scheme":"Other"},{"subitem_subject":"agent","subitem_subject_scheme":"Other"},{"subitem_subject":"reward","subitem_subject_scheme":"Other"},{"subitem_subject":"Q learning","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"Nash-Q learning","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"grid world","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"agent","subitem_subject_language":"en","subitem_subject_scheme":"Other"},{"subitem_subject":"reward","subitem_subject_language":"en","subitem_subject_scheme":"Other"}]},"item_language":{"attribute_name":"言語","attribute_value_mlt":[{"subitem_language":"jpn"}]},"item_resource_type":{"attribute_name":"資源タイプ","attribute_value_mlt":[{"resourcetype":"departmental bulletin paper","resourceuri":"http://purl.org/coar/resource_type/c_6501"}]},"item_title":"ナッシュQ学習における協調行動の生成","item_titles":{"attribute_name":"タイトル","attribute_value_mlt":[{"subitem_title":"ナッシュQ学習における協調行動の生成"},{"subitem_title":"Emergence of Cooperative Action in Nash-Q Learning","subitem_title_language":"en"}]},"item_type_id":"3","owner":"2","path":["279"],"pubdate":{"attribute_name":"公開日","attribute_value":"2018-06-13"},"publish_date":"2018-06-13","publish_status":"0","recid":"424","relation_version_is_last":true,"title":["ナッシュQ学習における協調行動の生成"],"weko_creator_id":"2","weko_shared_id":2},"updated":"2023-05-15T13:41:05.356655+00:00"}