<?xml version='1.0' encoding='UTF-8'?>
<OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
  <responseDate>2026-03-12T00:44:41Z</responseDate>
  <request metadataPrefix="jpcoar_1.0" identifier="oai:fit.repo.nii.ac.jp:00000424" verb="GetRecord">https://fit.repo.nii.ac.jp/oai</request>
  <GetRecord>
    <record>
      <header>
        <identifier>oai:fit.repo.nii.ac.jp:00000424</identifier>
        <datestamp>2023-05-15T13:41:05Z</datestamp>
        <setSpec>256:257:279</setSpec>
      </header>
      <metadata>
        <jpcoar:jpcoar xmlns:datacite="https://schema.datacite.org/meta/kernel-4/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcndl="http://ndl.go.jp/dcndl/terms/" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:jpcoar="https://github.com/JPCOAR/schema/blob/master/1.0/" xmlns:oaire="http://namespace.openaire.eu/schema/oaire/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:rioxxterms="http://www.rioxx.net/schema/v2.0/rioxxterms/" xmlns:xs="http://www.w3.org/2001/XMLSchema" xmlns="https://github.com/JPCOAR/schema/blob/master/1.0/" xsi:schemaLocation="https://github.com/JPCOAR/schema/blob/master/1.0/jpcoar_scm.xsd">
          <dc:title>ナッシュQ学習における協調行動の生成</dc:title>
          <dc:title xml:lang="en">Emergence of Cooperative Action in Nash-Q Learning</dc:title>
          <dcterms:alternative>ナッシュQ ガクシュウ ニ オケル キョウチョウ コウドウ ノ セイセイ</dcterms:alternative>
          <jpcoar:creator>
            <jpcoar:creatorName>北原, 頌士</jpcoar:creatorName>
          </jpcoar:creator>
          <jpcoar:creator>
            <jpcoar:creatorName>谷川, 裕一</jpcoar:creatorName>
          </jpcoar:creator>
          <jpcoar:creator>
            <jpcoar:creatorName>鶴岡, 久</jpcoar:creatorName>
          </jpcoar:creator>
          <jpcoar:subject subjectScheme="NDC">007.1</jpcoar:subject>
          <jpcoar:subject subjectScheme="Other">Q learning</jpcoar:subject>
          <jpcoar:subject subjectScheme="Other">Nash-Q learning</jpcoar:subject>
          <jpcoar:subject subjectScheme="Other">grid world</jpcoar:subject>
          <jpcoar:subject subjectScheme="Other">agent</jpcoar:subject>
          <jpcoar:subject subjectScheme="Other">reward</jpcoar:subject>
          <jpcoar:subject xml:lang="en" subjectScheme="Other">Q learning</jpcoar:subject>
          <jpcoar:subject xml:lang="en" subjectScheme="Other">Nash-Q learning</jpcoar:subject>
          <jpcoar:subject xml:lang="en" subjectScheme="Other">grid world</jpcoar:subject>
          <jpcoar:subject xml:lang="en" subjectScheme="Other">agent</jpcoar:subject>
          <jpcoar:subject xml:lang="en" subjectScheme="Other">reward</jpcoar:subject>
          <datacite:description descriptionType="Other">application/pdf</datacite:description>
          <datacite:description descriptionType="Other">論文(Article)</datacite:description>
          <datacite:description descriptionType="Other">The effect of Nash-Q learning algorithm has not yet been confirmed in multiple experiments. We adopted a 5×5 grid world in which two agents started from opposite lower corners and tried to reach their respective goal cell. Experiments showed performance differences between single agent Q-learning and Nash-Q learning. In the Nash-Q learning, both agents obtained similar accumulated re-wards; however, in the Q learning, each agent accumulated his reward differently. Findings of this re-search confirmed that when agents adopt Nash Q-learning to predict the other agent’s behavior, not only is the performance of the agents better than their performance when using single-agent Q-learning, but the emergence of the cooperative action can also be observed.</datacite:description>
          <dc:publisher>福岡工業大学</dc:publisher>
          <datacite:date dateType="Issued">2007-09-30</datacite:date>
          <dc:language>jpn</dc:language>
          <dc:type rdf:resource="http://purl.org/coar/resource_type/c_6501">departmental bulletin paper</dc:type>
          <oaire:version rdf:resource="http://purl.org/coar/version/c_970fb48d4fbd8a85">VoR</oaire:version>
          <jpcoar:identifier identifierType="HDL">http://hdl.handle.net/11478/937</jpcoar:identifier>
          <jpcoar:identifier identifierType="URI">https://fit.repo.nii.ac.jp/records/424</jpcoar:identifier>
          <jpcoar:sourceIdentifier identifierType="ISSN">02876620</jpcoar:sourceIdentifier>
          <jpcoar:sourceIdentifier identifierType="NCID">AN10036974</jpcoar:sourceIdentifier>
          <jpcoar:sourceTitle>福岡工業大学研究論集</jpcoar:sourceTitle>
          <jpcoar:volume>40</jpcoar:volume>
          <jpcoar:issue>1</jpcoar:issue>
          <jpcoar:pageStart>15</jpcoar:pageStart>
          <jpcoar:pageEnd>20</jpcoar:pageEnd>
          <jpcoar:file>
            <jpcoar:URI label="11478-937_p15鶴岡　久.pdf">https://fit.repo.nii.ac.jp/record/424/files/11478-937_p15鶴岡　久.pdf</jpcoar:URI>
            <jpcoar:mimeType>application/pdf</jpcoar:mimeType>
            <jpcoar:extent>843.3 kB</jpcoar:extent>
            <datacite:date dateType="Available">2020-09-14</datacite:date>
          </jpcoar:file>
        </jpcoar:jpcoar>
      </metadata>
    </record>
  </GetRecord>
</OAI-PMH>
