<?xml version="1.0" encoding="UTF-8"?>
<article xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.1" xml:lang="en">
  <front>
    <journal-meta>
      <journal-id>authorea</journal-id>
      <publisher>
        <publisher-name>Authorea</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.36227/techrxiv.171078237.77836600/v1</article-id>
      <title-group>
        <article-title>Multi-Discounting Reinforcement Learning Based on Reward Decomposition</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes">
          <contrib-id contrib-id-type="orcid">0009-0007-4307-5618</contrib-id>
          <name>
            <surname>Chen</surname>
            <given-names>Pengbin</given-names>
          </name>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name>
            <surname>Liu</surname>
            <given-names>Qi</given-names>
          </name>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name>
            <surname>Li</surname>
            <given-names>Yanjie</given-names>
          </name>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name>
            <surname>Yan</surname>
            <given-names>Kejian</given-names>
          </name>
        </contrib>
        <contrib contrib-type="author" corresp="no">
          <name>
            <surname>Ma</surname>
            <given-names>Shuaikang</given-names>
          </name>
        </contrib>
      </contrib-group>
      <pub-date date-type="preprint" publication-format="electronic">
        <day>18</day>
        <month>3</month>
        <year>2024</year>
      </pub-date>
      <self-uri xlink:href="https://doi.org/10.36227/techrxiv.171078237.77836600/v1">This preprint is available at https://doi.org/10.36227/techrxiv.171078237.77836600/v1</self-uri>
      <kwd-group kwd-group-type="author-created">
        <kwd>computing and processing</kwd>
        <kwd>discount factor</kwd>
        <kwd>mdp</kwd>
        <kwd>reinforcement learning</kwd>
        <kwd>reward decomposition</kwd>
        <kwd>robotics and control systems</kwd>
      </kwd-group>
    </article-meta>
  </front>
</article>
