Automatically assigned DDC number: 00631

Manually assigned DDC number: 00631

Number of references: 31

Title: Solution of Delayed Reinforcement Learning Problems Having Continuous Action Spaces

Author:

Subject: B. Ravindran Solution of Delayed Reinforcement Learning Problems Having Continuous Action Spaces

Description: This work concerns the solution of delayed Reinforcement Learning problems having continuous action spaces. The problems associated with continuous action spaces are discussed and various existing algorithms for solving the problem are presented. A extension of Q-learning for solving delayed RL problems having continuous action spaces is proposed which overcomes drawbacks associated with existing methods. Simulation results are presented to demonstrate the working of the proposed algorithm.

Contributor: The Pennsylvania State University CiteSeer Archives

Publisher: unknown

Date: 2001-10-02

Pubyear: 1996

Format: ps

Identifier: http://citeseer.ist.psu.edu/537952.html

Source: http://www-anw.cs.umass.edu/~ravi/ms_thesis.ps.gz

Language: en

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Rights: unrestricted

Graph

<?xml   version="1.0"   encoding="UTF-8"?>

<references_metadata>

      <rec   ID="/311556.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   the   Fourth   International   Workshop   on   Machine   Learning   Irvine   CA   June   1987"   CiteSeer_Volume=""   Title="Strategy   Learning   in   Multilayer   Connectionist   Representations,"   />

      <rec   ID="/35177.html"   Type="misc"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Advantage   updating,">

            <identifier   Org="ISBN:0131201158"   Paper_ID="/35177.html"   Extracted="0131201158"   DDC="658.8/27"   Normalized_DDC="658827"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0262042061"   Paper_ID="/35177.html"   Extracted="0262042061"   />

            <identifier   Org="ISBN:0262194503"   Paper_ID="/35177.html"   Extracted="0262194503"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/35177.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262201070"   Paper_ID="/35177.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0749415193"   Paper_ID="/35177.html"   Extracted="0749415193"   DDC="374.4"   Normalized_DDC="3744"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0749426349"   Paper_ID="/35177.html"   Extracted="0749426349"   DDC="378.03"   Normalized_DDC="37803"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:078031901X"   Paper_ID="/35177.html"   Extracted="078031901X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0780332113"   Paper_ID="/35177.html"   Extracted="0780332113"   DDC="006.3/2"   Normalized_DDC="00632"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0818624701"   Paper_ID="/35177.html"   Extracted="0818624701"   DDC="621.381"   Normalized_DDC="621381"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:155623550X"   Paper_ID="/35177.html"   Extracted="155623550X"   DDC="658.15/11/0285"   Normalized_DDC="65815110285"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540408045"   Paper_ID="/35177.html"   Extracted="3540408045"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:9051993986"   Paper_ID="/35177.html"   Extracted="9051993986"   />

      </rec>

      <rec   ID="/110654.html"   Type="incollection"   CiteSeer_Book="Learning   and   computational   neuroscience      foundations   of   adaptive   networks"   CiteSeer_Volume=""   Title="Learning   and   Sequential   Decision   Making,">

            <identifier   Org="ISBN:0123741769"   Paper_ID="/110654.html"   Extracted="0123741769"   DDC="330.019"   Normalized_DDC="330019"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262510901"   Paper_ID="/110654.html"   Extracted="0262510901"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262510952"   Paper_ID="/110654.html"   Extracted="0262510952"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262531224"   Paper_ID="/110654.html"   Extracted="0262531224"   DDC="591.51"   Normalized_DDC="59151"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262631490"   Paper_ID="/110654.html"   Extracted="0262631490"   DDC="591.51"   Normalized_DDC="59151"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0792392345"   Paper_ID="/110654.html"   Extracted="0792392345"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0805812911"   Paper_ID="/110654.html"   Extracted="0805812911"   />

            <identifier   Org="ISBN:0805814876"   Paper_ID="/110654.html"   Extracted="0805814876"   />

            <identifier   Org="ISBN:1558601414"   Paper_ID="/110654.html"   Extracted="1558601414"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1558601643"   Paper_ID="/110654.html"   Extracted="1558601643"   DDC="658.5"   Normalized_DDC="6585"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/110654.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1586030132"   Paper_ID="/110654.html"   Extracted="1586030132"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1852334452"   Paper_ID="/110654.html"   Extracted="1852334452"   DDC="005.3"   Normalized_DDC="0053"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540566678"   Paper_ID="/110654.html"   Extracted="3540566678"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540584838"   Paper_ID="/110654.html"   Extracted="3540584838"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540590528"   Paper_ID="/110654.html"   Extracted="3540590528"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540659072"   Paper_ID="/110654.html"   Extracted="3540659072"   DDC="003/.3"   Normalized_DDC="0033"   Normalized_Weight="0.06666666666666667"   />

      </rec>

      <rec   ID="/286243.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems   5   Proceedings   of   the   IEEE   Conference   in   Denver   to   appear"   CiteSeer_Volume=""   Title="Reinforcement   Learning   Applied   to   Linear   Quadratic   Regulation,">

            <identifier   Org="ISBN:0262122413"   Paper_ID="/286243.html"   Extracted="0262122413"   />

            <identifier   Org="ISBN:0262193981"   Paper_ID="/286243.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/286243.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262201070"   Paper_ID="/286243.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:0262510901"   Paper_ID="/286243.html"   Extracted="0262510901"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:078031901X"   Paper_ID="/286243.html"   Extracted="078031901X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:0792397169"   Paper_ID="/286243.html"   Extracted="0792397169"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/286243.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:0805821252"   Paper_ID="/286243.html"   Extracted="0805821252"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/286243.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:1558604804"   Paper_ID="/286243.html"   Extracted="1558604804"   />

            <identifier   Org="ISBN:3540240772"   Paper_ID="/286243.html"   Extracted="3540240772"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:354079865X"   Paper_ID="/286243.html"   Extracted="354079865X"   DDC="006.31"   Normalized_DDC="00631"   Normalized_Weight="0.125"   />

            <identifier   Org="ISBN:9051993986"   Paper_ID="/286243.html"   Extracted="9051993986"   />

      </rec>

      <rec   ID="/165188.html"   Type="misc"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Incremental   Dynamic   Programming   for   On-line   Adaptive   Optimal   Control,">

            <identifier   Org="ISBN:0262133172"   Paper_ID="/165188.html"   Extracted="0262133172"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.3333333333333333"   />

            <identifier   Org="ISBN:0262193981"   Paper_ID="/165188.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.3333333333333333"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/165188.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0780347560"   Paper_ID="/165188.html"   Extracted="0780347560"   DDC="621.381"   Normalized_DDC="621381"   Normalized_Weight="0.3333333333333333"   />

            <identifier   Org="ISBN:3211833641"   Paper_ID="/165188.html"   Extracted="3211833641"   />

      </rec>

      <rec   ID="/385953.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems"   CiteSeer_Volume=""   Title="Reinforcement   Learning   Methods   for   Continuous-Time   {M}arkov   Decision   Problems,"   />

      <rec   ID="/343069.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems   5   Proceedings   of   the   IEEE   Conference   in   Denver   to   appear"   CiteSeer_Volume=""   Title="Feudal   Reinforcement   Learning,">

            <identifier   Org="ISBN:0262112450"   Paper_ID="/343069.html"   Extracted="0262112450"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/343069.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262661446"   Paper_ID="/343069.html"   Extracted="0262661446"   DDC="591.5/01/1"   Normalized_DDC="5915011"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:047166054X"   Paper_ID="/343069.html"   Extracted="047166054X"   DDC="519.7/03"   Normalized_DDC="519703"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:078035530X"   Paper_ID="/343069.html"   Extracted="078035530X"   DDC="006.3/2"   Normalized_DDC="00632"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/343069.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/343069.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1558607781"   Paper_ID="/343069.html"   Extracted="1558607781"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1586034146"   Paper_ID="/343069.html"   Extracted="1586034146"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540206469"   Paper_ID="/343069.html"   Extracted="3540206469"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:354032688X"   Paper_ID="/343069.html"   Extracted="354032688X"   DDC="629.8/92"   Normalized_DDC="629892"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540590528"   Paper_ID="/343069.html"   Extracted="3540590528"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540644172"   Paper_ID="/343069.html"   Extracted="3540644172"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540654801"   Paper_ID="/343069.html"   Extracted="3540654801"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540676023"   Paper_ID="/343069.html"   Extracted="3540676023"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540678395"   Paper_ID="/343069.html"   Extracted="3540678395"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540699112"   Paper_ID="/343069.html"   Extracted="3540699112"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540747818"   Paper_ID="/343069.html"   Extracted="3540747818"   />

            <identifier   Org="ISBN:3540769269"   Paper_ID="/343069.html"   Extracted="3540769269"   />

            <identifier   Org="ISBN:427490525X"   Paper_ID="/343069.html"   Extracted="427490525X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

      </rec>

      <rec   ID="/278302.html"   Type="article"   CiteSeer_Book="Machine   Learning"   CiteSeer_Volume="14"   Title="{TD}($\lambda$)   Converges   with   Probability   1,">

            <identifier   Org="ISBN:0525949828"   Paper_ID="/278302.html"   Extracted="0525949828"   DDC="153.8/3"   Normalized_DDC="15383"   Normalized_Weight="1.0"   />

            <identifier   Org="ISBN:0780378989"   Paper_ID="/278302.html"   Extracted="0780378989"   />

      </rec>

      <rec   ID="/300268.html"   Type="techreport"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Reinforcement   Learning   and   its   Application   to   Control,">

            <identifier   Org="ISBN:0080422365"   Paper_ID="/300268.html"   Extracted="0080422365"   DDC="629.8/9"   Normalized_DDC="62989"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:0444819312"   Paper_ID="/300268.html"   Extracted="0444819312"   DDC="612.8/2"   Normalized_DDC="61282"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:0780305469"   Paper_ID="/300268.html"   Extracted="0780305469"   DDC="006"   Normalized_DDC="006"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:0780363493"   Paper_ID="/300268.html"   Extracted="0780363493"   DDC="629.8/92"   Normalized_DDC="629892"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:0805813640"   Paper_ID="/300268.html"   Extracted="0805813640"   DDC="153"   Normalized_DDC="153"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/300268.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:0805821252"   Paper_ID="/300268.html"   Extracted="0805821252"   />

            <identifier   Org="ISBN:155860247X"   Paper_ID="/300268.html"   Extracted="155860247X"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1558604197"   Paper_ID="/300268.html"   Extracted="1558604197"   />

            <identifier   Org="ISBN:1586036459"   Paper_ID="/300268.html"   Extracted="1586036459"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1593701578"   Paper_ID="/300268.html"   Extracted="1593701578"   DDC="333.790285"   Normalized_DDC="333790285"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:354026549X"   Paper_ID="/300268.html"   Extracted="354026549X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540427325"   Paper_ID="/300268.html"   Extracted="3540427325"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540590528"   Paper_ID="/300268.html"   Extracted="3540590528"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540628584"   Paper_ID="/300268.html"   Extracted="3540628584"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.08333333333333333"   />

      </rec>

      <rec   ID="/230083.html"   Type="inproceedings"   CiteSeer_Book="Proc   11th   International   Conference   on   Machine   Learning"   CiteSeer_Volume=""   Title="Consideration   of   risk   in   reinforcement   learning,">

            <identifier   Org="ISBN:0262195682"   Paper_ID="/230083.html"   Extracted="0262195682"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="1.0"   />

            <identifier   Org="ISBN:1558604197"   Paper_ID="/230083.html"   Extracted="1558604197"   />

      </rec>

      <rec   ID="/451869.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems"   CiteSeer_Volume=""   Title="Convergence   of   Stochastic   Iterative   Dynamic   Programming   Algorithms,">

            <identifier   Org="ISBN:0262012111"   Paper_ID="/451869.html"   Extracted="0262012111"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:026204207X"   Paper_ID="/451869.html"   Extracted="026204207X"   />

            <identifier   Org="ISBN:0262193981"   Paper_ID="/451869.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/451869.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262201070"   Paper_ID="/451869.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:047166054X"   Paper_ID="/451869.html"   Extracted="047166054X"   DDC="519.7/03"   Normalized_DDC="519703"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:0792369327"   Paper_ID="/451869.html"   Extracted="0792369327"   DDC="519.303"   Normalized_DDC="519303"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:0792374592"   Paper_ID="/451869.html"   Extracted="0792374592"   DDC="519.2/33"   Normalized_DDC="519233"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/451869.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:080581745X"   Paper_ID="/451869.html"   Extracted="080581745X"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/451869.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:1581131674"   Paper_ID="/451869.html"   Extracted="1581131674"   />

            <identifier   Org="ISBN:1586032399"   Paper_ID="/451869.html"   Extracted="1586032399"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:3540240772"   Paper_ID="/451869.html"   Extracted="3540240772"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:3540654801"   Paper_ID="/451869.html"   Extracted="3540654801"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:3540657010"   Paper_ID="/451869.html"   Extracted="3540657010"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:3540712305"   Paper_ID="/451869.html"   Extracted="3540712305"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07692307692307693"   />

            <identifier   Org="ISBN:427490525X"   Paper_ID="/451869.html"   Extracted="427490525X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07692307692307693"   />

      </rec>

      <rec   ID="/84168.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems"   CiteSeer_Volume=""   Title="Reinforcement   Learning   Algorithm   for   Partially   Observable   {M}arkov   Decision   Problems,"   />

      <rec   ID="/186946.html"   Type="techreport"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Approximate   Discounted   Dynamic   Programming   is   Unreliable,">

            <identifier   Org="ISBN:3540628584"   Paper_ID="/186946.html"   Extracted="3540628584"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="1.0"   />

      </rec>

      <rec   ID="/150059.html"   Type="article"   CiteSeer_Book="Cognitive   Science"   CiteSeer_Volume="16"   Title="Forward   models:   Supervised   learning   with   a   distal   teacher,">

            <identifier   Org="ISBN:0262071959"   Paper_ID="/150059.html"   Extracted="0262071959"   DDC="153"   Normalized_DDC="153"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0262072548"   Paper_ID="/150059.html"   Extracted="0262072548"   DDC="612.8/2"   Normalized_DDC="61282"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/150059.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262661160"   Paper_ID="/150059.html"   Extracted="0262661160"   DDC="153"   Normalized_DDC="153"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0444503153"   Paper_ID="/150059.html"   Extracted="0444503153"   DDC="616.89/8207"   Normalized_DDC="616898207"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0444528768"   Paper_ID="/150059.html"   Extracted="0444528768"   />

            <identifier   Org="ISBN:0521845114"   Paper_ID="/150059.html"   Extracted="0521845114"   DDC="629.8/92"   Normalized_DDC="629892"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:080581258X"   Paper_ID="/150059.html"   Extracted="080581258X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0805812911"   Paper_ID="/150059.html"   Extracted="0805812911"   />

            <identifier   Org="ISBN:0805813640"   Paper_ID="/150059.html"   Extracted="0805813640"   DDC="153"   Normalized_DDC="153"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/150059.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:080581745X"   Paper_ID="/150059.html"   Extracted="080581745X"   />

            <identifier   Org="ISBN:0805821597"   Paper_ID="/150059.html"   Extracted="0805821597"   />

            <identifier   Org="ISBN:0863777864"   Paper_ID="/150059.html"   Extracted="0863777864"   DDC="153.4"   Normalized_DDC="1534"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0907845096"   Paper_ID="/150059.html"   Extracted="0907845096"   />

            <identifier   Org="ISBN:3540287558"   Paper_ID="/150059.html"   Extracted="3540287558"   DDC="006.32"   Normalized_DDC="00632"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:3540733221"   Paper_ID="/150059.html"   Extracted="3540733221"   DDC="670.285/63"   Normalized_DDC="67028563"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:9812388052"   Paper_ID="/150059.html"   Extracted="9812388052"   DDC="006.32"   Normalized_DDC="00632"   Normalized_Weight="0.09090909090909091"   />

      </rec>

      <rec   ID="/222673.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems"   CiteSeer_Volume=""   Title="The   Parti-Game   Algorithm   for   Variable   Resolution   Reinforcement   Learning   in   Multidimensional   State-Spaces,">

            <identifier   Org="ISBN:0262112450"   Paper_ID="/222673.html"   Extracted="0262112450"   />

            <identifier   Org="ISBN:0262201526"   Paper_ID="/222673.html"   Extracted="0262201526"   />

            <identifier   Org="ISBN:0262510952"   Paper_ID="/222673.html"   Extracted="0262510952"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0262632004"   Paper_ID="/222673.html"   Extracted="0262632004"   DDC="591.50113"   Normalized_DDC="59150113"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0262661446"   Paper_ID="/222673.html"   Extracted="0262661446"   DDC="591.5/01/1"   Normalized_DDC="5915011"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:0805829415"   Paper_ID="/222673.html"   Extracted="0805829415"   />

            <identifier   Org="ISBN:1558604170"   Paper_ID="/222673.html"   Extracted="1558604170"   />

            <identifier   Org="ISBN:1558604197"   Paper_ID="/222673.html"   Extracted="1558604197"   />

            <identifier   Org="ISBN:1558604952"   Paper_ID="/222673.html"   Extracted="1558604952"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:1558607072"   Paper_ID="/222673.html"   Extracted="1558607072"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:1586035959"   Paper_ID="/222673.html"   Extracted="1586035959"   />

            <identifier   Org="ISBN:3540201211"   Paper_ID="/222673.html"   Extracted="3540201211"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:354032688X"   Paper_ID="/222673.html"   Extracted="354032688X"   DDC="629.8/92"   Normalized_DDC="629892"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:3540408045"   Paper_ID="/222673.html"   Extracted="3540408045"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:3540590528"   Paper_ID="/222673.html"   Extracted="3540590528"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:3540654801"   Paper_ID="/222673.html"   Extracted="3540654801"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:3540679251"   Paper_ID="/222673.html"   Extracted="3540679251"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.09090909090909091"   />

            <identifier   Org="ISBN:3540723927"   Paper_ID="/222673.html"   Extracted="3540723927"   />

      </rec>

      <rec   ID="/86839.html"   Type="inproceedings"   CiteSeer_Book="Machine   Learning"   CiteSeer_Volume=""   Title="Transfer   of   Learning   Across   Compositions   of   Sequentail   Tasks,"   />

      <rec   ID="/90919.html"   Type="inproceedings"   CiteSeer_Book="National   Conference   on   Artificial   Intelligence"   CiteSeer_Volume=""   Title="Reinforcement   Learning   with   a   Hierarchy   of   Abstract   Models,">

            <identifier   Org="ISBN:0262112450"   Paper_ID="/90919.html"   Extracted="0262112450"   />

            <identifier   Org="ISBN:0262122413"   Paper_ID="/90919.html"   Extracted="0262122413"   />

            <identifier   Org="ISBN:0262193981"   Paper_ID="/90919.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/90919.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262201070"   Paper_ID="/90919.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262510634"   Paper_ID="/90919.html"   Extracted="0262510634"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0262631490"   Paper_ID="/90919.html"   Extracted="0262631490"   DDC="591.51"   Normalized_DDC="59151"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:047166054X"   Paper_ID="/90919.html"   Extracted="047166054X"   DDC="519.7/03"   Normalized_DDC="519703"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0792376307"   Paper_ID="/90919.html"   Extracted="0792376307"   DDC="005.1"   Normalized_DDC="0051"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:155860247X"   Paper_ID="/90919.html"   Extracted="155860247X"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/90919.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1558604804"   Paper_ID="/90919.html"   Extracted="1558604804"   />

            <identifier   Org="ISBN:3540250468"   Paper_ID="/90919.html"   Extracted="3540250468"   DDC="629.8932"   Normalized_DDC="6298932"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540288961"   Paper_ID="/90919.html"   Extracted="3540288961"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540406662"   Paper_ID="/90919.html"   Extracted="3540406662"   DDC="629.8/92"   Normalized_DDC="629892"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540439412"   Paper_ID="/90919.html"   Extracted="3540439412"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540590528"   Paper_ID="/90919.html"   Extracted="3540590528"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540644172"   Paper_ID="/90919.html"   Extracted="3540644172"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540679251"   Paper_ID="/90919.html"   Extracted="3540679251"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.06666666666666667"   />

      </rec>

      <rec   ID="/134570.html"   Type="inproceedings"   CiteSeer_Book="MLC92"   CiteSeer_Volume=""   Title="Scaling   Reinforcement   Learning   Algorithms   by   Learning   Variable   Temporal   Resolution   Models,">

            <identifier   Org="ISBN:0262193981"   Paper_ID="/134570.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.3333333333333333"   />

            <identifier   Org="ISBN:0262510634"   Paper_ID="/134570.html"   Extracted="0262510634"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.3333333333333333"   />

            <identifier   Org="ISBN:0791800512"   Paper_ID="/134570.html"   Extracted="0791800512"   />

            <identifier   Org="ISBN:155860247X"   Paper_ID="/134570.html"   Extracted="155860247X"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.3333333333333333"   />

            <identifier   Org="ISBN:1574730010"   Paper_ID="/134570.html"   Extracted="1574730010"   />

      </rec>

      <rec   ID="/10103.html"   Type="article"   CiteSeer_Book="Machine   Learning"   CiteSeer_Volume="8"   Title="Transfer   of   Learning   by   Composing   Solutions   of   Elemental   Sequential   Tasks,">

            <identifier   Org="ISBN:0262631490"   Paper_ID="/10103.html"   Extracted="0262631490"   DDC="591.51"   Normalized_DDC="59151"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0262661446"   Paper_ID="/10103.html"   Extracted="0262661446"   DDC="591.5/01/1"   Normalized_DDC="5915011"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0769515940"   Paper_ID="/10103.html"   Extracted="0769515940"   />

            <identifier   Org="ISBN:0780370783"   Paper_ID="/10103.html"   Extracted="0780370783"   />

            <identifier   Org="ISBN:0792380479"   Paper_ID="/10103.html"   Extracted="0792380479"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0792392345"   Paper_ID="/10103.html"   Extracted="0792392345"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/10103.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:1558603352"   Paper_ID="/10103.html"   Extracted="1558603352"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1558603700"   Paper_ID="/10103.html"   Extracted="1558603700"   DDC="005.1"   Normalized_DDC="0051"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:157735236X"   Paper_ID="/10103.html"   Extracted="157735236X"   />

            <identifier   Org="ISBN:1852334452"   Paper_ID="/10103.html"   Extracted="1852334452"   DDC="005.3"   Normalized_DDC="0053"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540590528"   Paper_ID="/10103.html"   Extracted="3540590528"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540678395"   Paper_ID="/10103.html"   Extracted="3540678395"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540688463"   Paper_ID="/10103.html"   Extracted="3540688463"   />

      </rec>

      <rec   ID="/169801.html"   Type="techreport"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Learning   to   Solve   Markovian   Decision   Processes,">

            <identifier   Org="ISBN:0262193981"   Paper_ID="/169801.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0262201070"   Paper_ID="/169801.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0262611023"   Paper_ID="/169801.html"   Extracted="0262611023"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0262632004"   Paper_ID="/169801.html"   Extracted="0262632004"   DDC="591.50113"   Normalized_DDC="59150113"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:078035530X"   Paper_ID="/169801.html"   Extracted="078035530X"   DDC="006.3/2"   Normalized_DDC="00632"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0780358007"   Paper_ID="/169801.html"   Extracted="0780358007"   DDC="629.8/36"   Normalized_DDC="629836"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0792397169"   Paper_ID="/169801.html"   Extracted="0792397169"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0805838805"   Paper_ID="/169801.html"   Extracted="0805838805"   DDC="153"   Normalized_DDC="153"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1558603352"   Paper_ID="/169801.html"   Extracted="1558603352"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1558607072"   Paper_ID="/169801.html"   Extracted="1558607072"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540415971"   Paper_ID="/169801.html"   Extracted="3540415971"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540657010"   Paper_ID="/169801.html"   Extracted="3540657010"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540673059"   Paper_ID="/169801.html"   Extracted="3540673059"   DDC="006.3/2"   Normalized_DDC="00632"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540762639"   Paper_ID="/169801.html"   Extracted="3540762639"   DDC="006.3/2"   Normalized_DDC="00632"   Normalized_Weight="0.07142857142857142"   />

      </rec>

      <rec   ID="/300248.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems"   CiteSeer_Volume=""   Title="Robust   Reinforcement   Learning   in   Motion   Planning,">

            <identifier   Org="ISBN:0262201070"   Paper_ID="/300248.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.16666666666666666"   />

            <identifier   Org="ISBN:0262631784"   Paper_ID="/300248.html"   Extracted="0262631784"   DDC="591.5"   Normalized_DDC="5915"   Normalized_Weight="0.16666666666666666"   />

            <identifier   Org="ISBN:0444819312"   Paper_ID="/300248.html"   Extracted="0444819312"   DDC="612.8/2"   Normalized_DDC="61282"   Normalized_Weight="0.16666666666666666"   />

            <identifier   Org="ISBN:0471544485"   Paper_ID="/300248.html"   Extracted="0471544485"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.16666666666666666"   />

            <identifier   Org="ISBN:1558604804"   Paper_ID="/300248.html"   Extracted="1558604804"   />

            <identifier   Org="ISBN:1558607781"   Paper_ID="/300248.html"   Extracted="1558607781"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.16666666666666666"   />

            <identifier   Org="ISBN:3790812129"   Paper_ID="/300248.html"   Extracted="3790812129"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.16666666666666666"   />

      </rec>

      <rec   ID="/144448.html"   Type="inproceedings"   CiteSeer_Book="International   Conference   on   Machine   Learning"   CiteSeer_Volume=""   Title="Learning   Without   State-Estimation   in   Partially   Observable   Markovian   Decision   Processes,">

            <identifier   Org="ISBN:0262201046"   Paper_ID="/144448.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262693410"   Paper_ID="/144448.html"   Extracted="0262693410"   DDC="591.50113"   Normalized_DDC="59150113"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1402056257"   Paper_ID="/144448.html"   Extracted="1402056257"   DDC="629.8"   Normalized_DDC="6298"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1558603352"   Paper_ID="/144448.html"   Extracted="1558603352"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/144448.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1558604863"   Paper_ID="/144448.html"   Extracted="1558604863"   />

            <identifier   Org="ISBN:1586030132"   Paper_ID="/144448.html"   Extracted="1586030132"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1586035606"   Paper_ID="/144448.html"   Extracted="1586035606"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:1586035959"   Paper_ID="/144448.html"   Extracted="1586035959"   />

            <identifier   Org="ISBN:3540201211"   Paper_ID="/144448.html"   Extracted="3540201211"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540229590"   Paper_ID="/144448.html"   Extracted="3540229590"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540250735"   Paper_ID="/144448.html"   Extracted="3540250735"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540413855"   Paper_ID="/144448.html"   Extracted="3540413855"   DDC="510   s"   Normalized_DDC="51"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540654801"   Paper_ID="/144448.html"   Extracted="3540654801"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:3540752242"   Paper_ID="/144448.html"   Extracted="3540752242"   />

            <identifier   Org="ISBN:3540884386"   Paper_ID="/144448.html"   Extracted="3540884386"   />

            <identifier   Org="ISBN:427490525X"   Paper_ID="/144448.html"   Extracted="427490525X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.08333333333333333"   />

            <identifier   Org="ISBN:9051993986"   Paper_ID="/144448.html"   Extracted="9051993986"   />

      </rec>

      <rec   ID="/10484.html"   Type="article"   CiteSeer_Book="Machine   Learning"   CiteSeer_Volume="16"   Title="An   Upper   Bound   on   the   Loss   from   Approximate   Optimal-Value   Functions,">

            <identifier   Org="ISBN:0262201046"   Paper_ID="/10484.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262510901"   Paper_ID="/10484.html"   Extracted="0262510901"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/10484.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/10484.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:1558604197"   Paper_ID="/10484.html"   Extracted="1558604197"   />

            <identifier   Org="ISBN:1558607072"   Paper_ID="/10484.html"   Extracted="1558607072"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:157735236X"   Paper_ID="/10484.html"   Extracted="157735236X"   />

            <identifier   Org="ISBN:3540749578"   Paper_ID="/10484.html"   Extracted="3540749578"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.25"   />

      </rec>

      <rec   ID="/195161.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   the   Eighth   International   Workshop   on   Machine   Learning"   CiteSeer_Volume=""   Title="Planning   by   incremental   dynamic   programming,">

            <identifier   Org="ISBN:0126464901"   Paper_ID="/195161.html"   Extracted="0126464901"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0132610663"   Paper_ID="/195161.html"   Extracted="0132610663"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0201483696"   Paper_ID="/195161.html"   Extracted="0201483696"   DDC="591.5"   Normalized_DDC="5915"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262193981"   Paper_ID="/195161.html"   Extracted="0262193981"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262510634"   Paper_ID="/195161.html"   Extracted="0262510634"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262510901"   Paper_ID="/195161.html"   Extracted="0262510901"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262611023"   Paper_ID="/195161.html"   Extracted="0262611023"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262631490"   Paper_ID="/195161.html"   Extracted="0262631490"   DDC="591.51"   Normalized_DDC="59151"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0780325648"   Paper_ID="/195161.html"   Extracted="0780325648"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:080581745X"   Paper_ID="/195161.html"   Extracted="080581745X"   />

            <identifier   Org="ISBN:140206263X"   Paper_ID="/195161.html"   Extracted="140206263X"   DDC="005.1"   Normalized_DDC="0051"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:155860250X"   Paper_ID="/195161.html"   Extracted="155860250X"   DDC="006.3/3"   Normalized_DDC="00633"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:1599047055"   Paper_ID="/195161.html"   Extracted="1599047055"   DDC="006.3/33"   Normalized_DDC="006333"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540200576"   Paper_ID="/195161.html"   Extracted="3540200576"   DDC="570/.1/13"   Normalized_DDC="570113"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540206469"   Paper_ID="/195161.html"   Extracted="3540206469"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540304622"   Paper_ID="/195161.html"   Extracted="3540304622"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540605983"   Paper_ID="/195161.html"   Extracted="3540605983"   DDC="006.3/3"   Normalized_DDC="00633"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540742611"   Paper_ID="/195161.html"   Extracted="3540742611"   />

      </rec>

      <rec   ID="/415821.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   the   1991   American   Control   Conference"   CiteSeer_Volume=""   Title="Reinforcement   {L}earning   is   {D}irect   {A}daptive   {O}ptimal   {C}ontrol,"   />

      <rec   ID="/72887.html"   Type="inproceedings"   CiteSeer_Book="Advances   in   Neural   Information   Processing   Systems"   CiteSeer_Volume=""   Title="Active   Exploration   in   Dynamic   Environments,">

            <identifier   Org="ISBN:0195095227"   Paper_ID="/72887.html"   Extracted="0195095227"   DDC="006.3/7"   Normalized_DDC="00637"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0195098706"   Paper_ID="/72887.html"   Extracted="0195098706"   DDC="006.37"   Normalized_DDC="00637"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/72887.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262510901"   Paper_ID="/72887.html"   Extracted="0262510901"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0262631490"   Paper_ID="/72887.html"   Extracted="0262631490"   DDC="591.51"   Normalized_DDC="59151"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0444819312"   Paper_ID="/72887.html"   Extracted="0444819312"   DDC="612.8/2"   Normalized_DDC="61282"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0780342577"   Paper_ID="/72887.html"   Extracted="0780342577"   />

            <identifier   Org="ISBN:0780355369"   Paper_ID="/72887.html"   Extracted="0780355369"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0792392345"   Paper_ID="/72887.html"   Extracted="0792392345"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0792397169"   Paper_ID="/72887.html"   Extracted="0792397169"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0792397452"   Paper_ID="/72887.html"   Extracted="0792397452"   DDC="629.8/92631"   Normalized_DDC="629892631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:155860247X"   Paper_ID="/72887.html"   Extracted="155860247X"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/72887.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:1558607781"   Paper_ID="/72887.html"   Extracted="1558607781"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540415971"   Paper_ID="/72887.html"   Extracted="3540415971"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540584838"   Paper_ID="/72887.html"   Extracted="3540584838"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540664521"   Paper_ID="/72887.html"   Extracted="3540664521"   DDC="570/.1/13"   Normalized_DDC="570113"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540730060"   Paper_ID="/72887.html"   Extracted="3540730060"   DDC="006.3/2"   Normalized_DDC="00632"   Normalized_Weight="0.0625"   />

      </rec>

      <rec   ID="/18014.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   the   1993   Connectionist   Models   Summer   School"   CiteSeer_Volume=""   Title="{Issues   in   Using   Function   Approximation   for   Reinforcement   Learning},">

            <identifier   Org="ISBN:0262201046"   Paper_ID="/18014.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:078031901X"   Paper_ID="/18014.html"   Extracted="078031901X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0792397169"   Paper_ID="/18014.html"   Extracted="0792397169"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0805815902"   Paper_ID="/18014.html"   Extracted="0805815902"   />

            <identifier   Org="ISBN:080581745X"   Paper_ID="/18014.html"   Extracted="080581745X"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/18014.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1558607072"   Paper_ID="/18014.html"   Extracted="1558607072"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1586032399"   Paper_ID="/18014.html"   Extracted="1586032399"   DDC="629.8/9263"   Normalized_DDC="62989263"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1595930108"   Paper_ID="/18014.html"   Extracted="1595930108"   DDC="004/.35"   Normalized_DDC="00435"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3527319069"   Paper_ID="/18014.html"   Extracted="3527319069"   DDC="658.5"   Normalized_DDC="6585"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540288961"   Paper_ID="/18014.html"   Extracted="3540288961"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540304622"   Paper_ID="/18014.html"   Extracted="3540304622"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3930747332"   Paper_ID="/18014.html"   Extracted="3930747332"   />

      </rec>

      <rec   ID="/595322.html"   Type="article"   CiteSeer_Book="Machine   Learning"   CiteSeer_Volume="22"   Title="Feature-Based   Methods   for   Large   Scale   Dynamic   Programming,">

            <identifier   Org="ISBN:0262122413"   Paper_ID="/595322.html"   Extracted="0262122413"   />

            <identifier   Org="ISBN:0262194503"   Paper_ID="/595322.html"   Extracted="0262194503"   />

            <identifier   Org="ISBN:0262195348"   Paper_ID="/595322.html"   Extracted="0262195348"   />

            <identifier   Org="ISBN:0262201070"   Paper_ID="/595322.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:0387301623"   Paper_ID="/595322.html"   Extracted="0387301623"   DDC="518.103"   Normalized_DDC="518103"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:047166054X"   Paper_ID="/595322.html"   Extracted="047166054X"   DDC="519.7/03"   Normalized_DDC="519703"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:0819463892"   Paper_ID="/595322.html"   Extracted="0819463892"   DDC="621.36/7"   Normalized_DDC="621367"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/595322.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:3211833641"   Paper_ID="/595322.html"   Extracted="3211833641"   />

            <identifier   Org="ISBN:3540497196"   Paper_ID="/595322.html"   Extracted="3540497196"   DDC="629.8932"   Normalized_DDC="6298932"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:3540657010"   Paper_ID="/595322.html"   Extracted="3540657010"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:3540729259"   Paper_ID="/595322.html"   Extracted="3540729259"   />

            <identifier   Org="ISBN:3540732667"   Paper_ID="/595322.html"   Extracted="3540732667"   DDC="612.8/233"   Normalized_DDC="6128233"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:3540735798"   Paper_ID="/595322.html"   Extracted="3540735798"   DDC="004"   Normalized_DDC="004"   Normalized_Weight="0.1"   />

            <identifier   Org="ISBN:3540779477"   Paper_ID="/595322.html"   Extracted="3540779477"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1"   />

      </rec>

      <rec   ID="/63796.html"   Type="techreport"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Analysis   of   Some   Incremental   Variants   of   Policy   Iteration:   First   Steps   Toward   Understanding   Actor-Critic   Learning   Systems,">

            <identifier   Org="ISBN:0262201046"   Paper_ID="/63796.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:047166054X"   Paper_ID="/63796.html"   Extracted="047166054X"   DDC="519.7/03"   Normalized_DDC="519703"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:078031901X"   Paper_ID="/63796.html"   Extracted="078031901X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:1558603352"   Paper_ID="/63796.html"   Extracted="1558603352"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:3790814369"   Paper_ID="/63796.html"   Extracted="3790814369"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.25"   />

      </rec>

      <rec   ID="/1671.html"   Type="misc"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Tight   Performance   Bounds   on   Greedy   Policies   Based   on   Imperfect   Value   Functions,">

            <identifier   Org="ISBN:026204207X"   Paper_ID="/1671.html"   Extracted="026204207X"   />

            <identifier   Org="ISBN:0262201046"   Paper_ID="/1671.html"   Extracted="0262201046"   />

            <identifier   Org="ISBN:0262510987"   Paper_ID="/1671.html"   Extracted="0262510987"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0262511290"   Paper_ID="/1671.html"   Extracted="0262511290"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:0780359593"   Paper_ID="/1671.html"   Extracted="0780359593"   />

            <identifier   Org="ISBN:0780370783"   Paper_ID="/1671.html"   Extracted="0780370783"   />

            <identifier   Org="ISBN:0780383761"   Paper_ID="/1671.html"   Extracted="0780383761"   />

            <identifier   Org="ISBN:0792372867"   Paper_ID="/1671.html"   Extracted="0792372867"   DDC="004/.01/519"   Normalized_DDC="00401519"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1558603778"   Paper_ID="/1671.html"   Extracted="1558603778"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1558603859"   Paper_ID="/1671.html"   Extracted="1558603859"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1558604952"   Paper_ID="/1671.html"   Extracted="1558604952"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:1586036424"   Paper_ID="/1671.html"   Extracted="1586036424"   />

            <identifier   Org="ISBN:3540250735"   Paper_ID="/1671.html"   Extracted="3540250735"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:3540278729"   Paper_ID="/1671.html"   Extracted="3540278729"   DDC="004"   Normalized_DDC="004"   Normalized_Weight="0.1111111111111111"   />

            <identifier   Org="ISBN:7302128294"   Paper_ID="/1671.html"   Extracted="7302128294"   />

            <identifier   Org="ISBN:8871922298"   Paper_ID="/1671.html"   Extracted="8871922298"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.1111111111111111"   />

      </rec>

      <rec   ID="/80588.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   the   International   Joint   Conference   on   Artificial   Intellience"   CiteSeer_Volume=""   Title="A   reinforcement   learning   approach   to   Job-shop   Scheduling,">

            <identifier   Org="ISBN:0262201070"   Paper_ID="/80588.html"   Extracted="0262201070"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:026251091X"   Paper_ID="/80588.html"   Extracted="026251091X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0262510952"   Paper_ID="/80588.html"   Extracted="0262510952"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:026251107X"   Paper_ID="/80588.html"   Extracted="026251107X"   DDC="332/.0285"   Normalized_DDC="3320285"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:038709623X"   Paper_ID="/80588.html"   Extracted="038709623X"   />

            <identifier   Org="ISBN:038747319X"   Paper_ID="/80588.html"   Extracted="038747319X"   DDC="620.0042"   Normalized_DDC="6200042"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0470061960"   Paper_ID="/80588.html"   Extracted="0470061960"   DDC="621.384"   Normalized_DDC="621384"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0792374592"   Paper_ID="/80588.html"   Extracted="0792374592"   DDC="519.2/33"   Normalized_DDC="519233"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0849309999"   Paper_ID="/80588.html"   Extracted="0849309999"   DDC="670/.285"   Normalized_DDC="670285"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1558604197"   Paper_ID="/80588.html"   Extracted="1558604197"   />

            <identifier   Org="ISBN:1558607072"   Paper_ID="/80588.html"   Extracted="1558607072"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1591404509"   Paper_ID="/80588.html"   Extracted="1591404509"   DDC="006.3/3"   Normalized_DDC="00633"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540000283"   Paper_ID="/80588.html"   Extracted="3540000283"   DDC="004"   Normalized_DDC="004"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:354029046X"   Paper_ID="/80588.html"   Extracted="354029046X"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540421440"   Paper_ID="/80588.html"   Extracted="3540421440"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540678395"   Paper_ID="/80588.html"   Extracted="3540678395"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540926941"   Paper_ID="/80588.html"   Extracted="3540926941"   />

      </rec>

      <rec   ID="SELF"   Type="SELF"   CiteSeer_Book="SELF"   CiteSeer_Volume="SELF"   Title="Solution   of   Delayed   Reinforcement   Learning   Problems   Having   Continuous   Action   Spaces"   />

</references_metadata>

www.000webhost.com