Automatically assigned DDC number: 00631
Manually assigned DDC number: 00631
Number of references: 31
Title: Solution of Delayed Reinforcement Learning Problems Having Continuous Action Spaces
Author:
Subject: B. Ravindran Solution of Delayed Reinforcement Learning Problems Having Continuous Action Spaces
Description: This work concerns the solution of delayed Reinforcement Learning problems having continuous action spaces. The problems associated with continuous action spaces are discussed and various existing algorithms for solving the problem are presented. A extension of Q-learning for solving delayed RL problems having continuous action spaces is proposed which overcomes drawbacks associated with existing methods. Simulation results are presented to demonstrate the working of the proposed algorithm.
Contributor: The Pennsylvania State University CiteSeer Archives
Publisher: unknown
Date: 2001-10-02
Pubyear: 1996
Format: ps
Identifier: http://citeseer.ist.psu.edu/537952.html
Source: http://www-anw.cs.umass.edu/~ravi/ms_thesis.ps.gz
Language: en
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Rights: unrestricted
<?xml version="1.0" encoding="UTF-8"?>
<references_metadata>
<rec ID="/311556.html" Type="inproceedings" CiteSeer_Book="Proceedings of the Fourth International Workshop on Machine Learning Irvine CA June 1987" CiteSeer_Volume="" Title="Strategy Learning in Multilayer Connectionist Representations," />
<rec ID="/35177.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Advantage updating,">
<identifier Org="ISBN:0131201158" Paper_ID="/35177.html" Extracted="0131201158" DDC="658.8/27" Normalized_DDC="658827" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0262042061" Paper_ID="/35177.html" Extracted="0262042061" />
<identifier Org="ISBN:0262194503" Paper_ID="/35177.html" Extracted="0262194503" />
<identifier Org="ISBN:0262201046" Paper_ID="/35177.html" Extracted="0262201046" />
<identifier Org="ISBN:0262201070" Paper_ID="/35177.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0749415193" Paper_ID="/35177.html" Extracted="0749415193" DDC="374.4" Normalized_DDC="3744" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0749426349" Paper_ID="/35177.html" Extracted="0749426349" DDC="378.03" Normalized_DDC="37803" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:078031901X" Paper_ID="/35177.html" Extracted="078031901X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0780332113" Paper_ID="/35177.html" Extracted="0780332113" DDC="006.3/2" Normalized_DDC="00632" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0818624701" Paper_ID="/35177.html" Extracted="0818624701" DDC="621.381" Normalized_DDC="621381" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:155623550X" Paper_ID="/35177.html" Extracted="155623550X" DDC="658.15/11/0285" Normalized_DDC="65815110285" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540408045" Paper_ID="/35177.html" Extracted="3540408045" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:9051993986" Paper_ID="/35177.html" Extracted="9051993986" />
</rec>
<rec ID="/110654.html" Type="incollection" CiteSeer_Book="Learning and computational neuroscience foundations of adaptive networks" CiteSeer_Volume="" Title="Learning and Sequential Decision Making,">
<identifier Org="ISBN:0123741769" Paper_ID="/110654.html" Extracted="0123741769" DDC="330.019" Normalized_DDC="330019" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262510901" Paper_ID="/110654.html" Extracted="0262510901" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262510952" Paper_ID="/110654.html" Extracted="0262510952" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262531224" Paper_ID="/110654.html" Extracted="0262531224" DDC="591.51" Normalized_DDC="59151" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262631490" Paper_ID="/110654.html" Extracted="0262631490" DDC="591.51" Normalized_DDC="59151" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0792392345" Paper_ID="/110654.html" Extracted="0792392345" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0805812911" Paper_ID="/110654.html" Extracted="0805812911" />
<identifier Org="ISBN:0805814876" Paper_ID="/110654.html" Extracted="0805814876" />
<identifier Org="ISBN:1558601414" Paper_ID="/110654.html" Extracted="1558601414" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1558601643" Paper_ID="/110654.html" Extracted="1558601643" DDC="658.5" Normalized_DDC="6585" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1558603778" Paper_ID="/110654.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1586030132" Paper_ID="/110654.html" Extracted="1586030132" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1852334452" Paper_ID="/110654.html" Extracted="1852334452" DDC="005.3" Normalized_DDC="0053" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540566678" Paper_ID="/110654.html" Extracted="3540566678" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540584838" Paper_ID="/110654.html" Extracted="3540584838" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540590528" Paper_ID="/110654.html" Extracted="3540590528" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540659072" Paper_ID="/110654.html" Extracted="3540659072" DDC="003/.3" Normalized_DDC="0033" Normalized_Weight="0.06666666666666667" />
</rec>
<rec ID="/286243.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems 5 Proceedings of the IEEE Conference in Denver to appear" CiteSeer_Volume="" Title="Reinforcement Learning Applied to Linear Quadratic Regulation,">
<identifier Org="ISBN:0262122413" Paper_ID="/286243.html" Extracted="0262122413" />
<identifier Org="ISBN:0262193981" Paper_ID="/286243.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.125" />
<identifier Org="ISBN:0262201046" Paper_ID="/286243.html" Extracted="0262201046" />
<identifier Org="ISBN:0262201070" Paper_ID="/286243.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.125" />
<identifier Org="ISBN:0262510901" Paper_ID="/286243.html" Extracted="0262510901" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.125" />
<identifier Org="ISBN:078031901X" Paper_ID="/286243.html" Extracted="078031901X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.125" />
<identifier Org="ISBN:0792397169" Paper_ID="/286243.html" Extracted="0792397169" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.125" />
<identifier Org="ISBN:0805815902" Paper_ID="/286243.html" Extracted="0805815902" />
<identifier Org="ISBN:0805821252" Paper_ID="/286243.html" Extracted="0805821252" />
<identifier Org="ISBN:1558603778" Paper_ID="/286243.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.125" />
<identifier Org="ISBN:1558604804" Paper_ID="/286243.html" Extracted="1558604804" />
<identifier Org="ISBN:3540240772" Paper_ID="/286243.html" Extracted="3540240772" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.125" />
<identifier Org="ISBN:354079865X" Paper_ID="/286243.html" Extracted="354079865X" DDC="006.31" Normalized_DDC="00631" Normalized_Weight="0.125" />
<identifier Org="ISBN:9051993986" Paper_ID="/286243.html" Extracted="9051993986" />
</rec>
<rec ID="/165188.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Incremental Dynamic Programming for On-line Adaptive Optimal Control,">
<identifier Org="ISBN:0262133172" Paper_ID="/165188.html" Extracted="0262133172" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.3333333333333333" />
<identifier Org="ISBN:0262193981" Paper_ID="/165188.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.3333333333333333" />
<identifier Org="ISBN:0262201046" Paper_ID="/165188.html" Extracted="0262201046" />
<identifier Org="ISBN:0780347560" Paper_ID="/165188.html" Extracted="0780347560" DDC="621.381" Normalized_DDC="621381" Normalized_Weight="0.3333333333333333" />
<identifier Org="ISBN:3211833641" Paper_ID="/165188.html" Extracted="3211833641" />
</rec>
<rec ID="/385953.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems" CiteSeer_Volume="" Title="Reinforcement Learning Methods for Continuous-Time {M}arkov Decision Problems," />
<rec ID="/343069.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems 5 Proceedings of the IEEE Conference in Denver to appear" CiteSeer_Volume="" Title="Feudal Reinforcement Learning,">
<identifier Org="ISBN:0262112450" Paper_ID="/343069.html" Extracted="0262112450" />
<identifier Org="ISBN:0262201046" Paper_ID="/343069.html" Extracted="0262201046" />
<identifier Org="ISBN:0262661446" Paper_ID="/343069.html" Extracted="0262661446" DDC="591.5/01/1" Normalized_DDC="5915011" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:047166054X" Paper_ID="/343069.html" Extracted="047166054X" DDC="519.7/03" Normalized_DDC="519703" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:078035530X" Paper_ID="/343069.html" Extracted="078035530X" DDC="006.3/2" Normalized_DDC="00632" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0805815902" Paper_ID="/343069.html" Extracted="0805815902" />
<identifier Org="ISBN:1558603778" Paper_ID="/343069.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1558607781" Paper_ID="/343069.html" Extracted="1558607781" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1586034146" Paper_ID="/343069.html" Extracted="1586034146" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540206469" Paper_ID="/343069.html" Extracted="3540206469" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:354032688X" Paper_ID="/343069.html" Extracted="354032688X" DDC="629.8/92" Normalized_DDC="629892" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540590528" Paper_ID="/343069.html" Extracted="3540590528" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540644172" Paper_ID="/343069.html" Extracted="3540644172" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540654801" Paper_ID="/343069.html" Extracted="3540654801" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540676023" Paper_ID="/343069.html" Extracted="3540676023" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540678395" Paper_ID="/343069.html" Extracted="3540678395" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540699112" Paper_ID="/343069.html" Extracted="3540699112" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540747818" Paper_ID="/343069.html" Extracted="3540747818" />
<identifier Org="ISBN:3540769269" Paper_ID="/343069.html" Extracted="3540769269" />
<identifier Org="ISBN:427490525X" Paper_ID="/343069.html" Extracted="427490525X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
</rec>
<rec ID="/278302.html" Type="article" CiteSeer_Book="Machine Learning" CiteSeer_Volume="14" Title="{TD}($\lambda$) Converges with Probability 1,">
<identifier Org="ISBN:0525949828" Paper_ID="/278302.html" Extracted="0525949828" DDC="153.8/3" Normalized_DDC="15383" Normalized_Weight="1.0" />
<identifier Org="ISBN:0780378989" Paper_ID="/278302.html" Extracted="0780378989" />
</rec>
<rec ID="/300268.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="Reinforcement Learning and its Application to Control,">
<identifier Org="ISBN:0080422365" Paper_ID="/300268.html" Extracted="0080422365" DDC="629.8/9" Normalized_DDC="62989" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0444819312" Paper_ID="/300268.html" Extracted="0444819312" DDC="612.8/2" Normalized_DDC="61282" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0780305469" Paper_ID="/300268.html" Extracted="0780305469" DDC="006" Normalized_DDC="006" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0780363493" Paper_ID="/300268.html" Extracted="0780363493" DDC="629.8/92" Normalized_DDC="629892" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0805813640" Paper_ID="/300268.html" Extracted="0805813640" DDC="153" Normalized_DDC="153" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:0805815902" Paper_ID="/300268.html" Extracted="0805815902" />
<identifier Org="ISBN:0805821252" Paper_ID="/300268.html" Extracted="0805821252" />
<identifier Org="ISBN:155860247X" Paper_ID="/300268.html" Extracted="155860247X" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1558604197" Paper_ID="/300268.html" Extracted="1558604197" />
<identifier Org="ISBN:1586036459" Paper_ID="/300268.html" Extracted="1586036459" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1593701578" Paper_ID="/300268.html" Extracted="1593701578" DDC="333.790285" Normalized_DDC="333790285" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:354026549X" Paper_ID="/300268.html" Extracted="354026549X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540427325" Paper_ID="/300268.html" Extracted="3540427325" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540590528" Paper_ID="/300268.html" Extracted="3540590528" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540628584" Paper_ID="/300268.html" Extracted="3540628584" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.08333333333333333" />
</rec>
<rec ID="/230083.html" Type="inproceedings" CiteSeer_Book="Proc 11th International Conference on Machine Learning" CiteSeer_Volume="" Title="Consideration of risk in reinforcement learning,">
<identifier Org="ISBN:0262195682" Paper_ID="/230083.html" Extracted="0262195682" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="1.0" />
<identifier Org="ISBN:1558604197" Paper_ID="/230083.html" Extracted="1558604197" />
</rec>
<rec ID="/451869.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems" CiteSeer_Volume="" Title="Convergence of Stochastic Iterative Dynamic Programming Algorithms,">
<identifier Org="ISBN:0262012111" Paper_ID="/451869.html" Extracted="0262012111" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:026204207X" Paper_ID="/451869.html" Extracted="026204207X" />
<identifier Org="ISBN:0262193981" Paper_ID="/451869.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0262201046" Paper_ID="/451869.html" Extracted="0262201046" />
<identifier Org="ISBN:0262201070" Paper_ID="/451869.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:047166054X" Paper_ID="/451869.html" Extracted="047166054X" DDC="519.7/03" Normalized_DDC="519703" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0792369327" Paper_ID="/451869.html" Extracted="0792369327" DDC="519.303" Normalized_DDC="519303" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0792374592" Paper_ID="/451869.html" Extracted="0792374592" DDC="519.2/33" Normalized_DDC="519233" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:0805815902" Paper_ID="/451869.html" Extracted="0805815902" />
<identifier Org="ISBN:080581745X" Paper_ID="/451869.html" Extracted="080581745X" />
<identifier Org="ISBN:1558603778" Paper_ID="/451869.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:1581131674" Paper_ID="/451869.html" Extracted="1581131674" />
<identifier Org="ISBN:1586032399" Paper_ID="/451869.html" Extracted="1586032399" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540240772" Paper_ID="/451869.html" Extracted="3540240772" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540654801" Paper_ID="/451869.html" Extracted="3540654801" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540657010" Paper_ID="/451869.html" Extracted="3540657010" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:3540712305" Paper_ID="/451869.html" Extracted="3540712305" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07692307692307693" />
<identifier Org="ISBN:427490525X" Paper_ID="/451869.html" Extracted="427490525X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07692307692307693" />
</rec>
<rec ID="/84168.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems" CiteSeer_Volume="" Title="Reinforcement Learning Algorithm for Partially Observable {M}arkov Decision Problems," />
<rec ID="/186946.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="Approximate Discounted Dynamic Programming is Unreliable,">
<identifier Org="ISBN:3540628584" Paper_ID="/186946.html" Extracted="3540628584" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="1.0" />
</rec>
<rec ID="/150059.html" Type="article" CiteSeer_Book="Cognitive Science" CiteSeer_Volume="16" Title="Forward models: Supervised learning with a distal teacher,">
<identifier Org="ISBN:0262071959" Paper_ID="/150059.html" Extracted="0262071959" DDC="153" Normalized_DDC="153" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0262072548" Paper_ID="/150059.html" Extracted="0262072548" DDC="612.8/2" Normalized_DDC="61282" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0262201046" Paper_ID="/150059.html" Extracted="0262201046" />
<identifier Org="ISBN:0262661160" Paper_ID="/150059.html" Extracted="0262661160" DDC="153" Normalized_DDC="153" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0444503153" Paper_ID="/150059.html" Extracted="0444503153" DDC="616.89/8207" Normalized_DDC="616898207" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0444528768" Paper_ID="/150059.html" Extracted="0444528768" />
<identifier Org="ISBN:0521845114" Paper_ID="/150059.html" Extracted="0521845114" DDC="629.8/92" Normalized_DDC="629892" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:080581258X" Paper_ID="/150059.html" Extracted="080581258X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0805812911" Paper_ID="/150059.html" Extracted="0805812911" />
<identifier Org="ISBN:0805813640" Paper_ID="/150059.html" Extracted="0805813640" DDC="153" Normalized_DDC="153" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0805815902" Paper_ID="/150059.html" Extracted="0805815902" />
<identifier Org="ISBN:080581745X" Paper_ID="/150059.html" Extracted="080581745X" />
<identifier Org="ISBN:0805821597" Paper_ID="/150059.html" Extracted="0805821597" />
<identifier Org="ISBN:0863777864" Paper_ID="/150059.html" Extracted="0863777864" DDC="153.4" Normalized_DDC="1534" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0907845096" Paper_ID="/150059.html" Extracted="0907845096" />
<identifier Org="ISBN:3540287558" Paper_ID="/150059.html" Extracted="3540287558" DDC="006.32" Normalized_DDC="00632" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540733221" Paper_ID="/150059.html" Extracted="3540733221" DDC="670.285/63" Normalized_DDC="67028563" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:9812388052" Paper_ID="/150059.html" Extracted="9812388052" DDC="006.32" Normalized_DDC="00632" Normalized_Weight="0.09090909090909091" />
</rec>
<rec ID="/222673.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems" CiteSeer_Volume="" Title="The Parti-Game Algorithm for Variable Resolution Reinforcement Learning in Multidimensional State-Spaces,">
<identifier Org="ISBN:0262112450" Paper_ID="/222673.html" Extracted="0262112450" />
<identifier Org="ISBN:0262201526" Paper_ID="/222673.html" Extracted="0262201526" />
<identifier Org="ISBN:0262510952" Paper_ID="/222673.html" Extracted="0262510952" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0262632004" Paper_ID="/222673.html" Extracted="0262632004" DDC="591.50113" Normalized_DDC="59150113" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0262661446" Paper_ID="/222673.html" Extracted="0262661446" DDC="591.5/01/1" Normalized_DDC="5915011" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:0805829415" Paper_ID="/222673.html" Extracted="0805829415" />
<identifier Org="ISBN:1558604170" Paper_ID="/222673.html" Extracted="1558604170" />
<identifier Org="ISBN:1558604197" Paper_ID="/222673.html" Extracted="1558604197" />
<identifier Org="ISBN:1558604952" Paper_ID="/222673.html" Extracted="1558604952" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:1558607072" Paper_ID="/222673.html" Extracted="1558607072" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:1586035959" Paper_ID="/222673.html" Extracted="1586035959" />
<identifier Org="ISBN:3540201211" Paper_ID="/222673.html" Extracted="3540201211" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:354032688X" Paper_ID="/222673.html" Extracted="354032688X" DDC="629.8/92" Normalized_DDC="629892" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540408045" Paper_ID="/222673.html" Extracted="3540408045" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540590528" Paper_ID="/222673.html" Extracted="3540590528" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540654801" Paper_ID="/222673.html" Extracted="3540654801" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540679251" Paper_ID="/222673.html" Extracted="3540679251" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.09090909090909091" />
<identifier Org="ISBN:3540723927" Paper_ID="/222673.html" Extracted="3540723927" />
</rec>
<rec ID="/86839.html" Type="inproceedings" CiteSeer_Book="Machine Learning" CiteSeer_Volume="" Title="Transfer of Learning Across Compositions of Sequentail Tasks," />
<rec ID="/90919.html" Type="inproceedings" CiteSeer_Book="National Conference on Artificial Intelligence" CiteSeer_Volume="" Title="Reinforcement Learning with a Hierarchy of Abstract Models,">
<identifier Org="ISBN:0262112450" Paper_ID="/90919.html" Extracted="0262112450" />
<identifier Org="ISBN:0262122413" Paper_ID="/90919.html" Extracted="0262122413" />
<identifier Org="ISBN:0262193981" Paper_ID="/90919.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262201046" Paper_ID="/90919.html" Extracted="0262201046" />
<identifier Org="ISBN:0262201070" Paper_ID="/90919.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262510634" Paper_ID="/90919.html" Extracted="0262510634" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0262631490" Paper_ID="/90919.html" Extracted="0262631490" DDC="591.51" Normalized_DDC="59151" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:047166054X" Paper_ID="/90919.html" Extracted="047166054X" DDC="519.7/03" Normalized_DDC="519703" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0792376307" Paper_ID="/90919.html" Extracted="0792376307" DDC="005.1" Normalized_DDC="0051" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:155860247X" Paper_ID="/90919.html" Extracted="155860247X" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1558603778" Paper_ID="/90919.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1558604804" Paper_ID="/90919.html" Extracted="1558604804" />
<identifier Org="ISBN:3540250468" Paper_ID="/90919.html" Extracted="3540250468" DDC="629.8932" Normalized_DDC="6298932" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540288961" Paper_ID="/90919.html" Extracted="3540288961" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540406662" Paper_ID="/90919.html" Extracted="3540406662" DDC="629.8/92" Normalized_DDC="629892" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540439412" Paper_ID="/90919.html" Extracted="3540439412" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540590528" Paper_ID="/90919.html" Extracted="3540590528" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540644172" Paper_ID="/90919.html" Extracted="3540644172" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540679251" Paper_ID="/90919.html" Extracted="3540679251" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.06666666666666667" />
</rec>
<rec ID="/134570.html" Type="inproceedings" CiteSeer_Book="MLC92" CiteSeer_Volume="" Title="Scaling Reinforcement Learning Algorithms by Learning Variable Temporal Resolution Models,">
<identifier Org="ISBN:0262193981" Paper_ID="/134570.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.3333333333333333" />
<identifier Org="ISBN:0262510634" Paper_ID="/134570.html" Extracted="0262510634" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.3333333333333333" />
<identifier Org="ISBN:0791800512" Paper_ID="/134570.html" Extracted="0791800512" />
<identifier Org="ISBN:155860247X" Paper_ID="/134570.html" Extracted="155860247X" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.3333333333333333" />
<identifier Org="ISBN:1574730010" Paper_ID="/134570.html" Extracted="1574730010" />
</rec>
<rec ID="/10103.html" Type="article" CiteSeer_Book="Machine Learning" CiteSeer_Volume="8" Title="Transfer of Learning by Composing Solutions of Elemental Sequential Tasks,">
<identifier Org="ISBN:0262631490" Paper_ID="/10103.html" Extracted="0262631490" DDC="591.51" Normalized_DDC="59151" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0262661446" Paper_ID="/10103.html" Extracted="0262661446" DDC="591.5/01/1" Normalized_DDC="5915011" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0769515940" Paper_ID="/10103.html" Extracted="0769515940" />
<identifier Org="ISBN:0780370783" Paper_ID="/10103.html" Extracted="0780370783" />
<identifier Org="ISBN:0792380479" Paper_ID="/10103.html" Extracted="0792380479" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0792392345" Paper_ID="/10103.html" Extracted="0792392345" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0805815902" Paper_ID="/10103.html" Extracted="0805815902" />
<identifier Org="ISBN:1558603352" Paper_ID="/10103.html" Extracted="1558603352" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558603700" Paper_ID="/10103.html" Extracted="1558603700" DDC="005.1" Normalized_DDC="0051" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:157735236X" Paper_ID="/10103.html" Extracted="157735236X" />
<identifier Org="ISBN:1852334452" Paper_ID="/10103.html" Extracted="1852334452" DDC="005.3" Normalized_DDC="0053" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540590528" Paper_ID="/10103.html" Extracted="3540590528" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540678395" Paper_ID="/10103.html" Extracted="3540678395" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540688463" Paper_ID="/10103.html" Extracted="3540688463" />
</rec>
<rec ID="/169801.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="Learning to Solve Markovian Decision Processes,">
<identifier Org="ISBN:0262193981" Paper_ID="/169801.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0262201070" Paper_ID="/169801.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0262611023" Paper_ID="/169801.html" Extracted="0262611023" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0262632004" Paper_ID="/169801.html" Extracted="0262632004" DDC="591.50113" Normalized_DDC="59150113" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:078035530X" Paper_ID="/169801.html" Extracted="078035530X" DDC="006.3/2" Normalized_DDC="00632" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0780358007" Paper_ID="/169801.html" Extracted="0780358007" DDC="629.8/36" Normalized_DDC="629836" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0792397169" Paper_ID="/169801.html" Extracted="0792397169" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0805838805" Paper_ID="/169801.html" Extracted="0805838805" DDC="153" Normalized_DDC="153" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1558603352" Paper_ID="/169801.html" Extracted="1558603352" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1558607072" Paper_ID="/169801.html" Extracted="1558607072" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540415971" Paper_ID="/169801.html" Extracted="3540415971" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540657010" Paper_ID="/169801.html" Extracted="3540657010" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540673059" Paper_ID="/169801.html" Extracted="3540673059" DDC="006.3/2" Normalized_DDC="00632" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540762639" Paper_ID="/169801.html" Extracted="3540762639" DDC="006.3/2" Normalized_DDC="00632" Normalized_Weight="0.07142857142857142" />
</rec>
<rec ID="/300248.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems" CiteSeer_Volume="" Title="Robust Reinforcement Learning in Motion Planning,">
<identifier Org="ISBN:0262201070" Paper_ID="/300248.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.16666666666666666" />
<identifier Org="ISBN:0262631784" Paper_ID="/300248.html" Extracted="0262631784" DDC="591.5" Normalized_DDC="5915" Normalized_Weight="0.16666666666666666" />
<identifier Org="ISBN:0444819312" Paper_ID="/300248.html" Extracted="0444819312" DDC="612.8/2" Normalized_DDC="61282" Normalized_Weight="0.16666666666666666" />
<identifier Org="ISBN:0471544485" Paper_ID="/300248.html" Extracted="0471544485" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.16666666666666666" />
<identifier Org="ISBN:1558604804" Paper_ID="/300248.html" Extracted="1558604804" />
<identifier Org="ISBN:1558607781" Paper_ID="/300248.html" Extracted="1558607781" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.16666666666666666" />
<identifier Org="ISBN:3790812129" Paper_ID="/300248.html" Extracted="3790812129" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.16666666666666666" />
</rec>
<rec ID="/144448.html" Type="inproceedings" CiteSeer_Book="International Conference on Machine Learning" CiteSeer_Volume="" Title="Learning Without State-Estimation in Partially Observable Markovian Decision Processes,">
<identifier Org="ISBN:0262201046" Paper_ID="/144448.html" Extracted="0262201046" />
<identifier Org="ISBN:0262693410" Paper_ID="/144448.html" Extracted="0262693410" DDC="591.50113" Normalized_DDC="59150113" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1402056257" Paper_ID="/144448.html" Extracted="1402056257" DDC="629.8" Normalized_DDC="6298" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1558603352" Paper_ID="/144448.html" Extracted="1558603352" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1558603778" Paper_ID="/144448.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1558604863" Paper_ID="/144448.html" Extracted="1558604863" />
<identifier Org="ISBN:1586030132" Paper_ID="/144448.html" Extracted="1586030132" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1586035606" Paper_ID="/144448.html" Extracted="1586035606" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:1586035959" Paper_ID="/144448.html" Extracted="1586035959" />
<identifier Org="ISBN:3540201211" Paper_ID="/144448.html" Extracted="3540201211" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540229590" Paper_ID="/144448.html" Extracted="3540229590" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540250735" Paper_ID="/144448.html" Extracted="3540250735" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540413855" Paper_ID="/144448.html" Extracted="3540413855" DDC="510 s" Normalized_DDC="51" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540654801" Paper_ID="/144448.html" Extracted="3540654801" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:3540752242" Paper_ID="/144448.html" Extracted="3540752242" />
<identifier Org="ISBN:3540884386" Paper_ID="/144448.html" Extracted="3540884386" />
<identifier Org="ISBN:427490525X" Paper_ID="/144448.html" Extracted="427490525X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.08333333333333333" />
<identifier Org="ISBN:9051993986" Paper_ID="/144448.html" Extracted="9051993986" />
</rec>
<rec ID="/10484.html" Type="article" CiteSeer_Book="Machine Learning" CiteSeer_Volume="16" Title="An Upper Bound on the Loss from Approximate Optimal-Value Functions,">
<identifier Org="ISBN:0262201046" Paper_ID="/10484.html" Extracted="0262201046" />
<identifier Org="ISBN:0262510901" Paper_ID="/10484.html" Extracted="0262510901" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.25" />
<identifier Org="ISBN:0805815902" Paper_ID="/10484.html" Extracted="0805815902" />
<identifier Org="ISBN:1558603778" Paper_ID="/10484.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.25" />
<identifier Org="ISBN:1558604197" Paper_ID="/10484.html" Extracted="1558604197" />
<identifier Org="ISBN:1558607072" Paper_ID="/10484.html" Extracted="1558607072" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.25" />
<identifier Org="ISBN:157735236X" Paper_ID="/10484.html" Extracted="157735236X" />
<identifier Org="ISBN:3540749578" Paper_ID="/10484.html" Extracted="3540749578" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.25" />
</rec>
<rec ID="/195161.html" Type="inproceedings" CiteSeer_Book="Proceedings of the Eighth International Workshop on Machine Learning" CiteSeer_Volume="" Title="Planning by incremental dynamic programming,">
<identifier Org="ISBN:0126464901" Paper_ID="/195161.html" Extracted="0126464901" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0132610663" Paper_ID="/195161.html" Extracted="0132610663" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0201483696" Paper_ID="/195161.html" Extracted="0201483696" DDC="591.5" Normalized_DDC="5915" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262193981" Paper_ID="/195161.html" Extracted="0262193981" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262510634" Paper_ID="/195161.html" Extracted="0262510634" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262510901" Paper_ID="/195161.html" Extracted="0262510901" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262611023" Paper_ID="/195161.html" Extracted="0262611023" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262631490" Paper_ID="/195161.html" Extracted="0262631490" DDC="591.51" Normalized_DDC="59151" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0780325648" Paper_ID="/195161.html" Extracted="0780325648" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:080581745X" Paper_ID="/195161.html" Extracted="080581745X" />
<identifier Org="ISBN:140206263X" Paper_ID="/195161.html" Extracted="140206263X" DDC="005.1" Normalized_DDC="0051" Normalized_Weight="0.0625" />
<identifier Org="ISBN:155860250X" Paper_ID="/195161.html" Extracted="155860250X" DDC="006.3/3" Normalized_DDC="00633" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1599047055" Paper_ID="/195161.html" Extracted="1599047055" DDC="006.3/33" Normalized_DDC="006333" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540200576" Paper_ID="/195161.html" Extracted="3540200576" DDC="570/.1/13" Normalized_DDC="570113" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540206469" Paper_ID="/195161.html" Extracted="3540206469" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540304622" Paper_ID="/195161.html" Extracted="3540304622" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540605983" Paper_ID="/195161.html" Extracted="3540605983" DDC="006.3/3" Normalized_DDC="00633" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540742611" Paper_ID="/195161.html" Extracted="3540742611" />
</rec>
<rec ID="/415821.html" Type="inproceedings" CiteSeer_Book="Proceedings of the 1991 American Control Conference" CiteSeer_Volume="" Title="Reinforcement {L}earning is {D}irect {A}daptive {O}ptimal {C}ontrol," />
<rec ID="/72887.html" Type="inproceedings" CiteSeer_Book="Advances in Neural Information Processing Systems" CiteSeer_Volume="" Title="Active Exploration in Dynamic Environments,">
<identifier Org="ISBN:0195095227" Paper_ID="/72887.html" Extracted="0195095227" DDC="006.3/7" Normalized_DDC="00637" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0195098706" Paper_ID="/72887.html" Extracted="0195098706" DDC="006.37" Normalized_DDC="00637" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262201046" Paper_ID="/72887.html" Extracted="0262201046" />
<identifier Org="ISBN:0262510901" Paper_ID="/72887.html" Extracted="0262510901" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0262631490" Paper_ID="/72887.html" Extracted="0262631490" DDC="591.51" Normalized_DDC="59151" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0444819312" Paper_ID="/72887.html" Extracted="0444819312" DDC="612.8/2" Normalized_DDC="61282" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0780342577" Paper_ID="/72887.html" Extracted="0780342577" />
<identifier Org="ISBN:0780355369" Paper_ID="/72887.html" Extracted="0780355369" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0792392345" Paper_ID="/72887.html" Extracted="0792392345" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0792397169" Paper_ID="/72887.html" Extracted="0792397169" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0792397452" Paper_ID="/72887.html" Extracted="0792397452" DDC="629.8/92631" Normalized_DDC="629892631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:155860247X" Paper_ID="/72887.html" Extracted="155860247X" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1558603778" Paper_ID="/72887.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1558607781" Paper_ID="/72887.html" Extracted="1558607781" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540415971" Paper_ID="/72887.html" Extracted="3540415971" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540584838" Paper_ID="/72887.html" Extracted="3540584838" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540664521" Paper_ID="/72887.html" Extracted="3540664521" DDC="570/.1/13" Normalized_DDC="570113" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540730060" Paper_ID="/72887.html" Extracted="3540730060" DDC="006.3/2" Normalized_DDC="00632" Normalized_Weight="0.0625" />
</rec>
<rec ID="/18014.html" Type="inproceedings" CiteSeer_Book="Proceedings of the 1993 Connectionist Models Summer School" CiteSeer_Volume="" Title="{Issues in Using Function Approximation for Reinforcement Learning},">
<identifier Org="ISBN:0262201046" Paper_ID="/18014.html" Extracted="0262201046" />
<identifier Org="ISBN:078031901X" Paper_ID="/18014.html" Extracted="078031901X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0792397169" Paper_ID="/18014.html" Extracted="0792397169" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0805815902" Paper_ID="/18014.html" Extracted="0805815902" />
<identifier Org="ISBN:080581745X" Paper_ID="/18014.html" Extracted="080581745X" />
<identifier Org="ISBN:1558603778" Paper_ID="/18014.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558607072" Paper_ID="/18014.html" Extracted="1558607072" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1586032399" Paper_ID="/18014.html" Extracted="1586032399" DDC="629.8/9263" Normalized_DDC="62989263" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1595930108" Paper_ID="/18014.html" Extracted="1595930108" DDC="004/.35" Normalized_DDC="00435" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3527319069" Paper_ID="/18014.html" Extracted="3527319069" DDC="658.5" Normalized_DDC="6585" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540288961" Paper_ID="/18014.html" Extracted="3540288961" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540304622" Paper_ID="/18014.html" Extracted="3540304622" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3930747332" Paper_ID="/18014.html" Extracted="3930747332" />
</rec>
<rec ID="/595322.html" Type="article" CiteSeer_Book="Machine Learning" CiteSeer_Volume="22" Title="Feature-Based Methods for Large Scale Dynamic Programming,">
<identifier Org="ISBN:0262122413" Paper_ID="/595322.html" Extracted="0262122413" />
<identifier Org="ISBN:0262194503" Paper_ID="/595322.html" Extracted="0262194503" />
<identifier Org="ISBN:0262195348" Paper_ID="/595322.html" Extracted="0262195348" />
<identifier Org="ISBN:0262201070" Paper_ID="/595322.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1" />
<identifier Org="ISBN:0387301623" Paper_ID="/595322.html" Extracted="0387301623" DDC="518.103" Normalized_DDC="518103" Normalized_Weight="0.1" />
<identifier Org="ISBN:047166054X" Paper_ID="/595322.html" Extracted="047166054X" DDC="519.7/03" Normalized_DDC="519703" Normalized_Weight="0.1" />
<identifier Org="ISBN:0819463892" Paper_ID="/595322.html" Extracted="0819463892" DDC="621.36/7" Normalized_DDC="621367" Normalized_Weight="0.1" />
<identifier Org="ISBN:1558603778" Paper_ID="/595322.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1" />
<identifier Org="ISBN:3211833641" Paper_ID="/595322.html" Extracted="3211833641" />
<identifier Org="ISBN:3540497196" Paper_ID="/595322.html" Extracted="3540497196" DDC="629.8932" Normalized_DDC="6298932" Normalized_Weight="0.1" />
<identifier Org="ISBN:3540657010" Paper_ID="/595322.html" Extracted="3540657010" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1" />
<identifier Org="ISBN:3540729259" Paper_ID="/595322.html" Extracted="3540729259" />
<identifier Org="ISBN:3540732667" Paper_ID="/595322.html" Extracted="3540732667" DDC="612.8/233" Normalized_DDC="6128233" Normalized_Weight="0.1" />
<identifier Org="ISBN:3540735798" Paper_ID="/595322.html" Extracted="3540735798" DDC="004" Normalized_DDC="004" Normalized_Weight="0.1" />
<identifier Org="ISBN:3540779477" Paper_ID="/595322.html" Extracted="3540779477" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1" />
</rec>
<rec ID="/63796.html" Type="techreport" CiteSeer_Book="" CiteSeer_Volume="" Title="Analysis of Some Incremental Variants of Policy Iteration: First Steps Toward Understanding Actor-Critic Learning Systems,">
<identifier Org="ISBN:0262201046" Paper_ID="/63796.html" Extracted="0262201046" />
<identifier Org="ISBN:047166054X" Paper_ID="/63796.html" Extracted="047166054X" DDC="519.7/03" Normalized_DDC="519703" Normalized_Weight="0.25" />
<identifier Org="ISBN:078031901X" Paper_ID="/63796.html" Extracted="078031901X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.25" />
<identifier Org="ISBN:1558603352" Paper_ID="/63796.html" Extracted="1558603352" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.25" />
<identifier Org="ISBN:3790814369" Paper_ID="/63796.html" Extracted="3790814369" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.25" />
</rec>
<rec ID="/1671.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Tight Performance Bounds on Greedy Policies Based on Imperfect Value Functions,">
<identifier Org="ISBN:026204207X" Paper_ID="/1671.html" Extracted="026204207X" />
<identifier Org="ISBN:0262201046" Paper_ID="/1671.html" Extracted="0262201046" />
<identifier Org="ISBN:0262510987" Paper_ID="/1671.html" Extracted="0262510987" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0262511290" Paper_ID="/1671.html" Extracted="0262511290" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:0780359593" Paper_ID="/1671.html" Extracted="0780359593" />
<identifier Org="ISBN:0780370783" Paper_ID="/1671.html" Extracted="0780370783" />
<identifier Org="ISBN:0780383761" Paper_ID="/1671.html" Extracted="0780383761" />
<identifier Org="ISBN:0792372867" Paper_ID="/1671.html" Extracted="0792372867" DDC="004/.01/519" Normalized_DDC="00401519" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558603778" Paper_ID="/1671.html" Extracted="1558603778" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558603859" Paper_ID="/1671.html" Extracted="1558603859" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1558604952" Paper_ID="/1671.html" Extracted="1558604952" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:1586036424" Paper_ID="/1671.html" Extracted="1586036424" />
<identifier Org="ISBN:3540250735" Paper_ID="/1671.html" Extracted="3540250735" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:3540278729" Paper_ID="/1671.html" Extracted="3540278729" DDC="004" Normalized_DDC="004" Normalized_Weight="0.1111111111111111" />
<identifier Org="ISBN:7302128294" Paper_ID="/1671.html" Extracted="7302128294" />
<identifier Org="ISBN:8871922298" Paper_ID="/1671.html" Extracted="8871922298" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.1111111111111111" />
</rec>
<rec ID="/80588.html" Type="inproceedings" CiteSeer_Book="Proceedings of the International Joint Conference on Artificial Intellience" CiteSeer_Volume="" Title="A reinforcement learning approach to Job-shop Scheduling,">
<identifier Org="ISBN:0262201070" Paper_ID="/80588.html" Extracted="0262201070" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:026251091X" Paper_ID="/80588.html" Extracted="026251091X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0262510952" Paper_ID="/80588.html" Extracted="0262510952" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:026251107X" Paper_ID="/80588.html" Extracted="026251107X" DDC="332/.0285" Normalized_DDC="3320285" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:038709623X" Paper_ID="/80588.html" Extracted="038709623X" />
<identifier Org="ISBN:038747319X" Paper_ID="/80588.html" Extracted="038747319X" DDC="620.0042" Normalized_DDC="6200042" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0470061960" Paper_ID="/80588.html" Extracted="0470061960" DDC="621.384" Normalized_DDC="621384" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0792374592" Paper_ID="/80588.html" Extracted="0792374592" DDC="519.2/33" Normalized_DDC="519233" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0849309999" Paper_ID="/80588.html" Extracted="0849309999" DDC="670/.285" Normalized_DDC="670285" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1558604197" Paper_ID="/80588.html" Extracted="1558604197" />
<identifier Org="ISBN:1558607072" Paper_ID="/80588.html" Extracted="1558607072" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1591404509" Paper_ID="/80588.html" Extracted="1591404509" DDC="006.3/3" Normalized_DDC="00633" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540000283" Paper_ID="/80588.html" Extracted="3540000283" DDC="004" Normalized_DDC="004" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:354029046X" Paper_ID="/80588.html" Extracted="354029046X" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540421440" Paper_ID="/80588.html" Extracted="3540421440" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540678395" Paper_ID="/80588.html" Extracted="3540678395" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540926941" Paper_ID="/80588.html" Extracted="3540926941" />
</rec>
<rec ID="SELF" Type="SELF" CiteSeer_Book="SELF" CiteSeer_Volume="SELF" Title="Solution of Delayed Reinforcement Learning Problems Having Continuous Action Spaces" />
</references_metadata>