#include "Random.h"
#include <vector>
#include <map>

Include dependency graph for core.hh:

This graph shows which files directly or indirectly include this file:

Classes
class	Agent
class	Classifier
struct	classPair
class	Environment
struct	experience
class	MDPModel
class	Model
struct	modelPair
class	Planner
struct	StateActionInfo
Defines
#define	ALLM5TYPES 12
#define	AVERAGE 1
#define	BEST 3
#define	C45TREE 2
#define	CMAC_PLANNER 7
#define	CONTINUOUS_BONUS 3
#define	CONTINUOUS_BONUS_R 5
#define	DIFF_AND_NOVEL_BONUS 19
#define	DIFF_AND_VISIT_BONUS 16
#define	EPSILON 1e-5
#define	EPSILONGREEDY 8
#define	ET_UCT 4
#define	ET_UCT_ACTUAL 14
#define	ET_UCT_CORNERS 15
#define	ET_UCT_L1 10
#define	ET_UCT_WITH_ENV 5
#define	EXPLORE_UNKNOWN 0
#define	GPREGRESS 13
#define	GPTREE 14
#define	GREEDY 7
#define	LSTMULTI 10
#define	LSTSINGLE 11
#define	M5ALLMULTI 8
#define	M5ALLSINGLE 9
#define	M5MULTI 6
#define	M5SINGLE 7
#define	MBS_VI 20
#define	MOD_PRI_SWEEPING 9
#define	NN_PLANNER 8
#define	NO_EXPLORE 7
#define	NOVEL_STATE_BONUS 18
#define	PAR_ETUCT_ACTUAL 16
#define	PAR_ETUCT_CORNERS 17
#define	PARALLEL_ET_UCT 13
#define	POLICY_ITERATION 1
#define	POMDP_ETUCT 18
#define	POMDP_PAR_ETUCT 19
#define	PRI_SWEEPING 2
#define	RMAX 0
#define	SEPARATE 4
#define	SINGLETREE 3
#define	SLF 1
#define	STUMP 5
#define	SVM 4
#define	SWEEPING_UCT_HYBRID 6
#define	TABULAR 0
#define	THRESHOLD_BONUS 4
#define	THRESHOLD_BONUS_R 6
#define	TWO_MODE 1
#define	TWO_MODE_PLUS_R 2
#define	UCT 3
#define	UCT_WITH_ENV 12
#define	UCT_WITH_L 11
#define	UNVISITED_ACT_BONUS 13
#define	UNVISITED_BONUS 11
#define	VALUE_ITERATION 0
#define	VISITS_CONF 9
#define	WEIGHTAVG 2
Variables
const std::string	comboNames []
const std::string	exploreNames []
const std::string	modelNames []
const std::string	plannerNames []

Detailed Description

Fundamental declarations for the universal concepts in the reinforcement learning framework.

Author:: Nick Jong; Todd Hester

Definition in file core.hh.

Define Documentation

#define ALLM5TYPES 12

Definition at line 31 of file core.hh.

#define AVERAGE 1

Definition at line 54 of file core.hh.

#define BEST 3

Definition at line 56 of file core.hh.

#define C45TREE 2

Definition at line 21 of file core.hh.

#define CMAC_PLANNER 7

Definition at line 115 of file core.hh.

#define CONTINUOUS_BONUS 3

Definition at line 70 of file core.hh.

#define CONTINUOUS_BONUS_R 5

Definition at line 72 of file core.hh.

#define DIFF_AND_NOVEL_BONUS 19

Definition at line 82 of file core.hh.

#define DIFF_AND_VISIT_BONUS 16

Definition at line 80 of file core.hh.

#define EPSILON 1e-5

Definition at line 156 of file core.hh.

#define EPSILONGREEDY 8

Definition at line 76 of file core.hh.

#define ET_UCT 4

Definition at line 112 of file core.hh.

#define ET_UCT_ACTUAL 14

Definition at line 122 of file core.hh.

#define ET_UCT_CORNERS 15

Definition at line 123 of file core.hh.

#define ET_UCT_L1 10

Definition at line 118 of file core.hh.

#define ET_UCT_WITH_ENV 5

Definition at line 113 of file core.hh.

#define EXPLORE_UNKNOWN 0

Definition at line 67 of file core.hh.

#define GPREGRESS 13

Definition at line 32 of file core.hh.

#define GPTREE 14

Definition at line 33 of file core.hh.

#define GREEDY 7

Definition at line 75 of file core.hh.

#define LSTMULTI 10

Definition at line 29 of file core.hh.

#define LSTSINGLE 11

Definition at line 30 of file core.hh.

#define M5ALLMULTI 8

Definition at line 27 of file core.hh.

#define M5ALLSINGLE 9

Definition at line 28 of file core.hh.

#define M5MULTI 6

Definition at line 25 of file core.hh.

#define M5SINGLE 7

Definition at line 26 of file core.hh.

#define MBS_VI 20

Definition at line 128 of file core.hh.

#define MOD_PRI_SWEEPING 9

Definition at line 117 of file core.hh.

#define NN_PLANNER 8

Definition at line 116 of file core.hh.

#define NO_EXPLORE 7

Definition at line 74 of file core.hh.

#define NOVEL_STATE_BONUS 18

Definition at line 81 of file core.hh.

#define PAR_ETUCT_ACTUAL 16

Definition at line 124 of file core.hh.

#define PAR_ETUCT_CORNERS 17

Definition at line 125 of file core.hh.

#define PARALLEL_ET_UCT 13

Definition at line 121 of file core.hh.

#define POLICY_ITERATION 1

Definition at line 109 of file core.hh.

#define POMDP_ETUCT 18

Definition at line 126 of file core.hh.

#define POMDP_PAR_ETUCT 19

Definition at line 127 of file core.hh.

#define PRI_SWEEPING 2

Definition at line 110 of file core.hh.

#define RMAX 0

Definition at line 18 of file core.hh.

#define SEPARATE 4

Definition at line 57 of file core.hh.

#define SINGLETREE 3

Definition at line 22 of file core.hh.

#define SLF 1

Definition at line 20 of file core.hh.

#define STUMP 5

Definition at line 24 of file core.hh.

#define SVM 4

Definition at line 23 of file core.hh.

#define SWEEPING_UCT_HYBRID 6

Definition at line 114 of file core.hh.

#define TABULAR 0

Definition at line 19 of file core.hh.

#define THRESHOLD_BONUS 4

Definition at line 71 of file core.hh.

#define THRESHOLD_BONUS_R 6

Definition at line 73 of file core.hh.

#define TWO_MODE 1

Definition at line 68 of file core.hh.

#define TWO_MODE_PLUS_R 2

Definition at line 69 of file core.hh.

#define UCT 3

Definition at line 111 of file core.hh.

#define UCT_WITH_ENV 12

Definition at line 120 of file core.hh.

#define UCT_WITH_L 11

Definition at line 119 of file core.hh.

#define UNVISITED_ACT_BONUS 13

Definition at line 79 of file core.hh.

#define UNVISITED_BONUS 11

Definition at line 78 of file core.hh.

#define VALUE_ITERATION 0

Definition at line 108 of file core.hh.

#define VISITS_CONF 9

Definition at line 77 of file core.hh.

#define WEIGHTAVG 2

Definition at line 55 of file core.hh.

Variable Documentation

const std::string comboNames[]

Initial value:

 {
  "Average",
  "Weighted Average",
  "Best",
  "Separate"
}

Definition at line 59 of file core.hh.

const std::string exploreNames[]

Initial value:

 {
  "Explore Unknowns",
  "Two Modes",
  "Two Models +R",
  "Continuous Bonus",
  "Threshold Bonus",
  "Continuous Bonus +R",
  "Threshold Bonus +R",
  "Greedy",
  "Epsilon-Greedy",
  "Visits Confidence",
  "Type 10",
  "Unvisited State Bonus",
  "Type 12", 
  "Unvisited Action Bonus",
  "Type 14",
  "Type 15",
  "Model Diff & Visit Bonus",
  "Type 17",
  "FeatDist Bonus",
  "Model Diff & FeatDist Bonus"
}

Definition at line 84 of file core.hh.

const std::string modelNames[]

Initial value:

 {
  "Tabular",
  "SLF",
  "C4.5 Tree",
  "Single Tree",
  "SVM",
  "Stump",
  "M5 Tree",
  "M5 Tree",
  "M5 Tree",
  "M5 Tree",
  "LS Tree",
  "LS Tree",
  "M5 Combo",
  "GP Regression",
  "GP Tree"
}

Definition at line 35 of file core.hh.

const std::string plannerNames[]

Initial value:

 {
  "Value Iteration",
  "Policy Iteration",
  "Prioritized Sweeping",
  "UCT",
  "UCT",
  "UCT",
  "Sweeping UCT Hybrid",
  "CMACs",
  "NN",
  "Mod. Pri Sweeping",
  "UCT L=1",
  "UCT L",
  "UCT Env",
  "Parallel UCT",
  "Real-Valued UCT",
  "Corner UCT",
  "Parallel Real-Valued UCT",
  "Parallel Corner UCT",
  "Delayed UCT",
  "Parallel Delayed UCT",
  "Model Based Simulation - VI"
}

Definition at line 130 of file core.hh.

Classes

Defines

Variables

Detailed Description

Define Documentation

Variable Documentation