State switching. Needs refactoring

development
Ugo Finnendahl 5 years ago
parent 088bb10805
commit 12a5cb383e
  1. 32
      css/src/style.scss
  2. 77
      css/style.css
  3. 2
      css/style.min.css
  4. 58
      index.html
  5. 2
      js/controls.js
  6. 30
      js/rl.js
  7. 851
      js/view.js

@ -3,6 +3,8 @@
padding: 0; padding: 0;
} }
body{ body{
margin: 0;
padding: 0;
// background-color: ; // background-color: ;
font-family: sans-serif; font-family: sans-serif;
} }
@ -13,11 +15,13 @@ body{
#canvas{ #canvas{
height: 100%; height: 100%;
} }
nav{ nav{
position: absolute; position: absolute;
top: 10px; top: 10px;
left: 10px; left: 10px;
} }
.absolute{ .absolute{
position: absolute; position: absolute;
top:0; top:0;
@ -34,13 +38,37 @@ nav{
.sliders{ .sliders{
position: absolute; position: absolute;
top: 7vh; top: 20vh;
left: 2vw; left: 2vw;
width: 20vw; width: 20vw;
} }
#formula{ #formula{
position: absolute; position: absolute;
top: -5vh; top: 71.5vh;
width: 90vw; width: 90vw;
} }
.score{
position: absolute;
top: 7vh;
left: 2vw;
width: 20vw;
}
.lightbox{
padding: 2em;
position: absolute;
top:0;
left: 50%;
transform: translateX(-50%) translateY(-100%);
z-index: 10;
width: 50%;
height: 40%;
background-color: #BBB;
transition: all 1s;
&.active{
top:50%;
transform: translateX(-50%) translateY(-50%);
}
}

@ -0,0 +1,77 @@
* {
margin: 0;
padding: 0;
}
body {
margin: 0;
padding: 0;
font-family: sans-serif;
}
#container {
height: 100vh;
position: relative;
}
#canvas {
height: 100%;
}
nav {
position: absolute;
top: 10px;
left: 10px;
}
.absolute {
position: absolute;
top: 0;
left: 0;
}
.plot {
position: absolute;
top: 2vh;
right: 2vw;
width: 20vw;
height: 10vw;
}
.sliders {
position: absolute;
top: 20vh;
left: 2vw;
width: 20vw;
}
#formula {
position: absolute;
top: 71.5vh;
width: 90vw;
}
.score {
position: absolute;
top: 7vh;
left: 2vw;
width: 20vw;
}
.lightbox {
padding: 2em;
position: absolute;
top: 0;
left: 50%;
transform: translateX(-50%) translateY(-100%);
z-index: 10;
width: 50%;
height: 40%;
background-color: #BBB;
transition: all 1s;
}
.lightbox.active {
top: 50%;
transform: translateX(-50%) translateY(-50%);
}

2
css/style.min.css vendored

@ -1 +1 @@
*{margin:0;padding:0}body{font-family:sans-serif}#container{height:100vh;position:relative}#canvas{height:100%}nav{position:absolute;top:10px;left:10px}.absolute{position:absolute;top:0;left:0}.plot{position:absolute;top:2vh;right:2vw;width:20vw;height:10vw}.sliders{position:absolute;top:7vh;left:2vw;width:20vw}#formula{position:absolute;top:-5vh;width:90vw} *{margin:0;padding:0}body{margin:0;padding:0;font-family:sans-serif}#container{height:100vh;position:relative}#canvas{height:100%}nav{position:absolute;top:10px;left:10px}.absolute{position:absolute;top:0;left:0}.plot{position:absolute;top:2vh;right:2vw;width:20vw;height:10vw}.sliders{position:absolute;top:20vh;left:2vw;width:20vw}#formula{position:absolute;top:71.5vh;width:90vw}.score{position:absolute;top:7vh;left:2vw;width:20vw}.lightbox{padding:2em;position:absolute;top:0;left:50%;transform:translateX(-50%) translateY(-100%);z-index:10;width:50%;height:40%;background-color:#BBB;transition:all 1s}.lightbox.active{top:50%;transform:translateX(-50%) translateY(-50%)}

@ -16,47 +16,45 @@
<!-- The loading of KaTeX is deferred to speed up page rendering --> <!-- The loading of KaTeX is deferred to speed up page rendering -->
<script src="https://cdn.jsdelivr.net/npm/katex@0.11.1/dist/katex.min.js" integrity="sha384-y23I5Q6l+B6vatafAwxRu/0oK/79VlbSz7Q9aiSZUvyWYIYsd+qj+o24G5ZU2zJz" crossorigin="anonymous"></script> <script src="https://cdn.jsdelivr.net/npm/katex@0.11.1/dist/katex.min.js" integrity="sha384-y23I5Q6l+B6vatafAwxRu/0oK/79VlbSz7Q9aiSZUvyWYIYsd+qj+o24G5ZU2zJz" crossorigin="anonymous"></script>
<title>RL exhibit - prototype</title> <title>RL exhibit - prototype</title>
<link rel="stylesheet" href="https://gitcdn.xyz/cdn/jzilg/embellish.css/fff9961c5fec2d1c8ff53c87b12e18d5c8db7761/embellish.min.css">
<link rel="stylesheet" href="css/style.min.css"> <link rel="stylesheet" href="css/style.min.css">
</head> </head>
<body> <body>
<div id="app"> <div id="app">
<v-stage ref="stage" :config="stage_config"> <light-box :content="lightText" :options="lightOptions" :active="lightpopup"></light-box>
<v-layer ref="map_layer"> <v-stage ref="stage" :config="stage_config" v-show="isActive('global')">
<v-group ref="mini_map_group" :config="mini_map_config"> <rl-map :machine="machine" :maze="maze" :config="map_config"></rl-map>
<v-group v-for="(t_type, idx) in maze.map.flat()" :config="get_field_config(idx)"> </v-stage>
<v-rect :config="get_tile_config(idx, t_type)"></v-rect>
<v-image :config="energy_config" v-if="t_type==tile"></v-image> <v-stage ref="stage" :config="stage_config" v-show="isActive('local')">
</v-group> <rl-local :machine="machine" :maze="maze" :config="map_config"></rl-local>
<v-group v-for="(action,idx) in q_table" :config="get_field_config(idx)">
<v-shape v-for="(value, key) in action" :config="get_triangle_config(value, key)"></v-shape>
<v-text v-for="i in 4" :config="get_q_text_config(action,i)"></v-text>
</v-group>
<v-image :config="robot_config"></v-image>
</v-group>
</v-layer>
</v-stage> </v-stage>
<line-chart css-classes="plot" :chart-data="datacollection" :options="plot_options"></line-chart> <line-chart css-classes="plot" :chart-data="datacollection" :options="plot_options" v-show="isActive('plot')"></line-chart>
<div class="sliders"> <div class="sliders" v-show="isActive('sliders')">
<h1>Learning Rate {{learning_rate}}</h1> <h1>Learning Rate {{machine.learning_rate}}</h1>
<vue-slider v-model="learning_rate" :drag-on-click="true" v-bind="slider_config"></vue-slider> <vue-slider v-model="machine.learning_rate" :drag-on-click="true" v-bind="slider_config"></vue-slider>
<h1>Discount Factor {{discount_factor}}</h1> <h1>Discount Factor {{machine.discount_factor}}</h1>
<vue-slider v-model="discount_factor" :drag-on-click="true" v-bind="slider_config"></vue-slider> <vue-slider v-model="machine.discount_factor" :drag-on-click="true" v-bind="slider_config"></vue-slider>
<h1>Epsilon {{epsilon}}</h1> <h1>Epsilon {{machine.epsilon}}</h1>
<vue-slider v-model="epsilon" :drag-on-click="true" v-bind="slider_config"></vue-slider> <vue-slider v-model="machine.epsilon" :drag-on-click="true" v-bind="slider_config"></vue-slider>
<h1>Current Score</h1>
<h2>{{score}}</h2>
<div id="formula"></div> <div id="formula"></div>
</div> </div>
<div class="score" v-show="isActive('score')">
<h1>Current Score</h1>
<h2>{{machine.score}}</h2>
</div> </div>
<nav>
<button class="button" onclick="machine.run(1)">run 1 episode!</button> <nav class="navi" v-show="isActive('navi')">
<button class="button" onclick="machine.run(100)">run 100 episodes!</button> <button v-for="(item, key) in navigation" v-on:click="item">{{ key }}</button>
<button class="button" onclick="machine.auto_step();">auto step!</button>
<button class="button" onclick="machine.greedy_step();">greedy step!</button>
<button class="button" onclick="machine.reset_machine()">reset machine</button>
</nav> </nav>
</div>
<script> <script>
var map = [ var map = [
[0, 0, 1, 8, 0, 0, 0, 0, 0, 0], [0, 0, 1, 8, 0, 0, 0, 0, 0, 0],

2
js/controls.js vendored

@ -27,7 +27,7 @@ function key_callback(e) {
break; break;
} }
var ret = 1; var ret = 1;
if (tmp != undefined){ if (tmp != undefined && document.querySelector(".lightbox.active") == null){
ret = machine.step(tmp); ret = machine.step(tmp);
} }
// show_q_table(); // show_q_table();

@ -4,6 +4,7 @@ class RL_machine {
rewards, rewards,
start_state, start_state,
end_states, end_states,
start_score,
end_score, end_score,
learning_rate, learning_rate,
discount_factor, discount_factor,
@ -14,6 +15,7 @@ class RL_machine {
this.lr = learning_rate; this.lr = learning_rate;
this.df = discount_factor; this.df = discount_factor;
this.start_state = start_state; this.start_state = start_state;
this.start_score = start_score;
this.end_score = end_score; this.end_score = end_score;
this.end_states = end_states; this.end_states = end_states;
this.epsilon = epsilon; this.epsilon = epsilon;
@ -27,17 +29,17 @@ class RL_machine {
} }
} }
this.episode = 0; this.episode = 0;
this.state = this.start_state;
this.score = 0;
this.running = false; this.running = false;
this.score_history = []; this.score_history = [];
this.state = this.start_state;
this.score = this.start_score;
} }
new_episode(){ new_episode(){
// add_new_episode_callback // add_new_episode_callback
this.episode++; this.episode++;
this.state = this.start_state;
this.score_history.push(this.score); this.score_history.push(this.score);
this.score = 0; this.state = this.start_state;
this.score = this.start_score;
} }
auto_step(){ auto_step(){
if (Math.random() < this.epsilon){ if (Math.random() < this.epsilon){
@ -52,7 +54,23 @@ class RL_machine {
step(action){ step(action){
this.state = this.update_q_table(this.state, action); this.state = this.update_q_table(this.state, action);
// add_new_step_callback // add_new_step_callback
if (this.end_states.indexOf(this.state) >= 0 || this.score < this.end_score){ if (this.end_states.indexOf(this.state) >= 0) {
var succ_event = new CustomEvent("episode",{
detail: "success"
});
if (!this.running) {
window.dispatchEvent(succ_event);
}
this.new_episode();
return 2
}
if (this.score <= this.end_score){
var fail_event = new CustomEvent("episode",{
detail: "failed"
});
if (!this.running) {
window.dispatchEvent(fail_event);
}
this.new_episode(); this.new_episode();
return 2 return 2
} }
@ -191,4 +209,4 @@ var maze = new Maze(map, reward);
var learning_rate = 0.75; var learning_rate = 0.75;
var discount_factor = 0.8; var discount_factor = 0.8;
var machine = new RL_machine(maze.actions, maze.transactions, maze.rewards, maze.start_state, maze.end_states, -999, learning_rate, discount_factor, 0.2); var machine = new RL_machine(maze.actions, maze.transactions, maze.rewards, maze.start_state, maze.end_states, 50, 0, learning_rate, discount_factor, 0.2);

@ -1,31 +1,6 @@
Vue.component('line-chart', { // ----------------------------------------------------------------------------
extends: VueChartJs.Line, // -------------------------------- Plot --------------------------------------
mixins: [VueChartJs.mixins.reactiveProp], // ----------------------------------------------------------------------------
props: ['options'],
// mixins: [VueChartJs.mixins.reactiveData],
// props: ['options','labels', 'datasets'],
// watch: {
// 'labels': function(new_val) {
// this.chartData = {
// 'labels': new_val,
// 'datasets': this.datasets};
// },
// 'datasets': {
// deep:true,
// handler: function(new_val) {
// this.chartData = {
// 'labels': this.labels,
// 'datasets': new_val};
// }
// }
// },
mounted() {
this.renderChart(this.chartData, this.options);
},
})
var palette = ['#d2000d', '#d30512', '#d40a17', '#d50f1c', '#d61420', '#d71a25', '#d71f2a', '#d8242f', '#d92934', '#da2e39', '#db333d', '#dc3842', '#dd3d47', '#de424c', '#df4751', '#e04d56', '#e0525a', '#e1575f', '#e25c64', '#e36169', '#e4666e', '#e56b73', '#e67077', '#e7757c', '#e87a81', '#e98086', '#e9858b', '#ea8a90', '#eb8f95', '#ec9499', '#ed999e', '#ee9ea3', '#efa3a8', '#f0a8ad', '#f1adb2', '#f2b3b6', '#f2b8bb', '#f3bdc0', '#f4c2c5', '#f5c7ca', '#f6cccf', '#f7d1d3', '#f8d6d8', '#f9dbdd', '#fae0e2', '#fbe6e7', '#fbebec', '#fcf0f0', '#fdf5f5', '#fefafa', '#ffffff', '#fafcfa', '#f5f9f5', '#f0f6f0', '#ebf3ec', '#e6f1e7', '#e1eee2', '#dcebdd', '#d7e8d8', '#d3e5d3', '#cee2cf', '#c9dfca', '#c4dcc5', '#bfd9c0', '#bad6bb', '#b5d4b6', '#b0d1b2', '#abcead', '#a6cba8', '#a1c8a3', '#9cc59e', '#97c299', '#92bf95', '#8dbc90', '#88b98b', '#84b786', '#7fb481', '#7ab17c', '#75ae77', '#70ab73', '#6ba86e', '#66a569', '#61a264', '#5c9f5f', '#579c5a', '#529a56', '#4d9751', '#48944c', '#439147', '#3e8e42', '#398b3d', '#348839', '#308534', '#2b822f', '#267f2a', '#217d25', '#1c7a20', '#17771c', '#127417', '#0d7112', '#086e0d']
Array.prototype.simpleSMA = function(N) { Array.prototype.simpleSMA = function(N) {
return this.map( return this.map(
@ -55,201 +30,66 @@ Array.prototype.max = function() {
}); });
}; };
app = new Vue({ Vue.component('line-chart', {
el: '#app', extends: VueChartJs.Line,
components: { mixins: [VueChartJs.mixins.reactiveProp],
VueSlider: window['vue-slider-component'] props: ['options'],
}, mounted() {
data: { this.renderChart(this.chartData, this.options);
width: 0,
height: 0,
q_table: machine.q_table,
maze: maze,
state: {
x: 0,
y: 0
},
state_tween: new TimelineLite(),
score: machine.score,
score_history: machine.score_history,
labels: [],
learning_rate: machine.lr,
discount_factor: machine.df,
epsilon: machine.epsilon,
slider_config: {
min: 0,
max: 1,
duration: 0,
interval: 0.01,
tooltip: 'none'
},
robot_image: null,
energy_image: null,
},
created() {
// Resize handler
window.addEventListener('resize', this.handleResize)
this.handleResize();
// State wrapper
var s = machine.state;
var $this = this;
this.state = this.s2p(s);
Object.defineProperty(machine, 'state', {
get: function() {
return this._state
},
set: function(ne) {
this._state = ne;
$this.handleState(this._state);
}
});
machine.state = s;
// Score wrapper
var s = machine.score;
var $this = this;
this.score = s;
Object.defineProperty(machine, 'score', {
get: function() {
return this._score
},
set: function(ne) {
this._score = ne;
$this.score = ne
}
});
machine.score = s;
// Score history wrapper
var s = machine.score_history;
var $this = this;
this.score_history = s;
Object.defineProperty(machine, 'score_history', {
get: function() {
return this._score_history
}, },
set: function(ne) {
this._score_history = ne;
$this.score_history = ne
}
});
machine.score_history = s;
})
// ----------------------------------------------------------------------------
// --------------------------------- Map --------------------------------------
// ----------------------------------------------------------------------------
function set_images($this){
const robot_image = new window.Image(); const robot_image = new window.Image();
robot_image.src = "img/robot.png"; robot_image.src = "img/robot.png";
// robot_image.src = "https://konvajs.org/assets/yoda.jpg"; // robot_image.src = "https://konvajs.org/assets/yoda.jpg";
robot_image.onload = () => { robot_image.onload = () => {
// set image only when it is loaded // set image only when it is loaded
this.robot_image = robot_image; $this.robot_image = robot_image;
}; };
const energy_image = new window.Image(); const energy_image = new window.Image();
energy_image.src = "img/station.png"; energy_image.src = "img/station.png";
// energy_image.src = "https://konvajs.org/assets/yoda.jpg"; // energy_image.src = "https://konvajs.org/assets/yoda.jpg";
energy_image.onload = () => { energy_image.onload = () => {
// set image only when it is loaded // set image only when it is loaded
this.energy_image = energy_image; $this.energy_image = energy_image;
}; };
}, }
destroyed() {
window.removeEventListener('resize', this.handleResize) var palette = ['#d2000d', '#d30512', '#d40a17', '#d50f1c', '#d61420', '#d71a25', '#d71f2a', '#d8242f', '#d92934', '#da2e39', '#db333d', '#dc3842', '#dd3d47', '#de424c', '#df4751', '#e04d56', '#e0525a', '#e1575f', '#e25c64', '#e36169', '#e4666e', '#e56b73', '#e67077', '#e7757c', '#e87a81', '#e98086', '#e9858b', '#ea8a90', '#eb8f95', '#ec9499', '#ed999e', '#ee9ea3', '#efa3a8', '#f0a8ad', '#f1adb2', '#f2b3b6', '#f2b8bb', '#f3bdc0', '#f4c2c5', '#f5c7ca', '#f6cccf', '#f7d1d3', '#f8d6d8', '#f9dbdd', '#fae0e2', '#fbe6e7', '#fbebec', '#fcf0f0', '#fdf5f5', '#fefafa', '#ffffff', '#fafcfa', '#f5f9f5', '#f0f6f0', '#ebf3ec', '#e6f1e7', '#e1eee2', '#dcebdd', '#d7e8d8', '#d3e5d3', '#cee2cf', '#c9dfca', '#c4dcc5', '#bfd9c0', '#bad6bb', '#b5d4b6', '#b0d1b2', '#abcead', '#a6cba8', '#a1c8a3', '#9cc59e', '#97c299', '#92bf95', '#8dbc90', '#88b98b', '#84b786', '#7fb481', '#7ab17c', '#75ae77', '#70ab73', '#6ba86e', '#66a569', '#61a264', '#5c9f5f', '#579c5a', '#529a56', '#4d9751', '#48944c', '#439147', '#3e8e42', '#398b3d', '#348839', '#308534', '#2b822f', '#267f2a', '#217d25', '#1c7a20', '#17771c', '#127417', '#0d7112', '#086e0d']
},
computed: { Vue.component('rl-map', {
datacollection: function() { props: ['machine', 'maze', 'config'],
return { data: function () {
labels: Array.from(Array(this.score_history.length).keys()),
datasets: [{
label: 'Data One',
backgroundColor: 'rgb(0,0,0,0)',
data: this.score_history,//.simpleSMA(Math.round(50)),
fill: false,
borderColor: 'rgb(255, 159, 64)',
pointRadius: 1,
},
// {
// label: 'Data One',
// backgroundColor: 'rgb(0,0,0,0)',
// data: this.score_history.max(),
// fill: false,
// borderColor: 'rgb(64, 159, 255)',
// pointRadius: 1,
// },
]
}
},
plot_options: function() {
var $this = this;
return {
responsive: true,
maintainAspectRatio: false,
scales: {
xAxes: [{
// type: 'linear',
ticks: {
maxTicksLimit: 8,
maxRotation: 0,
}
}]
},
legend: {
display: false
}
}
},
stage_config: function() {
return {
width: this.width,
height: this.height,
}
},
mini_map_config: function() {
return { return {
x: this.width / 2 - (this.base_size * (this.maze.width) / 2), robot_image: null,
y: this.height / 2 - (this.base_size * (this.maze.height) / 2), energy_image: null,
scale: {
x: 1,
y: 1
}
} }
}, },
local_layer: function() { created() {
return { set_images(this);
x: this.width / 2,
y: this.height / 2,
scale: {
x: 2,
y: 2
}
}
}, },
map_config: function() { computed: {
main_config: function(){
return { return {
x: this.base_size * (this.maze.width - this.state.x), ...this.config,
y: this.base_size * (this.maze.height - this.state.y),
offset: { offset: {
x: this.base_size * this.maze.width + this.base_size / 2, x: -(this.config.width-this.base_size*this.maze.width)/2,
y: this.base_size * this.maze.height + this.base_size / 2, y: -(this.config.height-this.base_size*this.maze.height)/2,
}
} }
},
agent_config: function() {
return {
sides: 5,
radius: this.base_size / 3,
fill: '#00D2FF',
stroke: 'black',
strokeWidth: this.strokeW,
offset: {
x: -this.base_size / 2,
y: -this.base_size / 2
},
x: this.base_size * this.state.x,
y: this.base_size * this.state.y,
} }
}, },
robot_config: function() { robot_config: function() {
return { return {
height: this.base_size, height: this.base_size,
width: this.base_size, width: this.base_size,
x: this.base_size * this.state.x, x: this.base_size * this.machine.state.x,
y: this.base_size * this.state.y, y: this.base_size * this.machine.state.y,
image: this.robot_image, image: this.robot_image,
} }
}, },
@ -265,7 +105,7 @@ app = new Vue({
} }
}, },
base_size: function() { base_size: function() {
return Math.min(this.stage_config.height * 0.8 / this.maze.height, this.stage_config.width * 0.5 / this.maze.width); return Math.min(this.config.height/this.maze.height, this.config.width/this.maze.width);
}, },
strokeW: function() { strokeW: function() {
return this.base_size / 50; return this.base_size / 50;
@ -286,45 +126,8 @@ app = new Vue({
} }
}, },
methods: { methods: {
s2p: function(state) {
return {
x: (state % this.maze.width),
y: Math.floor(state / this.maze.width),
}
},
p2s: function(x, y) {
return x + y * this.maze.width;
},
handleResize: function() {
this.width = window.innerWidth;
this.height = window.innerHeight;
},
handleState: function(s) {
if (!machine.running) {
this.state_tween.to(this.state, 0.2, {
x: this.s2p(s).x,
y: this.s2p(s).y
});
} else {
this.state = this.s2p(s);
}
// this.hidden_state = s;
},
get_grid_line_config: function(idx, y = false) {
var offset = this.strokeW / 2;
if (y) {
var points = [-offset, Math.round(idx * this.base_size), this.base_size * this.maze.width + offset, Math.round(idx * this.base_size)];
} else {
var points = [Math.round(idx * this.base_size), -offset, Math.round(idx * this.base_size), this.base_size * this.maze.height + offset];
}
return {
points: points,
stroke: '#ddd',
strokeWidth: this.strokeW,
}
},
get_tile_type: function(state) { get_tile_type: function(state) {
var pos = this.s2p(state); var pos = this.machine.s2p(state);
if (pos.y > maze.height) { if (pos.y > maze.height) {
return null; return null;
} else if (pos.x > maze.width) { } else if (pos.x > maze.width) {
@ -333,14 +136,8 @@ app = new Vue({
return maze.map[pos.y][pos.x]; return maze.map[pos.y][pos.x];
} }
}, },
in_plus: function(pos1, pos2) {
if (Math.abs(pos1.x - pos2.x) + Math.abs(pos1.y - pos2.y) < 2) {
return true;
}
return false;
},
get_field_config: function(state) { get_field_config: function(state) {
var pos = this.s2p(state); var pos = this.machine.s2p(state);
return { return {
x: this.base_size * pos.x+this.base_size/2, x: this.base_size * pos.x+this.base_size/2,
y: this.base_size * pos.y+this.base_size/2, y: this.base_size * pos.y+this.base_size/2,
@ -443,20 +240,20 @@ app = new Vue({
} }
}, },
get_tile_config: function(i, t_type, local = false) { get_tile_config: function(i, t_type, local = false) {
var pos = this.s2p(i); // var pos = this.s2p(i);
var over = {}; var over = {};
// not in plus // not in plus
if (local) { if (local) {
if (!this.in_plus(this.s2p(i), { if (!this.in_plus(this.machine.s2p(i), {
x: Math.round(this.state.x), x: Math.round(this.machine.state.x),
y: Math.round(this.state.y) y: Math.round(this.machine.state.y)
})) { })) {
over = { over = {
opacity: 0, opacity: 0,
fill: "#eee" fill: "#eee"
}; };
} else if (i != this.p2s(Math.round(this.state.x), Math.round(this.state.y))) { } else if (i != this.p2s(Math.round(this.machine.state.x), Math.round(this.machine.state.y))) {
over = { over = {
opacity: 1, opacity: 1,
fill: "#eee" fill: "#eee"
@ -510,25 +307,553 @@ app = new Vue({
...over, ...over,
} }
} }
},
},
template:
`<v-layer ref="map_layer">
<v-group ref="map_group" :config="main_config">
<v-group v-for="(t_type, idx) in maze.map.flat()" :config="get_field_config(idx)">
<v-rect :config="get_tile_config(idx, t_type)"></v-rect>
<v-image :config="energy_config" v-if="t_type==8"></v-image>
</v-group>
<v-group v-for="(action,idx) in machine.q_table" :config="get_field_config(idx)">
<v-shape v-for="(value, key) in action" :config="get_triangle_config(value, key)"></v-shape>
<v-text v-for="i in 4" :config="get_q_text_config(action,i)"></v-text>
</v-group>
<v-image :config="robot_config"></v-image>
</v-group>
</v-layer>`
})
// ----------------------------------------------------------------------------
// -------------------------------- Local -------------------------------------
// ----------------------------------------------------------------------------
Vue.component('rl-local', {
props: ['machine', 'maze', 'config'],
data: function () {
return {
robot_image: null,
energy_image: null,
} }
}, },
watch: { created() {
learning_rate: function(new_val) { set_images(this);
machine.lr = new_val;
render_latex();
}, },
discount_factor: function(new_val) { computed: {
machine.df = new_val; main_config: function(){
render_latex(); return {
...this.config,
offset: {
x: -(this.config.width-this.base_size*3)/2,
y: -(this.config.height-this.base_size*3)/2,
}
}
}, },
epsilon: function(new_val) { map_config: function() {
machine.epsilon = new_val; return {
x: -(this.machine.state.x)*this.base_size,
y: -(this.machine.state.y)*this.base_size,
offset: {
x: -this.base_size,
y: -this.base_size,
} }
} }
}) },
robot_config: function() {
function render_latex() { return {
// (1-lr) * Q[state, action] + lr * (reward + gamma * np.max(Q[new_state, :]) height: this.base_size,
katex.render(`Q(s,a)\\leftarrow${(1-machine.lr).toFixed(2)}Q(s,a)+${machine.lr.toFixed(2)}(reward + ${machine.df.toFixed(2)}\\max_{a'}(Q(s_{new}, a'))`, document.getElementById('formula'),{displayMode: true,}); width: this.base_size,
} x: this.center,
render_latex(); y: this.center,
image: this.robot_image,
offset:{
x: this.base_size/2,
y: this.base_size/2,
}
}
},
energy_config: function() {
return {
height: this.base_size,
width: this.base_size,
offset: {
x: this.base_size/2,
y: this.base_size/2
},
image: this.energy_image,
}
},
base_size: function() {
return Math.min(this.config.height/3, this.config.width/3);
},
center: function() {
return 3*this.base_size / 2;
},
strokeW: function() {
return this.base_size / 50;
},
},
methods: {
get_tile_type: function(state) {
var pos = this.machine.s2p(state);
if (pos.y > maze.height) {
return null;
} else if (pos.x > maze.width) {
return null;
} else {
return maze.map[pos.y][pos.x];
}
},
in_plus: function(pos1, pos2) {
if (Math.abs(pos1.x - pos2.x) + Math.abs(pos1.y - pos2.y) < 2) {
return true;
}
return false;
},
get_field_config: function(state) {
var pos = this.machine.s2p(state);
return {
x: this.base_size * pos.x+this.base_size/2,
y: this.base_size * pos.y+this.base_size/2,
}
},
get_tile_config: function(i, t_type, local = true) {
// var pos = this.s2p(i);
var over = {};
// not in plus
if (local) {
if (!this.in_plus(this.machine.s2p(i), {
x: Math.round(this.machine.state.x),
y: Math.round(this.machine.state.y)
})) {
over = {
opacity: 0,
fill: "#eee"
};
} else if (i != this.machine.p2s(Math.round(this.machine.state.x), Math.round(this.machine.state.y))) {
over = {
opacity: 1,
fill: "#eee"
};
}
}
const layout = {
width: this.base_size,
height: this.base_size,
stroke: '#ddd',
strokeWidth: this.strokeW,
offset: {
x: this.base_size/2,
y: this.base_size/2,
}
};
switch (t_type) {
case tile.regular:
return {
...layout,
fill: '#fff',
opacity: 1,
...over,
}
case tile.end:
return {
...layout,
fill: '#0eb500',
opacity: 1,
...over,
}
case tile.start:
return {
...layout,
fill: '#ff0008',
opacity: 1,
...over,
}
case tile.dangerous:
return {
...layout,
fill: '#FF7B17',
opacity: 1,
...over,
}
case tile.wall:
return {
...layout,
opacity: 1,
...over,
fill: '#000000',
}
}
},
},
template:
`<v-layer ref="map_layer" :config="main_config">
<v-group ref="map_group" :config="map_config">
<v-group v-for="(t_type, idx) in maze.map.flat()" :config="get_field_config(idx)">
<v-rect :config="get_tile_config(idx, t_type)"></v-rect>
<v-image :config="energy_config" v-if="t_type==8 && idx==Math.round(machine.state.x)+maze.width*Math.round(machine.state.y)"></v-image>
</v-group>
</v-group>
<v-image :config="robot_config"></v-image>
</v-layer>`
})
// ----------------------------------------------------------------------------
// ------------------------------ lightbox ------------------------------------
// ----------------------------------------------------------------------------
Vue.component('light-box', {
props: ['content', 'options', 'active'],
// data: function () {
// return {
// active: false,
// }
// },
// methods: {
// close: function() {
// this.active = false;
// },
// open: function() {
// this.active = true;
// },
// },
template: `
<div class="lightbox" v-bind:class="{ active: active }">{{ content }}
<div class="options">
<button v-for="(item, key) in options" v-on:click="item">{{ key }}</button>
</div>
</div>`
})
// ----------------------------------------------------------------------------
// -------------------------------- Main --------------------------------------
// ----------------------------------------------------------------------------
function make_machine_reactive(th, machine){
var $this = th;
// Score wrapper
var s = machine.score;
$this.machine.score = s;
Object.defineProperty(machine, 'score', {
get: function() {
return this._score
},
set: function(ne) {
this._score = ne;
$this.machine.score = ne
}
});
machine.score = s;
// Score history wrapper
var s = machine.score_history;
$this.machine.score_history = s;
Object.defineProperty(machine, 'score_history', {
get: function() {
return this._score_history
},
set: function(ne) {
this._score_history = ne;
$this.machine.score_history = ne
}
});
machine.score_history = s;
// State wrapper
var s = machine.state;
$this.machine.state = $this.s2p(s);
Object.defineProperty(machine, 'state', {
get: function() {
return this._state
},
set: function(ne) {
this._state = ne;
$this.handleState(this._state);
}
});
machine.state = s;
$this.machine.s2p = $this.s2p;
$this.machine.p2s = $this.p2s;
window.addEventListener("episode", (ev) => {
if (ev.detail == "failed"){
$this.lightText = "Out of battery. The robot will be resetted.";
} else if (ev.detail == "success"){
$this.lightText = "You reached the goal. The robot will be resetted.";
}
$this.lightOptions = {
"ok": () => {$this.lightpopup = false;},
}
$this.lightpopup = true;
})
}
app = new Vue({
el: '#app',
components: {
VueSlider: window['vue-slider-component'],
},
data: {
state: 0,
maze: maze,
machine: {
object: machine,
q_table: machine.q_table,
state: {
x:0,
y:0,
},
state_tween: new TimelineLite(),
learning_rate: machine.lr,
discount_factor: machine.df,
epsilon: machine.epsilon,
score: machine.score,
score_history: machine.score_history,
s2p: null,
p2s: null,
},
width: 0,
height: 0,
state: null,
components: [],
lightText: "",
lightOptions: "",
lightpopup: false,
navigation: {},
onEnterState: function(){},
onLeaveState: function(){},
},
created() {
// Resize handler
window.addEventListener('resize', this.handleResize)
this.handleResize();
make_machine_reactive(this, machine);
this.state = "init";
},
destroyed() {
window.removeEventListener('resize', this.handleResize)
},
computed: {
stage_config: function() {
return {
width: this.width,
height: this.height,
}
},
map_config: function() {
return {
x: this.width*0.25,
y: this.height*0.1,
width: this.width*0.5,
height: this.height*0.8,
}
},
slider_config: function(){
return {
min: 0,
max: 1,
duration: 0,
interval: 0.01,
tooltip: 'none'
}
},
datacollection: function() {
return {
labels: Array.from(Array(this.machine.score_history.length).keys()),
datasets: [{
label: 'Data One',
backgroundColor: 'rgb(0,0,0,0)',
data: this.machine.score_history,//.simpleSMA(Math.round(50)),
fill: false,
borderColor: 'rgb(255, 159, 64)',
pointRadius: 1,
},
// {
// label: 'Data One',
// backgroundColor: 'rgb(0,0,0,0)',
// data: this.score_history.max(),
// fill: false,
// borderColor: 'rgb(64, 159, 255)',
// pointRadius: 1,
// },
]
}
},
plot_options: function() {
var $this = this;
return {
responsive: true,
maintainAspectRatio: false,
scales: {
xAxes: [{
// type: 'linear',
ticks: {
maxTicksLimit: 8,
maxRotation: 0,
}
}]
},
legend: {
display: false
}
}
},
},
methods: {
s2p: function(state) {
return {
x: (state % this.maze.width),
y: Math.floor(state / this.maze.width),
}
},
p2s: function(x, y) {
return x + y * this.maze.width;
},
handleState: function(s) {
if (!this.machine.object.running) {
this.machine.state_tween.to(this.machine.state, 0.2, {
x: this.s2p(s).x,
y: this.s2p(s).y
});
} else {
this.machine.state = this.s2p(s);
}
},
handleResize: function() {
this.width = window.innerWidth;
this.height = window.innerHeight;
},
isActive: function(what){
return this.components.indexOf(what) >= 0;
},
changeState: function(state){
this.components = [];
this.lightText = "";
this.lightOptions = "";
this.lightpopup = false;
this.navigation = {};
this.onEnterState = function(){};
this.onLeaveState = function(){};
this.state = state;
}
},
watch: {
'machine.learning_rate': function(new_val) {
machine.lr = new_val;
render_latex();
},
'machine.discount_factor': function(new_val) {
machine.df = new_val;
render_latex();
},
'machine.epsilon': function(new_val) {
machine.epsilon = new_val;
},
state: function(state){
this.onLeaveState();
Object.assign(this, StateMgr[state]);
this.onEnterState();
},
}
})
function render_latex() {
// (1-lr) * Q[state, action] + lr * (reward + gamma * np.max(Q[new_state, :])
katex.render(`Q(s,a)\\leftarrow${(1-machine.lr).toFixed(2)}Q(s,a)+${machine.lr.toFixed(2)}(reward + ${machine.df.toFixed(2)}\\max_{a'}(Q(s_{new}, a'))`, document.getElementById('formula'),{displayMode: true,});
}
render_latex();
// ----------------------------------------------------------------------------
// ------------------------------ StateMgr ------------------------------------
// ----------------------------------------------------------------------------
var StateMgr = {
init: {
lightText: `Reinforcement learning (RL) is an area of machine learning concerned with how software agents ought to take actions in an environment so as to maximize some notion of cumulative reward. Reinforcement learning is one of three basic machine learning paradigms, alongside supervised learning and unsupervised learning. (wikipedia)
This exhibit explains how a robot can learn to navigate through a maze in order to reach its destination, before running out of power. At first the robot knows nothing, and learns from each new action (movement) and state (location reached). Slowly it starts to develop an understanding of the maze that will allow it to reach the charging station before it runs out of power. Eventually, it should learn to avoid any detour and reach the charging station in the optimal number of steps.`,
lightOptions: {
"next": () => app.changeState("local"),
},
onEnterState: function () {
this.lightpopup = true;
},
onLeaveState: function () {
this.lightpopup = false;
}
},
local: {
components: ["local", "navi", "score"],
navigation: {
"reset robot": () => machine.reset_machine(),
"continue": () => app.changeState("global"),
},
lightText: "But there is a problem! The robot cannot see the whole maze, it only knows where it is and in which direction it can move. Can you reach the charging station in those conditions? Use the arrows to move",
lightOptions: {
"next": () => {app.lightpopup = false;},
},
onEnterState: function () {
this.lightpopup = true;
},
onLeaveState: function () {
this.lightpopup = false;
}
},
global: {
components: ["global", "sliders", "plot", "navi", "score"],
navigation: {
"run 1 episode!": () => machine.run(1),
"run 100 episodes!": () => machine.run(100),
"auto step!": () => machine.auto_step(),
"greedy step!": () => machine.greedy_step(),
"reset machine": () => machine.reset_machine(),
},
lightText: `As a human, you keep track of where you are and how you got there without thinking, which helps you think about what actions you should take next to reach your destination. And you can also just look around! How can then the robot 'think' of the maze, to know which action is the best at every moment? And how can it learn that? It must somehow keep track of where it is, and remember how good or bad was each action at each place in the maze, try new things, and update it's "mental image" of what was a good decision and what not.
Reinforcement Learning uses the concept of a "Q-function", which keeps track of how "good" it expects it to be to take a specific action 'a' from a specific location 's'. This is written as Q(s, a). It also uses a "policy", which determines the best action to take in a given state, and is written as π(s). The robot must learn those functions while it navigates the maze. With each step, the functions are modified by a little bit, until eventually they give it the best strategy to solve the maze.`,
lightOptions: {
"continue": () => {app.lightpopup = false;},
},
onEnterState: function () {
this.lightpopup = true;
},
}
};
// ----------------------------------------------------------------------------
// ------------------------------- Dummy --------------------------------------
// ----------------------------------------------------------------------------
// Vue.component('dummy', {
// props: ['config'],
// data: function () {
// return {
// robot_image: null,
// }
// },
// created() {
//
// },
// mounted() {
//
// },
// computed: {
// fun: function() {
// return
// },
// },
// methods: {
// fun: function(arg) {
// },
// },
// template: ``
// })

Loading…
Cancel
Save