Commit 071e16a9 authored by Daniel Lukats's avatar Daniel Lukats

final push

parent 439bdc7c
......@@ -61,7 +61,8 @@
name = {episode reward graph},
description = {TODO}
description = {a graph that plots time steps on the x axis and the cumulated rewards of terminated episodes on the y
......@@ -169,6 +170,11 @@
description = {an objective that approximates the true objective, e.g., by posing a lower bound on improvement}
name = {tensor},
description = {in this thesis, a tensor is a multi-dimensional vector (or array, in computer science terms)}
name = {terminal state},
description = {an absorbing state that the agent cannot leave. Transitioning to a terminal state marks the end of an
