diff --git a/source-code/Pseudocode/q-learning/q-learning.tex b/source-code/Pseudocode/q-learning/q-learning.tex index bd69241..24356e7 100644 --- a/source-code/Pseudocode/q-learning/q-learning.tex +++ b/source-code/Pseudocode/q-learning/q-learning.tex @@ -20,7 +20,7 @@ \begin{algorithm}[H] \begin{algorithmic} \Require - \Statex Sates $\mathcal{X} = \{1, \dots, n_x\}$ + \Statex States $\mathcal{X} = \{1, \dots, n_x\}$ \Statex Actions $\mathcal{A} = \{1, \dots, n_a\},\qquad A: \mathcal{X} \Rightarrow \mathcal{A}$ \Statex Reward function $R: \mathcal{X} \times \mathcal{A} \rightarrow \mathbb{R}$ \Statex Black-box (probabilistic) transition function $T: \mathcal{X} \times \mathcal{A} \rightarrow \mathcal{X}$