Skip to content

Commit f44f017

Browse files
committed
examples moved
1 parent 2d8ca56 commit f44f017

File tree

5 files changed

+2
-14
lines changed

5 files changed

+2
-14
lines changed
File renamed without changes.
File renamed without changes.

src/model_free.py

Lines changed: 0 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -71,14 +71,6 @@ class ModelFree:
7171
transition.
7272
'''
7373

74-
SOLVERS = {
75-
'first_visit_mc': first_visit_monte_carlo,
76-
'every_visit_mc': every_visit_monte_carlo,
77-
'off_policy_first_visit': off_policy_first_visit,
78-
'off_policy_every_visit': off_policy_every_visit,
79-
'temporal_difference': tdn,
80-
}
81-
8274
def __init__(
8375
self,
8476
states: Sequence[Any],

src/solvers.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -546,6 +546,4 @@ def _tdn(MF, n, alpha, n_episodes, max_steps, optimize, sample_step):
546546
return v, q, samples
547547

548548

549-
# temporal difference control SARSA, QLeearning, and some others
550-
551-
549+
# temporal difference control SARSA, QLeearning, and some others

src/utils.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,10 +1,8 @@
11
from abc import ABC, abstractmethod
22
from typing import (
33
Any,
4-
Union,
54
Sequence,
65
List,
7-
Dict,
86
Tuple,
97
Callable,
108
NewType
@@ -18,7 +16,6 @@
1816
TOL = 1E-6
1917
MEAN_ITERS = int(1E4)
2018

21-
2219
class Policy(ABC):
2320
def __init__(self):
2421
pass
@@ -80,6 +77,7 @@ class Vpi(_TabularValues):
8077
class Qpi(_TabularValues):
8178
pass
8279

80+
8381

8482
VQPi = NewType('VQPi', Tuple[Vpi, Qpi, Policy])
8583
Samples = NewType('Samples', Tuple[int, List[Vpi], List[Qpi], List[np.ndarray]])

0 commit comments

Comments
 (0)