You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
16 lines
436 B
Python
16 lines
436 B
Python
10 years ago
|
"""Reinforcement Learning (Chapter 21)
|
||
|
"""
|
||
|
|
||
|
from utils import *
|
||
|
import agents
|
||
|
|
||
|
class PassiveADPAgent(agents.Agent):
|
||
|
"""Passive (non-learning) agent that uses adaptive dynamic programming
|
||
|
on a given MDP and policy. [Fig. 21.2]"""
|
||
|
NotImplementedError
|
||
|
|
||
|
class PassiveTDAgent(agents.Agent):
|
||
|
"""Passive (non-learning) agent that uses temporal differences to learn
|
||
|
utility estimates. [Fig. 21.4]"""
|
||
|
NotImplementedError
|