000 | 00695 a2200253 4500 | ||
---|---|---|---|
005 | 20240613143609.0 | ||
008 | 240613b |||||||| |||| 00| 0 eng d | ||
020 | _a9780262039246 | ||
041 | _aeng | ||
082 | _a006.31 Su871r2 | ||
100 | _aSutton, Richard S. | ||
245 |
_aReinforcement learning _ban introduction |
||
250 | _a2nd ed. | ||
260 |
_bMIT Press _aCambridge _c2020 |
||
300 | _axxii, 526p. | ||
440 | _aAdaptive Computation and Machine Learning | ||
490 | _aBach, Francis | ||
650 | _aReinforcement learning | ||
650 |
_aDynamic programming _xPolicy |
||
650 |
_aMemory control _xCase studies |
||
700 | _aBarto, Andrew G. | ||
942 | _cREF | ||
960 | _aa | ||
999 |
_c28205 _d28205 |