Last update: Fri Mar 23 02:20:06 MDT 2018
@Article{Hoffman:2012:RLS, author = "Matthew W. Hoffman and Alessandro Lazaric and Mohammad Ghavamzadeh and R{\'e}mi Munos", title = "Regularized Least Squares Temporal Difference Learning with Nested $ \ell_2 $ and $ \ell_1 $ Penalization", journal = j-LECT-NOTES-COMP-SCI, volume = "7188", pages = "102--114", year = "2012", CODEN = "LNCSD9", DOI = "https://doi.org/10.1007/978-3-642-29946-9_13", ISSN = "0302-9743 (print), 1611-3349 (electronic)", ISSN-L = "0302-9743", bibdate = "Wed Dec 19 15:25:54 MST 2012", bibsource = "http://www.math.utah.edu/pub/tex/bib/lncs2012b.bib", URL = "http://link.springer.com/chapter/10.1007/978-3-642-29946-9_13/", acknowledgement = ack-nhfb, book-DOI = "https://doi.org/10.1007/978-3-642-29946-9", book-URL = "http://www.springerlink.com/content/978-3-642-29946-9", fjournal = "Lecture Notes in Computer Science", }