BibTeX record journals/mor/KarmakarB18

download as .bib file

@article{DBLP:journals/mor/KarmakarB18,
  author       = {Prasenjit Karmakar and
                  Shalabh Bhatnagar},
  title        = {Two Time-Scale Stochastic Approximation with Controlled Markov Noise
                  and Off-Policy Temporal-Difference Learning},
  journal      = {Math. Oper. Res.},
  volume       = {43},
  number       = {1},
  pages        = {130--151},
  year         = {2018},
  url          = {https://doi.org/10.1287/moor.2017.0855},
  doi          = {10.1287/MOOR.2017.0855},
  timestamp    = {Sat, 09 Apr 2022 12:21:56 +0200},
  biburl       = {https://dblp.org/rec/journals/mor/KarmakarB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics