BibTeX records: Alexander L. Strehl

download as .bib file

@incollection{DBLP:reference/ml/Strehl17,
  author       = {Alexander L. Strehl},
  editor       = {Claude Sammut and
                  Geoffrey I. Webb},
  title        = {Associative Reinforcement Learning},
  booktitle    = {Encyclopedia of Machine Learning and Data Mining},
  pages        = {71--73},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-1-4899-7687-1\_40},
  doi          = {10.1007/978-1-4899-7687-1\_40},
  timestamp    = {Wed, 12 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/ml/Strehl17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/BeygelzimerLLSS14,
  author       = {Alina Beygelzimer and
                  John Langford and
                  Yury Lifshits and
                  Gregory B. Sorkin and
                  Alexander L. Strehl},
  title        = {Conditional Probability Tree Estimation Analysis and Algorithms},
  journal      = {CoRR},
  volume       = {abs/1408.2031},
  year         = {2014},
  url          = {http://arxiv.org/abs/1408.2031},
  eprinttype    = {arXiv},
  eprint       = {1408.2031},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/BeygelzimerLLSS14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/StrehlLL12,
  author       = {Alexander L. Strehl and
                  Lihong Li and
                  Michael L. Littman},
  title        = {Incremental Model-based Learners With Formal Learning-Time Guarantees},
  journal      = {CoRR},
  volume       = {abs/1206.6870},
  year         = {2012},
  url          = {http://arxiv.org/abs/1206.6870},
  eprinttype    = {arXiv},
  eprint       = {1206.6870},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/StrehlLL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/LiLWS11,
  author       = {Lihong Li and
                  Michael L. Littman and
                  Thomas J. Walsh and
                  Alexander L. Strehl},
  title        = {Knows what it knows: a framework for self-aware learning},
  journal      = {Mach. Learn.},
  volume       = {82},
  number       = {3},
  pages        = {399--443},
  year         = {2011},
  url          = {https://doi.org/10.1007/s10994-010-5225-4},
  doi          = {10.1007/S10994-010-5225-4},
  timestamp    = {Tue, 15 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ml/LiLWS11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/StrehlLLK10,
  author       = {Alexander L. Strehl and
                  John Langford and
                  Lihong Li and
                  Sham M. Kakade},
  editor       = {John D. Lafferty and
                  Christopher K. I. Williams and
                  John Shawe{-}Taylor and
                  Richard S. Zemel and
                  Aron Culotta},
  title        = {Learning from Logged Implicit Exploration Data},
  booktitle    = {Advances in Neural Information Processing Systems 23: 24th Annual
                  Conference on Neural Information Processing Systems 2010. Proceedings
                  of a meeting held 6-9 December 2010, Vancouver, British Columbia,
                  Canada},
  pages        = {2217--2225},
  publisher    = {Curran Associates, Inc.},
  year         = {2010},
  url          = {https://proceedings.neurips.cc/paper/2010/hash/c0f168ce8900fa56e57789e2a2f2c9d0-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/StrehlLLK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@incollection{DBLP:reference/ml/Strehl10,
  author       = {Alexander L. Strehl},
  editor       = {Claude Sammut and
                  Geoffrey I. Webb},
  title        = {Associative Reinforcement Learning},
  booktitle    = {Encyclopedia of Machine Learning},
  pages        = {49--51},
  publisher    = {Springer},
  year         = {2010},
  url          = {https://doi.org/10.1007/978-0-387-30164-8\_40},
  doi          = {10.1007/978-0-387-30164-8\_40},
  timestamp    = {Wed, 14 Nov 2018 10:51:34 +0100},
  biburl       = {https://dblp.org/rec/reference/ml/Strehl10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1003-0120,
  author       = {Alexander L. Strehl and
                  John Langford and
                  Sham M. Kakade},
  title        = {Learning from Logged Implicit Exploration Data},
  journal      = {CoRR},
  volume       = {abs/1003.0120},
  year         = {2010},
  url          = {http://arxiv.org/abs/1003.0120},
  eprinttype    = {arXiv},
  eprint       = {1003.0120},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1003-0120.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jmlr/StrehlLL09,
  author       = {Alexander L. Strehl and
                  Lihong Li and
                  Michael L. Littman},
  title        = {Reinforcement Learning in Finite MDPs: {PAC} Analysis},
  journal      = {J. Mach. Learn. Res.},
  volume       = {10},
  pages        = {2413--2444},
  year         = {2009},
  url          = {https://dl.acm.org/doi/10.5555/1577069.1755867},
  doi          = {10.5555/1577069.1755867},
  timestamp    = {Thu, 02 Jun 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/StrehlLL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/BeygelzimerLLSS09,
  author       = {Alina Beygelzimer and
                  John Langford and
                  Yury Lifshits and
                  Gregory B. Sorkin and
                  Alexander L. Strehl},
  editor       = {Jeff A. Bilmes and
                  Andrew Y. Ng},
  title        = {Conditional Probability Tree Estimation Analysis and Algorithms},
  booktitle    = {{UAI} 2009, Proceedings of the Twenty-Fifth Conference on Uncertainty
                  in Artificial Intelligence, Montreal, QC, Canada, June 18-21, 2009},
  pages        = {51--58},
  publisher    = {{AUAI} Press},
  year         = {2009},
  url          = {https://www.auai.org/uai2009/papers/UAI2009\_0203\_204f4f08e911ef8031953205360416f9.pdf},
  timestamp    = {Tue, 25 Oct 2022 12:03:45 +0200},
  biburl       = {https://dblp.org/rec/conf/uai/BeygelzimerLLSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:journals/jmlr/ShiPDLSSV09,
  author       = {Qinfeng Shi and
                  James Petterson and
                  Gideon Dror and
                  John Langford and
                  Alexander J. Smola and
                  Alexander L. Strehl and
                  Vishy Vishwanathan},
  editor       = {David A. Van Dyk and
                  Max Welling},
  title        = {Hash Kernels},
  booktitle    = {Proceedings of the Twelfth International Conference on Artificial
                  Intelligence and Statistics, {AISTATS} 2009, Clearwater Beach, Florida,
                  USA, April 16-18, 2009},
  series       = {{JMLR} Proceedings},
  volume       = {5},
  pages        = {496--503},
  publisher    = {JMLR.org},
  year         = {2009},
  url          = {http://proceedings.mlr.press/v5/shi09a.html},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jmlr/ShiPDLSSV09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-0903-4217,
  author       = {Alina Beygelzimer and
                  John Langford and
                  Yury Lifshits and
                  Gregory B. Sorkin and
                  Alexander L. Strehl},
  title        = {Conditional Probability Tree Estimation Analysis and Algorithms},
  journal      = {CoRR},
  volume       = {abs/0903.4217},
  year         = {2009},
  url          = {http://arxiv.org/abs/0903.4217},
  eprinttype    = {arXiv},
  eprint       = {0903.4217},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-0903-4217.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jcss/StrehlL08,
  author       = {Alexander L. Strehl and
                  Michael L. Littman},
  title        = {An analysis of model-based Interval Estimation for Markov Decision
                  Processes},
  journal      = {J. Comput. Syst. Sci.},
  volume       = {74},
  number       = {8},
  pages        = {1309--1331},
  year         = {2008},
  url          = {https://doi.org/10.1016/j.jcss.2007.08.009},
  doi          = {10.1016/J.JCSS.2007.08.009},
  timestamp    = {Tue, 16 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/jcss/StrehlL08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/DaiSG08,
  author       = {Peng Dai and
                  Alexander L. Strehl and
                  Judy Goldsmith},
  editor       = {Lin Padgham and
                  David C. Parkes and
                  J{\"{o}}rg P. M{\"{u}}ller and
                  Simon Parsons},
  title        = {Expediting {RL} by using graphical structures},
  booktitle    = {7th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2008), Estoril, Portugal, May 12-16, 2008, Volume
                  3},
  pages        = {1325--1328},
  publisher    = {{IFAAMAS}},
  year         = {2008},
  url          = {https://dl.acm.org/citation.cfm?id=1402863},
  timestamp    = {Tue, 02 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/DaiSG08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/LangfordSW08,
  author       = {John Langford and
                  Alexander L. Strehl and
                  Jennifer Wortman},
  editor       = {William W. Cohen and
                  Andrew McCallum and
                  Sam T. Roweis},
  title        = {Exploration scavenging},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Fifth International Conference
                  {(ICML} 2008), Helsinki, Finland, June 5-9, 2008},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {307},
  pages        = {528--535},
  publisher    = {{ACM}},
  year         = {2008},
  url          = {https://doi.org/10.1145/1390156.1390223},
  doi          = {10.1145/1390156.1390223},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/LangfordSW08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/isaim/Strehl08,
  author       = {Alexander L. Strehl},
  title        = {Probably Approximately Correct {(PAC)} Exploration in Reinforcement
                  Learning},
  booktitle    = {International Symposium on Artificial Intelligence and Mathematics,
                  {ISAIM} 2008, Fort Lauderdale, Florida, USA, January 2-4, 2008},
  year         = {2008},
  url          = {http://isaim2008.unl.edu/PAPERS/SS3-ActiveLearning/isaim08-alex-strehl.pdf},
  timestamp    = {Thu, 12 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isaim/Strehl08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/GoelLS08,
  author       = {Sharad Goel and
                  John Langford and
                  Alexander L. Strehl},
  editor       = {Daphne Koller and
                  Dale Schuurmans and
                  Yoshua Bengio and
                  L{\'{e}}on Bottou},
  title        = {Predictive Indexing for Fast Search},
  booktitle    = {Advances in Neural Information Processing Systems 21, Proceedings
                  of the Twenty-Second Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 8-11, 2008},
  pages        = {505--512},
  publisher    = {Curran Associates, Inc.},
  year         = {2008},
  url          = {https://proceedings.neurips.cc/paper/2008/hash/fa83a11a198d5a7f0bf77a1987bcd006-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/GoelLS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/StrehlDL07,
  author       = {Alexander L. Strehl and
                  Carlos Diuk and
                  Michael L. Littman},
  title        = {Efficient Structure Learning in Factored-State MDPs},
  booktitle    = {Proceedings of the Twenty-Second {AAAI} Conference on Artificial Intelligence,
                  July 22-26, 2007, Vancouver, British Columbia, Canada},
  pages        = {645--650},
  publisher    = {{AAAI} Press},
  year         = {2007},
  url          = {http://www.aaai.org/Library/AAAI/2007/aaai07-102.php},
  timestamp    = {Tue, 05 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/StrehlDL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/StrehlL07,
  author       = {Alexander L. Strehl and
                  Michael L. Littman},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Online Linear Regression and Its Application to Model-Based Reinforcement
                  Learning},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {1417--1424},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/b7bb35b9c6ca2aee2df08cf09d7016c2-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/StrehlL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/DiukSL06,
  author       = {Carlos Diuk and
                  Alexander L. Strehl and
                  Michael L. Littman},
  editor       = {Hideyuki Nakashima and
                  Michael P. Wellman and
                  Gerhard Weiss and
                  Peter Stone},
  title        = {A hierarchical approach to efficient reinforcement learning in deterministic
                  domains},
  booktitle    = {5th International Joint Conference on Autonomous Agents and Multiagent
                  Systems {(AAMAS} 2006), Hakodate, Japan, May 8-12, 2006},
  pages        = {313--319},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1160633.1160686},
  doi          = {10.1145/1160633.1160686},
  timestamp    = {Tue, 08 Mar 2022 10:12:47 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/DiukSL06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/StrehlLWLL06,
  author       = {Alexander L. Strehl and
                  Lihong Li and
                  Eric Wiewiora and
                  John Langford and
                  Michael L. Littman},
  editor       = {William W. Cohen and
                  Andrew W. Moore},
  title        = {{PAC} model-free reinforcement learning},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Third International Conference
                  {(ICML} 2006), Pittsburgh, Pennsylvania, USA, June 25-29, 2006},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {148},
  pages        = {881--888},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1143844.1143955},
  doi          = {10.1145/1143844.1143955},
  timestamp    = {Tue, 19 Nov 2019 09:25:06 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/StrehlLWLL06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/StrehlMLH06,
  author       = {Alexander L. Strehl and
                  Chris Mesterharm and
                  Michael L. Littman and
                  Haym Hirsh},
  editor       = {William W. Cohen and
                  Andrew W. Moore},
  title        = {Experience-efficient learning in associative bandit problems},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Third International Conference
                  {(ICML} 2006), Pittsburgh, Pennsylvania, USA, June 25-29, 2006},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {148},
  pages        = {889--896},
  publisher    = {{ACM}},
  year         = {2006},
  url          = {https://doi.org/10.1145/1143844.1143956},
  doi          = {10.1145/1143844.1143956},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/StrehlMLH06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/uai/StrehlLL06,
  author       = {Alexander L. Strehl and
                  Lihong Li and
                  Michael L. Littman},
  title        = {Incremental Model-based Learners With Formal Learning-Time Guarantees},
  booktitle    = {{UAI} '06, Proceedings of the 22nd Conference in Uncertainty in Artificial
                  Intelligence, Cambridge, MA, USA, July 13-16, 2006},
  publisher    = {{AUAI} Press},
  year         = {2006},
  url          = {https://dslpitt.org/uai/displayArticleDetails.jsp?mmnu=1\&\#38;smnu=2\&\#38;article\_id=1288\&\#38;proceeding\_id=22},
  timestamp    = {Wed, 03 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/uai/StrehlLL06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/StrehlL05,
  author       = {Alexander L. Strehl and
                  Michael L. Littman},
  editor       = {Luc De Raedt and
                  Stefan Wrobel},
  title        = {A theoretical analysis of Model-Based Interval Estimation},
  booktitle    = {Machine Learning, Proceedings of the Twenty-Second International Conference
                  {(ICML} 2005), Bonn, Germany, August 7-11, 2005},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {119},
  pages        = {856--863},
  publisher    = {{ACM}},
  year         = {2005},
  url          = {https://doi.org/10.1145/1102351.1102459},
  doi          = {10.1145/1102351.1102459},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/StrehlL05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/LefflerLSW05,
  author       = {Bethany R. Leffler and
                  Michael L. Littman and
                  Alexander L. Strehl and
                  Thomas J. Walsh},
  editor       = {Sebastian Thrun and
                  Gaurav S. Sukhatme and
                  Stefan Schaal},
  title        = {Efficient Exploration With Latent Structure},
  booktitle    = {Robotics: Science and Systems I, June 8-11, 2005, Massachusetts Institute
                  of Technology, Cambridge, Massachusetts, {USA}},
  pages        = {81--88},
  publisher    = {The {MIT} Press},
  year         = {2005},
  url          = {http://www.roboticsproceedings.org/rss01/p11.html},
  doi          = {10.15607/RSS.2005.I.011},
  timestamp    = {Tue, 15 Nov 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rss/LefflerLSW05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ajc/Strehl04,
  author       = {Alexander L. Strehl},
  title        = {Ternary codes through ternary designs},
  journal      = {Australas. {J} Comb.},
  volume       = {30},
  pages        = {21--30},
  year         = {2004},
  url          = {http://ajc.maths.uq.edu.au/pdf/30/ajc\_v30\_p021.pdf},
  timestamp    = {Wed, 11 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ajc/Strehl04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/ictai/StrehlL04,
  author       = {Alexander L. Strehl and
                  Michael L. Littman},
  title        = {An Empirical Evaluation of Interval Estimation for Markov Decision
                  Processes},
  booktitle    = {16th {IEEE} International Conference on Tools with Artificial Intelligence
                  {(ICTAI} 2004), 15-17 November 2004, Boca Raton, FL, {USA}},
  pages        = {128--135},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICTAI.2004.28},
  doi          = {10.1109/ICTAI.2004.28},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/ictai/StrehlL04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics