BibTeX records: Prashanth L. A.

download as .bib file

@article{DBLP:journals/orl/KollaABJ19,
  author    = {Ravi Kumar Kolla and
               Prashanth L. A. and
               Sanjay P. Bhat and
               Krishna P. Jagannathan},
  title     = {Concentration bounds for empirical conditional value-at-risk: The
               unbounded case},
  journal   = {Oper. Res. Lett.},
  volume    = {47},
  number    = {1},
  pages     = {16--20},
  year      = {2019},
  url       = {https://doi.org/10.1016/j.orl.2018.11.005},
  doi       = {10.1016/j.orl.2018.11.005},
  timestamp = {Wed, 13 Feb 2019 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/orl/KollaABJ19},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-00997,
  author    = {Ravi Kumar Kolla and
               Prashanth L. A. and
               Krishna P. Jagannathan},
  title     = {Risk-aware Multi-armed Bandits Using Conditional Value-at-Risk},
  journal   = {CoRR},
  volume    = {abs/1901.00997},
  year      = {2019},
  url       = {http://arxiv.org/abs/1901.00997},
  archivePrefix = {arXiv},
  eprint    = {1901.00997},
  timestamp = {Thu, 31 Jan 2019 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1901-00997},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-02953,
  author    = {Vinay Praneeth Boda and
               Prashanth L. A.},
  title     = {Correlated bandits or: How to minimize mean-squared error online},
  journal   = {CoRR},
  volume    = {abs/1902.02953},
  year      = {2019},
  url       = {http://arxiv.org/abs/1902.02953},
  archivePrefix = {arXiv},
  eprint    = {1902.02953},
  timestamp = {Fri, 01 Mar 2019 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1902-02953},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1902-10709,
  author    = {Sanjay P. Bhat and
               Prashanth L. A.},
  title     = {Improved Concentration Bounds for Conditional Value-at-Risk and Cumulative
               Prospect Theory using Wasserstein distance},
  journal   = {CoRR},
  volume    = {abs/1902.10709},
  year      = {2019},
  url       = {http://arxiv.org/abs/1902.10709},
  archivePrefix = {arXiv},
  eprint    = {1902.10709},
  timestamp = {Mon, 04 Mar 2019 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1902-10709},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tac/JieAFMS18,
  author    = {Cheng Jie and
               Prashanth L. A. and
               Michael C. Fu and
               Steven I. Marcus and
               Csaba Szepesv{\'{a}}ri},
  title     = {Stochastic Optimization in a Cumulative Prospect Theory Framework},
  journal   = {{IEEE} Trans. Automat. Contr.},
  volume    = {63},
  number    = {9},
  pages     = {2867--2882},
  year      = {2018},
  url       = {https://doi.org/10.1109/TAC.2018.2822658},
  doi       = {10.1109/TAC.2018.2822658},
  timestamp = {Thu, 13 Sep 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/tac/JieAFMS18},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-01739,
  author    = {Ravi Kumar Kolla and
               Prashanth L. A. and
               Sanjay P. Bhat and
               Krishna P. Jagannathan},
  title     = {Concentration bounds for empirical conditional value-at-risk: The
               unbounded case},
  journal   = {CoRR},
  volume    = {abs/1808.01739},
  year      = {2018},
  url       = {http://arxiv.org/abs/1808.01739},
  archivePrefix = {arXiv},
  eprint    = {1808.01739},
  timestamp = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1808-01739},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1808-02871,
  author    = {Prashanth L. A. and
               Shalabh Bhatnagar and
               Nirav Bhavsar and
               Michael C. Fu and
               Steven I. Marcus},
  title     = {Random directions stochastic approximation with deterministic perturbations},
  journal   = {CoRR},
  volume    = {abs/1808.02871},
  year      = {2018},
  url       = {http://arxiv.org/abs/1808.02871},
  archivePrefix = {arXiv},
  eprint    = {1808.02871},
  timestamp = {Sun, 02 Sep 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1808-02871},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1810-09126,
  author    = {Prashanth L. A. and
               Michael C. Fu},
  title     = {Risk-Sensitive Reinforcement Learning: {A} Constrained Optimization
               Viewpoint},
  journal   = {CoRR},
  volume    = {abs/1810.09126},
  year      = {2018},
  url       = {http://arxiv.org/abs/1810.09126},
  archivePrefix = {arXiv},
  eprint    = {1810.09126},
  timestamp = {Wed, 31 Oct 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/corr/abs-1810-09126},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tac/ABFM17,
  author    = {Prashanth L. A. and
               Shalabh Bhatnagar and
               Michael C. Fu and
               Steven I. Marcus},
  title     = {Adaptive System Optimization Using Random Directions Stochastic Approximation},
  journal   = {{IEEE} Trans. Automat. Contr.},
  volume    = {62},
  number    = {5},
  pages     = {2223--2238},
  year      = {2017},
  url       = {https://doi.org/10.1109/TAC.2016.2600643},
  doi       = {10.1109/TAC.2016.2600643},
  timestamp = {Wed, 26 Jul 2017 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/tac/ABFM17},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/GopalanAFM17,
  author    = {Aditya Gopalan and
               Prashanth L. A. and
               Michael C. Fu and
               Steven I. Marcus},
  title     = {Weighted Bandits or: How Bandits Learn Distorted Values That Are Not
               Expected},
  booktitle = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
               February 4-9, 2017, San Francisco, California, {USA.}},
  pages     = {1941--1947},
  year      = {2017},
  crossref  = {DBLP:conf/aaai/2017},
  url       = {http://aaai.org/ocs/index.php/AAAI/AAAI17/paper/view/14896},
  timestamp = {Sat, 13 May 2017 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/aaai/GopalanAFM17},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ml/AG16,
  author    = {Prashanth L. A. and
               Mohammad Ghavamzadeh},
  title     = {Variance-constrained actor-critic algorithms for discounted and average
               reward MDPs},
  journal   = {Machine Learning},
  volume    = {105},
  number    = {3},
  pages     = {367--417},
  year      = {2016},
  url       = {https://doi.org/10.1007/s10994-016-5569-5},
  doi       = {10.1007/s10994-016-5569-5},
  timestamp = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/ml/AG16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/scl/APBC16,
  author    = {Prashanth L. A. and
               H. L. Prasad and
               Shalabh Bhatnagar and
               Prakash Chandra},
  title     = {A constrained optimization perspective on actor-critic algorithms
               and application to network routing},
  journal   = {Systems {\&} Control Letters},
  volume    = {92},
  pages     = {46--51},
  year      = {2016},
  url       = {https://doi.org/10.1016/j.sysconle.2016.02.020},
  doi       = {10.1016/j.sysconle.2016.02.020},
  timestamp = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/scl/APBC16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aistats/HuAGS16,
  author    = {Xiaowei Hu and
               Prashanth L. A. and
               Andr{\'{a}}s Gy{\"{o}}rgy and
               Csaba Szepesv{\'{a}}ri},
  title     = {(Bandit) Convex Optimization with Biased Noisy Gradient Oracles},
  booktitle = {Proceedings of the 19th International Conference on Artificial Intelligence
               and Statistics, {AISTATS} 2016, Cadiz, Spain, May 9-11, 2016},
  pages     = {819--828},
  year      = {2016},
  crossref  = {DBLP:conf/aistats/2016},
  url       = {http://jmlr.org/proceedings/papers/v51/hu16b.html},
  timestamp = {Wed, 03 Apr 2019 18:02:00 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/aistats/HuAGS16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cdc/ReddyAB16,
  author    = {D. Sai Koti Reddy and
               Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Improved Hessian estimation for adaptive random directions stochastic
               approximation},
  booktitle = {55th {IEEE} Conference on Decision and Control, {CDC} 2016, Las Vegas,
               NV, USA, December 12-14, 2016},
  pages     = {3682--3687},
  year      = {2016},
  crossref  = {DBLP:conf/cdc/2016},
  url       = {https://doi.org/10.1109/CDC.2016.7798823},
  doi       = {10.1109/CDC.2016.7798823},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/cdc/ReddyAB16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/AJFMS16,
  author    = {Prashanth L. A. and
               Cheng Jie and
               Michael C. Fu and
               Steven I. Marcus and
               Csaba Szepesv{\'{a}}ri},
  title     = {Cumulative Prospect Theory Meets Reinforcement Learning: Prediction
               and Control},
  booktitle = {Proceedings of the 33nd International Conference on Machine Learning,
               {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  pages     = {1406--1415},
  year      = {2016},
  crossref  = {DBLP:conf/icml/2016},
  url       = {http://jmlr.org/proceedings/papers/v48/la16.html},
  timestamp = {Wed, 03 Apr 2019 18:02:22 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/icml/AJFMS16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/HuAGS16,
  author    = {Xiaowei Hu and
               Prashanth L. A. and
               Andr{\'{a}}s Gy{\"{o}}rgy and
               Csaba Szepesv{\'{a}}ri},
  title     = {(Bandit) Convex Optimization with Biased Noisy Gradient Oracles},
  journal   = {CoRR},
  volume    = {abs/1609.07087},
  year      = {2016},
  url       = {http://arxiv.org/abs/1609.07087},
  archivePrefix = {arXiv},
  eprint    = {1609.07087},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/HuAGS16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/GopalanAFM16,
  author    = {Aditya Gopalan and
               Prashanth L. A. and
               Michael C. Fu and
               Steven I. Marcus},
  title     = {Weighted bandits or: How bandits learn distorted values that are not
               expected},
  journal   = {CoRR},
  volume    = {abs/1611.10283},
  year      = {2016},
  url       = {http://arxiv.org/abs/1611.10283},
  archivePrefix = {arXiv},
  eprint    = {1611.10283},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/GopalanAFM16},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/jota/BhatnagarA15,
  author    = {Shalabh Bhatnagar and
               Prashanth L. A.},
  title     = {Simultaneous Perturbation Newton Algorithms for Simulation Optimization},
  journal   = {J. Optimization Theory and Applications},
  volume    = {164},
  number    = {2},
  pages     = {621--643},
  year      = {2015},
  url       = {https://doi.org/10.1007/s10957-013-0507-1},
  doi       = {10.1007/s10957-013-0507-1},
  timestamp = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/jota/BhatnagarA15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/simulation/APDBD15,
  author    = {Prashanth L. A. and
               H. L. Prasad and
               Nirmit Desai and
               Shalabh Bhatnagar and
               Gargi Dasgupta},
  title     = {Simultaneous perturbation methods for adaptive labor staffing in service
               systems},
  journal   = {Simulation},
  volume    = {91},
  number    = {5},
  pages     = {432--455},
  year      = {2015},
  url       = {https://doi.org/10.1177/0037549715581198},
  doi       = {10.1177/0037549715581198},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/simulation/APDBD15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KordaAM15,
  author    = {Nathaniel Korda and
               Prashanth L. A. and
               R{\'{e}}mi Munos},
  title     = {Fast Gradient Descent for Drifting Least Squares Regression, with
               Application to Bandits},
  booktitle = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
               January 25-30, 2015, Austin, Texas, {USA.}},
  pages     = {2708--2714},
  year      = {2015},
  crossref  = {DBLP:conf/aaai/2015},
  url       = {http://www.aaai.org/ocs/index.php/AAAI/AAAI15/paper/view/9820},
  timestamp = {Sun, 12 Apr 2015 12:16:43 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/aaai/KordaAM15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/PrasadAB15,
  author    = {H. L. Prasad and
               Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Two-Timescale Algorithms for Learning Nash Equilibria in General-Sum
               Stochastic Games},
  booktitle = {Proceedings of the 2015 International Conference on Autonomous Agents
               and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages     = {1371--1379},
  year      = {2015},
  crossref  = {DBLP:conf/atal/2015},
  url       = {http://dl.acm.org/citation.cfm?id=2773328},
  timestamp = {Fri, 15 May 2015 16:18:42 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/atal/PrasadAB15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/KordaA15,
  author    = {Nathaniel Korda and
               Prashanth L. A.},
  title     = {On {TD(0)} with function approximation: Concentration bounds and a
               centered variant with exponential convergence},
  booktitle = {Proceedings of the 32nd International Conference on Machine Learning,
               {ICML} 2015, Lille, France, 6-11 July 2015},
  pages     = {626--634},
  year      = {2015},
  crossref  = {DBLP:conf/icml/2015},
  url       = {http://jmlr.org/proceedings/papers/v37/korda15.html},
  timestamp = {Wed, 03 Apr 2019 18:02:12 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/icml/KordaA15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AB15,
  author    = {Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Adaptive system optimization using (simultaneous) random directions
               stochastic approximation},
  journal   = {CoRR},
  volume    = {abs/1502.05577},
  year      = {2015},
  url       = {http://arxiv.org/abs/1502.05577},
  archivePrefix = {arXiv},
  eprint    = {1502.05577},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/AB15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/ACFM15,
  author    = {Prashanth L. A. and
               Cheng Jie and
               Michael C. Fu and
               Steven I. Marcus},
  title     = {Cumulative Prospect Theory Meets Reinforcement Learning: Estimation
               and Control},
  journal   = {CoRR},
  volume    = {abs/1506.02632},
  year      = {2015},
  url       = {http://arxiv.org/abs/1506.02632},
  archivePrefix = {arXiv},
  eprint    = {1506.02632},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/ACFM15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/APBC15,
  author    = {Prashanth L. A. and
               H. L. Prasad and
               Shalabh Bhatnagar and
               Prakash Chandra},
  title     = {A constrained optimization perspective on actor critic algorithms
               and application to network routing},
  journal   = {CoRR},
  volume    = {abs/1507.07984},
  year      = {2015},
  url       = {http://arxiv.org/abs/1507.07984},
  archivePrefix = {arXiv},
  eprint    = {1507.07984},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/APBC15},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/winet/ACB14,
  author    = {Prashanth L. A. and
               Abhranil Chatterjee and
               Shalabh Bhatnagar},
  title     = {Two timescale convergent Q-learning for sleep-scheduling in wireless
               sensor networks},
  journal   = {Wireless Networks},
  volume    = {20},
  number    = {8},
  pages     = {2589--2604},
  year      = {2014},
  url       = {https://doi.org/10.1007/s11276-014-0762-6},
  doi       = {10.1007/s11276-014-0762-6},
  timestamp = {Fri, 30 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/winet/ACB14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/alt/A14,
  author    = {Prashanth L. A.},
  title     = {Policy Gradients for CVaR-Constrained MDPs},
  booktitle = {Algorithmic Learning Theory - 25th International Conference, {ALT}
               2014, Bled, Slovenia, October 8-10, 2014. Proceedings},
  pages     = {155--169},
  year      = {2014},
  crossref  = {DBLP:conf/alt/2014},
  url       = {https://doi.org/10.1007/978-3-319-11662-4\_12},
  doi       = {10.1007/978-3-319-11662-4\_12},
  timestamp = {Fri, 26 May 2017 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/alt/A14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cdc/FonteneauA14,
  author    = {Raphael Fonteneau and
               Prashanth L. A.},
  title     = {Simultaneous perturbation algorithms for batch off-policy search},
  booktitle = {53rd {IEEE} Conference on Decision and Control, {CDC} 2014, Los Angeles,
               CA, USA, December 15-17, 2014},
  pages     = {2622--2627},
  year      = {2014},
  crossref  = {DBLP:conf/cdc/2014},
  url       = {https://doi.org/10.1109/CDC.2014.7039790},
  doi       = {10.1109/CDC.2014.7039790},
  timestamp = {Fri, 19 May 2017 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/cdc/FonteneauA14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/comsnets/ACB14,
  author    = {Prashanth L. A. and
               Abhranil Chatterjee and
               Shalabh Bhatnagar},
  title     = {Adaptive sleep-wake control using reinforcement learning in sensor
               networks},
  booktitle = {Sixth International Conference on Communication Systems and Networks,
               {COMSNETS} 2014, Bangalore, India, January 6-10, 2014},
  pages     = {1--8},
  year      = {2014},
  crossref  = {DBLP:conf/comsnets/2014},
  url       = {https://doi.org/10.1109/COMSNETS.2014.6734874},
  doi       = {10.1109/COMSNETS.2014.6734874},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/comsnets/ACB14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/pkdd/AKM14,
  author    = {Prashanth L. A. and
               Nathaniel Korda and
               R{\'{e}}mi Munos},
  title     = {Fast {LSTD} Using Stochastic Approximation: Finite Time Analysis and
               Application to Traffic Control},
  booktitle = {Machine Learning and Knowledge Discovery in Databases - European Conference,
               {ECML} {PKDD} 2014, Nancy, France, September 15-19, 2014. Proceedings,
               Part {II}},
  pages     = {66--81},
  year      = {2014},
  crossref  = {DBLP:conf/pkdd/2014-2},
  url       = {https://doi.org/10.1007/978-3-662-44851-9\_5},
  doi       = {10.1007/978-3-662-44851-9\_5},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/pkdd/AKM14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PrasadAB14,
  author    = {H. L. Prasad and
               Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Algorithms for Nash Equilibria in General-Sum Stochastic Games},
  journal   = {CoRR},
  volume    = {abs/1401.2086},
  year      = {2014},
  url       = {http://arxiv.org/abs/1401.2086},
  archivePrefix = {arXiv},
  eprint    = {1401.2086},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/PrasadAB14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/FonteneauA14,
  author    = {Raphael Fonteneau and
               Prashanth L. A.},
  title     = {Simultaneous Perturbation Algorithms for Batch Off-Policy Search},
  journal   = {CoRR},
  volume    = {abs/1403.4514},
  year      = {2014},
  url       = {http://arxiv.org/abs/1403.4514},
  archivePrefix = {arXiv},
  eprint    = {1403.4514},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/FonteneauA14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AG14,
  author    = {Prashanth L. A. and
               Mohammad Ghavamzadeh},
  title     = {Actor-Critic Algorithms for Risk-Sensitive Reinforcement Learning},
  journal   = {CoRR},
  volume    = {abs/1403.6530},
  year      = {2014},
  url       = {http://arxiv.org/abs/1403.6530},
  archivePrefix = {arXiv},
  eprint    = {1403.6530},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/AG14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/A14a,
  author    = {Prashanth L. A.},
  title     = {Policy Gradients for CVaR-Constrained MDPs},
  journal   = {CoRR},
  volume    = {abs/1405.2690},
  year      = {2014},
  url       = {http://arxiv.org/abs/1405.2690},
  archivePrefix = {arXiv},
  eprint    = {1405.2690},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/A14a},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KordaP14,
  author    = {Nathaniel Korda and
               Prashanth L. A.},
  title     = {On {TD(0)} with function approximation: Concentration bounds and a
               centered variant with exponential convergence},
  journal   = {CoRR},
  volume    = {abs/1411.3224},
  year      = {2014},
  url       = {http://arxiv.org/abs/1411.3224},
  archivePrefix = {arXiv},
  eprint    = {1411.3224},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/KordaP14},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/atal/AnanthapadmanabharaoPDB13,
  author    = {Prashanth Lakshmanrao Ananthapadmanabharao and
               Horabailu Laxminarayana Prasad and
               Nirmit Desai and
               Shalabh Bhatnagar},
  title     = {Mechanisms for hostile agents with capacity constraints},
  booktitle = {International conference on Autonomous Agents and Multi-Agent Systems,
               {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages     = {659--666},
  year      = {2013},
  crossref  = {DBLP:conf/atal/2013},
  url       = {http://dl.acm.org/citation.cfm?id=2485024},
  timestamp = {Fri, 28 Jun 2013 12:19:40 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/atal/AnanthapadmanabharaoPDB13},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/LAG13,
  author    = {Prashanth L. A. and
               Mohammad Ghavamzadeh},
  title     = {Actor-Critic Algorithms for Risk-Sensitive MDPs},
  booktitle = {Advances in Neural Information Processing Systems 26: 27th Annual
               Conference on Neural Information Processing Systems 2013. Proceedings
               of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States.},
  pages     = {252--260},
  year      = {2013},
  crossref  = {DBLP:conf/nips/2013},
  url       = {http://papers.nips.cc/paper/4917-actor-critic-algorithms-for-risk-sensitive-mdps},
  timestamp = {Fri, 31 Jan 2014 12:11:40 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/nips/LAG13},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PrashanthKM13,
  author    = {Prashanth L. A. and
               Nathaniel Korda and
               R{\'{e}}mi Munos},
  title     = {Analysis of stochastic approximation for efficient least squares regression
               and {LSTD}},
  journal   = {CoRR},
  volume    = {abs/1306.2557},
  year      = {2013},
  url       = {http://arxiv.org/abs/1306.2557},
  archivePrefix = {arXiv},
  eprint    = {1306.2557},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/PrashanthKM13},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/KordaPM13,
  author    = {Nathaniel Korda and
               Prashanth L. A. and
               R{\'{e}}mi Munos},
  title     = {Online gradient descent for least squares regression: Non-asymptotic
               bounds and application to bandits},
  journal   = {CoRR},
  volume    = {abs/1307.3176},
  year      = {2013},
  url       = {http://arxiv.org/abs/1307.3176},
  archivePrefix = {arXiv},
  eprint    = {1307.3176},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/KordaPM13},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/AnanthapadmanabharaoCB13,
  author    = {Prashanth Lakshmanrao Ananthapadmanabharao and
               Abhranil Chatterjee and
               Shalabh Bhatnagar},
  title     = {Reinforcement Learning for Sleep-Wake Scheduling in Sensor Networks},
  journal   = {CoRR},
  volume    = {abs/1312.7292},
  year      = {2013},
  url       = {http://arxiv.org/abs/1312.7292},
  archivePrefix = {arXiv},
  eprint    = {1312.7292},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/AnanthapadmanabharaoCB13},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/PrashanthPDBD13,
  author    = {Prashanth L. A. and
               H. L. Prasad and
               Nirmit Desai and
               Shalabh Bhatnagar and
               Gargi Dasgupta},
  title     = {Simultaneous Perturbation Methods for Adaptive Labor Staffing in Service
               Systems},
  journal   = {CoRR},
  volume    = {abs/1312.7430},
  year      = {2013},
  url       = {http://arxiv.org/abs/1312.7430},
  archivePrefix = {arXiv},
  eprint    = {1312.7430},
  timestamp = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl    = {https://dblp.org/rec/bib/journals/corr/PrashanthPDBD13},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tvt/PrashanthB12,
  author    = {Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Threshold Tuning Using Stochastic Optimization for Graded Signal Control},
  journal   = {{IEEE} Trans. Vehicular Technology},
  volume    = {61},
  number    = {9},
  pages     = {3865--3880},
  year      = {2012},
  url       = {https://doi.org/10.1109/TVT.2012.2209904},
  doi       = {10.1109/TVT.2012.2209904},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/tvt/PrashanthB12},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tits/PrashanthB11,
  author    = {Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Reinforcement Learning With Function Approximation for Traffic Signal
               Control},
  journal   = {{IEEE} Trans. Intelligent Transportation Systems},
  volume    = {12},
  number    = {2},
  pages     = {412--421},
  year      = {2011},
  url       = {https://doi.org/10.1109/TITS.2010.2091408},
  doi       = {10.1109/TITS.2010.2091408},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/journals/tits/PrashanthB11},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icsoc/PrashanthPDBD11,
  author    = {Prashanth L. A. and
               H. L. Prasad and
               Nirmit Desai and
               Shalabh Bhatnagar and
               Gargi Banerjee Dasgupta},
  title     = {Stochastic Optimization for Adaptive Labor Staffing in Service Systems},
  booktitle = {Service-Oriented Computing - 9th International Conference, {ICSOC}
               2011, Paphos, Cyprus, December 5-8, 2011 Proceedings},
  pages     = {487--494},
  year      = {2011},
  crossref  = {DBLP:conf/icsoc/2011},
  url       = {https://doi.org/10.1007/978-3-642-25535-9\_33},
  doi       = {10.1007/978-3-642-25535-9\_33},
  timestamp = {Wed, 13 Feb 2019 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/icsoc/PrashanthPDBD11},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/itsc/AB11,
  author    = {Prashanth L. A. and
               Shalabh Bhatnagar},
  title     = {Reinforcement learning with average cost for adaptive control of traffic
               lights at intersections},
  booktitle = {14th International {IEEE} Conference on Intelligent Transportation
               Systems, {ITSC} 2011, Washington, DC, USA, October 5-7, 2011},
  pages     = {1640--1645},
  year      = {2011},
  crossref  = {DBLP:conf/itsc/2011},
  url       = {https://doi.org/10.1109/ITSC.2011.6082823},
  doi       = {10.1109/ITSC.2011.6082823},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/itsc/AB11},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/comsware/PrashanthG08,
  author    = {Prashanth L. A. and
               K. Gopinath},
  title     = {{OFDM-MAC} algorithms and their impact on {TCP} performance in next
               generation mobile networks},
  booktitle = {Proceedings of the Third International Conference on COMmunication
               System softWAre and MiddlewaRE {(COMSWARE} 2008), January 5-10, 2008,
               Bangalore, India},
  pages     = {133--140},
  year      = {2008},
  crossref  = {DBLP:conf/comsware/2008},
  url       = {https://doi.org/10.1109/COMSWA.2008.4554395},
  doi       = {10.1109/COMSWA.2008.4554395},
  timestamp = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/comsware/PrashanthG08},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/aaai/2017,
  editor    = {Satinder P. Singh and
               Shaul Markovitch},
  title     = {Proceedings of the Thirty-First {AAAI} Conference on Artificial Intelligence,
               February 4-9, 2017, San Francisco, California, {USA}},
  publisher = {{AAAI} Press},
  year      = {2017},
  url       = {http://www.aaai.org/Library/AAAI/aaai17contents.php},
  timestamp = {Mon, 06 Mar 2017 08:17:31 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/aaai/2017},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/aistats/2016,
  editor    = {Arthur Gretton and
               Christian C. Robert},
  title     = {Proceedings of the 19th International Conference on Artificial Intelligence
               and Statistics, {AISTATS} 2016, Cadiz, Spain, May 9-11, 2016},
  series    = {{JMLR} Workshop and Conference Proceedings},
  volume    = {51},
  publisher = {JMLR.org},
  year      = {2016},
  url       = {http://jmlr.org/proceedings/papers/v51/},
  timestamp = {Wed, 03 Apr 2019 18:02:00 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/aistats/2016},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/cdc/2016,
  title     = {55th {IEEE} Conference on Decision and Control, {CDC} 2016, Las Vegas,
               NV, USA, December 12-14, 2016},
  publisher = {{IEEE}},
  year      = {2016},
  url       = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=7786694},
  isbn      = {978-1-5090-1837-6},
  timestamp = {Tue, 03 Jan 2017 12:13:39 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/cdc/2016},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/icml/2016,
  editor    = {Maria{-}Florina Balcan and
               Kilian Q. Weinberger},
  title     = {Proceedings of the 33nd International Conference on Machine Learning,
               {ICML} 2016, New York City, NY, USA, June 19-24, 2016},
  series    = {{JMLR} Workshop and Conference Proceedings},
  volume    = {48},
  publisher = {JMLR.org},
  year      = {2016},
  url       = {http://jmlr.org/proceedings/papers/v48/},
  timestamp = {Wed, 03 Apr 2019 18:02:22 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/icml/2016},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/aaai/2015,
  editor    = {Blai Bonet and
               Sven Koenig},
  title     = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
               January 25-30, 2015, Austin, Texas, {USA}},
  publisher = {{AAAI} Press},
  year      = {2015},
  url       = {http://www.aaai.org/Library/AAAI/aaai15contents.php},
  isbn      = {978-1-57735-698-1},
  timestamp = {Sun, 12 Apr 2015 12:16:43 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/aaai/2015},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/atal/2015,
  editor    = {Gerhard Weiss and
               Pinar Yolum and
               Rafael H. Bordini and
               Edith Elkind},
  title     = {Proceedings of the 2015 International Conference on Autonomous Agents
               and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  publisher = {{ACM}},
  year      = {2015},
  url       = {http://dl.acm.org/citation.cfm?id=2772879},
  isbn      = {978-1-4503-3413-6},
  timestamp = {Fri, 15 May 2015 16:18:42 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/atal/2015},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/icml/2015,
  editor    = {Francis R. Bach and
               David M. Blei},
  title     = {Proceedings of the 32nd International Conference on Machine Learning,
               {ICML} 2015, Lille, France, 6-11 July 2015},
  series    = {{JMLR} Workshop and Conference Proceedings},
  volume    = {37},
  publisher = {JMLR.org},
  year      = {2015},
  url       = {http://jmlr.org/proceedings/papers/v37/},
  timestamp = {Wed, 03 Apr 2019 18:02:12 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/icml/2015},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/alt/2014,
  editor    = {Peter Auer and
               Alexander Clark and
               Thomas Zeugmann and
               Sandra Zilles},
  title     = {Algorithmic Learning Theory - 25th International Conference, {ALT}
               2014, Bled, Slovenia, October 8-10, 2014. Proceedings},
  series    = {Lecture Notes in Computer Science},
  volume    = {8776},
  publisher = {Springer},
  year      = {2014},
  url       = {https://doi.org/10.1007/978-3-319-11662-4},
  doi       = {10.1007/978-3-319-11662-4},
  isbn      = {978-3-319-11661-7},
  timestamp = {Fri, 26 May 2017 00:48:26 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/alt/2014},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/cdc/2014,
  title     = {53rd {IEEE} Conference on Decision and Control, {CDC} 2014, Los Angeles,
               CA, USA, December 15-17, 2014},
  publisher = {{IEEE}},
  year      = {2014},
  url       = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=7027307},
  isbn      = {978-1-4799-7746-8},
  timestamp = {Wed, 18 Feb 2015 19:58:28 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/cdc/2014},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/comsnets/2014,
  title     = {Sixth International Conference on Communication Systems and Networks,
               {COMSNETS} 2014, Bangalore, India, January 6-10, 2014},
  publisher = {{IEEE}},
  year      = {2014},
  url       = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=6720258},
  timestamp = {Wed, 12 Feb 2014 15:46:04 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/comsnets/2014},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/pkdd/2014-2,
  editor    = {Toon Calders and
               Floriana Esposito and
               Eyke H{\"{u}}llermeier and
               Rosa Meo},
  title     = {Machine Learning and Knowledge Discovery in Databases - European Conference,
               {ECML} {PKDD} 2014, Nancy, France, September 15-19, 2014. Proceedings,
               Part {II}},
  series    = {Lecture Notes in Computer Science},
  volume    = {8725},
  publisher = {Springer},
  year      = {2014},
  url       = {https://doi.org/10.1007/978-3-662-44851-9},
  doi       = {10.1007/978-3-662-44851-9},
  isbn      = {978-3-662-44850-2},
  timestamp = {Mon, 22 May 2017 17:11:17 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/pkdd/2014-2},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/atal/2013,
  editor    = {Maria L. Gini and
               Onn Shehory and
               Takayuki Ito and
               Catholijn M. Jonker},
  title     = {International conference on Autonomous Agents and Multi-Agent Systems,
               {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  publisher = {{IFAAMAS}},
  year      = {2013},
  url       = {http://dl.acm.org/citation.cfm?id=2484920},
  isbn      = {978-1-4503-1993-5},
  timestamp = {Fri, 28 Jun 2013 12:19:40 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/atal/2013},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/nips/2013,
  editor    = {Christopher J. C. Burges and
               L{\'{e}}on Bottou and
               Zoubin Ghahramani and
               Kilian Q. Weinberger},
  title     = {Advances in Neural Information Processing Systems 26: 27th Annual
               Conference on Neural Information Processing Systems 2013. Proceedings
               of a meeting held December 5-8, 2013, Lake Tahoe, Nevada, United States},
  year      = {2013},
  url       = {http://papers.nips.cc/book/advances-in-neural-information-processing-systems-26-2013},
  timestamp = {Fri, 31 Jan 2014 12:11:40 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/nips/2013},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/icsoc/2011,
  editor    = {Gerti Kappel and
               Zakaria Maamar and
               Hamid R. Motahari Nezhad},
  title     = {Service-Oriented Computing - 9th International Conference, {ICSOC}
               2011, Paphos, Cyprus, December 5-8, 2011 Proceedings},
  series    = {Lecture Notes in Computer Science},
  volume    = {7084},
  publisher = {Springer},
  year      = {2011},
  url       = {https://doi.org/10.1007/978-3-642-25535-9},
  doi       = {10.1007/978-3-642-25535-9},
  isbn      = {978-3-642-25534-2},
  timestamp = {Fri, 19 May 2017 01:25:50 +0200},
  biburl    = {https://dblp.org/rec/bib/conf/icsoc/2011},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/itsc/2011,
  title     = {14th International {IEEE} Conference on Intelligent Transportation
               Systems, {ITSC} 2011, Washington, DC, USA, October 5-7, 2011},
  publisher = {{IEEE}},
  year      = {2011},
  url       = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=6069628},
  isbn      = {978-1-4577-2198-4},
  timestamp = {Mon, 21 Nov 2016 12:16:55 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/itsc/2011},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/comsware/2008,
  editor    = {Sunghyun Choi and
               Jim Kurose and
               Krithi Ramamritham},
  title     = {Proceedings of the Third International Conference on COMmunication
               System softWAre and MiddlewaRE {(COMSWARE} 2008), January 5-10, 2008,
               Bangalore, India},
  publisher = {{IEEE}},
  year      = {2008},
  url       = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=4545865},
  isbn      = {978-1-4244-1797-1},
  timestamp = {Tue, 24 Mar 2015 18:02:55 +0100},
  biburl    = {https://dblp.org/rec/bib/conf/comsware/2008},
  bibsource = {dblp computer science bibliography, https://dblp.org}
}
maintained by Schloss Dagstuhl LZI, founded at University of Trier