Stop the war!

Остановите войну!

for scientists:

default search action

combined dblp search
author search
venue search
publication search

ask others

BibTeX records: Shalabh Bhatnagar

Name: dblp XML data dump
Creator: Schloss Dagstuhl - Leibniz Center for Informatics
Published: 1993
License: https://creativecommons.org/publicdomain/zero/1.0/
Keywords: dblp, XML, computer science, scholarly publications, metadata

> Home > Persons > Shalabh Bhatnagar

download as .bib file

@article{DBLP:journals/icl/BaratJB24,
  author       = {Arghyadeep Barat and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Energy Management in a Cooperative Energy Harvesting Wireless Sensor
                  Network},
  journal      = {{IEEE} Commun. Lett.},
  volume       = {28},
  number       = {1},
  pages        = {243--247},
  year         = {2024},
  url          = {https://doi.org/10.1109/LCOMM.2023.3335143},
  doi          = {10.1109/LCOMM.2023.3335143},
  timestamp    = {Fri, 26 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/icl/BaratJB24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/isgt/VivekDB24,
  author       = {V. P. Vivek and
                  Raghuram Bharadwaj Diddigi and
                  Shalabh Bhatnagar},
  title        = {Dynamic Energy Management in Competing Microgrids using Reinforcement
                  Learning},
  booktitle    = {{IEEE} Power {\&} Energy Society Innovative Smart Grid Technologies
                  Conference, {ISGT} 2024, Washington, DC, USA, February 19-22, 2024},
  pages        = {1--5},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ISGT59692.2024.10454198},
  doi          = {10.1109/ISGT59692.2024.10454198},
  timestamp    = {Wed, 13 Mar 2024 18:04:53 +0100},
  biburl       = {https://dblp.org/rec/conf/isgt/VivekDB24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2402-01371,
  author       = {Prashansa Panda and
                  Shalabh Bhatnagar},
  title        = {Critic-Actor for Average Reward MDPs with Function Approximation:
                  {A} Finite-Time Analysis},
  journal      = {CoRR},
  volume       = {abs/2402.01371},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.01371},
  doi          = {10.48550/ARXIV.2402.01371},
  eprinttype    = {arXiv},
  eprint       = {2402.01371},
  timestamp    = {Fri, 09 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-01371.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/csysl/BhatnagarBG23,
  author       = {Shalabh Bhatnagar and
                  Vivek S. Borkar and
                  Soumyajit Guin},
  title        = {Actor-Critic or Critic-Actor? {A} Tale of Two Time Scales},
  journal      = {{IEEE} Control. Syst. Lett.},
  volume       = {7},
  pages        = {2671--2676},
  year         = {2023},
  url          = {https://doi.org/10.1109/LCSYS.2023.3288931},
  doi          = {10.1109/LCSYS.2023.3288931},
  timestamp    = {Fri, 21 Jul 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/csysl/BhatnagarBG23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/GuinB23,
  author       = {Soumyajit Guin and
                  Shalabh Bhatnagar},
  title        = {A Policy Gradient Approach for Finite Horizon Constrained Markov Decision
                  Processes},
  booktitle    = {62nd {IEEE} Conference on Decision and Control, {CDC} 2023, Singapore,
                  December 13-15, 2023},
  pages        = {3353--3359},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CDC49753.2023.10383413},
  doi          = {10.1109/CDC49753.2023.10383413},
  timestamp    = {Mon, 29 Jan 2024 17:30:32 +0100},
  biburl       = {https://dblp.org/rec/conf/cdc/GuinB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ciss/BhatnagarA23,
  author       = {Shalabh Bhatnagar and
                  Prashanth L. A.},
  title        = {Generalized Simultaneous Perturbation Stochastic Approximation with
                  Reduced Estimator Bias},
  booktitle    = {57th Annual Conference on Information Sciences and Systems, {CISS}
                  2023, Baltimore, MD, USA, March 22-24, 2023},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/CISS56502.2023.10089720},
  doi          = {10.1109/CISS56502.2023.10089720},
  timestamp    = {Sat, 22 Apr 2023 16:25:53 +0200},
  biburl       = {https://dblp.org/rec/conf/ciss/BhatnagarA23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icml/SaxenaKKB23,
  author       = {Naman Saxena and
                  Subhojyoti Khastagir and
                  Shishir Kolathaya and
                  Shalabh Bhatnagar},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Off-Policy Average Reward Actor-Critic with Deterministic Policy Search},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {30130--30203},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/saxena23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SaxenaKKB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ro-man/KarumanchiDJB23,
  author       = {Sambhu H. Karumanchi and
                  Raghuram Bharadwaj Diddigi and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Autonomous {UAV} Navigation in Complex Environments using Human Feedback},
  booktitle    = {32nd {IEEE} International Conference on Robot and Human Interactive
                  Communication, {RO-MAN} 2023, Busan, Republic of Korea, August 28-31,
                  2023},
  pages        = {499--506},
  publisher    = {{IEEE}},
  year         = {2023},
  url          = {https://doi.org/10.1109/RO-MAN57019.2023.10309494},
  doi          = {10.1109/RO-MAN57019.2023.10309494},
  timestamp    = {Thu, 23 Nov 2023 21:16:36 +0100},
  biburl       = {https://dblp.org/rec/conf/ro-man/KarumanchiDJB23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2303-07068,
  author       = {Lakshmi Mandal and
                  Shalabh Bhatnagar},
  title        = {n-Step Temporal Difference Learning with Optimal n},
  journal      = {CoRR},
  volume       = {abs/2303.07068},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2303.07068},
  doi          = {10.48550/ARXIV.2303.07068},
  eprinttype    = {arXiv},
  eprint       = {2303.07068},
  timestamp    = {Thu, 16 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2303-07068.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2304-10951,
  author       = {Mizhaan Prajit Maniyar and
                  Akash Mondal and
                  Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {A Cubic-regularized Policy Newton Algorithm for Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2304.10951},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2304.10951},
  doi          = {10.48550/ARXIV.2304.10951},
  eprinttype    = {arXiv},
  eprint       = {2304.10951},
  timestamp    = {Tue, 02 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2304-10951.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2305-12125,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar and
                  Naman Saxena},
  title        = {A Framework for Provably Stable and Consistent Training of Deep Feedforward
                  Networks},
  journal      = {CoRR},
  volume       = {abs/2305.12125},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.12125},
  doi          = {10.48550/ARXIV.2305.12125},
  eprinttype    = {arXiv},
  eprint       = {2305.12125},
  timestamp    = {Fri, 26 May 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-12125.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2305-12239,
  author       = {Naman Saxena and
                  Subhojyoti Khastagir and
                  Shishir Kolathaya and
                  Shalabh Bhatnagar},
  title        = {Off-Policy Average Reward Actor-Critic with Deterministic Policy Search},
  journal      = {CoRR},
  volume       = {abs/2305.12239},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.12239},
  doi          = {10.48550/ARXIV.2305.12239},
  eprinttype    = {arXiv},
  eprint       = {2305.12239},
  timestamp    = {Thu, 17 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-12239.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2310-05000,
  author       = {Shalabh Bhatnagar},
  title        = {The Reinforce Policy Gradient Algorithm Revisited},
  journal      = {CoRR},
  volume       = {abs/2310.05000},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.05000},
  doi          = {10.48550/ARXIV.2310.05000},
  eprinttype    = {arXiv},
  eprint       = {2310.05000},
  timestamp    = {Fri, 20 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-05000.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2310-05911,
  author       = {Arghyadeep Barat and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Energy Management in a Cooperative Energy Harvesting Wireless Sensor
                  Network},
  journal      = {CoRR},
  volume       = {abs/2310.05911},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.05911},
  doi          = {10.48550/ARXIV.2310.05911},
  eprinttype    = {arXiv},
  eprint       = {2310.05911},
  timestamp    = {Thu, 23 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-05911.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2310-16363,
  author       = {Prashansa Panda and
                  Shalabh Bhatnagar},
  title        = {Finite Time Analysis of Constrained Actor Critic and Constrained Natural
                  Actor Critic Algorithms},
  journal      = {CoRR},
  volume       = {abs/2310.16363},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2310.16363},
  doi          = {10.48550/ARXIV.2310.16363},
  eprinttype    = {arXiv},
  eprint       = {2310.16363},
  timestamp    = {Tue, 31 Oct 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2310-16363.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2311-11789,
  author       = {Lakshmi Mandal and
                  Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  title        = {Approximate Linear Programming and Decentralized Policy Improvement
                  in Cooperative Multi-agent Markov Decision Processes},
  journal      = {CoRR},
  volume       = {abs/2311.11789},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2311.11789},
  doi          = {10.48550/ARXIV.2311.11789},
  eprinttype    = {arXiv},
  eprint       = {2311.11789},
  timestamp    = {Thu, 23 Nov 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2311-11789.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/mor/RamaswamyB22,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Analyzing Approximate Value Iteration Algorithms},
  journal      = {Math. Oper. Res.},
  volume       = {47},
  number       = {3},
  pages        = {2138--2159},
  year         = {2022},
  url          = {https://doi.org/10.1287/moor.2021.1202},
  doi          = {10.1287/MOOR.2021.1202},
  timestamp    = {Mon, 05 Dec 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/mor/RamaswamyB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/KamanchiDB22,
  author       = {Chandramouli Kamanchi and
                  Raghuram Bharadwaj Diddigi and
                  Shalabh Bhatnagar},
  title        = {Generalized Second-Order Value Iteration in Markov Decision Processes},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {67},
  number       = {8},
  pages        = {4241--4247},
  year         = {2022},
  url          = {https://doi.org/10.1109/TAC.2021.3112851},
  doi          = {10.1109/TAC.2021.3112851},
  timestamp    = {Mon, 08 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/KamanchiDB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/DiddigiKB22,
  author       = {Raghuram Bharadwaj Diddigi and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  title        = {A Generalized Minimax Q-Learning Algorithm for Two-Player Zero-Sum
                  Stochastic Games},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {67},
  number       = {9},
  pages        = {4816--4823},
  year         = {2022},
  url          = {https://doi.org/10.1109/TAC.2022.3159453},
  doi          = {10.1109/TAC.2022.3159453},
  timestamp    = {Sat, 10 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/DiddigiKB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/aaai/DebB22,
  author       = {Rohan Deb and
                  Shalabh Bhatnagar},
  title        = {Gradient Temporal Difference with Momentum: Stability and Convergence},
  booktitle    = {Thirty-Sixth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2022, Thirty-Fourth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2022, The Twelveth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2022 Virtual Event, February 22
                  - March 1, 2022},
  pages        = {6488--6496},
  publisher    = {{AAAI} Press},
  year         = {2022},
  url          = {https://doi.org/10.1609/aaai.v36i6.20601},
  doi          = {10.1609/AAAI.V36I6.20601},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DebB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/allerton/DebGB22,
  author       = {Rohan Deb and
                  Meet Gandhi and
                  Shalabh Bhatnagar},
  title        = {Schedule Based Temporal Difference Algorithms},
  booktitle    = {58th Annual Allerton Conference on Communication, Control, and Computing,
                  Allerton 2022, Monticello, IL, USA, September 27-30, 2022},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/Allerton49937.2022.9929388},
  doi          = {10.1109/ALLERTON49937.2022.9929388},
  timestamp    = {Fri, 11 Nov 2022 16:53:12 +0100},
  biburl       = {https://dblp.org/rec/conf/allerton/DebGB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icaart/Shanmugasundaram22a,
  author       = {Priya Shanmugasundaram and
                  Shalabh Bhatnagar},
  editor       = {Ana Paula Rocha and
                  Luc Steels and
                  H. Jaap van den Herik},
  title        = {Co-operative Multi-agent Twin Delayed {DDPG} for Robust Phase Duration
                  Optimization of Large Road Networks},
  booktitle    = {Agents and Artificial Intelligence - 14th International Conference,
                  {ICAART} 2022, Virtual Event, February 3-5, 2022, Revised Selected
                  Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {13786},
  pages        = {122--142},
  publisher    = {Springer},
  year         = {2022},
  url          = {https://doi.org/10.1007/978-3-031-22953-4\_6},
  doi          = {10.1007/978-3-031-22953-4\_6},
  timestamp    = {Mon, 26 Jun 2023 20:44:19 +0200},
  biburl       = {https://dblp.org/rec/conf/icaart/Shanmugasundaram22a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icaart/Shanmugasundaram22,
  author       = {Priya Shanmugasundaram and
                  Shalabh Bhatnagar},
  editor       = {Ana Paula Rocha and
                  Luc Steels and
                  H. Jaap van den Herik},
  title        = {Robust Traffic Signal Timing Control using Multiagent Twin Delayed
                  Deep Deterministic Policy Gradients},
  booktitle    = {Proceedings of the 14th International Conference on Agents and Artificial
                  Intelligence, {ICAART} 2022, Volume 2, Online Streaming, February
                  3-5, 2022},
  pages        = {477--485},
  publisher    = {{SCITEPRESS}},
  year         = {2022},
  url          = {https://doi.org/10.5220/0010889300003116},
  doi          = {10.5220/0010889300003116},
  timestamp    = {Tue, 06 Jun 2023 14:58:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icaart/Shanmugasundaram22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icra/MishraSGKLSSBK22,
  author       = {Utkarsh A. Mishra and
                  Soumya R. Samineni and
                  Prakhar Goel and
                  Chandravaran Kunjeti and
                  Himanshu Lodha and
                  Aman Singh and
                  Aditya Sagi and
                  Shalabh Bhatnagar and
                  Shishir Kolathaya},
  title        = {Dynamic Mirror Descent based Model Predictive Control for Accelerating
                  Robot Learning},
  booktitle    = {2022 International Conference on Robotics and Automation, {ICRA} 2022,
                  Philadelphia, PA, USA, May 23-27, 2022},
  pages        = {1631--1637},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/ICRA46639.2022.9812089},
  doi          = {10.1109/ICRA46639.2022.9812089},
  timestamp    = {Wed, 20 Jul 2022 18:22:23 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/MishraSGKLSSBK22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ijcnn/DiddigiJJB22,
  author       = {Raghuram Bharadwaj Diddigi and
                  Prateek Jain and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Neural Network Compatible Off-Policy Natural Actor-Critic Algorithm},
  booktitle    = {International Joint Conference on Neural Networks, {IJCNN} 2022, Padua,
                  Italy, July 18-23, 2022},
  pages        = {1--10},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/IJCNN55064.2022.9892303},
  doi          = {10.1109/IJCNN55064.2022.9892303},
  timestamp    = {Mon, 10 Oct 2022 17:40:09 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/DiddigiJJB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/nips/JayantB22,
  author       = {Ashish Kumar Jayant and
                  Shalabh Bhatnagar},
  editor       = {Sanmi Koyejo and
                  S. Mohamed and
                  A. Agarwal and
                  Danielle Belgrave and
                  K. Cho and
                  A. Oh},
  title        = {Model-based Safe Deep Reinforcement Learning via a Constrained Proximal
                  Policy Optimization Algorithm},
  booktitle    = {Advances in Neural Information Processing Systems 35: Annual Conference
                  on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans,
                  LA, USA, November 28 - December 9, 2022},
  year         = {2022},
  url          = {http://papers.nips.cc/paper\_files/paper/2022/hash/9a8eb202c060b7d81f5889631cbcd47e-Abstract-Conference.html},
  timestamp    = {Mon, 08 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/JayantB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/smc/PadakandlaJGB22,
  author       = {Sindhu Padakandla and
                  Prabuchandran K. J. and
                  Sourav Ganguly and
                  Shalabh Bhatnagar},
  title        = {Data Efficient Safe Reinforcement Learning},
  booktitle    = {{IEEE} International Conference on Systems, Man, and Cybernetics,
                  {SMC} 2022, Prague, Czech Republic, October 9-12, 2022},
  pages        = {1167--1172},
  publisher    = {{IEEE}},
  year         = {2022},
  url          = {https://doi.org/10.1109/SMC53654.2022.9945313},
  doi          = {10.1109/SMC53654.2022.9945313},
  timestamp    = {Thu, 01 Dec 2022 15:59:35 +0100},
  biburl       = {https://dblp.org/rec/conf/smc/PadakandlaJGB22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2201-00286,
  author       = {Arun Raman and
                  Keerthan Shagrithaya and
                  Shalabh Bhatnagar},
  title        = {Reinforcement Learning for Task Specifications with Action-Constraints},
  journal      = {CoRR},
  volume       = {abs/2201.00286},
  year         = {2022},
  url          = {https://arxiv.org/abs/2201.00286},
  eprinttype    = {arXiv},
  eprint       = {2201.00286},
  timestamp    = {Mon, 10 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2201-00286.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2208-00290,
  author       = {Akash Mondal and
                  Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {A Gradient Smoothed Functional Algorithm with Truncated Cauchy Random
                  Perturbations for Stochastic Optimization},
  journal      = {CoRR},
  volume       = {abs/2208.00290},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2208.00290},
  doi          = {10.48550/ARXIV.2208.00290},
  eprinttype    = {arXiv},
  eprint       = {2208.00290},
  timestamp    = {Wed, 10 Aug 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2208-00290.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2210-04470,
  author       = {Shalabh Bhatnagar and
                  Vivek S. Borkar and
                  Soumyajit Guin},
  title        = {Actor-Critic or Critic-Actor? {A} Tale of Two Time Scales},
  journal      = {CoRR},
  volume       = {abs/2210.04470},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.04470},
  doi          = {10.48550/ARXIV.2210.04470},
  eprinttype    = {arXiv},
  eprint       = {2210.04470},
  timestamp    = {Wed, 12 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-04470.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2210-04527,
  author       = {Soumyajit Guin and
                  Shalabh Bhatnagar},
  title        = {A policy gradient approach for Finite Horizon Constrained Markov Decision
                  Processes},
  journal      = {CoRR},
  volume       = {abs/2210.04527},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.04527},
  doi          = {10.48550/ARXIV.2210.04527},
  eprinttype    = {arXiv},
  eprint       = {2210.04527},
  timestamp    = {Thu, 13 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-04527.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2210-07573,
  author       = {Ashish Kumar Jayant and
                  Shalabh Bhatnagar},
  title        = {Model-based Safe Deep Reinforcement Learning via a Constrained Proximal
                  Policy Optimization Algorithm},
  journal      = {CoRR},
  volume       = {abs/2210.07573},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2210.07573},
  doi          = {10.48550/ARXIV.2210.07573},
  eprinttype    = {arXiv},
  eprint       = {2210.07573},
  timestamp    = {Tue, 18 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2210-07573.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2212-10477,
  author       = {Shalabh Bhatnagar and
                  Prashanth L. A.},
  title        = {Generalized Simultaneous Perturbation Stochastic Approximation with
                  Reduced Estimator Bias},
  journal      = {CoRR},
  volume       = {abs/2212.10477},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2212.10477},
  doi          = {10.48550/ARXIV.2212.10477},
  eprinttype    = {arXiv},
  eprint       = {2212.10477},
  timestamp    = {Wed, 04 Jan 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2212-10477.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/apin/JPKB21,
  author       = {Prabuchandran K. J. and
                  Santosh Penubothula and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  title        = {Novel First Order Bayesian Optimization with an Application to Reinforcement
                  Learning},
  journal      = {Appl. Intell.},
  volume       = {51},
  number       = {3},
  pages        = {1565--1579},
  year         = {2021},
  url          = {https://doi.org/10.1007/s10489-020-01896-w},
  doi          = {10.1007/S10489-020-01896-W},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/apin/JPKB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/scl/KarmakarB21,
  author       = {Prasenjit Karmakar and
                  Shalabh Bhatnagar},
  title        = {On tight bounds for function approximation error in risk-sensitive
                  reinforcement learning},
  journal      = {Syst. Control. Lett.},
  volume       = {150},
  pages        = {104899},
  year         = {2021},
  url          = {https://doi.org/10.1016/j.sysconle.2021.104899},
  doi          = {10.1016/J.SYSCONLE.2021.104899},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scl/KarmakarB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/RamaswamyBQ21,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar and
                  Daniel E. Quevedo},
  title        = {Asynchronous Stochastic Approximations With Asymptotically Biased
                  Errors and Deep Multiagent Learning},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {66},
  number       = {9},
  pages        = {3969--3983},
  year         = {2021},
  url          = {https://doi.org/10.1109/TAC.2020.3026269},
  doi          = {10.1109/TAC.2020.3026269},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/RamaswamyBQ21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/KarmakarB21,
  author       = {Prasenjit Karmakar and
                  Shalabh Bhatnagar},
  title        = {Stochastic Approximation With Iterate-Dependent Markov Noise Under
                  Verifiable Conditions in Compact State Space With the Stability of
                  Iterates Not Ensured},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {66},
  number       = {12},
  pages        = {5941--5954},
  year         = {2021},
  url          = {https://doi.org/10.1109/TAC.2021.3057299},
  doi          = {10.1109/TAC.2021.3057299},
  timestamp    = {Wed, 15 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tac/KarmakarB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tits/SinglaPB21,
  author       = {Abhik Singla and
                  Sindhu Padakandla and
                  Shalabh Bhatnagar},
  title        = {Memory-Based Deep Reinforcement Learning for Obstacle Avoidance in
                  {UAV} With Limited Environment Knowledge},
  journal      = {{IEEE} Trans. Intell. Transp. Syst.},
  volume       = {22},
  number       = {1},
  pages        = {107--118},
  year         = {2021},
  url          = {https://doi.org/10.1109/TITS.2019.2954952},
  doi          = {10.1109/TITS.2019.2954952},
  timestamp    = {Tue, 02 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tits/SinglaPB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/atal/ParnikaDDB21,
  author       = {P. Parnika and
                  Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  editor       = {Frank Dignum and
                  Alessio Lomuscio and
                  Ulle Endriss and
                  Ann Now{\'{e}}},
  title        = {Attention Actor-Critic Algorithm for Multi-Agent Constrained Co-operative
                  Reinforcement Learning},
  booktitle    = {{AAMAS} '21: 20th International Conference on Autonomous Agents and
                  Multiagent Systems, Virtual Event, United Kingdom, May 3-7, 2021},
  pages        = {1616--1618},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://www.ifaamas.org/Proceedings/aamas2021/pdfs/p1616.pdf},
  doi          = {10.5555/3463952.3464178},
  timestamp    = {Wed, 20 Jul 2022 17:03:47 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/ParnikaDDB21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2101-02349,
  author       = {P. Parnika and
                  Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {Attention Actor-Critic algorithm for Multi-Agent Constrained Co-operative
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2101.02349},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.02349},
  eprinttype    = {arXiv},
  eprint       = {2101.02349},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-02349.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2110-10017,
  author       = {Raghuram Bharadwaj Diddigi and
                  Prateek Jain and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Neural Network Compatible Off-Policy Natural Actor-Critic Algorithm},
  journal      = {CoRR},
  volume       = {abs/2110.10017},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.10017},
  eprinttype    = {arXiv},
  eprint       = {2110.10017},
  timestamp    = {Mon, 25 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-10017.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2110-15093,
  author       = {Vivek VP and
                  Shalabh Bhatnagar},
  title        = {Finite Horizon Q-learning: Stability, Convergence and Simulations},
  journal      = {CoRR},
  volume       = {abs/2110.15093},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.15093},
  eprinttype    = {arXiv},
  eprint       = {2110.15093},
  timestamp    = {Tue, 02 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-15093.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2111-11004,
  author       = {Rohan Deb and
                  Shalabh Bhatnagar},
  title        = {Gradient Temporal Difference with Momentum: Stability and Convergence},
  journal      = {CoRR},
  volume       = {abs/2111.11004},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.11004},
  eprinttype    = {arXiv},
  eprint       = {2111.11004},
  timestamp    = {Fri, 26 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-11004.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2111-11768,
  author       = {Rohan Deb and
                  Meet Gandhi and
                  Shalabh Bhatnagar},
  title        = {Schedule Based Temporal Difference Algorithms},
  journal      = {CoRR},
  volume       = {abs/2111.11768},
  year         = {2021},
  url          = {https://arxiv.org/abs/2111.11768},
  eprinttype    = {arXiv},
  eprint       = {2111.11768},
  timestamp    = {Fri, 26 Nov 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2111-11768.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2112-02999,
  author       = {Utkarsh A. Mishra and
                  Soumya R. Samineni and
                  Prakhar Goel and
                  Chandravaran Kunjeti and
                  Himanshu Lodha and
                  Aman Singh and
                  Aditya Sagi and
                  Shalabh Bhatnagar and
                  Shishir Kolathaya},
  title        = {Dynamic Mirror Descent based Model Predictive Control for Accelerating
                  Robot Learning},
  journal      = {CoRR},
  volume       = {abs/2112.02999},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.02999},
  eprinttype    = {arXiv},
  eprint       = {2112.02999},
  timestamp    = {Wed, 08 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-02999.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2112-03515,
  author       = {Rohan Deb and
                  Shalabh Bhatnagar},
  title        = {N-Timescale Stochastic Approximation: Stability and Convergence},
  journal      = {CoRR},
  volume       = {abs/2112.03515},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.03515},
  eprinttype    = {arXiv},
  eprint       = {2112.03515},
  timestamp    = {Mon, 13 Dec 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-03515.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/apin/PadakandlaJB20,
  author       = {Sindhu Padakandla and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Reinforcement learning algorithm for non-stationary environments},
  journal      = {Appl. Intell.},
  volume       = {50},
  number       = {11},
  pages        = {3590--3606},
  year         = {2020},
  url          = {https://doi.org/10.1007/s10489-020-01758-5},
  doi          = {10.1007/S10489-020-01758-5},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/apin/PadakandlaJB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/csysl/KamanchiDB20,
  author       = {Chandramouli Kamanchi and
                  Raghuram Bharadwaj Diddigi and
                  Shalabh Bhatnagar},
  title        = {Successive Over-Relaxation {\textdollar}\{Q\}{\textdollar} -Learning},
  journal      = {{IEEE} Control. Syst. Lett.},
  volume       = {4},
  number       = {1},
  pages        = {55--60},
  year         = {2020},
  url          = {https://doi.org/10.1109/LCSYS.2019.2921158},
  doi          = {10.1109/LCSYS.2019.2921158},
  timestamp    = {Tue, 24 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csysl/KamanchiDB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/csysl/JohnKB20,
  author       = {Indu John and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  title        = {Generalized Speedy Q-Learning},
  journal      = {{IEEE} Control. Syst. Lett.},
  volume       = {4},
  number       = {3},
  pages        = {524--529},
  year         = {2020},
  url          = {https://doi.org/10.1109/LCSYS.2020.2970555},
  doi          = {10.1109/LCSYS.2020.2970555},
  timestamp    = {Tue, 16 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/csysl/JohnKB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/mor/YajiB20,
  author       = {Vinayaka G. Yaji and
                  Shalabh Bhatnagar},
  title        = {Stochastic Recursive Inclusions in Two Timescales with Nonadditive
                  Iterate-Dependent Markov Noise},
  journal      = {Math. Oper. Res.},
  volume       = {45},
  number       = {4},
  pages        = {1405--1444},
  year         = {2020},
  url          = {https://doi.org/10.1287/moor.2019.1037},
  doi          = {10.1287/MOOR.2019.1037},
  timestamp    = {Thu, 16 Sep 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mor/YajiB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/YajiB20,
  author       = {Vinayaka G. Yaji and
                  Shalabh Bhatnagar},
  title        = {Analysis of Stochastic Approximation Schemes With Set-Valued Maps
                  in the Absence of a Stability Guarantee and Their Stabilization},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {65},
  number       = {3},
  pages        = {1100--1115},
  year         = {2020},
  url          = {https://doi.org/10.1109/TAC.2019.2916688},
  doi          = {10.1109/TAC.2019.2916688},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/YajiB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/ABBFM20,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar and
                  Nirav Bhavsar and
                  Michael C. Fu and
                  Steven I. Marcus},
  title        = {Random Directions Stochastic Approximation With Deterministic Perturbations},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {65},
  number       = {6},
  pages        = {2450--2465},
  year         = {2020},
  url          = {https://doi.org/10.1109/TAC.2019.2930821},
  doi          = {10.1109/TAC.2019.2930821},
  timestamp    = {Tue, 16 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/ABBFM20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/aaai/DharmavaramRB20,
  author       = {Akshay Dharmavaram and
                  Matthew Riemer and
                  Shalabh Bhatnagar},
  title        = {Hierarchical Average Reward Policy Gradient Algorithms (Student Abstract)},
  booktitle    = {The Thirty-Fourth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2020, The Thirty-Second Innovative Applications of Artificial Intelligence
                  Conference, {IAAI} 2020, The Tenth {AAAI} Symposium on Educational
                  Advances in Artificial Intelligence, {EAAI} 2020, New York, NY, USA,
                  February 7-12, 2020},
  pages        = {13777--13778},
  publisher    = {{AAAI} Press},
  year         = {2020},
  url          = {https://doi.org/10.1609/aaai.v34i10.7160},
  doi          = {10.1609/AAAI.V34I10.7160},
  timestamp    = {Sat, 21 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/DharmavaramRB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/corl/PaigwarKTKVJBGA20,
  author       = {Kartik Paigwar and
                  Lokesh Krishna and
                  Sashank Tirumala and
                  Naman Khetan and
                  Aditya Varma and
                  Ashish Joglekar and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  editor       = {Jens Kober and
                  Fabio Ramos and
                  Claire J. Tomlin},
  title        = {Robust Quadrupedal Locomotion on Sloped Terrains: {A} Linear Policy
                  Approach},
  booktitle    = {4th Conference on Robot Learning, CoRL 2020, 16-18 November 2020,
                  Virtual Event / Cambridge, MA, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {155},
  pages        = {2257--2267},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {https://proceedings.mlr.press/v155/paigwar21a.html},
  timestamp    = {Tue, 18 Oct 2022 08:35:37 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/PaigwarKTKVJBGA20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ecai/DiddigiKB20,
  author       = {Raghuram Bharadwaj Diddigi and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  editor       = {Giuseppe De Giacomo and
                  Alejandro Catal{\'{a}} and
                  Bistra Dilkina and
                  Michela Milano and
                  Sen{\'{e}}n Barro and
                  Alberto Bugar{\'{\i}}n and
                  J{\'{e}}r{\^{o}}me Lang},
  title        = {A Convergent Off-Policy Temporal Difference Algorithm},
  booktitle    = {{ECAI} 2020 - 24th European Conference on Artificial Intelligence,
                  29 August-8 September 2020, Santiago de Compostela, Spain, August
                  29 - September 8, 2020 - Including 10th Conference on Prestigious
                  Applications of Artificial Intelligence {(PAIS} 2020)},
  series       = {Frontiers in Artificial Intelligence and Applications},
  volume       = {325},
  pages        = {1103--1110},
  publisher    = {{IOS} Press},
  year         = {2020},
  url          = {https://doi.org/10.3233/FAIA200207},
  doi          = {10.3233/FAIA200207},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ecai/DiddigiKB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ijcnn/JohnB20,
  author       = {Indu John and
                  Shalabh Bhatnagar},
  title        = {Deep Reinforcement Learning with Successive Over-Relaxation and its
                  Application in Autoscaling Cloud Resources},
  booktitle    = {2020 International Joint Conference on Neural Networks, {IJCNN} 2020,
                  Glasgow, United Kingdom, July 19-24, 2020},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/IJCNN48605.2020.9206598},
  doi          = {10.1109/IJCNN48605.2020.9206598},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/JohnB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/isgteurope/NayakECDRSDB20,
  author       = {Shravan Nayak and
                  Chanakya Ajit Ekbote and
                  Annanya Pratap Singh Chauhan and
                  Raghuram Bharadwaj Diddigi and
                  Prishita Ray and
                  Abhinava Sikdar and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {Stochastic Game Frameworks for Efficient Energy Management in Microgrid
                  Networks},
  booktitle    = {{IEEE} {PES} Innovative Smart Grid Technologies Europe, {ISGT} Europe
                  2020, Delft, The Netherlands, October 26-28, 2020},
  pages        = {116--120},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/ISGT-Europe47291.2020.9248952},
  doi          = {10.1109/ISGT-EUROPE47291.2020.9248952},
  timestamp    = {Tue, 21 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/isgteurope/NayakECDRSDB20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/pimrc/Padakandla0B20,
  author       = {Sindhu Padakandla and
                  Shilpa Rao and
                  Shalabh Bhatnagar},
  title        = {Learning-Based Resource Allocation in Industrial IoT Systems},
  booktitle    = {31st {IEEE} Annual International Symposium on Personal, Indoor and
                  Mobile Radio Communications, {PIMRC} 2020, London, United Kingdom,
                  August 31 - September 3, 2020},
  pages        = {1--7},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/PIMRC48278.2020.9217170},
  doi          = {10.1109/PIMRC48278.2020.9217170},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/pimrc/Padakandla0B20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ro-man/TirumalaGPSJBGA20,
  author       = {Sashank Tirumala and
                  Sagar Venkatesh Gubbi and
                  Kartik Paigwar and
                  Aditya Sagi and
                  Ashish Joglekar and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  title        = {Learning Stable Manoeuvres in Quadruped Robots from Expert Demonstrations},
  booktitle    = {29th {IEEE} International Conference on Robot and Human Interactive
                  Communication, {RO-MAN} 2020, Naples, Italy, August 31 - September
                  4, 2020},
  pages        = {1107--1112},
  publisher    = {{IEEE}},
  year         = {2020},
  url          = {https://doi.org/10.1109/RO-MAN47096.2020.9223511},
  doi          = {10.1109/RO-MAN47096.2020.9223511},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ro-man/TirumalaGPSJBGA20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2002-02084,
  author       = {Shravan Nayak and
                  Chanakya Ajit Ekbote and
                  Annanya Pratap Singh Chauhan and
                  Raghuram Bharadwaj Diddigi and
                  Prishita Ray and
                  Abhinava Sikdar and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {A Stochastic Game Framework for Efficient Energy Management in Microgrid
                  Networks},
  journal      = {CoRR},
  volume       = {abs/2002.02084},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.02084},
  eprinttype    = {arXiv},
  eprint       = {2002.02084},
  timestamp    = {Mon, 10 Feb 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-02084.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2007-14290,
  author       = {Sashank Tirumala and
                  Sagar Venkatesh Gubbi and
                  Kartik Paigwar and
                  Aditya Sagi and
                  Ashish Joglekar and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  title        = {Learning Stable Manoeuvres in Quadruped Robots from Expert Demonstrations},
  journal      = {CoRR},
  volume       = {abs/2007.14290},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.14290},
  eprinttype    = {arXiv},
  eprint       = {2007.14290},
  timestamp    = {Mon, 03 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-14290.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2009-00821,
  author       = {Meet Gandhi and
                  Atreyee Kundu and
                  Shalabh Bhatnagar},
  title        = {A reinforcement learning approach to hybrid control design},
  journal      = {CoRR},
  volume       = {abs/2009.00821},
  year         = {2020},
  url          = {https://arxiv.org/abs/2009.00821},
  eprinttype    = {arXiv},
  eprint       = {2009.00821},
  timestamp    = {Wed, 16 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2009-00821.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2010-06142,
  author       = {Dhuruva Priyan G. M and
                  Abhik Singla and
                  Shalabh Bhatnagar},
  title        = {Hindsight Experience Replay with Kronecker Product Approximate Curvature},
  journal      = {CoRR},
  volume       = {abs/2010.06142},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.06142},
  eprinttype    = {arXiv},
  eprint       = {2010.06142},
  timestamp    = {Tue, 20 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-06142.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-2010-16342,
  author       = {Kartik Paigwar and
                  Lokesh Krishna and
                  Sashank Tirumala and
                  Naman Khetan and
                  Aditya Sagi and
                  Ashish Joglekar and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  title        = {Robust Quadrupedal Locomotion on Sloped Terrains: {A} Linear Policy
                  Approach},
  journal      = {CoRR},
  volume       = {abs/2010.16342},
  year         = {2020},
  url          = {https://arxiv.org/abs/2010.16342},
  eprinttype    = {arXiv},
  eprint       = {2010.16342},
  timestamp    = {Tue, 03 Nov 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2010-16342.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/csysl/KamanchiDJB19,
  author       = {Chandramouli Kamanchi and
                  Raghuram Bharadwaj Diddigi and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {An Online Sample-Based Method for Mode Estimation Using {ODE} Analysis
                  of Stochastic Approximation Algorithms},
  journal      = {{IEEE} Control. Syst. Lett.},
  volume       = {3},
  number       = {3},
  pages        = {697--702},
  year         = {2019},
  url          = {https://doi.org/10.1109/LCSYS.2019.2916467},
  doi          = {10.1109/LCSYS.2019.2916467},
  timestamp    = {Tue, 24 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/csysl/KamanchiDJB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/RamaswamyB19,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Stability of Stochastic Approximations With "Controlled Markov"
                  Noise and Temporal Difference Learning},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {64},
  number       = {6},
  pages        = {2614--2620},
  year         = {2019},
  url          = {https://doi.org/10.1109/TAC.2018.2874687},
  doi          = {10.1109/TAC.2018.2874687},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/RamaswamyB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/allerton/JosephB19,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {Stochastic Approximation Trackers for Model-Based Search},
  booktitle    = {57th Annual Allerton Conference on Communication, Control, and Computing,
                  Allerton 2019, Monticello, IL, USA, September 24-27, 2019},
  pages        = {741--748},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ALLERTON.2019.8919816},
  doi          = {10.1109/ALLERTON.2019.8919816},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/allerton/JosephB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/atal/DiddigiRJB19,
  author       = {Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  editor       = {Edith Elkind and
                  Manuela Veloso and
                  Noa Agmon and
                  Matthew E. Taylor},
  title        = {Actor-Critic Algorithms for Constrained Multi-agent Reinforcement
                  Learning},
  booktitle    = {Proceedings of the 18th International Conference on Autonomous Agents
                  and MultiAgent Systems, {AAMAS} '19, Montreal, QC, Canada, May 13-17,
                  2019},
  pages        = {1931--1933},
  publisher    = {International Foundation for Autonomous Agents and Multiagent Systems},
  year         = {2019},
  url          = {http://dl.acm.org/citation.cfm?id=3331967},
  timestamp    = {Mon, 18 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/DiddigiRJB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/JosephB19,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {An Adaptive and Incremental Approach to Quantile Estimation},
  booktitle    = {58th {IEEE} Conference on Decision and Control, {CDC} 2019, Nice,
                  France, December 11-13, 2019},
  pages        = {6025--6031},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/CDC40024.2019.9029803},
  doi          = {10.1109/CDC40024.2019.9029803},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/JosephB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/comad/JohnB19,
  author       = {Indu John and
                  Shalabh Bhatnagar},
  editor       = {Raghu Krishnapuram and
                  Parag Singla},
  title        = {Efficient Budget Allocation and Task Assignment in Crowdsourcing},
  booktitle    = {Proceedings of the {ACM} India Joint International Conference on Data
                  Science and Management of Data, {COMAD/CODS} 2019, Kolkata, India,
                  January 3-5, 2019},
  pages        = {318--321},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3297001.3297050},
  doi          = {10.1145/3297001.3297050},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/comad/JohnB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icmla/JohnKB19,
  author       = {Indu John and
                  Ravikumar Karumanchi and
                  Shalabh Bhatnagar},
  editor       = {M. Arif Wani and
                  Taghi M. Khoshgoftaar and
                  Dingding Wang and
                  Huanjing Wang and
                  Naeem Seliya},
  title        = {Predictive and Prescriptive Analytics for Performance Optimization:
                  Framework and a Case Study on a Large-Scale Enterprise System},
  booktitle    = {18th {IEEE} International Conference On Machine Learning And Applications,
                  {ICMLA} 2019, Boca Raton, FL, USA, December 16-19, 2019},
  pages        = {876--881},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICMLA.2019.00152},
  doi          = {10.1109/ICMLA.2019.00152},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icmla/JohnKB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icra/SinglaBDBGAK19,
  author       = {Abhik Singla and
                  Shounak Bhattacharya and
                  Dhaivat Dholakiya and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  title        = {Realizing Learned Quadruped Locomotion Behaviors through Kinematic
                  Motion Primitives},
  booktitle    = {International Conference on Robotics and Automation, {ICRA} 2019,
                  Montreal, QC, Canada, May 20-24, 2019},
  pages        = {7434--7440},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICRA.2019.8794179},
  doi          = {10.1109/ICRA.2019.8794179},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/SinglaBDBGAK19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ro-man/BhattacharyaSAD19,
  author       = {Shounak Bhattacharya and
                  Abhik Singla and
                  Abhimanyu and
                  Dhaivat Dholakiya and
                  Shalabh Bhatnagar and
                  Bharadwaj Amrutur and
                  Ashitava Ghosal and
                  Shishir Kolathaya},
  title        = {Learning Active Spine Behaviors for Dynamic and Efficient Locomotion
                  in Quadruped Robots},
  booktitle    = {28th {IEEE} International Conference on Robot and Human Interactive
                  Communication, {RO-MAN} 2019, New Delhi, India, October 14-18, 2019},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/RO-MAN46459.2019.8956332},
  doi          = {10.1109/RO-MAN46459.2019.8956332},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ro-man/BhattacharyaSAD19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ro-man/KolathayaGAJSDA19,
  author       = {Shishir Kolathaya and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Ashish Joglekar and
                  Suhan Shetty and
                  Dhaivat Dholakiya and
                  Abhimanyu and
                  Aditya Sagi and
                  Shounak Bhattacharya and
                  Abhik Singla and
                  Shalabh Bhatnagar},
  title        = {Trajectory based Deep Policy Search for Quadrupedal Walking},
  booktitle    = {28th {IEEE} International Conference on Robot and Human Interactive
                  Communication, {RO-MAN} 2019, New Delhi, India, October 14-18, 2019},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/RO-MAN46459.2019.8956369},
  doi          = {10.1109/RO-MAN46459.2019.8956369},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ro-man/KolathayaGAJSDA19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/saso/JohnSB19,
  author       = {Indu John and
                  Aiswarya Sreekantan and
                  Shalabh Bhatnagar},
  title        = {Efficient Adaptive Resource Provisioning for Cloud Applications using
                  Reinforcement Learning},
  booktitle    = {{IEEE} 4th International Workshops on Foundations and Applications
                  of Self* Systems, FAS*W@SASO/ICCAC 2019, Umea, Sweden, June 16-20,
                  2019},
  pages        = {271--272},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/FAS-W.2019.00077},
  doi          = {10.1109/FAS-W.2019.00077},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/saso/JohnSB19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1901-00697,
  author       = {Dhaivat Dholakiya and
                  Shounak Bhattacharya and
                  Ajay Gunalan and
                  Abhik Singla and
                  Shalabh Bhatnagar and
                  Bharadwaj Amrutur and
                  Ashitava Ghosal and
                  Shishir Kolathaya},
  title        = {Design, Development and Experimental Realization of a Quadrupedal
                  Research Platform: Stoch},
  journal      = {CoRR},
  volume       = {abs/1901.00697},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.00697},
  eprinttype    = {arXiv},
  eprint       = {1901.00697},
  timestamp    = {Thu, 31 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-00697.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1902-03806,
  author       = {Chandramouli K and
                  Raghuram Bharadwaj Diddigi and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {An Online Sample Based Method for Mode Estimation using {ODE} Analysis
                  of Stochastic Approximation Algorithms},
  journal      = {CoRR},
  volume       = {abs/1902.03806},
  year         = {2019},
  url          = {http://arxiv.org/abs/1902.03806},
  eprinttype    = {arXiv},
  eprint       = {1902.03806},
  timestamp    = {Tue, 21 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1902-03806.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1903-03812,
  author       = {Chandramouli Kamanchi and
                  Raghuram Bharadwaj Diddigi and
                  Shalabh Bhatnagar},
  title        = {Successive Over Relaxation Q-Learning},
  journal      = {CoRR},
  volume       = {abs/1903.03812},
  year         = {2019},
  url          = {http://arxiv.org/abs/1903.03812},
  eprinttype    = {arXiv},
  eprint       = {1903.03812},
  timestamp    = {Sun, 31 Mar 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1903-03812.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1905-02907,
  author       = {Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Actor-Critic Algorithms for Constrained Multi-agent Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/1905.02907},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.02907},
  eprinttype    = {arXiv},
  eprint       = {1905.02907},
  timestamp    = {Mon, 27 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-02907.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1905-03927,
  author       = {Chandramouli Kamanchi and
                  Raghuram Bharadwaj Diddigi and
                  Shalabh Bhatnagar},
  title        = {Second Order Value Iteration in Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/1905.03927},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.03927},
  eprinttype    = {arXiv},
  eprint       = {1905.03927},
  timestamp    = {Mon, 27 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-03927.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1905-03970,
  author       = {Sindhu Padakandla and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Reinforcement Learning in Non-Stationary Environments},
  journal      = {CoRR},
  volume       = {abs/1905.03970},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.03970},
  eprinttype    = {arXiv},
  eprint       = {1905.03970},
  timestamp    = {Mon, 27 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-03970.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1905-06077,
  author       = {Shounak Bhattacharya and
                  Abhik Singla and
                  Abhimanyu and
                  Dhaivat Dholakiya and
                  Shalabh Bhatnagar and
                  Bharadwaj Amrutur and
                  Ashitava Ghosal and
                  Shishir Kolathaya},
  title        = {Learning Active Spine Behaviors for Dynamic and Efficient Locomotion
                  in Quadruped Robots},
  journal      = {CoRR},
  volume       = {abs/1905.06077},
  year         = {2019},
  url          = {http://arxiv.org/abs/1905.06077},
  eprinttype    = {arXiv},
  eprint       = {1905.06077},
  timestamp    = {Tue, 28 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1905-06077.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1906-06659,
  author       = {Raghuram Bharadwaj Diddigi and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  title        = {Solution of Two-Player Zero-Sum Game by Successive Relaxation},
  journal      = {CoRR},
  volume       = {abs/1906.06659},
  year         = {2019},
  url          = {http://arxiv.org/abs/1906.06659},
  eprinttype    = {arXiv},
  eprint       = {1906.06659},
  timestamp    = {Mon, 24 Jun 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1906-06659.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1911-00397,
  author       = {Indu John and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  title        = {Generalized Speedy Q-learning},
  journal      = {CoRR},
  volume       = {abs/1911.00397},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.00397},
  eprinttype    = {arXiv},
  eprint       = {1911.00397},
  timestamp    = {Mon, 11 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-00397.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1911-05697,
  author       = {Raghuram Bharadwaj Diddigi and
                  Chandramouli Kamanchi and
                  Shalabh Bhatnagar},
  title        = {A Convergent Off-Policy Temporal Difference Algorithm},
  journal      = {CoRR},
  volume       = {abs/1911.05697},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.05697},
  eprinttype    = {arXiv},
  eprint       = {1911.05697},
  timestamp    = {Mon, 02 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-05697.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1911-08826,
  author       = {Akshay Dharmavaram and
                  Matthew Riemer and
                  Shalabh Bhatnagar},
  title        = {Hierarchical Average Reward Policy Gradient Algorithms},
  journal      = {CoRR},
  volume       = {abs/1911.08826},
  year         = {2019},
  url          = {http://arxiv.org/abs/1911.08826},
  eprinttype    = {arXiv},
  eprint       = {1911.08826},
  timestamp    = {Tue, 03 Dec 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1911-08826.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1912-12907,
  author       = {Sashank Tirumala and
                  Aditya Sagi and
                  Kartik Paigwar and
                  Ashish Joglekar and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  title        = {Gait Library Synthesis for Quadruped Robots via Augmented Random Search},
  journal      = {CoRR},
  volume       = {abs/1912.12907},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.12907},
  eprinttype    = {arXiv},
  eprint       = {1912.12907},
  timestamp    = {Sat, 04 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-12907.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/informs/ZhouB18,
  author       = {Enlu Zhou and
                  Shalabh Bhatnagar},
  title        = {Gradient-Based Adaptive Stochastic Search for Simulation Optimization
                  Over Continuous Space},
  journal      = {{INFORMS} J. Comput.},
  volume       = {30},
  number       = {1},
  pages        = {154--167},
  year         = {2018},
  url          = {https://doi.org/10.1287/ijoc.2017.0771},
  doi          = {10.1287/IJOC.2017.0771},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/informs/ZhouB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ml/JosephB18,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {An incremental off-policy search in a model-free Markov decision process
                  using a single sample path},
  journal      = {Mach. Learn.},
  volume       = {107},
  number       = {6},
  pages        = {969--1011},
  year         = {2018},
  url          = {https://doi.org/10.1007/s10994-018-5697-1},
  doi          = {10.1007/S10994-018-5697-1},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ml/JosephB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ml/JosephB18a,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {An online prediction algorithm for reinforcement learning with linear
                  function approximation using cross entropy method},
  journal      = {Mach. Learn.},
  volume       = {107},
  number       = {8-10},
  pages        = {1385--1429},
  year         = {2018},
  url          = {https://doi.org/10.1007/s10994-018-5727-z},
  doi          = {10.1007/S10994-018-5727-Z},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ml/JosephB18a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/mor/KarmakarB18,
  author       = {Prasenjit Karmakar and
                  Shalabh Bhatnagar},
  title        = {Two Time-Scale Stochastic Approximation with Controlled Markov Noise
                  and Off-Policy Temporal-Difference Learning},
  journal      = {Math. Oper. Res.},
  volume       = {43},
  number       = {1},
  pages        = {130--151},
  year         = {2018},
  url          = {https://doi.org/10.1287/moor.2017.0855},
  doi          = {10.1287/MOOR.2017.0855},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mor/KarmakarB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/Lakshminarayanan18,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar and
                  Csaba Szepesv{\'{a}}ri},
  title        = {A Linearly Relaxed Approximate Linear Program for Markov Decision
                  Processes},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {63},
  number       = {4},
  pages        = {1185--1191},
  year         = {2018},
  url          = {https://doi.org/10.1109/TAC.2017.2743163},
  doi          = {10.1109/TAC.2017.2743163},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/Lakshminarayanan18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/RamaswamyB18,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Analysis of Gradient Descent Methods With Nondiminishing Bounded Errors},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {63},
  number       = {5},
  pages        = {1465--1471},
  year         = {2018},
  url          = {https://doi.org/10.1109/TAC.2017.2744598},
  doi          = {10.1109/TAC.2017.2744598},
  timestamp    = {Wed, 20 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/RamaswamyB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/telsys/BhatnagarPK18,
  author       = {Shalabh Bhatnagar and
                  Sanjeev Patel and
                  Karmeshu},
  title        = {A stochastic approximation approach to active queue management},
  journal      = {Telecommun. Syst.},
  volume       = {68},
  number       = {1},
  pages        = {89--104},
  year         = {2018},
  url          = {https://doi.org/10.1007/s11235-017-0377-1},
  doi          = {10.1007/S11235-017-0377-1},
  timestamp    = {Thu, 13 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/telsys/BhatnagarPK18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/wcl/DiddigiJB18,
  author       = {Raghuram Bharadwaj Diddigi and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Novel Sensor Scheduling Scheme for Intruder Tracking in Energy Efficient
                  Sensor Networks},
  journal      = {{IEEE} Wirel. Commun. Lett.},
  volume       = {7},
  number       = {5},
  pages        = {712--715},
  year         = {2018},
  url          = {https://doi.org/10.1109/LWC.2018.2814576},
  doi          = {10.1109/LWC.2018.2814576},
  timestamp    = {Wed, 01 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/wcl/DiddigiJB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/KJRB18,
  author       = {Chandramouli K and
                  Prabuchandran K. J. and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {Generalized Deterministic Perturbations For Stochastic Gradient Search},
  booktitle    = {57th {IEEE} Conference on Decision and Control, {CDC} 2018, Miami,
                  FL, USA, December 17-19, 2018},
  pages        = {5734--5739},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/CDC.2018.8619736},
  doi          = {10.1109/CDC.2018.8619736},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/KJRB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/smartgridcomm/DiddigiRB18,
  author       = {Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {A unified decision making framework for supply and demand management
                  in microgrid networks},
  booktitle    = {2018 {IEEE} International Conference on Communications, Control, and
                  Computing Technologies for Smart Grids, SmartGridComm 2018, Aalborg,
                  Denmark, October 29-31, 2018},
  pages        = {1--7},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/SmartGridComm.2018.8587514},
  doi          = {10.1109/SMARTGRIDCOMM.2018.8587514},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/smartgridcomm/DiddigiRB18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1801-10287,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {An Incremental Off-policy Search in a Model-free Markov Decision Process
                  Using a Single Sample Path},
  journal      = {CoRR},
  volume       = {abs/1801.10287},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.10287},
  eprinttype    = {arXiv},
  eprint       = {1801.10287},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-10287.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1801-10291,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {A Cross Entropy based Optimization Algorithm with Global Convergence
                  Guarantees},
  journal      = {CoRR},
  volume       = {abs/1801.10291},
  year         = {2018},
  url          = {http://arxiv.org/abs/1801.10291},
  eprinttype    = {arXiv},
  eprint       = {1801.10291},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1801-10291.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1806-06720,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {An Online Prediction Algorithm for Reinforcement Learning with Linear
                  Function Approximation using Cross Entropy Method},
  journal      = {CoRR},
  volume       = {abs/1806.06720},
  year         = {2018},
  url          = {http://arxiv.org/abs/1806.06720},
  eprinttype    = {arXiv},
  eprint       = {1806.06720},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1806-06720.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1808-02871,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar and
                  Nirav Bhavsar and
                  Michael C. Fu and
                  Steven I. Marcus},
  title        = {Random directions stochastic approximation with deterministic perturbations},
  journal      = {CoRR},
  volume       = {abs/1808.02871},
  year         = {2018},
  url          = {http://arxiv.org/abs/1808.02871},
  eprinttype    = {arXiv},
  eprint       = {1808.02871},
  timestamp    = {Wed, 20 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1808-02871.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1810-03842,
  author       = {Abhik Singla and
                  Shounak Bhattacharya and
                  Dhaivat Dholakiya and
                  Shalabh Bhatnagar and
                  Ashitava Ghosal and
                  Bharadwaj Amrutur and
                  Shishir Kolathaya},
  title        = {Realizing Learned Quadruped Locomotion Behaviors through Kinematic
                  Motion Primitives},
  journal      = {CoRR},
  volume       = {abs/1810.03842},
  year         = {2018},
  url          = {http://arxiv.org/abs/1810.03842},
  eprinttype    = {arXiv},
  eprint       = {1810.03842},
  timestamp    = {Tue, 30 Oct 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1810-03842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1811-03307,
  author       = {Abhik Singla and
                  Sindhu Padakandla and
                  Shalabh Bhatnagar},
  title        = {Memory-based Deep Reinforcement Learning for Obstacle Avoidance in
                  {UAV} with Limited Environment Knowledge},
  journal      = {CoRR},
  volume       = {abs/1811.03307},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.03307},
  eprinttype    = {arXiv},
  eprint       = {1811.03307},
  timestamp    = {Thu, 22 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-03307.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/Lakshminarayanan17,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  title        = {A stability criterion for two timescale stochastic approximation schemes},
  journal      = {Autom.},
  volume       = {79},
  pages        = {108--114},
  year         = {2017},
  url          = {https://doi.org/10.1016/j.automatica.2016.12.014},
  doi          = {10.1016/J.AUTOMATICA.2016.12.014},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/Lakshminarayanan17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/coap/LakshmananB17,
  author       = {K. Lakshmanan and
                  Shalabh Bhatnagar},
  title        = {Quasi-Newton smoothed functional algorithms for unconstrained and
                  constrained simulation optimization},
  journal      = {Comput. Optim. Appl.},
  volume       = {66},
  number       = {3},
  pages        = {533--556},
  year         = {2017},
  url          = {https://doi.org/10.1007/s10589-016-9875-4},
  doi          = {10.1007/S10589-016-9875-4},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/coap/LakshmananB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/mor/RamaswamyB17,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {A Generalization of the Borkar-Meyn Theorem for Stochastic Recursive
                  Inclusions},
  journal      = {Math. Oper. Res.},
  volume       = {42},
  number       = {3},
  pages        = {648--661},
  year         = {2017},
  url          = {https://doi.org/10.1287/moor.2016.0821},
  doi          = {10.1287/MOOR.2016.0821},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mor/RamaswamyB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/ABFM17,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar and
                  Michael C. Fu and
                  Steven I. Marcus},
  title        = {Adaptive System Optimization Using Random Directions Stochastic Approximation},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {62},
  number       = {5},
  pages        = {2223--2238},
  year         = {2017},
  url          = {https://doi.org/10.1109/TAC.2016.2600643},
  doi          = {10.1109/TAC.2016.2600643},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/ABFM17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/telsys/KarmeshuPB17,
  author       = {Karmeshu and
                  Sanjeev Patel and
                  Shalabh Bhatnagar},
  title        = {Adaptive mean queue size and its rate of change: queue management
                  with random dropping},
  journal      = {Telecommun. Syst.},
  volume       = {65},
  number       = {2},
  pages        = {281--295},
  year         = {2017},
  url          = {https://doi.org/10.1007/s11235-016-0229-4},
  doi          = {10.1007/S11235-016-0229-4},
  timestamp    = {Thu, 13 Aug 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/telsys/KarmeshuPB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/IEEEcloud/KumarPLPGB17,
  author       = {Sandeep Kumar and
                  Sindhu Padakandla and
                  Chandrashekar Lakshminarayanan and
                  Priyank Parihar and
                  K. Gopinath and
                  Shalabh Bhatnagar},
  editor       = {Geoffrey C. Fox},
  title        = {Scalable Performance Tuning of Hadoop MapReduce: {A} Noisy Gradient
                  Approach},
  booktitle    = {2017 {IEEE} 10th International Conference on Cloud Computing (CLOUD),
                  Honolulu, HI, USA, June 25-30, 2017},
  pages        = {375--382},
  publisher    = {{IEEE} Computer Society},
  year         = {2017},
  url          = {https://doi.org/10.1109/CLOUD.2017.55},
  doi          = {10.1109/CLOUD.2017.55},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/IEEEcloud/KumarPLPGB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ijcnn/JosephB17,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {A model based search method for prediction in model-free Markov decision
                  process},
  booktitle    = {2017 International Joint Conference on Neural Networks, {IJCNN} 2017,
                  Anchorage, AK, USA, May 14-19, 2017},
  pages        = {170--177},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/IJCNN.2017.7965851},
  doi          = {10.1109/IJCNN.2017.7965851},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/JosephB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ijcnn/JosephB17a,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {Bounds for off-policy prediction in reinforcement learning},
  booktitle    = {2017 International Joint Conference on Neural Networks, {IJCNN} 2017,
                  Anchorage, AK, USA, May 14-19, 2017},
  pages        = {3991--3997},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/IJCNN.2017.7966359},
  doi          = {10.1109/IJCNN.2017.7966359},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/JosephB17a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/premi/JosephB17,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  editor       = {B. Uma Shankar and
                  Kuntal Ghosh and
                  Deba Prasad Mandal and
                  Shubhra Sankar Ray and
                  David Zhang and
                  Sankar K. Pal},
  title        = {An Incremental Fast Policy Search Using a Single Sample Path},
  booktitle    = {Pattern Recognition and Machine Intelligence - 7th International Conference,
                  PReMI 2017, Kolkata, India, December 5-8, 2017, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {10597},
  pages        = {3--10},
  publisher    = {Springer},
  year         = {2017},
  url          = {https://doi.org/10.1007/978-3-319-69900-4\_1},
  doi          = {10.1007/978-3-319-69900-4\_1},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/premi/JosephB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/YajiB17,
  author       = {Vinayaka G. Yaji and
                  Shalabh Bhatnagar},
  title        = {Analysis of stochastic approximation schemes with set-valued maps
                  in the absence of a stability guarantee and their stabilization},
  journal      = {CoRR},
  volume       = {abs/1701.07590},
  year         = {2017},
  url          = {http://arxiv.org/abs/1701.07590},
  eprinttype    = {arXiv},
  eprint       = {1701.07590},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YajiB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/KRB17,
  author       = {Chandramouli K and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {Deterministic Perturbations For Simultaneous Perturbation Methods
                  Using Circulant Matrices},
  journal      = {CoRR},
  volume       = {abs/1702.06250},
  year         = {2017},
  url          = {http://arxiv.org/abs/1702.06250},
  eprinttype    = {arXiv},
  eprint       = {1702.06250},
  timestamp    = {Mon, 18 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/KRB17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/Lakshminarayanan17,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar and
                  Csaba Szepesv{\'{a}}ri},
  title        = {A Linearly Relaxed Approximate Linear Program for Markov Decision
                  Processes},
  journal      = {CoRR},
  volume       = {abs/1704.02544},
  year         = {2017},
  url          = {http://arxiv.org/abs/1704.02544},
  eprinttype    = {arXiv},
  eprint       = {1704.02544},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/Lakshminarayanan17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1708-07732,
  author       = {Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Shalabh Bhatnagar},
  title        = {Multi-Agent Q-Learning for Minimizing Demand-Supply Power Deficit
                  in Microgrids},
  journal      = {CoRR},
  volume       = {abs/1708.07732},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.07732},
  eprinttype    = {arXiv},
  eprint       = {1708.07732},
  timestamp    = {Mon, 18 Nov 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-07732.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1708-08113,
  author       = {Raghuram Bharadwaj Diddigi and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Novel Sensor Scheduling Scheme for Intruder Tracking in Energy Efficient
                  Sensor Networks},
  journal      = {CoRR},
  volume       = {abs/1708.08113},
  year         = {2017},
  url          = {http://arxiv.org/abs/1708.08113},
  eprinttype    = {arXiv},
  eprint       = {1708.08113},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1708-08113.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1709-04673,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Conditions for Stability and Convergence of Set-Valued Stochastic
                  Approximations: Applications to Approximate Value and Fixed point
                  Iterations with Noise},
  journal      = {CoRR},
  volume       = {abs/1709.04673},
  year         = {2017},
  url          = {http://arxiv.org/abs/1709.04673},
  eprinttype    = {arXiv},
  eprint       = {1709.04673},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1709-04673.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1711-05078,
  author       = {Raghuram Bharadwaj Diddigi and
                  Sai Koti Reddy Danda and
                  Krishnasuri Narayanam and
                  Shalabh Bhatnagar},
  title        = {A unified decision making framework for supply and demand management
                  in microgrid networks},
  journal      = {CoRR},
  volume       = {abs/1711.05078},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.05078},
  eprinttype    = {arXiv},
  eprint       = {1711.05078},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-05078.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1712-04303,
  author       = {Jayvant Anantpur and
                  Nagendra Dwarakanath Gulur and
                  Shivaram Kalyanakrishnan and
                  Shalabh Bhatnagar and
                  R. Govindarajan},
  title        = {{RLWS:} {A} Reinforcement Learning based {GPU} Warp Scheduler},
  journal      = {CoRR},
  volume       = {abs/1712.04303},
  year         = {2017},
  url          = {http://arxiv.org/abs/1712.04303},
  eprinttype    = {arXiv},
  eprint       = {1712.04303},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1712-04303.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/deds/BhatnagarL16,
  author       = {Shalabh Bhatnagar and
                  K. Lakshmanan},
  title        = {Multiscale Q-learning with linear function approximation},
  journal      = {Discret. Event Dyn. Syst.},
  volume       = {26},
  number       = {3},
  pages        = {477--509},
  year         = {2016},
  url          = {https://doi.org/10.1007/s10626-015-0216-z},
  doi          = {10.1007/S10626-015-0216-Z},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/deds/BhatnagarL16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/scl/APBC16,
  author       = {Prashanth L. A. and
                  H. L. Prasad and
                  Shalabh Bhatnagar and
                  Prakash Chandra},
  title        = {A constrained optimization perspective on actor-critic algorithms
                  and application to network routing},
  journal      = {Syst. Control. Lett.},
  volume       = {92},
  pages        = {46--51},
  year         = {2016},
  url          = {https://doi.org/10.1016/j.sysconle.2016.02.020},
  doi          = {10.1016/J.SYSCONLE.2016.02.020},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scl/APBC16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/JBB16,
  author       = {Prabuchandran K. J. and
                  Shalabh Bhatnagar and
                  Vivek S. Borkar},
  title        = {Actor-Critic Algorithms with Online Feature Adaptation},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {26},
  number       = {4},
  pages        = {24:1--24:26},
  year         = {2016},
  url          = {https://doi.org/10.1145/2868723},
  doi          = {10.1145/2868723},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/JBB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/ReddyAB16,
  author       = {Sai Koti Reddy Danda and
                  Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {Improved Hessian estimation for adaptive random directions stochastic
                  approximation},
  booktitle    = {55th {IEEE} Conference on Decision and Control, {CDC} 2016, Las Vegas,
                  NV, USA, December 12-14, 2016},
  pages        = {3682--3687},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/CDC.2016.7798823},
  doi          = {10.1109/CDC.2016.7798823},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/ReddyAB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ecai/JosephB16,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  editor       = {Gal A. Kaminka and
                  Maria Fox and
                  Paolo Bouquet and
                  Eyke H{\"{u}}llermeier and
                  Virginia Dignum and
                  Frank Dignum and
                  Frank van Harmelen},
  title        = {Revisiting the Cross Entropy Method with Applications in Stochastic
                  Global Optimization and Reinforcement Learning},
  booktitle    = {{ECAI} 2016 - 22nd European Conference on Artificial Intelligence,
                  29 August-2 September 2016, The Hague, The Netherlands - Including
                  Prestigious Applications of Artificial Intelligence {(PAIS} 2016)},
  series       = {Frontiers in Artificial Intelligence and Applications},
  volume       = {285},
  pages        = {1026--1034},
  publisher    = {{IOS} Press},
  year         = {2016},
  url          = {https://doi.org/10.3233/978-1-61499-672-9-1026},
  doi          = {10.3233/978-1-61499-672-9-1026},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ecai/JosephB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ecai/MaityLPB16,
  author       = {Raj Kumar Maity and
                  Chandrashekar Lakshminarayanan and
                  Sindhu Padakandla and
                  Shalabh Bhatnagar},
  editor       = {Gal A. Kaminka and
                  Maria Fox and
                  Paolo Bouquet and
                  Eyke H{\"{u}}llermeier and
                  Virginia Dignum and
                  Frank Dignum and
                  Frank van Harmelen},
  title        = {Shaping Proto-Value Functions Using Rewards},
  booktitle    = {{ECAI} 2016 - 22nd European Conference on Artificial Intelligence,
                  29 August-2 September 2016, The Hague, The Netherlands - Including
                  Prestigious Applications of Artificial Intelligence {(PAIS} 2016)},
  series       = {Frontiers in Artificial Intelligence and Applications},
  volume       = {285},
  pages        = {1690--1691},
  publisher    = {{IOS} Press},
  year         = {2016},
  url          = {https://doi.org/10.3233/978-1-61499-672-9-1690},
  doi          = {10.3233/978-1-61499-672-9-1690},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ecai/MaityLPB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ijcnn/NB16,
  author       = {Ranganath B. N. and
                  Shalabh Bhatnagar},
  title        = {Scalable focussed entity resolution},
  booktitle    = {2016 International Joint Conference on Neural Networks, {IJCNN} 2016,
                  Vancouver, BC, Canada, July 24-29, 2016},
  pages        = {3570--3577},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/IJCNN.2016.7727658},
  doi          = {10.1109/IJCNN.2016.7727658},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ijcnn/NB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/wsc/JosephB16,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {A randomized algorithm for continuous optimization},
  booktitle    = {Winter Simulation Conference, {WSC} 2016, Washington, DC, USA, December
                  11-14, 2016},
  pages        = {907--918},
  publisher    = {{IEEE}},
  year         = {2016},
  url          = {https://doi.org/10.1109/WSC.2016.7822152},
  doi          = {10.1109/WSC.2016.7822152},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/wsc/JosephB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/KarmeshuPB16,
  author       = {Karmeshu and
                  Sanjeev Patel and
                  Shalabh Bhatnagar},
  title        = {Adaptive Mean Queue Size and Its Rate of Change: Queue Management
                  with Random Dropping},
  journal      = {CoRR},
  volume       = {abs/1602.02241},
  year         = {2016},
  url          = {http://arxiv.org/abs/1602.02241},
  eprinttype    = {arXiv},
  eprint       = {1602.02241},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KarmeshuPB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/RamaswamyB16,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Gradient-based learning algorithms with constant-error estimators:
                  stability and convergence},
  journal      = {CoRR},
  volume       = {abs/1604.00151},
  year         = {2016},
  url          = {http://arxiv.org/abs/1604.00151},
  eprinttype    = {arXiv},
  eprint       = {1604.00151},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RamaswamyB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/KarmakarMB16,
  author       = {Prasenjit Karmakar and
                  Raj Kumar Maity and
                  Shalabh Bhatnagar},
  title        = {On a convergent off -policy temporal difference learning algorithm
                  in on-line learning environment},
  journal      = {CoRR},
  volume       = {abs/1605.06076},
  year         = {2016},
  url          = {http://arxiv.org/abs/1605.06076},
  eprinttype    = {arXiv},
  eprint       = {1605.06076},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KarmakarMB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/YajiB16,
  author       = {Vinayaka Yaji and
                  Shalabh Bhatnagar},
  title        = {Stochastic Recursive Inclusions with Non-Additive Iterate-Dependent
                  Markov Noise},
  journal      = {CoRR},
  volume       = {abs/1607.04735},
  year         = {2016},
  url          = {http://arxiv.org/abs/1607.04735},
  eprinttype    = {arXiv},
  eprint       = {1607.04735},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YajiB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/JosephB16,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  title        = {A Cross Entropy based Stochastic Approximation Algorithm for Reinforcement
                  Learning with Linear Function Approximation},
  journal      = {CoRR},
  volume       = {abs/1609.09449},
  year         = {2016},
  url          = {http://arxiv.org/abs/1609.09449},
  eprinttype    = {arXiv},
  eprint       = {1609.09449},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/JosephB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/YajiB16a,
  author       = {Vinayaka Yaji and
                  Shalabh Bhatnagar},
  title        = {Stochastic Recursive Inclusions in two timescales with non-additive
                  iterate dependent Markov noise},
  journal      = {CoRR},
  volume       = {abs/1611.05961},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.05961},
  eprinttype    = {arXiv},
  eprint       = {1611.05961},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YajiB16a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/KumarPLPGB16,
  author       = {Sandeep Kumar and
                  Sindhu Padakandla and
                  Chandrashekar Lakshminarayanan and
                  Priyank Parihar and
                  K. Gopinath and
                  Shalabh Bhatnagar},
  title        = {Performance Tuning of Hadoop MapReduce: {A} Noisy Gradient Approach},
  journal      = {CoRR},
  volume       = {abs/1611.10052},
  year         = {2016},
  url          = {http://arxiv.org/abs/1611.10052},
  eprinttype    = {arXiv},
  eprint       = {1611.10052},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KumarPLPGB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/KarmakarB16,
  author       = {Prasenjit Karmakar and
                  Shalabh Bhatnagar},
  title        = {A note on the function approximation error bound for risk-sensitive
                  reinforcement learning},
  journal      = {CoRR},
  volume       = {abs/1612.07562},
  year         = {2016},
  url          = {http://arxiv.org/abs/1612.07562},
  eprinttype    = {arXiv},
  eprint       = {1612.07562},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KarmakarB16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/jota/BhatnagarA15,
  author       = {Shalabh Bhatnagar and
                  Prashanth L. A.},
  title        = {Simultaneous Perturbation Newton Algorithms for Simulation Optimization},
  journal      = {J. Optim. Theory Appl.},
  volume       = {164},
  number       = {2},
  pages        = {621--643},
  year         = {2015},
  url          = {https://doi.org/10.1007/s10957-013-0507-1},
  doi          = {10.1007/S10957-013-0507-1},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jota/BhatnagarA15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/scl/YajiB15,
  author       = {Vinayaka Yaji and
                  Shalabh Bhatnagar},
  title        = {Necessary and sufficient conditions for optimality in constrained
                  general sum stochastic games},
  journal      = {Syst. Control. Lett.},
  volume       = {85},
  pages        = {8--15},
  year         = {2015},
  url          = {https://doi.org/10.1016/j.sysconle.2015.08.003},
  doi          = {10.1016/J.SYSCONLE.2015.08.003},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scl/YajiB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/simulation/APDBD15,
  author       = {Prashanth L. A. and
                  H. L. Prasad and
                  Nirmit Desai and
                  Shalabh Bhatnagar and
                  Gargi Dasgupta},
  title        = {Simultaneous perturbation methods for adaptive labor staffing in service
                  systems},
  journal      = {Simul.},
  volume       = {91},
  number       = {5},
  pages        = {432--455},
  year         = {2015},
  url          = {https://doi.org/10.1177/0037549715581198},
  doi          = {10.1177/0037549715581198},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/simulation/APDBD15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tcom/PadakandlaJB15,
  author       = {Sindhu Padakandla and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Energy Sharing for Multiple Sensor Nodes With Finite Buffers},
  journal      = {{IEEE} Trans. Commun.},
  volume       = {63},
  number       = {5},
  pages        = {1811--1823},
  year         = {2015},
  url          = {https://doi.org/10.1109/TCOMM.2015.2415777},
  doi          = {10.1109/TCOMM.2015.2415777},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tcom/PadakandlaJB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/aaai/Lakshminarayanan15,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  editor       = {Blai Bonet and
                  Sven Koenig},
  title        = {A Generalized Reduced Linear Program for Markov Decision Processes},
  booktitle    = {Proceedings of the Twenty-Ninth {AAAI} Conference on Artificial Intelligence,
                  January 25-30, 2015, Austin, Texas, {USA}},
  pages        = {2722--2728},
  publisher    = {{AAAI} Press},
  year         = {2015},
  url          = {https://doi.org/10.1609/aaai.v29i1.9620},
  doi          = {10.1609/AAAI.V29I1.9620},
  timestamp    = {Mon, 18 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/Lakshminarayanan15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/atal/PrasadAB15,
  author       = {H. L. Prasad and
                  Prashanth L. A. and
                  Shalabh Bhatnagar},
  editor       = {Gerhard Weiss and
                  Pinar Yolum and
                  Rafael H. Bordini and
                  Edith Elkind},
  title        = {Two-Timescale Algorithms for Learning Nash Equilibria in General-Sum
                  Stochastic Games},
  booktitle    = {Proceedings of the 2015 International Conference on Autonomous Agents
                  and Multiagent Systems, {AAMAS} 2015, Istanbul, Turkey, May 4-8, 2015},
  pages        = {1371--1379},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {http://dl.acm.org/citation.cfm?id=2773328},
  timestamp    = {Tue, 08 Mar 2022 10:12:47 +0100},
  biburl       = {https://dblp.org/rec/conf/atal/PrasadAB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/comsnets/JNB15,
  author       = {Prabuchandran K. J. and
                  Hemanth Kumar A. N and
                  Shalabh Bhatnagar},
  title        = {Decentralized learning for traffic signal control},
  booktitle    = {7th International Conference on Communication Systems and Networks,
                  {COMSNETS} 2015, Bangalore, India, January 6-10, 2015},
  pages        = {1--6},
  publisher    = {{IEEE}},
  year         = {2015},
  url          = {https://doi.org/10.1109/COMSNETS.2015.7098712},
  doi          = {10.1109/COMSNETS.2015.7098712},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/comsnets/JNB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/iconip/JosephB15,
  author       = {Ajin George Joseph and
                  Shalabh Bhatnagar},
  editor       = {Sabri Arik and
                  Tingwen Huang and
                  Weng Kin Lai and
                  Qingshan Liu},
  title        = {A Stochastic Approximation Algorithm for Quantile Estimation},
  booktitle    = {Neural Information Processing - 22nd International Conference, {ICONIP}
                  2015, Istanbul, Turkey, November 9-12, 2015, Proceedings, Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {9490},
  pages        = {311--319},
  publisher    = {Springer},
  year         = {2015},
  url          = {https://doi.org/10.1007/978-3-319-26535-3\_36},
  doi          = {10.1007/978-3-319-26535-3\_36},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iconip/JosephB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/RamaswamyB15,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {A Generalization of the Borkar-Meyn Theorem for Stochastic Recursive
                  Inclusions},
  journal      = {CoRR},
  volume       = {abs/1502.01953},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.01953},
  eprinttype    = {arXiv},
  eprint       = {1502.01953},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RamaswamyB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/RamaswamyB15a,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Stochastic recursive inclusions with two timescales},
  journal      = {CoRR},
  volume       = {abs/1502.01956},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.01956},
  eprinttype    = {arXiv},
  eprint       = {1502.01956},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RamaswamyB15a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/AB15,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {Adaptive system optimization using (simultaneous) random directions
                  stochastic approximation},
  journal      = {CoRR},
  volume       = {abs/1502.05577},
  year         = {2015},
  url          = {http://arxiv.org/abs/1502.05577},
  eprinttype    = {arXiv},
  eprint       = {1502.05577},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/PadakandlaJB15,
  author       = {Sindhu Padakandla and
                  Prabuchandran K. J. and
                  Shalabh Bhatnagar},
  title        = {Energy Sharing for Multiple Sensor Nodes with Finite Buffers},
  journal      = {CoRR},
  volume       = {abs/1503.04964},
  year         = {2015},
  url          = {http://arxiv.org/abs/1503.04964},
  eprinttype    = {arXiv},
  eprint       = {1503.04964},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PadakandlaJB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/KarmakarB15,
  author       = {Prasenjit Karmakar and
                  Shalabh Bhatnagar},
  title        = {Two Timescale Stochastic Approximation with Controlled Markov noise},
  journal      = {CoRR},
  volume       = {abs/1503.09105},
  year         = {2015},
  url          = {http://arxiv.org/abs/1503.09105},
  eprinttype    = {arXiv},
  eprint       = {1503.09105},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/KarmakarB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/RamaswamyB15b,
  author       = {Arunselvan Ramaswamy and
                  Shalabh Bhatnagar},
  title        = {Stability of Stochastic Approximations with 'Controlled Markov' Noise
                  and Temporal Difference Learning},
  journal      = {CoRR},
  volume       = {abs/1504.06043},
  year         = {2015},
  url          = {http://arxiv.org/abs/1504.06043},
  eprinttype    = {arXiv},
  eprint       = {1504.06043},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/RamaswamyB15b.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/YajiB15,
  author       = {Vinayaka Yaji and
                  Shalabh Bhatnagar},
  title        = {A bi-convex optimization problem to compute Nash equilibrium in n-player
                  games and an algorithm},
  journal      = {CoRR},
  volume       = {abs/1504.06828},
  year         = {2015},
  url          = {http://arxiv.org/abs/1504.06828},
  eprinttype    = {arXiv},
  eprint       = {1504.06828},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/YajiB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/PrasadB15,
  author       = {H. L. Prasad and
                  Shalabh Bhatnagar},
  title        = {A Study of Gradient Descent Schemes for General-Sum Stochastic Games},
  journal      = {CoRR},
  volume       = {abs/1507.00093},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.00093},
  eprinttype    = {arXiv},
  eprint       = {1507.00093},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PrasadB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/APBC15,
  author       = {Prashanth L. A. and
                  H. L. Prasad and
                  Shalabh Bhatnagar and
                  Prakash Chandra},
  title        = {A constrained optimization perspective on actor critic algorithms
                  and application to network routing},
  journal      = {CoRR},
  volume       = {abs/1507.07984},
  year         = {2015},
  url          = {http://arxiv.org/abs/1507.07984},
  eprinttype    = {arXiv},
  eprint       = {1507.07984},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/APBC15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/NarayananMB15,
  author       = {Chandrashekar Lakshmi Narayanan and
                  Raj Kumar Maity and
                  Shalabh Bhatnagar},
  title        = {Shaping Proto-Value Functions via Rewards},
  journal      = {CoRR},
  volume       = {abs/1511.08589},
  year         = {2015},
  url          = {http://arxiv.org/abs/1511.08589},
  eprinttype    = {arXiv},
  eprint       = {1511.08589},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/NarayananMB15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/GhoshdastidarDB14,
  author       = {Debarghya Ghoshdastidar and
                  Ambedkar Dukkipati and
                  Shalabh Bhatnagar},
  title        = {Newton-based stochastic optimization using q-Gaussian smoothed functional
                  algorithms},
  journal      = {Autom.},
  volume       = {50},
  number       = {10},
  pages        = {2606--2614},
  year         = {2014},
  url          = {https://doi.org/10.1016/j.automatica.2014.08.021},
  doi          = {10.1016/J.AUTOMATICA.2014.08.021},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/GhoshdastidarDB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/itor/ChakravartyPB14,
  author       = {Saswata Chakravarty and
                  Sindhu Padakandla and
                  Shalabh Bhatnagar},
  title        = {A simulation-based algorithm for optimal pricing policy under demand
                  uncertainty},
  journal      = {Int. Trans. Oper. Res.},
  volume       = {21},
  number       = {5},
  pages        = {737--760},
  year         = {2014},
  url          = {https://doi.org/10.1111/itor.12064},
  doi          = {10.1111/ITOR.12064},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/itor/ChakravartyPB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/GhoshdastidarDB14,
  author       = {Debarghya Ghoshdastidar and
                  Ambedkar Dukkipati and
                  Shalabh Bhatnagar},
  title        = {Smoothed Functional Algorithms for Stochastic Optimization Using \emph{q}-Gaussian
                  Distributions},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {24},
  number       = {3},
  pages        = {17:1--17:26},
  year         = {2014},
  url          = {https://doi.org/10.1145/2628434},
  doi          = {10.1145/2628434},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/GhoshdastidarDB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/winet/ACB14,
  author       = {Prashanth L. A. and
                  Abhranil Chatterjee and
                  Shalabh Bhatnagar},
  title        = {Two timescale convergent Q-learning for sleep-scheduling in wireless
                  sensor networks},
  journal      = {Wirel. Networks},
  volume       = {20},
  number       = {8},
  pages        = {2589--2604},
  year         = {2014},
  url          = {https://doi.org/10.1007/s11276-014-0762-6},
  doi          = {10.1007/S11276-014-0762-6},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/winet/ACB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/LakshminarayananB14,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  title        = {Approximate Dynamic Programming with (min; +) linear function approximation
                  for Markov decision processes},
  booktitle    = {53rd {IEEE} Conference on Decision and Control, {CDC} 2014, Los Angeles,
                  CA, USA, December 15-17, 2014},
  pages        = {1588--1593},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/CDC.2014.7039626},
  doi          = {10.1109/CDC.2014.7039626},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/LakshminarayananB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/JBB14,
  author       = {Prabuchandran K. J. and
                  Shalabh Bhatnagar and
                  Vivek S. Borkar},
  title        = {An actor critic algorithm based on Grassmanian search},
  booktitle    = {53rd {IEEE} Conference on Decision and Control, {CDC} 2014, Los Angeles,
                  CA, USA, December 15-17, 2014},
  pages        = {3597--3602},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/CDC.2014.7039948},
  doi          = {10.1109/CDC.2014.7039948},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/JBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/comsnets/ACB14,
  author       = {Prashanth L. A. and
                  Abhranil Chatterjee and
                  Shalabh Bhatnagar},
  title        = {Adaptive sleep-wake control using reinforcement learning in sensor
                  networks},
  booktitle    = {Sixth International Conference on Communication Systems and Networks,
                  {COMSNETS} 2014, Bangalore, India, January 6-10, 2014},
  pages        = {1--8},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/COMSNETS.2014.6734874},
  doi          = {10.1109/COMSNETS.2014.6734874},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/comsnets/ACB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/hcomp/LakshminarayananDBB14,
  author       = {Chandrashekar Lakshminarayanan and
                  Ayush Dubey and
                  Shalabh Bhatnagar and
                  Chithralekha Balamurugan},
  editor       = {Jeffrey P. Bigham and
                  David C. Parkes},
  title        = {A Markov Decision Process Framework for Predictable Job Completion
                  Times on Crowdsourcing Platforms},
  booktitle    = {Proceedings of the Seconf {AAAI} Conference on Human Computation and
                  Crowdsourcing, {HCOMP} 2014, November 2-4, 2014, Pittsburgh, Pennsylvania,
                  {USA}},
  pages        = {34--35},
  publisher    = {{AAAI}},
  year         = {2014},
  url          = {https://doi.org/10.1609/hcomp.v2i1.13183},
  doi          = {10.1609/HCOMP.V2I1.13183},
  timestamp    = {Tue, 05 Sep 2023 11:10:11 +0200},
  biburl       = {https://dblp.org/rec/conf/hcomp/LakshminarayananDBB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/itsc/JNB14,
  author       = {Prabuchandran K. J. and
                  Hemanth Kumar A. N and
                  Shalabh Bhatnagar},
  title        = {Multi-agent reinforcement learning for traffic signal control},
  booktitle    = {17th International {IEEE} Conference on Intelligent Transportation
                  Systems, {ITSC} 2014, Qingdao, China, October 8-11, 2014},
  pages        = {2529--2534},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ITSC.2014.6958095},
  doi          = {10.1109/ITSC.2014.6958095},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/itsc/JNB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/nips/YaoSSMB14,
  author       = {Hengshuai Yao and
                  Csaba Szepesv{\'{a}}ri and
                  Richard S. Sutton and
                  Joseph Modayil and
                  Shalabh Bhatnagar},
  editor       = {Zoubin Ghahramani and
                  Max Welling and
                  Corinna Cortes and
                  Neil D. Lawrence and
                  Kilian Q. Weinberger},
  title        = {Universal Option Models},
  booktitle    = {Advances in Neural Information Processing Systems 27: Annual Conference
                  on Neural Information Processing Systems 2014, December 8-13 2014,
                  Montreal, Quebec, Canada},
  pages        = {990--998},
  year         = {2014},
  url          = {https://proceedings.neurips.cc/paper/2014/hash/996a7fa078cc36c46d02f9af3bef918b-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/YaoSSMB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/wsc/ZhouBC14,
  author       = {Enlu Zhou and
                  Shalabh Bhatnagar and
                  Xi Chen},
  editor       = {Stephen J. Buckley and
                  John A. Miller},
  title        = {Simulation optimization via gradient-based stochastic search},
  booktitle    = {Proceedings of the 2014 Winter Simulation Conference, Savannah, GA,
                  USA, December 7-10, 2014},
  pages        = {3869--3879},
  publisher    = {{IEEE/ACM}},
  year         = {2014},
  url          = {https://doi.org/10.1109/WSC.2014.7020213},
  doi          = {10.1109/WSC.2014.7020213},
  timestamp    = {Thu, 11 Apr 2024 20:25:47 +0200},
  biburl       = {https://dblp.org/rec/conf/wsc/ZhouBC14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/PrasadAB14,
  author       = {H. L. Prasad and
                  Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {Algorithms for Nash Equilibria in General-Sum Stochastic Games},
  journal      = {CoRR},
  volume       = {abs/1401.2086},
  year         = {2014},
  url          = {http://arxiv.org/abs/1401.2086},
  eprinttype    = {arXiv},
  eprint       = {1401.2086},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PrasadAB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/LakshminarayananB14,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  title        = {Approximate Dynamic Programming based on Projection onto the (min,
                  +) subsemimodule},
  journal      = {CoRR},
  volume       = {abs/1403.4175},
  year         = {2014},
  url          = {http://arxiv.org/abs/1403.4175},
  eprinttype    = {arXiv},
  eprint       = {1403.4175},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LakshminarayananB14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/LakshminarayananB14a,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  title        = {Approximate dynamic programming with {\textdollar}({\textbackslash}min,
                  +){\textdollar} linear function approximation for Markov decision
                  processes},
  journal      = {CoRR},
  volume       = {abs/1403.4179},
  year         = {2014},
  url          = {http://arxiv.org/abs/1403.4179},
  eprinttype    = {arXiv},
  eprint       = {1403.4179},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LakshminarayananB14a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/LakshminarayananB14b,
  author       = {Chandrashekar Lakshminarayanan and
                  Shalabh Bhatnagar},
  title        = {A Generalized Reduced Linear Program for Markov Decision Processes},
  journal      = {CoRR},
  volume       = {abs/1409.3536},
  year         = {2014},
  url          = {http://arxiv.org/abs/1409.3536},
  eprinttype    = {arXiv},
  eprint       = {1409.3536},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/LakshminarayananB14b.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/jstsp/BhatnagarBJ13,
  author       = {Shalabh Bhatnagar and
                  Vivek S. Borkar and
                  Prabuchandran K. J.},
  title        = {Feature Search in the Grassmanian in Online Reinforcement Learning},
  journal      = {{IEEE} J. Sel. Top. Signal Process.},
  volume       = {7},
  number       = {5},
  pages        = {746--758},
  year         = {2013},
  url          = {https://doi.org/10.1109/JSTSP.2013.2255022},
  doi          = {10.1109/JSTSP.2013.2255022},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jstsp/BhatnagarBJ13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/wcl/JMB13,
  author       = {Prabuchandran K. J. and
                  Sunil Kumar Meena and
                  Shalabh Bhatnagar},
  title        = {Q-Learning Based Energy Management Policies for a Single Sensor Node
                  with Finite Buffer},
  journal      = {{IEEE} Wirel. Commun. Lett.},
  volume       = {2},
  number       = {1},
  pages        = {82--85},
  year         = {2013},
  url          = {https://doi.org/10.1109/WCL.2012.112012.120754},
  doi          = {10.1109/WCL.2012.112012.120754},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/wcl/JMB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/atal/AnanthapadmanabharaoPDB13,
  author       = {Prashanth Lakshmanrao Ananthapadmanabharao and
                  Horabailu Laxminarayana Prasad and
                  Nirmit Desai and
                  Shalabh Bhatnagar},
  editor       = {Maria L. Gini and
                  Onn Shehory and
                  Takayuki Ito and
                  Catholijn M. Jonker},
  title        = {Mechanisms for hostile agents with capacity constraints},
  booktitle    = {International conference on Autonomous Agents and Multi-Agent Systems,
                  {AAMAS} '13, Saint Paul, MN, USA, May 6-10, 2013},
  pages        = {659--666},
  publisher    = {{IFAAMAS}},
  year         = {2013},
  url          = {http://dl.acm.org/citation.cfm?id=2485024},
  timestamp    = {Thu, 09 Sep 2021 16:09:54 +0200},
  biburl       = {https://dblp.org/rec/conf/atal/AnanthapadmanabharaoPDB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/GhoshdastidarDB13,
  author       = {Debarghya Ghoshdastidar and
                  Ambedkar Dukkipati and
                  Shalabh Bhatnagar},
  title        = {Newton based Stochastic Optimization using q-Gaussian Smoothed Functional
                  Algorithms},
  journal      = {CoRR},
  volume       = {abs/1311.2296},
  year         = {2013},
  url          = {http://arxiv.org/abs/1311.2296},
  eprinttype    = {arXiv},
  eprint       = {1311.2296},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/GhoshdastidarDB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/AnanthapadmanabharaoCB13,
  author       = {Prashanth Lakshmanrao Ananthapadmanabharao and
                  Abhranil Chatterjee and
                  Shalabh Bhatnagar},
  title        = {Reinforcement Learning for Sleep-Wake Scheduling in Sensor Networks},
  journal      = {CoRR},
  volume       = {abs/1312.7292},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.7292},
  eprinttype    = {arXiv},
  eprint       = {1312.7292},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/AnanthapadmanabharaoCB13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/PrashanthPDBD13,
  author       = {Prashanth L. A. and
                  H. L. Prasad and
                  Nirmit Desai and
                  Shalabh Bhatnagar and
                  Gargi Dasgupta},
  title        = {Simultaneous Perturbation Methods for Adaptive Labor Staffing in Service
                  Systems},
  journal      = {CoRR},
  volume       = {abs/1312.7430},
  year         = {2013},
  url          = {http://arxiv.org/abs/1312.7430},
  eprinttype    = {arXiv},
  eprint       = {1312.7430},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/PrashanthPDBD13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/PrasadB12,
  author       = {H. L. Prasad and
                  Shalabh Bhatnagar},
  title        = {General-sum stochastic games: Verifiability conditions for Nash equilibria},
  journal      = {Autom.},
  volume       = {48},
  number       = {11},
  pages        = {2923--2930},
  year         = {2012},
  url          = {https://doi.org/10.1016/j.automatica.2012.06.088},
  doi          = {10.1016/J.AUTOMATICA.2012.06.088},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/PrasadB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/cn/VemuBH12,
  author       = {Koteswara Rao Vemu and
                  Shalabh Bhatnagar and
                  N. Hemachandra},
  title        = {Optimal multi-layered congestion based pricing schemes for enhanced
                  QoS},
  journal      = {Comput. Networks},
  volume       = {56},
  number       = {4},
  pages        = {1249--1262},
  year         = {2012},
  url          = {https://doi.org/10.1016/j.comnet.2011.12.004},
  doi          = {10.1016/J.COMNET.2011.12.004},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/cn/VemuBH12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/jota/BhatnagarL12,
  author       = {Shalabh Bhatnagar and
                  K. Lakshmanan},
  title        = {An Online Actor-Critic Algorithm with Function Approximation for Constrained
                  Markov Decision Processes},
  journal      = {J. Optim. Theory Appl.},
  volume       = {153},
  number       = {3},
  pages        = {688--708},
  year         = {2012},
  url          = {https://doi.org/10.1007/s10957-012-9989-5},
  doi          = {10.1007/S10957-012-9989-5},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jota/BhatnagarL12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tvt/PrashanthB12,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {Threshold Tuning Using Stochastic Optimization for Graded Signal Control},
  journal      = {{IEEE} Trans. Veh. Technol.},
  volume       = {61},
  number       = {9},
  pages        = {3865--3880},
  year         = {2012},
  url          = {https://doi.org/10.1109/TVT.2012.2209904},
  doi          = {10.1109/TVT.2012.2209904},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tvt/PrashanthB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/allerton/LakshmananB12,
  author       = {K. Lakshmanan and
                  Shalabh Bhatnagar},
  title        = {A novel Q-learning algorithm with function approximation for constrained
                  Markov decision processes},
  booktitle    = {50th Annual Allerton Conference on Communication, Control, and Computing,
                  Allerton 2012, Allerton Park {\&} Retreat Center, Monticello,
                  IL, USA, October 1-5, 2012},
  pages        = {400--405},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/Allerton.2012.6483246},
  doi          = {10.1109/ALLERTON.2012.6483246},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/allerton/LakshmananB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/isit/GhoshdastidarDB12,
  author       = {Debarghya Ghoshdastidar and
                  Ambedkar Dukkipati and
                  Shalabh Bhatnagar},
  title        = {q-Gaussian based Smoothed Functional algorithms for stochastic optimization},
  booktitle    = {Proceedings of the 2012 {IEEE} International Symposium on Information
                  Theory, {ISIT} 2012, Cambridge, MA, USA, July 1-6, 2012},
  pages        = {1059--1063},
  publisher    = {{IEEE}},
  year         = {2012},
  url          = {https://doi.org/10.1109/ISIT.2012.6283013},
  doi          = {10.1109/ISIT.2012.6283013},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/isit/GhoshdastidarDB12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1202-5665,
  author       = {Debarghya Ghoshdastidar and
                  Ambedkar Dukkipati and
                  Shalabh Bhatnagar},
  title        = {q-Gaussian based Smoothed Functional Algorithm for Stochastic Optimization},
  journal      = {CoRR},
  volume       = {abs/1202.5665},
  year         = {2012},
  url          = {http://arxiv.org/abs/1202.5665},
  eprinttype    = {arXiv},
  eprint       = {1202.5665},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1202-5665.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-1206-4832,
  author       = {Debarghya Ghoshdastidar and
                  Ambedkar Dukkipati and
                  Shalabh Bhatnagar},
  title        = {Smoothed Functional Algorithms for Stochastic Optimization using q-Gaussian
                  Distributions},
  journal      = {CoRR},
  volume       = {abs/1206.4832},
  year         = {2012},
  url          = {http://arxiv.org/abs/1206.4832},
  eprinttype    = {arXiv},
  eprint       = {1206.4832},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1206-4832.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/scl/Bhatnagar11,
  author       = {Shalabh Bhatnagar},
  title        = {The Borkar-Meyn theorem for asynchronous stochastic approximations},
  journal      = {Syst. Control. Lett.},
  volume       = {60},
  number       = {7},
  pages        = {472--478},
  year         = {2011},
  url          = {https://doi.org/10.1016/j.sysconle.2011.04.002},
  doi          = {10.1016/J.SYSCONLE.2011.04.002},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scl/Bhatnagar11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tase/BhatnagarMH11,
  author       = {Shalabh Bhatnagar and
                  Vivek Kumar Mishra and
                  N. Hemachandra},
  title        = {Stochastic Algorithms for Discrete Parameter Simulation Optimization},
  journal      = {{IEEE} Trans Autom. Sci. Eng.},
  volume       = {8},
  number       = {4},
  pages        = {780--793},
  year         = {2011},
  url          = {https://doi.org/10.1109/TASE.2011.2159375},
  doi          = {10.1109/TASE.2011.2159375},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tase/BhatnagarMH11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tcom/KarmeshuBM11,
  author       = {Karmeshu and
                  Shalabh Bhatnagar and
                  Vivek Kumar Mishra},
  title        = {An Optimized {SDE} Model for Slotted Aloha},
  journal      = {{IEEE} Trans. Commun.},
  volume       = {59},
  number       = {6},
  pages        = {1502--1508},
  year         = {2011},
  url          = {https://doi.org/10.1109/TCOMM.2011.041111.090113},
  doi          = {10.1109/TCOMM.2011.041111.090113},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tcom/KarmeshuBM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tits/PrashanthB11,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {Reinforcement Learning With Function Approximation for Traffic Signal
                  Control},
  journal      = {{IEEE} Trans. Intell. Transp. Syst.},
  volume       = {12},
  number       = {2},
  pages        = {412--421},
  year         = {2011},
  url          = {https://doi.org/10.1109/TITS.2010.2091408},
  doi          = {10.1109/TITS.2010.2091408},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tits/PrashanthB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/BhatnagarHM11,
  author       = {Shalabh Bhatnagar and
                  N. Hemachandra and
                  Vivek Kumar Mishra},
  title        = {Stochastic approximation algorithms for constrained optimization via
                  simulation},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {21},
  number       = {3},
  pages        = {15:1--15:22},
  year         = {2011},
  url          = {https://doi.org/10.1145/1921598.1921599},
  doi          = {10.1145/1921598.1921599},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/BhatnagarHM11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icdcit/LakshmananB11,
  author       = {K. Lakshmanan and
                  Shalabh Bhatnagar},
  editor       = {Raja Natarajan and
                  Adegboyega K. Ojo},
  title        = {Smoothed Functional and Quasi-Newton Algorithms for Routing in Multi-stage
                  Queueing Network with Constraints},
  booktitle    = {Distributed Computing and Internet Technology - 7th International
                  Conference, {ICDCIT} 2011, Bhubaneshwar, India, February 9-12, 2011.
                  Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {6536},
  pages        = {175--186},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-19056-8\_12},
  doi          = {10.1007/978-3-642-19056-8\_12},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icdcit/LakshmananB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icsoc/PrashanthPDBD11,
  author       = {Prashanth L. A. and
                  H. L. Prasad and
                  Nirmit Desai and
                  Shalabh Bhatnagar and
                  Gargi Banerjee Dasgupta},
  editor       = {Gerti Kappel and
                  Zakaria Maamar and
                  Hamid R. Motahari Nezhad},
  title        = {Stochastic Optimization for Adaptive Labor Staffing in Service Systems},
  booktitle    = {Service-Oriented Computing - 9th International Conference, {ICSOC}
                  2011, Paphos, Cyprus, December 5-8, 2011 Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7084},
  pages        = {487--494},
  publisher    = {Springer},
  year         = {2011},
  url          = {https://doi.org/10.1007/978-3-642-25535-9\_33},
  doi          = {10.1007/978-3-642-25535-9\_33},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icsoc/PrashanthPDBD11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/itsc/AB11,
  author       = {Prashanth L. A. and
                  Shalabh Bhatnagar},
  title        = {Reinforcement learning with average cost for adaptive control of traffic
                  lights at intersections},
  booktitle    = {14th International {IEEE} Conference on Intelligent Transportation
                  Systems, {ITSC} 2011, Washington, DC, USA, October 5-7, 2011},
  pages        = {1640--1645},
  publisher    = {{IEEE}},
  year         = {2011},
  url          = {https://doi.org/10.1109/ITSC.2011.6082823},
  doi          = {10.1109/ITSC.2011.6082823},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/itsc/AB11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/scl/Bhatnagar10,
  author       = {Shalabh Bhatnagar},
  title        = {An actor-critic algorithm with function approximation for discounted
                  cost constrained Markov decision processes},
  journal      = {Syst. Control. Lett.},
  volume       = {59},
  number       = {12},
  pages        = {760--766},
  year         = {2010},
  url          = {https://doi.org/10.1016/j.sysconle.2010.08.013},
  doi          = {10.1016/J.SYSCONLE.2010.08.013},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/scl/Bhatnagar10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/simulation/ChakrabortyB10,
  author       = {Anshuk Chakraborty and
                  Shalabh Bhatnagar},
  title        = {Optimized Policies for the Retransmission Probabilities in Slotted
                  Aloha},
  journal      = {Simul.},
  volume       = {86},
  number       = {4},
  pages        = {247--261},
  year         = {2010},
  url          = {https://doi.org/10.1177/0037549709349324},
  doi          = {10.1177/0037549709349324},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/simulation/ChakrabortyB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/winet/ReddyBRC10,
  author       = {G. Ramana Reddy and
                  Shalabh Bhatnagar and
                  V. Rakesh and
                  Vijay Prakash Chaturvedi},
  title        = {An efficient algorithm for scheduling in bluetooth piconets and scatternets},
  journal      = {Wirel. Networks},
  volume       = {16},
  number       = {7},
  pages        = {1799--1816},
  year         = {2010},
  url          = {https://doi.org/10.1007/s11276-009-0229-3},
  doi          = {10.1007/S11276-009-0229-3},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/winet/ReddyBRC10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icml/MaeiSBS10,
  author       = {Hamid Reza Maei and
                  Csaba Szepesv{\'{a}}ri and
                  Shalabh Bhatnagar and
                  Richard S. Sutton},
  editor       = {Johannes F{\"{u}}rnkranz and
                  Thorsten Joachims},
  title        = {Toward Off-Policy Learning Control with Function Approximation},
  booktitle    = {Proceedings of the 27th International Conference on Machine Learning
                  (ICML-10), June 21-24, 2010, Haifa, Israel},
  pages        = {719--726},
  publisher    = {Omnipress},
  year         = {2010},
  url          = {https://icml.cc/Conferences/2010/papers/627.pdf},
  timestamp    = {Wed, 03 Apr 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/MaeiSBS10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/BhatnagarSGL09,
  author       = {Shalabh Bhatnagar and
                  Richard S. Sutton and
                  Mohammad Ghavamzadeh and
                  Mark Lee},
  title        = {Natural actor-critic algorithms},
  journal      = {Autom.},
  volume       = {45},
  number       = {11},
  pages        = {2471--2482},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.automatica.2009.07.008},
  doi          = {10.1016/J.AUTOMATICA.2009.07.008},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/BhatnagarSGL09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/icl/BhatnagarP09,
  author       = {Shalabh Bhatnagar and
                  Rajesh Kumar Patro},
  title        = {A proof of convergence of the {B-RED} and {P-RED} algorithms for random
                  early detection},
  journal      = {{IEEE} Commun. Lett.},
  volume       = {13},
  number       = {10},
  pages        = {809--811},
  year         = {2009},
  url          = {https://doi.org/10.1109/LCOMM.2009.091276},
  doi          = {10.1109/LCOMM.2009.091276},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/icl/BhatnagarP09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/pe/PatroB09,
  author       = {Rajesh Kumar Patro and
                  Shalabh Bhatnagar},
  title        = {A probabilistic constrained nonlinear optimization framework to optimize
                  {RED} parameters},
  journal      = {Perform. Evaluation},
  volume       = {66},
  number       = {2},
  pages        = {81--104},
  year         = {2009},
  url          = {https://doi.org/10.1016/j.peva.2008.09.003},
  doi          = {10.1016/J.PEVA.2008.09.003},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pe/PatroB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/BhatnagarKM09,
  author       = {Shalabh Bhatnagar and
                  Karmeshu and
                  Vivek Kumar Mishra},
  title        = {Optimal parameter trajectory estimation in parameterized SDEs: An
                  algorithmic procedure},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {19},
  number       = {2},
  pages        = {8:1--8:27},
  year         = {2009},
  url          = {https://doi.org/10.1145/1502787.1502791},
  doi          = {10.1145/1502787.1502791},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/BhatnagarKM09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/YaoBS09,
  author       = {Hengshuai Yao and
                  Shalabh Bhatnagar and
                  Csaba Szepesv{\'{a}}ri},
  title        = {{LMS-2:} Towards an algorithm that is as cheap as {LMS} and almost
                  as efficient as {RLS}},
  booktitle    = {Proceedings of the 48th {IEEE} Conference on Decision and Control,
                  {CDC} 2009, combined withe the 28th Chinese Control Conference, December
                  16-18, 2009, Shanghai, China},
  pages        = {1181--1188},
  publisher    = {{IEEE}},
  year         = {2009},
  url          = {https://doi.org/10.1109/CDC.2009.5400370},
  doi          = {10.1109/CDC.2009.5400370},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/YaoBS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icml/SuttonMPBSSW09,
  author       = {Richard S. Sutton and
                  Hamid Reza Maei and
                  Doina Precup and
                  Shalabh Bhatnagar and
                  David Silver and
                  Csaba Szepesv{\'{a}}ri and
                  Eric Wiewiora},
  editor       = {Andrea Pohoreckyj Danyluk and
                  L{\'{e}}on Bottou and
                  Michael L. Littman},
  title        = {Fast gradient-descent methods for temporal-difference learning with
                  linear function approximation},
  booktitle    = {Proceedings of the 26th Annual International Conference on Machine
                  Learning, {ICML} 2009, Montreal, Quebec, Canada, June 14-18, 2009},
  series       = {{ACM} International Conference Proceeding Series},
  volume       = {382},
  pages        = {993--1000},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1553374.1553501},
  doi          = {10.1145/1553374.1553501},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/SuttonMPBSSW09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/nips/MaeiSBPSS09,
  author       = {Hamid Reza Maei and
                  Csaba Szepesv{\'{a}}ri and
                  Shalabh Bhatnagar and
                  Doina Precup and
                  David Silver and
                  Richard S. Sutton},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {Convergent Temporal-Difference Learning with Arbitrary Smooth Function
                  Approximation},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {1204--1212},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/3a15c7d0bbe60300a39f76f8a5ba6896-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/MaeiSBPSS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/nips/YaoSBDS09,
  author       = {Hengshuai Yao and
                  Richard S. Sutton and
                  Shalabh Bhatnagar and
                  Diao Dongcui and
                  Csaba Szepesv{\'{a}}ri},
  editor       = {Yoshua Bengio and
                  Dale Schuurmans and
                  John D. Lafferty and
                  Christopher K. I. Williams and
                  Aron Culotta},
  title        = {Multi-Step Dyna Planning for Policy Evaluation and Control},
  booktitle    = {Advances in Neural Information Processing Systems 22: 23rd Annual
                  Conference on Neural Information Processing Systems 2009. Proceedings
                  of a meeting held 7-10 December 2009, Vancouver, British Columbia,
                  Canada},
  pages        = {2187--2195},
  publisher    = {Curran Associates, Inc.},
  year         = {2009},
  url          = {https://proceedings.neurips.cc/paper/2009/hash/c52f1bd66cc19d05628bd8bf27af3ad6-Abstract.html},
  timestamp    = {Thu, 21 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/nips/YaoSBDS09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@incollection{DBLP:reference/dataware/ViswanathMB09,
  author       = {P. Viswanath and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  editor       = {John Wang},
  title        = {Pattern Synthesis for Nonparametric Pattern Recognition},
  booktitle    = {Encyclopedia of Data Warehousing and Mining, Second Edition {(4} Volumes)},
  pages        = {1511--1516},
  publisher    = {{IGI} Global},
  year         = {2009},
  url          = {http://www.igi-global.com/Bookstore/Chapter.aspx?TitleId=11020},
  timestamp    = {Wed, 12 Jul 2017 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/reference/dataware/ViswanathMB09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/BhatnagarB08,
  author       = {Shalabh Bhatnagar and
                  K. Mohan Babu},
  title        = {New algorithms of the Q-learning type},
  journal      = {Autom.},
  volume       = {44},
  number       = {4},
  pages        = {1111--1119},
  year         = {2008},
  url          = {https://doi.org/10.1016/j.automatica.2007.09.009},
  doi          = {10.1016/J.AUTOMATICA.2007.09.009},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/BhatnagarB08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/mms/VelusamyGBV08,
  author       = {Sudha Velusamy and
                  Lakshmi Gopal and
                  Shalabh Bhatnagar and
                  Sridhar Varadarajan},
  title        = {An efficient ad recommendation system for {TV} programs},
  journal      = {Multim. Syst.},
  volume       = {14},
  number       = {2},
  pages        = {73--87},
  year         = {2008},
  url          = {https://doi.org/10.1007/s00530-008-0117-1},
  doi          = {10.1007/S00530-008-0117-1},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mms/VelusamyGBV08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/simulation/BhatnagarA08,
  author       = {Shalabh Bhatnagar and
                  Mohammed Shahid Abdulla},
  title        = {Simulation-Based Optimization Algorithms for Finite-Horizon Markov
                  Decision Processes},
  journal      = {Simul.},
  volume       = {84},
  number       = {12},
  pages        = {577--600},
  year         = {2008},
  url          = {https://doi.org/10.1177/0037549708098120},
  doi          = {10.1177/0037549708098120},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/simulation/BhatnagarA08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/mmsp/VelusamyBBS08,
  author       = {Sudha Velusamy and
                  Shalabh Bhatnagar and
                  S. V. Basavaraja and
                  V. Sridhar},
  title        = {{SPSA} based feature relevance estimation for video retrieval},
  booktitle    = {International Workshop on Multimedia Signal Processing, {MMSP} 2008,
                  October 8-10, 2008, Shangri-la Hotel, Cairns, Queensland, Australia},
  pages        = {598--603},
  publisher    = {{IEEE} Signal Processing Society},
  year         = {2008},
  url          = {https://doi.org/10.1109/MMSP.2008.4665147},
  doi          = {10.1109/MMSP.2008.4665147},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mmsp/VelusamyBBS08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/netcoop/KolavaliB08,
  author       = {Sudha Rani Kolavali and
                  Shalabh Bhatnagar},
  editor       = {Eitan Altman and
                  Augustin Chaintreau},
  title        = {Ant Colony Optimization Algorithms for Shortest Path Problems},
  booktitle    = {Network Control and Optimization, Second Euro-NF Workshop, {NET-COOP}
                  2008, Paris, France, September 8-10, 2008. Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {5425},
  pages        = {37--44},
  publisher    = {Springer},
  year         = {2008},
  url          = {https://doi.org/10.1007/978-3-642-00393-6\_5},
  doi          = {10.1007/978-3-642-00393-6\_5},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/netcoop/KolavaliB08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/deds/AbdullaB07,
  author       = {Mohammed Shahid Abdulla and
                  Shalabh Bhatnagar},
  title        = {Reinforcement Learning Based Algorithms for Average Cost Markov Decision
                  Processes},
  journal      = {Discret. Event Dyn. Syst.},
  volume       = {17},
  number       = {1},
  pages        = {23--52},
  year         = {2007},
  url          = {https://doi.org/10.1007/s10626-006-0003-y},
  doi          = {10.1007/S10626-006-0003-Y},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/deds/AbdullaB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/isci/DukkipatiBM07,
  author       = {Ambedkar Dukkipati and
                  Shalabh Bhatnagar and
                  M. Narasimha Murty},
  title        = {Gelfand-Yaglom-Perez theorem for generalized relative entropy functionals},
  journal      = {Inf. Sci.},
  volume       = {177},
  number       = {24},
  pages        = {5707--5714},
  year         = {2007},
  url          = {https://doi.org/10.1016/j.ins.2007.07.017},
  doi          = {10.1016/J.INS.2007.07.017},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/isci/DukkipatiBM07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/Bhatnagar07,
  author       = {Shalabh Bhatnagar},
  title        = {Adaptive Newton-based multivariate smoothed functional algorithms
                  for simulation optimization},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {18},
  number       = {1},
  pages        = {2:1--2:35},
  year         = {2007},
  url          = {https://doi.org/10.1145/1315575.1315577},
  doi          = {10.1145/1315575.1315577},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/Bhatnagar07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/acc/AbdullaB07,
  author       = {Mohammed Shahid Abdulla and
                  Shalabh Bhatnagar},
  title        = {Parametrized Actor-Critic Algorithms for Finite-Horizon MDPs},
  booktitle    = {American Control Conference, {ACC} 2007, New York, NY, USA, 9-13 July,
                  2007},
  pages        = {534--539},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ACC.2007.4282587},
  doi          = {10.1109/ACC.2007.4282587},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acc/AbdullaB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/acc/AbdullaB07a,
  author       = {Mohammed Shahid Abdulla and
                  Shalabh Bhatnagar},
  title        = {Solving MDPs using Two-timescale Simulated Annealing with Multiplicative
                  Weights},
  booktitle    = {American Control Conference, {ACC} 2007, New York, NY, USA, 9-13 July,
                  2007},
  pages        = {2428--2433},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/ACC.2007.4282586},
  doi          = {10.1109/ACC.2007.4282586},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/acc/AbdullaB07a.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/VemuBH07,
  author       = {Koteswara Rao Vemu and
                  Shalabh Bhatnagar and
                  N. Hemachandra},
  title        = {Link route pricing for enhanced QoS},
  booktitle    = {46th {IEEE} Conference on Decision and Control, {CDC} 2007, New Orleans,
                  LA, USA, December 12-14, 2007},
  pages        = {1504--1509},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/CDC.2007.4434595},
  doi          = {10.1109/CDC.2007.4434595},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/VemuBH07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/MishraBH07,
  author       = {Vivek Kumar Mishra and
                  Shalabh Bhatnagar and
                  N. Hemachandra},
  title        = {Discrete parameter simulation optimization algorithms with applications
                  to admission control with dependent service times},
  booktitle    = {46th {IEEE} Conference on Decision and Control, {CDC} 2007, New Orleans,
                  LA, USA, December 12-14, 2007},
  pages        = {2986--2991},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/CDC.2007.4434229},
  doi          = {10.1109/CDC.2007.4434229},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/MishraBH07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/AbdullaB07,
  author       = {Mohammed Shahid Abdulla and
                  Shalabh Bhatnagar},
  title        = {Network flow-control using asynchronous stochastic approximation},
  booktitle    = {46th {IEEE} Conference on Decision and Control, {CDC} 2007, New Orleans,
                  LA, USA, December 12-14, 2007},
  pages        = {5857--5862},
  publisher    = {{IEEE}},
  year         = {2007},
  url          = {https://doi.org/10.1109/CDC.2007.4434593},
  doi          = {10.1109/CDC.2007.4434593},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/AbdullaB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/euroitv/VelusamyGVB07,
  author       = {Sudha Velusamy and
                  Lakshmi Gopal and
                  Sridhar Varadarajan and
                  Shalabh Bhatnagar},
  editor       = {Pablo C{\'{e}}sar and
                  Konstantinos Chorianopoulos and
                  Jens F. Jensen},
  title        = {Fuzzy Clustering Based Ad Recommendation for {TV} Programs},
  booktitle    = {Interactive {TV:} a Shared Experience, 5th European Conference, EuroITV
                  2007, Amsterdam, The Netherlands, May 24-25, 2007, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4471},
  pages        = {175--184},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-72559-6\_19},
  doi          = {10.1007/978-3-540-72559-6\_19},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/euroitv/VelusamyGVB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icdcit/ChaturvediRB07,
  author       = {Vijay Prakash Chaturvedi and
                  V. Rakesh and
                  Shalabh Bhatnagar},
  editor       = {Tomasz Janowski and
                  Hrushikesha Mohanty},
  title        = {An Efficient and Optimized Bluetooth Scheduling Algorithm for Piconets},
  booktitle    = {Distributed Computing and Internet Technology, 4th International Conference,
                  {ICDCIT} 2007, Bangalore, India, December 17-20, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4882},
  pages        = {19--30},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-77115-9\_2},
  doi          = {10.1007/978-3-540-77115-9\_2},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icdcit/ChaturvediRB07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icdcit/VemuBH07,
  author       = {Koteswara Rao Vemu and
                  Shalabh Bhatnagar and
                  N. Hemachandra},
  editor       = {Tomasz Janowski and
                  Hrushikesha Mohanty},
  title        = {An Optimal Weighted-Average Congestion Based Pricing Scheme for Enhanced
                  QoS},
  booktitle    = {Distributed Computing and Internet Technology, 4th International Conference,
                  {ICDCIT} 2007, Bangalore, India, December 17-20, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {4882},
  pages        = {135--145},
  publisher    = {Springer},
  year         = {2007},
  url          = {https://doi.org/10.1007/978-3-540-77115-9\_14},
  doi          = {10.1007/978-3-540-77115-9\_14},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icdcit/VemuBH07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/nips/BhatnagarSGL07,
  author       = {Shalabh Bhatnagar and
                  Richard S. Sutton and
                  Mohammad Ghavamzadeh and
                  Mark Lee},
  editor       = {John C. Platt and
                  Daphne Koller and
                  Yoram Singer and
                  Sam T. Roweis},
  title        = {Incremental Natural Actor-Critic Algorithms},
  booktitle    = {Advances in Neural Information Processing Systems 20, Proceedings
                  of the Twenty-First Annual Conference on Neural Information Processing
                  Systems, Vancouver, British Columbia, Canada, December 3-6, 2007},
  pages        = {105--112},
  publisher    = {Curran Associates, Inc.},
  year         = {2007},
  url          = {https://proceedings.neurips.cc/paper/2007/hash/6883966fd8f918a4aa29be29d2c386fb-Abstract.html},
  timestamp    = {Mon, 16 May 2022 15:41:51 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/BhatnagarSGL07.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/BhatnagarP06,
  author       = {Shalabh Bhatnagar and
                  J. Ranjan Panigrahi},
  title        = {Actor-critic algorithms for hierarchical Markov decision processes},
  journal      = {Autom.},
  volume       = {42},
  number       = {4},
  pages        = {637--644},
  year         = {2006},
  url          = {https://doi.org/10.1016/j.automatica.2005.12.010},
  doi          = {10.1016/J.AUTOMATICA.2005.12.010},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/BhatnagarP06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/jmlr/BhatnagarBA06,
  author       = {Shalabh Bhatnagar and
                  Vivek S. Borkar and
                  Madhukar Akarapu},
  title        = {A Simulation-Based Algorithm for Ergodic Control of Markov Chains
                  Conditioned on Rare Events},
  journal      = {J. Mach. Learn. Res.},
  volume       = {7},
  pages        = {1937--1962},
  year         = {2006},
  url          = {http://jmlr.org/papers/v7/bhatnagar06a.html},
  timestamp    = {Wed, 10 Jul 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/jmlr/BhatnagarBA06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/prl/ViswanathMB06,
  author       = {P. Viswanath and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Partition based pattern synthesis technique with efficient algorithms
                  for nearest neighbor classification},
  journal      = {Pattern Recognit. Lett.},
  volume       = {27},
  number       = {14},
  pages        = {1714--1724},
  year         = {2006},
  url          = {https://doi.org/10.1016/j.patrec.2006.04.015},
  doi          = {10.1016/J.PATREC.2006.04.015},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/prl/ViswanathMB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/telsys/VaidyaB06,
  author       = {Rahul Vaidya and
                  Shalabh Bhatnagar},
  title        = {Robust optimization of Random Early Detection},
  journal      = {Telecommun. Syst.},
  volume       = {33},
  number       = {4},
  pages        = {291--316},
  year         = {2006},
  url          = {https://doi.org/10.1007/s11235-006-9020-2},
  doi          = {10.1007/S11235-006-9020-2},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/telsys/VaidyaB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/PatroB06,
  author       = {Rajesh Kumar Patro and
                  Shalabh Bhatnagar},
  title        = {A Four-Timescale Algorithm for Constrained Stochastic Optimization
                  of {RED}},
  booktitle    = {45th {IEEE} Conference on Decision and Control, {CDC} 2006, San Diego,
                  CA, USA, December 13-15, 2006},
  pages        = {1930--1935},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/CDC.2006.377655},
  doi          = {10.1109/CDC.2006.377655},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/PatroB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/BhatnagarA06,
  author       = {Shalabh Bhatnagar and
                  Mohammed Shahid Abdulla},
  title        = {A Reinforcement Learning Based Algorithm for Finite Horizon Markov
                  Decision Processes},
  booktitle    = {45th {IEEE} Conference on Decision and Control, {CDC} 2006, San Diego,
                  CA, USA, December 13-15, 2006},
  pages        = {5519--5524},
  publisher    = {{IEEE}},
  year         = {2006},
  url          = {https://doi.org/10.1109/CDC.2006.377190},
  doi          = {10.1109/CDC.2006.377190},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/BhatnagarA06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/wsc/AbdullaB06,
  author       = {Mohammed Shahid Abdulla and
                  Shalabh Bhatnagar},
  editor       = {L. Felipe Perrone and
                  Barry Lawson and
                  Jason Liu and
                  Frederick P. Wieland},
  title        = {{SPSA} algorithms with measurement reuse},
  booktitle    = {Proceedings of the Winter Simulation Conference {WSC} 2006, Monterey,
                  California, USA, December 3-6, 2006},
  pages        = {320--328},
  publisher    = {{IEEE} Computer Society},
  year         = {2006},
  url          = {https://doi.org/10.1109/WSC.2006.323089},
  doi          = {10.1109/WSC.2006.323089},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/wsc/AbdullaB06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-cs-0601080,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {On Measure Theoretic definitions of Generalized Information Measures
                  and Maximum Entropy Prescriptions},
  journal      = {CoRR},
  volume       = {abs/cs/0601080},
  year         = {2006},
  url          = {http://arxiv.org/abs/cs/0601080},
  eprinttype    = {arXiv},
  eprint       = {cs/0601080},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-cs-0601080.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/pr/ViswanathMB05,
  author       = {P. Viswanath and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Overlap pattern synthesis with an efficient nearest neighbor classifier},
  journal      = {Pattern Recognit.},
  volume       = {38},
  number       = {8},
  pages        = {1187--1195},
  year         = {2005},
  url          = {https://doi.org/10.1016/j.patcog.2004.10.007},
  doi          = {10.1016/J.PATCOG.2004.10.007},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pr/ViswanathMB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/simulation/BhatnagarK05,
  author       = {Shalabh Bhatnagar and
                  Hemant J. Kowshik},
  title        = {A Discrete Parameter Stochastic Approximation Algorithm for Simulation
                  Optimization},
  journal      = {Simul.},
  volume       = {81},
  number       = {11},
  pages        = {757--772},
  year         = {2005},
  url          = {https://doi.org/10.1177/0037549705062294},
  doi          = {10.1177/0037549705062294},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/simulation/BhatnagarK05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/telsys/BhatnagarR05,
  author       = {Shalabh Bhatnagar and
                  I. Bala Bhaskar Reddy},
  title        = {Optimal Threshold Policies for Admission Control in Communication
                  Networks via Discrete Parameter Stochastic Approximation},
  journal      = {Telecommun. Syst.},
  volume       = {29},
  number       = {1},
  pages        = {9--31},
  year         = {2005},
  url          = {https://doi.org/10.1007/s11235-005-6629-5},
  doi          = {10.1007/S11235-005-6629-5},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/telsys/BhatnagarR05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/Bhatnagar05,
  author       = {Shalabh Bhatnagar},
  title        = {Adaptive multivariate three-timescale stochastic approximation algorithms
                  for simulation based optimization},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {15},
  number       = {1},
  pages        = {74--107},
  year         = {2005},
  url          = {https://doi.org/10.1145/1044322.1044326},
  doi          = {10.1145/1044322.1044326},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/Bhatnagar05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cec/DukkipatiMB05,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Information theoretic justification of Boltzmann selection and its
                  generalization to Tsallis case},
  booktitle    = {Proceedings of the {IEEE} Congress on Evolutionary Computation, {CEC}
                  2005, 2-4 September 2005, Edinburgh, {UK}},
  pages        = {1667--1674},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/CEC.2005.1554889},
  doi          = {10.1109/CEC.2005.1554889},
  timestamp    = {Thu, 16 Dec 2021 13:59:05 +0100},
  biburl       = {https://dblp.org/rec/conf/cec/DukkipatiMB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/ifip12/AbdullaB05,
  author       = {Mohammed Shahid Abdulla and
                  Shalabh Bhatnagar},
  editor       = {Daoliang Li and
                  Baoji Wang},
  title        = {Solution of Mdps Using Simulation-Based Value Iteration},
  booktitle    = {Artificial Intelligence Applications and Innovations - {IFIP} {TC12}
                  {WG12.5} - Second {IFIP} Conference on Artificial Intelligence Applications
                  and Innovations (AIAI2005), September 7-9, 2005, Beijing, China},
  series       = {{IFIP}},
  volume       = {187},
  pages        = {765--775},
  publisher    = {Springer},
  year         = {2005},
  url          = {https://doi.org/10.1007/0-387-29295-0\_83},
  doi          = {10.1007/0-387-29295-0\_83},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/ifip12/AbdullaB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/isit/DukkipatiMB05,
  author       = {Ambedkar Dukkipati and
                  Narasimha Murty Musti and
                  Shalabh Bhatnagar},
  title        = {Properties of Kullback-Leibler cross-entropy minimization in nonextensive
                  framework},
  booktitle    = {Proceedings of the 2005 {IEEE} International Symposium on Information
                  Theory, {ISIT} 2005, Adelaide, South Australia, Australia, 4-9 September
                  2005},
  pages        = {2374--2378},
  publisher    = {{IEEE}},
  year         = {2005},
  url          = {https://doi.org/10.1109/ISIT.2005.1523773},
  doi          = {10.1109/ISIT.2005.1523773},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/isit/DukkipatiMB05.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/abs-cs-0511078,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Uniqueness of Nonextensive entropy under Renyi's Recipe},
  journal      = {CoRR},
  volume       = {abs/cs/0511078},
  year         = {2005},
  url          = {http://arxiv.org/abs/cs/0511078},
  eprinttype    = {arXiv},
  eprint       = {cs/0511078},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-cs-0511078.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/inffus/ViswanathMB04,
  author       = {P. Viswanath and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Fusion of multiple approximate nearest neighbor classifiers for fast
                  and efficient classification},
  journal      = {Inf. Fusion},
  volume       = {5},
  number       = {4},
  pages        = {239--250},
  year         = {2004},
  url          = {https://doi.org/10.1016/j.inffus.2004.02.003},
  doi          = {10.1016/J.INFFUS.2004.02.003},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/inffus/ViswanathMB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tac/BhatnagarK04,
  author       = {Shalabh Bhatnagar and
                  Shishir Kumar},
  title        = {A simultaneous perturbation stochastic approximation-based actor-critic
                  algorithm for Markov decision processes},
  journal      = {{IEEE} Trans. Autom. Control.},
  volume       = {49},
  number       = {4},
  pages        = {592--598},
  year         = {2004},
  url          = {https://doi.org/10.1109/TAC.2004.825622},
  doi          = {10.1109/TAC.2004.825622},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tac/BhatnagarK04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cdc/PanigrahiB04,
  author       = {Jnana Ranjan Panigrahi and
                  Shalabh Bhatnagar},
  title        = {Hierarchical decision making in semiconductor fabs using multi-time
                  scale Markov decision processes},
  booktitle    = {43rd {IEEE} Conference on Decision and Control, {CDC} 2004, Nassau,
                  Bahamas, December 14-17, 2004},
  pages        = {4387--4392},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/CDC.2004.1429441},
  doi          = {10.1109/CDC.2004.1429441},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cdc/PanigrahiB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cec/DukkipatiMB04,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Cauchy annealing schedule: an annealing schedule for Boltzmann selection
                  scheme in evolutionary algorithms},
  booktitle    = {Proceedings of the {IEEE} Congress on Evolutionary Computation, {CEC}
                  2004, 19-23 June 2004, Portland, OR, {USA}},
  pages        = {55--62},
  publisher    = {{IEEE}},
  year         = {2004},
  url          = {https://doi.org/10.1109/CEC.2004.1330837},
  doi          = {10.1109/CEC.2004.1330837},
  timestamp    = {Thu, 16 Dec 2021 13:58:46 +0100},
  biburl       = {https://dblp.org/rec/conf/cec/DukkipatiMB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/icpr/ViswanathMB04,
  author       = {P. Viswanath and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {A Pattern Synthesis Technique with an Efficient Nearest Neighbor Classifier
                  for Binary Pattern Recognition},
  booktitle    = {17th International Conference on Pattern Recognition, {ICPR} 2004,
                  Cambridge, UK, August 23-26, 2004},
  pages        = {416--419},
  publisher    = {{IEEE} Computer Society},
  year         = {2004},
  url          = {https://doi.org/10.1109/ICPR.2004.1333791},
  doi          = {10.1109/ICPR.2004.1333791},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icpr/ViswanathMB04.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/cs-AI-0407037,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Generalized Evolutionary Algorithm based on Tsallis Statistics},
  journal      = {CoRR},
  volume       = {cs.AI/0407037},
  year         = {2004},
  url          = {http://arxiv.org/abs/cs.AI/0407037},
  doi          = {10.48550/ARXIV.CS/0407037},
  timestamp    = {Wed, 10 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/cs-AI-0407037.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/corr/cs-AI-0408055,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Cauchy Annealing Schedule: An Annealing Schedule for Boltzmann Selection
                  Scheme in Evolutionary Algorithms},
  journal      = {CoRR},
  volume       = {cs.AI/0408055},
  year         = {2004},
  url          = {http://arxiv.org/abs/cs.AI/0408055},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/cs-AI-0408055.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/simulation/BhatnagarB03,
  author       = {Shalabh Bhatnagar and
                  Vivek S. Borkar},
  title        = {Multiscale Chaotic {SPSA} and Smoothed Functional Algorithms for Simulation
                  Optimization},
  journal      = {Simul.},
  volume       = {79},
  number       = {10},
  pages        = {568--580},
  year         = {2003},
  url          = {https://doi.org/10.1177/0037549703039988},
  doi          = {10.1177/0037549703039988},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/simulation/BhatnagarB03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/tomacs/BhatnagarFMW03,
  author       = {Shalabh Bhatnagar and
                  Michael C. Fu and
                  Steven I. Marcus and
                  I{-}Jeng Wang},
  title        = {Two-timescale simultaneous perturbation stochastic approximation using
                  deterministic perturbation sequences},
  journal      = {{ACM} Trans. Model. Comput. Simul.},
  volume       = {13},
  number       = {2},
  pages        = {180--209},
  year         = {2003},
  url          = {https://doi.org/10.1145/858481.858486},
  doi          = {10.1145/858481.858486},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tomacs/BhatnagarFMW03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@inproceedings{DBLP:conf/cec/DukkipatiMB03,
  author       = {Ambedkar Dukkipati and
                  M. Narasimha Murty and
                  Shalabh Bhatnagar},
  title        = {Quotient evolutionary space: abstraction of evolutionary process w.r.t
                  macroscopic properties},
  booktitle    = {Proceedings of the {IEEE} Congress on Evolutionary Computation, {CEC}
                  2003, Canberra, Australia, December 8-12, 2003},
  pages        = {846--853},
  publisher    = {{IEEE}},
  year         = {2003},
  url          = {https://doi.org/10.1109/CEC.2003.1299755},
  doi          = {10.1109/CEC.2003.1299755},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cec/DukkipatiMB03.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/automatica/CaoRBFM02,
  author       = {Xi{-}Ren Cao and
                  Zhiyuan Ren and
                  Shalabh Bhatnagar and
                  Michael C. Fu and
                  Steven I. Marcus},
  title        = {A time aggregation approach to Markov decision processes},
  journal      = {Autom.},
  volume       = {38},
  number       = {6},
  pages        = {929--943},
  year         = {2002},
  url          = {https://doi.org/10.1016/S0005-1098(01)00282-5},
  doi          = {10.1016/S0005-1098(01)00282-5},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/automatica/CaoRBFM02.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/ton/BhatnagarFMF01,
  author       = {Shalabh Bhatnagar and
                  Michael C. Fu and
                  Steven I. Marcus and
                  Pedram Jaefari Fard},
  title        = {Optimal structured feedback policies for {ABR} flow control using
                  two-timescale {SPSA}},
  journal      = {{IEEE/ACM} Trans. Netw.},
  volume       = {9},
  number       = {4},
  pages        = {479--491},
  year         = {2001},
  url          = {https://doi.org/10.1109/90.944345},
  doi          = {10.1109/90.944345},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ton/BhatnagarFMF01.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

@article{DBLP:journals/mor/BhatnagarB95,
  author       = {Shalabh Bhatnagar and
                  Vivek S. Borkar},
  title        = {A Convex Analytic Framework for Ergodic Control of Semi-Markov Processes},
  journal      = {Math. Oper. Res.},
  volume       = {20},
  number       = {4},
  pages        = {923--936},
  year         = {1995},
  url          = {https://doi.org/10.1287/moor.20.4.923},
  doi          = {10.1287/MOOR.20.4.923},
  timestamp    = {Sat, 09 Apr 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/mor/BhatnagarB95.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}

a service of

manage site settings

To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.