E. Bartocci, L. Bortolussi, T. Brázdil, D. Milios, G. Sanguinetti
{"title":"Policy Learning for Time-Bounded Reachability in Continuous-Time Markov Decision Processes via Doubly-Stochastic Gradient Ascent","authors":"E. Bartocci, L. Bortolussi, T. Brázdil, D. Milios, G. Sanguinetti","doi":"10.1007/978-3-319-43425-4_17","DOIUrl":null,"url":null,"abstract":"","PeriodicalId":150495,"journal":{"name":"International Conference on Quantitative Evaluation of Systems","volume":"20 1","pages":"0"},"PeriodicalIF":0.0000,"publicationDate":"2016-05-31","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":"8","resultStr":null,"platform":"Semanticscholar","paperid":null,"PeriodicalName":"International Conference on Quantitative Evaluation of Systems","FirstCategoryId":"1085","ListUrlMain":"https://doi.org/10.1007/978-3-319-43425-4_17","RegionNum":0,"RegionCategory":null,"ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":null,"EPubDate":"","PubModel":"","JCR":"","JCRName":"","Score":null,"Total":0}