{"title":"Unified Inter and Intra Options Learning Using Policy Gradient Methods","authors":"K. Levy, N. Shimkin","doi":"10.1007/978-3-642-29946-9_17","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_17","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"9 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"123675822","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
A. Fachantidis, Ioannis Partalas, Matthew E. Taylor, I. Vlahavas
{"title":"Transfer Learning via Multiple Inter-task Mappings","authors":"A. Fachantidis, Ioannis Partalas, Matthew E. Taylor, I. Vlahavas","doi":"10.1007/978-3-642-29946-9_23","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_23","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"167 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"114884364","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Kyriakos C. Chatzidimitriou, Ioannis Partalas, P. Mitkas, I. Vlahavas
{"title":"Transferring Evolved Reservoir Features in Reinforcement Learning Tasks","authors":"Kyriakos C. Chatzidimitriou, Ioannis Partalas, P. Mitkas, I. Vlahavas","doi":"10.1007/978-3-642-29946-9_22","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_22","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"6 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"123103780","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Automatic Construction of Temporally Extended Actions for MDPs Using Bisimulation Metrics","authors":"P. S. Castro, Doina Precup","doi":"10.1007/978-3-642-29946-9_16","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_16","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"1 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"125513961","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Optimized Look-ahead Tree Search Policies","authors":"Francis Maes, L. Wehenkel, D. Ernst","doi":"10.1007/978-3-642-29946-9_20","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_20","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"5 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"132022497","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Introduction of Fixed Mode States into Online Profit Sharing and Its Application to Waist Trajectory Generation of Biped Robot","authors":"Seiya Kuroda, K. Miyazaki, Hiroaki Kobayashi","doi":"10.1007/978-3-642-29946-9_29","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_29","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"1 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"130271078","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
{"title":"Batch, Off-Policy and Model-Free Apprenticeship Learning","authors":"Edouard Klein, M. Geist, O. Pietquin","doi":"10.1007/978-3-642-29946-9_28","DOIUrl":"https://doi.org/10.1007/978-3-642-29946-9_28","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"20 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2011-09-09","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"128655519","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}