Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_18
C. Rasmussen, M. Deisenroth
{"title":"Probabilistic Inference for Fast Learning in Control","authors":"C. Rasmussen, M. Deisenroth","doi":"10.1007/978-3-540-89722-4_18","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_18","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"32 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"131397390","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_17
Jan Peters, J. Kober, D. Nguyen-Tuong
{"title":"Policy Learning - A Unified Perspective with Applications in Robotics","authors":"Jan Peters, J. Kober, D. Nguyen-Tuong","doi":"10.1007/978-3-540-89722-4_17","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_17","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"1 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"116739157","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_7
T. Gabel, Martin A. Riedmiller
{"title":"Evaluation of Batch-Mode Reinforcement Learning Methods for Solving DEC-MDPs with Changing Action Sets","authors":"T. Gabel, Martin A. Riedmiller","doi":"10.1007/978-3-540-89722-4_7","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_7","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"75 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"116393005","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_15
J. Martín-Guerrero, E. Soria-Olivas, M. Martínez-Sober, Antonio J. Serrano, J. R. M. Benedito, J. Gómez-Sanchís
{"title":"Use of Reinforcement Learning in Two Real Applications","authors":"J. Martín-Guerrero, E. Soria-Olivas, M. Martínez-Sober, Antonio J. Serrano, J. R. M. Benedito, J. Gómez-Sanchís","doi":"10.1007/978-3-540-89722-4_15","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_15","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"216 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"132050934","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_19
Noel Welsh, J. Wyatt
{"title":"United We Stand: Population Based Methods for Solving Unknown POMDPs","authors":"Noel Welsh, J. Wyatt","doi":"10.1007/978-3-540-89722-4_19","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_19","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"26 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"131123417","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_14
D. Loiacono, P. Lanzi
{"title":"Tile Coding Based on Hyperplane Tiles","authors":"D. Loiacono, P. Lanzi","doi":"10.1007/978-3-540-89722-4_14","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_14","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"25 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"115342941","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_8
M. Geist, O. Pietquin, G. Fricout
{"title":"Bayesian Reward Filtering","authors":"M. Geist, O. Pietquin, G. Fricout","doi":"10.1007/978-3-540-89722-4_8","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_8","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"28 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"124718583","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}
Pub Date : 2008-11-27DOI: 10.1007/978-3-540-89722-4_12
Jean-François Hren, R. Munos
{"title":"Optimistic Planning of Deterministic Systems","authors":"Jean-François Hren, R. Munos","doi":"10.1007/978-3-540-89722-4_12","DOIUrl":"https://doi.org/10.1007/978-3-540-89722-4_12","url":null,"abstract":"","PeriodicalId":432284,"journal":{"name":"European Workshop on Reinforcement Learning","volume":"36 1","pages":"0"},"PeriodicalIF":0.0,"publicationDate":"2008-11-27","publicationTypes":"Journal Article","fieldsOfStudy":null,"isOpenAccess":false,"openAccessPdf":"","citationCount":null,"resultStr":null,"platform":"Semanticscholar","paperid":"129862051","PeriodicalName":null,"FirstCategoryId":null,"ListUrlMain":null,"RegionNum":0,"RegionCategory":"","ArticlePicture":[],"TitleCN":null,"AbstractTextCN":null,"PMCID":"","EPubDate":null,"PubModel":null,"JCR":null,"JCRName":null,"Score":null,"Total":0}