BibTex format
@inproceedings{Soh:2011:10.1145/2001858.2002036,
author = {Soh, H and Demiris, Y},
doi = {10.1145/2001858.2002036},
pages = {471--477},
title = {Multi-reward policies for medical applications: Anthrax attacks and smart wheelchairs},
url = {http://dx.doi.org/10.1145/2001858.2002036},
year = {2011}
}
RIS format (EndNote, RefMan)
TY - CPAPER
AB - Medical decisions are often difficult; they involve uncertain information, multiple-objectives and debatable outcomes. In this work, we discuss the application of the multi-reward partially-observable Markov decision process (MR-POMDP) and NSGA2-LS, a hybridised multi-objective evolutionary solver, to two problems in the medical domain: anthrax response and smart-wheelchair control. For the first problem, we use a discrete model and analyse the trade-offs between the best solutions (in the form of finite-state controllers) found by our evolutionary algorithm. For the second, we contribute an extension of our method to the continuous space and optimising recurrent neural networks (RNNs) for use on medical robots such as smart wheelchairs. © 2011 ACM.
AU - Soh,H
AU - Demiris,Y
DO - 10.1145/2001858.2002036
EP - 477
PY - 2011///
SP - 471
TI - Multi-reward policies for medical applications: Anthrax attacks and smart wheelchairs
UR - http://dx.doi.org/10.1145/2001858.2002036
ER -