@inproceedings{f341d75a4b07470e8d5774b11bc7f160,
title = "Temporal difference learning to detect unsafe system states",
abstract = "This paper proposes a general framework to detect unsafe states of a system whose basic realtime parameters are captured by multi-sensors. Our approach is to learn a danger level function which can be used to alert the users in advance of dangerous situations. The main challenge to this learning problem is the labelling issue, i.e., it is difficult to assign an objective danger level at each time step to the training data, except at the collapse points where a penalty can be assigned and at the successful ends where a certain reward can be assigned. In this paper, we treat the danger level as expected future reward (penalty is regarded as negative reward) and use temporal difference (TD) learning [2] to learn a function to approximate the expected future reward. The TD learning obtains the approximation by propagating the penalty/reward observable at collapse points or successful ends to the entire feature space following some constraints. Our approach is applied to, but not limited to, the application of monitoring of driving safety and the experimental results demonstrate the effectiveness of the approach.",
keywords = "Driving safety, Multi-sensor, Temporal difference learning, Unsafe system state",
author = "Huazhong Ning and Wei Xu and Yue Zhou and Yihong Gong and Thomas Huang",
year = "2008",
language = "英语",
isbn = "9781424421756",
series = "Proceedings - International Conference on Pattern Recognition",
booktitle = "2008 19th International Conference on Pattern Recognition, ICPR 2008",
note = "2008 19th International Conference on Pattern Recognition, ICPR 2008 ; Conference date: 08-12-2008 Through 11-12-2008",
}