@inproceedings{9576d857681f486b9d155011cc1430ff,
title = "Virtual machines of high availability using hardware-assisted failure detection",
abstract = "The virtualization technology has been widely used in today's doud computing datacenters. With the virtualization technology, each physical machine in a datacenter can be logically divided into several virtual machines, on which different types of software services can host. However, many reasons may decrease the availability of the whole system. For example, a failed physical machine automatically fails all virtual machines on the physical machine, and consequently fails every software service on the virtual machines. It is difficult to detect failures efficiently in a general-purpose computer architecture because the hardware cannot provide enough information for fast failure detection. On the contrary, the ATCA (Advanced Telecommunications Computing Architecture) physical machines provide high hardware availability, and support IPMI (Intelligent Platform Management Interface) that can quickly detect the hardware status. In this paper, we developed a novel failure model and designed a symmetric fault-tolerant mechanism using ATCA physical machines and KVM to provide a solution for high system availability. The proposed fault-tolerant mechanism divides ATCA physical machines into pairs, such that each machine of a pair supports fault tolerance for each other. Once a failure is detected in the physical machine layer or the virtualization layer, the failed virtual machines are then recovered on the other physical machine. We have compared the proposed fault-tolerance mechanism with another prior VM-based fault-tolerance tool. The results show that the proposed mechanism significantly reduces the service downtime. That is, it provides better system availability for software services running on the virtual machines.",
keywords = "ATCA, Failover, Fault tolerance, High availability, Virtual machine",
author = "Wang, {Wei Jen} and Huang, {Hung Lin} and Chuang, {Shan Hao} and Chen, {Shao Jui} and Kao, {Chia Hung} and Deron Liang",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 49th Annual IEEE International Carnahan Conference on Security Technology, ICCST 2015 ; Conference date: 21-09-2015 Through 24-09-2015",
year = "2016",
month = jan,
day = "21",
doi = "10.1109/CCST.2015.7389668",
language = "???core.languages.en_GB???",
series = "Proceedings - International Carnahan Conference on Security Technology",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "ICCST 2015 - The 49th Annual IEEE International Carnahan Conference on Security Technology",
}