@inproceedings{05e183d99bdb4cc995d8ae6497fd92e5,
title = "Learning from Metadata: A Fuzzy Token Matching Based Configuration File Discovery Approach",
abstract = "Discovery of configuration files is one of the prerequisite activities for a successful workload migration to the cloud. The complicated and super-sized file systems, the considerable variance of configuration files, and the multiple-presence of configuration items make configuration file discovery very difficult. Traditional approaches usually highly rely on experts to compose software specific scripts or rules to discover configuration files, which is very expensive and labor-intensive. In this paper, we propose a novel learning based approach named MetaConf to convert configuration file discovery to a supervised file classification task using the file metadata as learning features such that it can be conducted automatically, efficiently, and independently of domain expertise. We report our evaluation with extensive and real-world case studies, and the experimental results validate that our approach is effective and it outperforms our baseline method.",
keywords = "Cloud Migration, Configuration file discovery, Data imbalance, File metadata, Fuzzy string matching",
author = "Han Wang and Meng, {Fan Jing} and Xuejun Zhuo and Lin Yang and Li, {Chang Sheng} and Xu, {Jing Min}",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 8th IEEE International Conference on Cloud Computing, CLOUD 2015 ; Conference date: 27-06-2015 Through 02-07-2015",
year = "2015",
month = aug,
day = "19",
doi = "10.1109/CLOUD.2015.61",
language = "English",
series = "Proceedings - 2015 IEEE 8th International Conference on Cloud Computing, CLOUD 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "405--412",
editor = "Calton Pu and Ajay Mohindra",
booktitle = "Proceedings - 2015 IEEE 8th International Conference on Cloud Computing, CLOUD 2015",
address = "United States",
}