@inproceedings{14698aefa64e4dd68742e968d0ba4782,
title = "Work-in-Progress: Maximizing Model Accuracy in Real-time and Iterative Machine Learning",
abstract = "As iterative machine learning (ML) (e.g. neural network based supervised learning and k-means clustering) becomes more ubiquitous in our daily life, it is becoming increasingly important to complete model training quickly to support real-time decision making, while still achieving high model accuracy (e.g. low prediction errors) that is critical for profits of ML tasks. Motivated by the observation that the small proportions of accuracy-critical input data can contribute to large parts of model accuracy in many iterative ML applications, this paper introduces a system middleware to maximize model accuracy by spending the limited time budget on the most accuracy-related input data. To achieve this, our approach employs a fast method to divide the input data into multiple parts of similar points and represents each part with an aggregated data point. Using these points, it quickly estimates the correlations between different parts and model accuracy, thus allowing ML tasks to process the most accuracy-related parts first. We incorporate our approach with two popular supervised and unsupervised ML algorithms on Spark and demonstrate its benefits in providing high model accuracy under short deadlines.",
keywords = "Accuracy-aware-processing, Machine-learning",
author = "Rui Han and Fan Zhang and Chen, {Lydia Y.} and Jianfeng Zhan",
note = "Publisher Copyright: {\textcopyright} 2017 IEEE.; 38th IEEE Real-Time Systems Symposium, RTSS 2017 ; Conference date: 05-10-2017 Through 08-10-2017",
year = "2017",
month = jul,
day = "2",
doi = "10.1109/RTSS.2017.00055",
language = "English",
series = "Proceedings - Real-Time Systems Symposium",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "351--353",
booktitle = "Proceedings - 2017 IEEE Real-Time Systems Symposium, RTSS 2017",
address = "United States",
}