@inproceedings{3398abbe73c84590b2b5fe67bb4d2cc2,
title = "Keyword search over probabilistic XML data",
abstract = "Despite the proliferation of work on XML keyword search, it remains open to support keyword search over uncertain XML data. In this paper, we study the problem of ELCA-based answers over uncertain XML data, which is to retrieve subtrees taking a probability of at least a threshold to be ELCA-based answers. To answer such query efficiently, we employ a filtering-and-verification strategy which is based on a proposed probabilistic inverted index, PrIndex. Based on PrIndex, we develop tight lower and upper bounds that can prune unqualified results very rapidly. After that, we propose an efficient algorithm (PrIndex-based algorithm) that combine probability threshold pruning and probability distribution of node from leaf to root to support keyword search over probabilistic XML data. Extensive experimental results demonstrate the effectiveness of the proposed algorithms.",
keywords = "keywords search, probabilistic XML data, probability threshold",
author = "Yue Zhao and Guoren Wang and Ye Yuan and Junxia Wang and Chungang Lin and Ying Yu",
note = "Publisher Copyright: {\textcopyright} 2015 IEEE.; 12th International Conference on Fuzzy Systems and Knowledge Discovery, FSKD 2015 ; Conference date: 15-08-2015 Through 17-08-2015",
year = "2016",
month = jan,
day = "13",
doi = "10.1109/FSKD.2015.7382118",
language = "English",
series = "2015 12th International Conference on Fuzzy Systems and Knowledge Discovery, FSKD 2015",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "1230--1235",
editor = "Zhuo Tang and Jiayi Du and Shu Yin and Renfa Li and Ligang He",
booktitle = "2015 12th International Conference on Fuzzy Systems and Knowledge Discovery, FSKD 2015",
address = "United States",
}