@inproceedings{c7b586ea445f4494ab85c2893ef72248,
title = "PathGuide: An efficient clustering based indexing method for XML path expressions",
abstract = "This paper focuses on the performance improvement for long-path XML query processing. It is motivated by the fact that the existing inverted index and join algorithms are efficient for short path XML queries, but are inefficient for long path XML queries since the response time of the existing approaches is exponential to the length of paths. We propose a clustering based indexing method, called PathGuide, in this paper, which enhances the XML inverted index with the clustering technique. The element nodes are clustered based on their path patterns and the summary for such path information is kept in a suffix tree as the index of these element nodes. In addition, new operations are proposed to fully utilize PathGuide. With the assistance of PathGuide, unlike the path expansion approach used in Lore, the set of a relative location path can be found via one-step index lookup. Compared to the existing structural join method, PathGuide significantly reduces both join overhead and disk I/O cost. The extensive experimental studies are conducted and our results show that PathGuide outperforms the structural joins at least four times in most cases.",
keywords = "Clustering algorithms, Costs, Database languages, Delay, Indexing, Navigation, Proposals, Query processing, Tree data structures, XML",
author = "Jiefeng Cheng and Ge Yu and Guoren Wang and Yu, {J. X.}",
note = "Publisher Copyright: {\textcopyright} 2003 IEEE.; 8th International Conference on Database Systems for Advanced Applications, DASFAA 2003 ; Conference date: 26-03-2003 Through 28-03-2003",
year = "2003",
doi = "10.1109/DASFAA.2003.1192390",
language = "English",
series = "Proceedings - 8th International Conference on Database Systems for Advanced Applications, DASFAA 2003",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "257--264",
booktitle = "Proceedings - 8th International Conference on Database Systems for Advanced Applications, DASFAA 2003",
address = "United States",
}