@inproceedings{9c5ee977646f4db0beea2f876210a6b8,
title = "Context enhanced keyword extraction for sparse geo-entity relation from web texts",
abstract = "Geo-entity relation recognition from rich texts requires robust and effective solutions on keyword extraction. Compared with supervised learning methods, unsupervised learning methods attract more attention for their capability to capture the dynamic feature variation in text and to discover additional relation types. The frequency-based methods of keyword extraction have been widely studied. However, it is difficult to be applied into geo-entity keyword extraction directly because of the sparse distribution of geo-entity relations in texts. Besides, there are few studies on Chinese keyword extraction. This paper proposes a context enhanced keyword extraction method. Firstly the contexts for geo-entities are enhanced to reduce the sparseness of terms. Secondly two well-known frequency-based statistical methods (i.e., DF and Entropy) are used to build a large-scale corpus automatically from the enhanced contexts. Thirdly the lexical features and their weights are statistically determined based on the corpus to enhance the distinction of the terms. Finally, all terms in the enhanced contexts are measured with the lexical features, and the most important terms are selected as the keywords of geo-entity pairs. Experiments are conducted with mass real Chinese web texts. Compared with DF and Entropy, the presented method improves the precision by 41\% and 36\% respectively in discovering the keywords with sparse distribution and generates additional 60\% correct keywords for geo-entity relation recognition.",
keywords = "Context enhancement, Geo-entity relation, Geographical information retrieval, Keyword extraction, Text mining",
author = "Li Yu and Feng Lu and Xueying Zhang and Xiliang Liu",
note = "Publisher Copyright: {\textcopyright} Springer International Publishing Switzerland 2016.; 18th International Conference on Web Technologies and Applications, APWeb 2016 and Workshop on 2nd International Workshop on Web Data Mining and Applications, WDMA 2016 and 1st International Workshop on Graph Analytics and Query Processing, GAP 2016 and 1st International Workshop on Spatial-temporal Data Management and Analytics, SDMA 2016 ; Conference date: 23-09-2016 Through 25-09-2016",
year = "2016",
doi = "10.1007/978-3-319-45835-9\_22",
language = "English",
isbn = "9783319458342",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "253--264",
editor = "Jia Zhu and Rong Zhang and Lijun Chang and Wenjie Zhang and Kuien Liu and Atsuyuki Morishima and Fu, \{Tom Z.J.\} and Xiaoyan Yang and Zhiwei Zhang",
booktitle = "Web Technologies and Applications - APWeb 2016 Workshops, WDMA, GAP, and SDMA, Proceedings",
address = "Germany",
}