@inproceedings{08ddaace3b0b43ea831826a9ddaa67a6,
title = "英语科技论文摘要语步结构语料库构建研究",
abstract = "Move structures are discourse units in research articles (RA) and is of great value in move analysis, essay writing, etc. Although there is abundant research on move structures in academic articles, there are still relatively few move annotation data resources. This research developed and constructed a specific corpus for annotating move structures in English RA abstracts. Currently, nearly 34,000 Move structures have been annotated, covering the fields of Natural Language Processing (NLP), Computer Vision (CV), Communication Engineering and Mechanical Engineering. We also presented annotation statistics and analysis. The first stage of corpus construction relies on manual annotation to form high-quality corpus data. In the second and main stage, an automatic recognition and annotation model based on BERT is adopted, which can improve the annotation speed and expand the annotation scale while ensuring the annotation quality. We conducted move structure recognition experiments based on the constructed corpus, and compared the performance of our model with large language models(LLM) including ChatGPT and Claude3. The experimental results show that the F1 scores of move structure recognition achieved by our model outperformed those of LLM, indicating the effectiveness of the proposed model. This corpus is currently publicly available and can provide necessary data resources for NLP related tasks such as scientific paper information extraction and English writing intelligent assistance, it is also beneficial to foreign language teaching and research such as English for Academic Purposes, it can effectively promote the digital transformation of foreign language education.",
keywords = "Abstract, Corpus, Move structure, Research article",
author = "Hongzheng Li and Ruojin Wang and Chong Feng and Fang Liu",
note = "Publisher Copyright: {\textcopyright} 2024 China National Conference on Computational Linguistics.; 23rd Chinese National Conference on Computational Linguistics, CCL 2024 ; Conference date: 24-07-2024 Through 28-07-2024",
year = "2024",
language = "繁体中文",
series = "CCL 2024 - 23rd Chinese National Conference on Computational Linguistics",
publisher = "Chinese National Conference on Computational Linguistic (CCL)",
pages = "841--852",
editor = "Maosong Sun and Jiye Liang and Xianpei Han and Zhiyuan Liu and Yulan He",
booktitle = "Main Conference",
}