@inproceedings{1aba072bb4dc415c830259c752b4c14f,
title = "GeoCQA: A Large-Scale Geography-Domain Chinese Question Answering Dataset from Examination",
abstract = "We present GeoCQA, the largest multiple-choice Chinese Question answering dataset in the geographic domain, evaluating the high-level reading ability of logic reasoning and prior geographic domain knowledge integration of a question answering (QA) model. GeoCQA contains 58,940 questions from real-world scenarios and has been collected from the high school geography examination which aims to evaluate students{\textquoteright} mastery of the geographic concept and their ability to use geographic knowledge to solve problems. To investigate the challenges of GeoCQA to existing methods, we implement both rule-based and best neural methods and find that the current best method can achieve 71.90\% of test accuracy, while unskilled humans and skilled humans can reach 80\% and 96\% accuracy respectively, which shows that GeoCQA is challenging to the current methods and the performance still has space to improve. We will release GeoCQA and our baselines to bring more data sources to the community and hope that it can help to promote much stronger Chinese QA models in the future (https://github.com/db12138/GeoCQA ).",
keywords = "Geography-domain question answering, OpenQA task, Retriever-reader methods",
author = "Zhen Cui and Bin Wang and Jiangzhou Ju",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 10th CCF Conference on Natural Language Processing and Chinese Computing, NLPCC 2021 ; Conference date: 13-10-2021 Through 17-10-2021",
year = "2021",
doi = "10.1007/978-3-030-88483-3\_13",
language = "英语",
isbn = "9783030884826",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "163--175",
editor = "Lu Wang and Yansong Feng and Yu Hong and Ruifang He",
booktitle = "Natural Language Processing and Chinese Computing - 10th CCF International Conference, NLPCC 2021, Proceedings",
}