@inproceedings{gunes2012eager, abstract = {Key to named entity recognition, the manual gazetteering of entity lists is a costly, errorprone process that often yields results that are incomplete and suffer from sampling bias. Exploiting current sources of structured information, we propose a novel method for extending minimal seed lists into complete gazetteers. Like previous approaches, we value W IKIPEDIA as a huge, well-curated, and relatively unbiased source of entities. However, in contrast to previous work, we exploit not only its content, but also its structure, as exposed in DBPEDIA. We extend gazetteers through Wikipedia categories, carefully limiting the impact of noisy categorizations. The resulting gazetteers easily outperform previous approaches on named entity recognition. }, author = {Gunes, Omer and Schallhart, Christian and Furche, Tim and Lehmann, Jens and Ngomo, Axel-Cyrille Ngonga}, booktitle = {Proceedings of the 3rd Workshop on the People's Web Meets NLP: Collaboratively Constructed Semantic Resources and their Applications to NLP}, interhash = {20c47a41c89ff6c2a8f7bb524185b8ac}, intrahash = {3eac4c009268cd4f2c264dd24053f8a6}, month = jul, organization = {Association for Computational Linguistics}, pages = {29--33}, title = {EAGER: extending automatically gazetteers for entity recognition}, url = {http://acl.eldoc.ub.rug.nl/mirror/W/W12/W12-4005.pdf}, year = 2012 }