@proceedings{thierrypoibeau2013multisource, abstract = {Information extraction (IE) and text summarization (TS) are powerful technologies for finding relevant pieces of information in text and presenting them to the user in condensed form. The ongoing information explosion makes IE and TS critical for successful functioning within the information society. These technologies face particular challenges due to the inherent multi-source nature of the information explosion. The technologies must now handle not isolated texts or individual narratives, but rather large-scale repositories and streams--in general, in multiple languages--containing a multiplicity of perspectives, opinions, or commentaries on particular topics, entities or events. There is thus a need to adapt existing techniques and develop new ones to deal with these challenges. This volume contains a selection of papers that present a variety of methodologies for content identification and extraction, as well as for content fusion and regeneration. The chapters cover various aspects of the challenges, depending on the nature of the information sought--names vs. events,-- and the nature of the sources--news streams vs. image captions vs. scientific research papers, etc. This volume aims to offer a broad and representative sample of studies from this very active research field.}, address = {Berlin; New York}, editor = {Poibeau, Thierry and Saggion, Horacio and Piskorski, Jakub and Yangarber, Roman}, interhash = {b1d51398d5660ed1e16f40d74cc815db}, intrahash = {21816f2809a2b58397acce5ac9558d28}, isbn = {9783642285691 3642285694 3642285686 9783642285684}, publisher = {Springer}, refid = {808368416}, title = {Multi-source, multilingual information extraction and summarization}, url = {http://link.springer.com/book/10.1007/978-3-642-28569-1}, year = 2013 } @incollection{piskorski2013information, abstract = {In this chapter we present a brief overview of Information Extraction, which is an area of natural language processing that deals with finding factual information in free text. In formal terms, }, author = {Piskorski, Jakub and Yangarber, Roman}, booktitle = {Multi-source, Multilingual Information Extraction and Summarization}, doi = {10.1007/978-3-642-28569-1_2}, editor = {Poibeau, Thierry and Saggion, Horacio and Piskorski, Jakub and Yangarber, Roman}, interhash = {276145faeb3b45461f09f6ae5aabef5e}, intrahash = {55c1de993e15515d35b68a512088d607}, isbn = {978-3-642-28568-4}, language = {English}, pages = {23-49}, publisher = {Springer Berlin Heidelberg}, series = {Theory and Applications of Natural Language Processing}, title = {Information Extraction: Past, Present and Future}, url = {http://dx.doi.org/10.1007/978-3-642-28569-1_2}, year = 2013 } @book{manning2008, author = {Manning, Christopher D. and Raghavan, Prabhakar and Schütze, Hinrich}, interhash = {2e574e46b7668a7268e7f02b46f4d9bb}, intrahash = {9f4ab13e07b48b9723113aa74224be65}, publisher = {Cambridge University Press}, title = {Introduction to Information Retrieval}, year = 2008 }