@inproceedings{conf/wsdm/KohlschutterFN10, author = {Kohlschütter, Christian and Fankhauser, Peter and Nejdl, Wolfgang}, booktitle = {Proc. of 3rd ACM International Conference on Web Search and Data Mining New York City, NY USA (WSDM 2010).}, interhash = {25ea118166ef2f0d5597ca90fa702c9d}, intrahash = {dbc8464d9a298afa49d607d65f2160e2}, title = {Boilerplate Detection using Shallow Text Features}, year = 2010 } @inproceedings{conf/www/SinhaSSMEHW15, author = {Sinha, Arnab and Shen, Zhihong and Song, Yang and Ma, Hao and Eide, Darrin and Hsu, Bo-June Paul and Wang, Kuansan}, booktitle = {WWW (Companion Volume)}, crossref = {conf/www/2015c}, editor = {Gangemi, Aldo and Leonardi, Stefano and Panconesi, Alessandro}, ee = {http://doi.acm.org/10.1145/2740908.2742839}, interhash = {6d71a6eb1d070023f6fb75a5f1019a21}, intrahash = {e6066395c31b2f3de9fb836dbac5723a}, isbn = {978-1-4503-3473-0}, pages = {243-246}, publisher = {ACM}, title = {An Overview of Microsoft Academic Service (MAS) and Applications.}, url = {http://dblp.uni-trier.de/db/conf/www/www2015c.html#SinhaSSMEHW15}, year = 2015 } @article{10.1371/journal.pone.0136763, abstract = {

The issue of sustainability is at the top of the political and societal agenda, being considered of extreme importance and urgency. Human individual action impacts the environment both locally (e.g., local air/water quality, noise disturbance) and globally (e.g., climate change, resource use). Urban environments represent a crucial example, with an increasing realization that the most effective way of producing a change is involving the citizens themselves in monitoring campaigns (a citizen science bottom-up approach). This is possible by developing novel technologies and IT infrastructures enabling large citizen participation. Here, in the wider framework of one of the first such projects, we show results from an international competition where citizens were involved in mobile air pollution monitoring using low cost sensing devices, combined with a web-based game to monitor perceived levels of pollution. Measures of shift in perceptions over the course of the campaign are provided, together with insights into participatory patterns emerging from this study. Interesting effects related to inertia and to direct involvement in measurement activities rather than indirect information exposure are also highlighted, indicating that direct involvement can enhance learning and environmental awareness. In the future, this could result in better adoption of policies towards decreasing pollution.

}, author = {Sîrbu, Alina and Becker, Martin and Caminiti, Saverio and De Baets, Bernard and Elen, Bart and Francis, Louise and Gravino, Pietro and Hotho, Andreas and Ingarra, Stefano and Loreto, Vittorio and Molino, Andrea and Mueller, Juergen and Peters, Jan and Ricchiuti, Ferdinando and Saracino, Fabio and Servedio, Vito D. P. and Stumme, Gerd and Theunis, Jan and Tria, Francesca and Van den Bossche, Joris}, doi = {10.1371/journal.pone.0136763}, interhash = {6abb09b5ac2137e557a84d7be10009b4}, intrahash = {f35761dd0fbd9ad8af7c8099e0b6aac4}, journal = {PLoS ONE}, month = {08}, number = 8, pages = {e0136763}, publisher = {Public Library of Science}, title = {Participatory Patterns in an International Air Quality Monitoring Initiative}, url = {http://dx.doi.org/10.1371%2Fjournal.pone.0136763}, volume = 10, year = 2015 } @article{mnih2015humanlevel, author = {Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Rusu, Andrei A. and Veness, Joel and Bellemare, Marc G. and Graves, Alex and Riedmiller, Martin and Fidjeland, Andreas K. and Ostrovski, Georg and Petersen, Stig and Beattie, Charles and Sadik, Amir and Antonoglou, Ioannis and King, Helen and Kumaran, Dharshan and Wierstra, Daan and Legg, Shane and Hassabis, Demis}, interhash = {eac59980357d99db87b341b61ef6645f}, intrahash = {fb15f4471c81dc2b9edf2304cb2f7083}, issn = {00280836}, journal = {Nature}, month = feb, number = 7540, pages = {529--533}, publisher = {Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, title = {Human-level control through deep reinforcement learning}, url = {http://dx.doi.org/10.1038/nature14236}, volume = 518, year = 2015 } @inproceedings{tran2015semantic, abstract = {In this paper we study the problem of semantic annotation for a trending hashtag which is the crucial step towards analyzing user behavior in social media, yet has been largely unexplored. We tackle the problem via linking to entities from Wikipedia. We incorporate the social aspects of trending hashtags by identifying prominent entities for the annotation so as to maximize the information spreading in entity networks. We exploit temporal dynamics of entities in Wikipedia, namely Wikipedia edits and page views to improve the annotation quality. Our experiments show that we significantly outperform the established methods in tweet annotation.}, author = {Tran, Tuan and Tran, Nam-Khanh and Teka Hadgu, Asmelash and Jäschke, Robert}, booktitle = {Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing (EMNLP)}, interhash = {4156275c801376fa64dfdb69a4ce60c4}, intrahash = {9d4cd9070922e1eb43bcab1da4a9d840}, month = sep, publisher = {Association for Computational Linguistics}, title = {Semantic Annotation for Microblog Topics Using Wikipedia Temporal Information}, year = 2015 } @article{kluegl2013exploiting, abstract = {Conditional Random Fields (CRF) are popular methods for labeling unstructured or textual data. Like many machine learning approaches, these undirected graphical models assume the instances to be independently distributed. However, in real-world applications data is grouped in a natural way, e.g., by its creation context. The instances in each group often share additional structural consistencies. This paper proposes a domain-independent method for exploiting these consistencies by combining two CRFs in a stacked learning framework. We apply rule learning collectively on the predictions of an initial CRF for one context to acquire descriptions of its specific properties. Then, we utilize these descriptions as dynamic and high quality features in an additional (stacked) CRF. The presented approach is evaluated with a real-world dataset for the segmentation of references and achieves a significant reduction of the labeling error.}, author = {Kluegl, Peter and Toepfer, Martin and Lemmerich, Florian and Hotho, Andreas and Puppe, Frank}, interhash = {9ef3f543e4cc9e2b0ef078595f92013b}, intrahash = {fbaab25e96dd20d96ece9d7fefdc3b4f}, journal = {Mathematical Methodologies in Pattern Recognition and Machine Learning Springer Proceedings in Mathematics & Statistics}, pages = {111-125}, title = {Exploiting Structural Consistencies with Stacked Conditional Random Fields}, volume = 30, year = 2013 } @misc{becker2014subjective, abstract = {Sensor data is objective. But when measuring our environment, measured values are contrasted with our perception, which is always subjective. This makes interpreting sensor measurements difficult for a single person in her personal environment. In this context, the EveryAware projects directly connects the concepts of objective sensor data with subjective impressions and perceptions by providing a collective sensing platform with several client applications allowing to explicitly associate those two data types. The goal is to provide the user with personalized feedback, a characterization of the global as well as her personal environment, and enable her to position her perceptions in this global context. In this poster we summarize the collected data of two EveryAware applications, namely WideNoise for noise measurements and AirProbe for participatory air quality sensing. Basic insights are presented including user activity, learning processes and sensor data to perception correlations. These results provide an outlook on how this data can further be used to understand the connection between sensor data and perceptions. }, author = {Becker, Martin and Hotho, Andreas and Mueller, Juergen and Kibanov, Mark and Atzmueller, Martin and Stumme, Gerd}, howpublished = {CSSWS 2014, Poster}, interhash = {615afda9869c5e0facc8bdb5534760aa}, intrahash = {33cf40cc46170f51767c46d2ec14a495}, title = {Subjective vs. Objective Data: Bridging the Gap}, url = {http://www.gesis.org/en/events/css-wintersymposium/poster-presentation/}, year = 2014 } @inproceedings{vkistowski2015modeling, abstract = {Today’s system developers and operators face the challenge of creating software systems that make efficient use of dynamically allocated resources under highly variable and dynamic load profiles, while at the same time delivering reliable performance. Benchmarking of systems under these constraints is difficult, as state-of-the-art benchmarking frameworks provide only limited support for emulating such dynamic and highly vari- able load profiles for the creation of realistic workload scenarios. Industrial benchmarks typically confine themselves to workloads with constant or stepwise increasing loads. Alternatively, they support replaying of recorded load traces. Statistical load inten- sity descriptions also do not sufficiently capture concrete pattern load profile variations over time. To address these issues, we present the Descartes Load Intensity Model (DLIM). DLIM provides a modeling formalism for describing load intensity variations over time. A DLIM instance can be used as a compact representation of a recorded load intensity trace, providing a powerful tool for benchmarking and performance analysis. As manually obtaining DLIM instances can be time consuming, we present three different automated extraction methods, which also help to enable autonomous system analysis for self-adaptive systems. Model expressiveness is validated using the presented extraction methods. Extracted DLIM instances exhibit a median modeling error of 12.4% on average over nine different real-world traces covering between two weeks and seven months. Additionally, extraction methods perform orders of magnitude faster than existing time series decomposition approaches.}, author = {v. Kistowski, Jóakim and Nikolas, Herbst. and Zoller, Daniel and Kounev, Samuel and Hotho, Andreas}, booktitle = {Proceedings of the 10th International Symposium on Software Engineering for Adaptive and Self-Managing Systems (SEAMS)}, interhash = {9f0be929d7bcc057c778f6b44e73cf4c}, intrahash = {f449d3cf35941636f96d72aaf620a275}, title = {Modeling and Extracting Load Intensity Profiles}, year = 2015 } @inproceedings{zoller2015publication, abstract = {Scholarly success is traditionally measured in terms of citations to publications. With the advent of publication man- agement and digital libraries on the web, scholarly usage data has become a target of investigation and new impact metrics computed on such usage data have been proposed – so called altmetrics. In scholarly social bookmarking sys- tems, scientists collect and manage publication meta data and thus reveal their interest in these publications. In this work, we investigate connections between usage metrics and citations, and find posts, exports, and page views of publications to be correlated to citations.}, author = {Zoller, Daniel and Doerfel, Stephan and Jäschke, Robert and Stumme, Gerd and Hotho, Andreas}, booktitle = {Proceedings of the 2015 ACM Conference on Web Science}, interhash = {3515b34cd19959cee5fafbf4467a75ed}, intrahash = {548a7010ee2726f28e04e5c6e5fd6e2d}, title = {On Publication Usage in a Social Bookmarking System}, year = 2015 } @incollection{singer2014folksonomies, author = {Singer, Philipp and Niebler, Thomas and Hotho, Andreas and Strohmaier, Markus}, booktitle = {Encyclopedia of Social Network Analysis and Mining}, interhash = {3a55606e91328ca0191127b1fafe189e}, intrahash = {84d9498b73de976d8d550c6761d4be0d}, pages = {542--547}, publisher = {Springer}, title = {Folksonomies}, year = 2014 } @inproceedings{ring2015condist, author = {Ring, Markus and Otto, Florian and Becker, Martin and Niebler, Thomas and Landes, Dieter and Hotho, Andreas}, editor = {ECMLPKDD2015}, interhash = {c062a57a17a0910d6c27ecd664502ac1}, intrahash = {a2f9d649f2856677e4d886a3b517404d}, title = {ConDist: A Context-Driven Categorical Distance Measure}, year = 2015 } @inproceedings{dallmann2015media, address = {Cyprus, Turkey, September 1-4}, author = {Dallmann, Alexander and Lemmerich, Florian and Zoller, Daniel and Hotho, Andreas}, booktitle = {26th ACM Conference on Hypertext and Social Media}, interhash = {6b2daa7830c5e504543dcdaefed46285}, intrahash = {addfd0d84b4347392dc94a4bec400412}, publisher = {ACM}, title = {Media Bias in German Online Newspapers}, year = 2015 } @article{journals/expert/RehakPGSBC09, author = {Rehák, Martin and Pechoucek, Michal and Grill, Martin and Stiborek, Jan and Bartos, Karel and Celeda, Pavel}, ee = {http://doi.ieeecomputersociety.org/10.1109/MIS.2009.42}, interhash = {878f9ec500bf1b485f337afe0abe1801}, intrahash = {502b8b47f7e3ee930f2d79bde0b29d76}, journal = {IEEE Intelligent Systems}, number = 3, pages = {16-25}, title = {Adaptive Multiagent System for Network Traffic Monitoring.}, url = {http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.149.3921&rep=rep1&type=pdf}, volume = 24, year = 2009 } @article{journals/nle/ZeschG10, author = {Zesch, Torsten and Gurevych, Iryna}, ee = {http://dx.doi.org/10.1017/S1351324909990167}, interhash = {3300b5457187d0f6c551e63ecb27336c}, intrahash = {76a512bbba5ba8ec5819d469d4611d81}, journal = {Natural Language Engineering}, number = 1, pages = {25-59}, title = {Wisdom of crowds versus wisdom of linguists - measuring the semantic relatedness of words.}, url = {http://dblp.uni-trier.de/db/journals/nle/nle16.html#ZeschG10}, volume = 16, year = 2010 } @inproceedings{DBLP:conf/dsaa/KrompassNT14, author = {Krompass, Denis and Nickel, Maximilian and Tresp, Volker}, bibsource = {dblp computer science bibliography, http://dblp.org}, booktitle = {International Conference on Data Science and Advanced Analytics, {DSAA} 2014, Shanghai, China, October 30 - November 1, 2014}, crossref = {DBLP:conf/dsaa/2014}, doi = {10.1109/DSAA.2014.7058046}, interhash = {0ca986606c22ca0b3780c9b9c25f31c7}, intrahash = {c952ed96ece470e4fa5336eedf670d5b}, isbn = {978-1-4799-6991-3}, pages = {18--24}, publisher = {{IEEE}}, title = {Large-scale factorization of type-constrained multi-relational data}, url = {http://dx.doi.org/10.1109/DSAA.2014.7058046}, year = 2014 } @inproceedings{singer2015hyptrails, address = {Firenze, Italy}, author = {Singer, P. and Helic, D. and Hotho, A. and Strohmaier, M.}, booktitle = {24th International World Wide Web Conference (WWW2015)}, interhash = {d33e150aa37dcd618388960286f8a46a}, intrahash = {5d21e53dc91b35a4a6cb6b9ec858045d}, month = {May 18 - May 22}, organization = {ACM}, publisher = {ACM}, title = {Hyptrails: A bayesian approach for comparing hypotheses about human trails}, url = {http://www.www2015.it/documents/proceedings/proceedings/p1003.pdf}, year = 2015 } @inproceedings{conf/icdm/DuBJ10, author = {Du, Lan and Buntine, Wray Lindsay and Jin, Huidong}, booktitle = {ICDM}, crossref = {conf/icdm/2010}, editor = {Webb, Geoffrey I. and 0001, Bing Liu and Zhang, Chengqi and Gunopulos, Dimitrios and Wu, Xindong}, ee = {http://doi.ieeecomputersociety.org/10.1109/ICDM.2010.51}, interhash = {dcde7dbdd419330aabb01d151e23c45c}, intrahash = {5a639efaf1e8fea6b0f309333efd7bee}, isbn = {978-0-7695-4256-0}, pages = {148-157}, publisher = {IEEE Computer Society}, title = {Sequential Latent Dirichlet Allocation: Discover Underlying Topic Structures within a Document.}, url = {http://dblp.uni-trier.de/db/conf/icdm/icdm2010.html#DuBJ10}, year = 2010 } @inproceedings{conf/conll/LevyG14, author = {Levy, Omer and Goldberg, Yoav}, booktitle = {CoNLL}, crossref = {conf/conll/2014}, editor = {Morante, Roser and tau Yih, Wen}, ee = {http://aclweb.org/anthology/W/W14/W14-1618.pdf}, interhash = {680dde1fd83a8dd0d6b2619a8266516e}, intrahash = {23bb00b6abab97ed93e74f3b5b148630}, isbn = {978-1-941643-02-0}, pages = {171-180}, publisher = {ACL}, title = {Linguistic Regularities in Sparse and Explicit Word Representations.}, url = {http://dblp.uni-trier.de/db/conf/conll/conll2014.html#LevyG14}, year = 2014 } @article{grimmer2013text, author = {Grimmer, Justin and Stewart, Brandon M}, interhash = {eb68e01ef4168a398d79f408042fe529}, intrahash = {76001ebc726700bef81886d2e285b7cf}, journal = {Political Analysis}, pages = {mps028}, publisher = {SPM-PMSAPSA}, title = {Text as data: The promise and pitfalls of automatic content analysis methods for political texts}, year = 2013 } @inproceedings{noauthororeditor, author = {Mirowski, Piotr and Ranzato, Marc'Aurelio and LeCun, Yann}, editor = {of the NIPS 2010 Workshop on Deep Learning, Proceedings}, interhash = {b7ce347e904a4ca3263cf6cc1e2253bd}, intrahash = {fc3e0e3af595f9a46df6bc9233df836f}, title = {Dynamic Auto-Encoders for Semantic Indexing}, url = {http://yann.lecun.com/exdb/publis/pdf/mirowski-nipsdl-10.pdf}, year = 2010 }