@inproceedings{hotho2006information, abstract = {Social bookmark tools are rapidly emerging on the Web. In such systems users are setting up lightweight conceptual structures called folksonomies. The reason for their immediate success is the fact that no specific skills are needed for participating. At the moment, however, the information retrieval support is limited. We present a formal model and a new search algorithm for folksonomies,called FolkRank, that exploits the structure of the folksonomy. The proposed algorithm is also applied to findcommunities within the folksonomy and is used to structure search results. All findings are demonstrated on a large scale dataset.}, address = {Heidelberg}, author = {Hotho, Andreas and Jäschke, Robert and Schmitz, Christoph and Stumme, Gerd}, booktitle = {The Semantic Web: Research and Applications}, editor = {Sure, York and Domingue, John}, file = {hotho2006information.pdf:hotho2006information.pdf:PDF}, groups = {public}, interhash = {10ec64d80b0ac085328a953bb494fb89}, intrahash = {3c301945817681d637ee43901c016939}, month = {June}, pages = {411-426}, pdf = {hotho2006information.pdf}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, timestamp = {2010-11-11 15:34:51}, title = {Information Retrieval in Folksonomies: Search and Ranking}, username = {dbenz}, volume = 4011, year = 2006 } @article{springerlink:10.1007/s00778-010-0204-8, abstract = {Graph conductance queries, also known as personalized PageRank and related to random walks with restarts, were originally proposed to assign a hyperlink-based prestige score to Web pages. More general forms of such queries are also very useful for ranking in entity-relation (ER) graphs used to represent relational, XML and hypertext data. Evaluation of PageRank usually involves a global eigen computation. If the graph is even moderately large, interactive response times may not be possible. Recently, the need for interactive PageRank evaluation has increased. The graph may be fully known only when the query is submitted. Browsing actions of the user may change some inputs to the PageRank computation dynamically. In this paper, we describe a system that analyzes query workloads and the ER graph, invests in limited offline indexing, and exploits those indices to achieve essentially constant-time query processing, even as the graph size scales. Our techniques—data and query statistics collection, index selection and materialization, and query-time index exploitation—have parallels in the extensive relational query optimization literature, but is applied to supporting novel graph data repositories. We report on experiments with five temporal snapshots of the CiteSeer ER graph having 74–702 thousand entity nodes, 0.17–1.16 million word nodes, 0.29–3.26 million edges between entities, and 3.29–32.8 million edges between words and entities. We also used two million actual queries from CiteSeer’s logs. Queries run 3–4 orders of magnitude faster than whole-graph PageRank, the gap growing with graph size. Index size is smaller than a text index. Ranking accuracy is 94–98% with reference to whole-graph PageRank.}, address = {Berlin / Heidelberg}, affiliation = {IIT Bombay, Powai, Mumbai, Maharashtra India}, author = {Chakrabarti, Soumen and Pathak, Amit and Gupta, Manish}, doi = {10.1007/s00778-010-0204-8}, interhash = {96a2d92f703a13f77bae8f56372f3e1b}, intrahash = {dcc951cd461fe1c454db7a738429d421}, issn = {1066-8888}, journal = {The VLDB Journal}, keyword = {Computer Science}, pages = {1-26}, publisher = {Springer}, title = {Index design and query processing for graph conductance search}, url = {http://dx.doi.org/10.1007/s00778-010-0204-8}, year = 2010 } @inproceedings{hotho2006information, author = {Hotho, Andreas and J{\"a}schke, Robert and Schmitz, Christoph and Stumme, Gerd}, booktitle = {Proceedings of the 3rd European Semantic Web Conference}, interhash = {882bd942131c6c303bdc9c4732287ae9}, intrahash = {087d10ce5603cef6c6a8b443700368a2}, pages = {411-426}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {Information Retrieval in Folksonomies: Search and Ranking}, year = 2006 } @inproceedings{hotho2006information, abstract = {Social bookmark tools are rapidly emerging on the Web. In such systems users are setting up lightweight conceptual structures called folksonomies. The reason for their immediate success is the fact that no specific skills are needed for participating. At the moment, however, the information retrieval support is limited. We present a formal model and a new search algorithm for folksonomies, called FolkRank, that exploits the structure of the folksonomy. The proposed algorithm is also applied to find communities within the folksonomy and is used to structure search results. All findings are demonstrated on a large scale dataset.}, address = {Heidelberg}, author = {Hotho, Andreas and Jäschke, Robert and Schmitz, Christoph and Stumme, Gerd}, booktitle = {The Semantic Web: Research and Applications}, editor = {Sure, York and Domingue, John}, interhash = {10ec64d80b0ac085328a953bb494fb89}, intrahash = {3c301945817681d637ee43901c016939}, month = {June}, pages = {411-426}, publisher = {Springer}, series = {Lecture Notes in Computer Science}, title = {Information Retrieval in Folksonomies: Search and Ranking}, volume = 4011, year = 2006 }