@inproceedings{xin2008www, abstract = {The success and popularity of social network systems, such as del.icio.us, Facebook, MySpace, and YouTube, have generated many interesting and challenging problems to the research community. Among others, discovering social interests shared by groups of users is very important because it helps to connect people with common interests and encourages people to contribute and share more contents. The main challenge to solving this problem comes from the diffi- culty of detecting and representing the interest of the users. The existing approaches are all based on the online connections of users and so unable to identify the common interest of users who have no online connections. In this paper, we propose a novel social interest discovery approach based on user-generated tags. Our approach is motivated by the key observation that in a social network, human users tend to use descriptive tags to annotate the contents that they are interested in. Our analysis on a large amount of real-world traces reveals that in general, user-generated tags are consistent with the web content they are attached to, while more concise and closer to the understanding and judgments of human users about the content. Thus, patterns of frequent co-occurrences of user tags can be used to characterize and capture topics of user interests. We have developed an Internet Social Interest Discovery system, ISID, to discover the common user interests and cluster users and their saved URLs by different interest topics. Our evaluation shows that ISID can effectively cluster similar documents by interest topics and discover user communities with common interests no matter if they have any online connections.}, author = {Li, Xin and Guo, Lei and Zhao, Yihong E.}, booktitle = {Proceedings of the 17th International World Wide Web Conference}, interhash = {d7e6a5b8d215682b2a75add69c01de29}, intrahash = {42b4c94cff05ccef031235d661a7a77a}, pages = {675-684}, publisher = {ACM}, title = {Tag-based Social Interest Discovery}, url = {http://www2008.org/papers/pdf/p675-liA.pdf}, year = 2008 } @article{cattuto2007, author = {Cattuto, C. and Schmitz, C. and Baldassarri, A. and Servedio, V. D. P. and Loreto, V. and Hotho, A. and Grahl, M. and Stumme, G.}, interhash = {fc5f2df61d28bc99b7e15029da125588}, intrahash = {d87e198a6d564ae8a8fe151e0a96fa0f}, journal = {AI Communications}, number = 4, pages = {245 - 262}, title = {Network Properties of Folksonomies}, url = {http://www.kde.cs.uni-kassel.de/hotho/pub/2007/aicomm_2007_folksonomy_clustering.pdf}, vgwort = {67}, volume = 20, year = 2007 } @misc{citeulike:341233, abstract = {The investigation of community structures in networks is an important issue in many domains and disciplines. This problem is relevant for social tasks (objective analysis of relationships on the web), biological inquiries (functional studies in metabolic, cellular or protein networks) or technological problems (optimization of large infrastructures). Several types of algorithm exist for revealing the community structure in networks, but a general and quantitative definition of community is still lacking, leading to an intrinsic difficulty in the interpretation of the results of the algorithms without any additional non-topological information. In this paper we face this problem by introducing two quantitative definitions of community and by showing how they are implemented in practice in the existing algorithms. In this way the algorithms for the identification of the community structure become fully self-contained. Furthermore, we propose a new local algorithm to detect communities which outperforms the existing algorithms with respect to the computational cost, keeping the same level of reliability. The new algorithm is tested on artificial and real-world graphs. In particular we show the application of the new algorithm to a network of scientific collaborations, which, for its size, can not be attacked with the usual methods. This new class of local algorithms could open the way to applications to large-scale technological and biological applications.}, author = {Radicchi, Filippo and Castellano, Claudio and Cecconi, Federico and Loreto, Vittorio and Parisi, Domenico}, citeulike-article-id = {341233}, comment = {"In general algorithms define communities operationally as what the they finds. A dendrogram, i. e. a community structure, is always produced by the algorithms down to the level of single nodes, independently from the type of graph analyzed. This is due to the lack of explicit prescriptions to discriminate between networks that are actually endowed with a community structure and those that are not. As a consequence, in practical applications one needs additional, non topological, information on the nature of the network to understand which of the branches of the tree have a real significance. Without such information it is not clear at all whether the identification of a community is reliable or not." --- Domain: scientific collaborations Task: calculate a dendrogram (the community graph) Method: effucuebt GN (Girvan \& Newman( algorithm based on edge betweenness. Their algorithm allows to be fine-tuned beween acting local or global. To be more efficient they replace the "edge betweenness" by "edge clustering coefficient" which is based on the number of triangles the edge is contained in VS the degree of the incident nodes. Motto: "Algorithm must include the quantitative community definition"}, eprint = {cond-mat/0309488}, interhash = {6ec9b00862909de405c08db1c9b43d63}, intrahash = {8634d935e0bf4d74a870d5c805612665}, month = Feb, priority = {0}, title = {Defining and identifying communities in networks}, url = {http://arxiv.org/abs/cond-mat/0309488}, year = 2004 }