@inproceedings{564d54b65f884b7cb95aa9f9ffce8ab5,
title = "An effective and efficient subpopulation extraction method in large social networks",
abstract = "With the help of information technologies, we have access to very large networks, even with billions of nodes. This large size has limited our ability to perform analysis and provide theoretical compelling explanation on the whole network. One solution is to extract connected subgraphs and analyze them as subpopulations. We propose a method for extracting such subpopulation archiving two desirable properties: 1) be effective, resulting in subpopulations with more ties within them than to the external network; and 2) be fast, so that it scales well to large networks. We develop a method called the {"}Transitive Clustering and Pruning{"} (T-CLAP) algorithm. We compare the speed and effectiveness of this algorithm to two other popularly community detection algorithms - Newman's and Clauset's algorithms. We find that T-CLAP is orders of magnitudes faster than Newman's algorithm; and is superior to Clauset's algorithm in terms of returning effective subpopulations that are useful.",
keywords = "Large scale data, Social network, Subpopulation extraction",
author = "Bin Zhang and David Krackhardt and Ramayya Krishnan and Patrick Doreian",
year = "2011",
language = "English (US)",
isbn = "9781618394729",
series = "International Conference on Information Systems 2011, ICIS 2011",
pages = "477--493",
booktitle = "International Conference on Information Systems 2011, ICIS 2011",
note = "32nd International Conference on Information System 2011, ICIS 2011 ; Conference date: 04-12-2011 Through 07-12-2011",
}