<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article
  PUBLIC "-//NLM//DTD Journal Publishing DTD v3.0 20080202//EN" "http://dtd.nlm.nih.gov/publishing/3.0/journalpublishing3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="3.0" xml:lang="EN">
  <front>
    <journal-meta><journal-id journal-id-type="nlm-ta">PLoS ONE</journal-id><journal-id journal-id-type="publisher-id">plos</journal-id><journal-id journal-id-type="pmc">plosone</journal-id><!--===== Grouping journal title elements =====--><journal-title-group><journal-title>PLoS ONE</journal-title></journal-title-group><issn pub-type="epub">1932-6203</issn><publisher>
        <publisher-name>Public Library of Science</publisher-name>
        <publisher-loc>San Francisco, USA</publisher-loc>
      </publisher></journal-meta>
    <article-meta><article-id pub-id-type="publisher-id">PONE-D-10-06702</article-id><article-id pub-id-type="doi">10.1371/journal.pone.0016939</article-id><article-categories>
        <subj-group subj-group-type="heading">
          <subject>Research Article</subject>
        </subj-group>
        <subj-group subj-group-type="Discipline-v2">
          <subject>Mathematics</subject>
          <subj-group>
            <subject>Applied mathematics</subject>
            <subj-group>
              <subject>Complex systems</subject>
            </subj-group>
          </subj-group>
        </subj-group>
        <subj-group subj-group-type="Discipline-v2">
          <subject>Physics</subject>
          <subj-group>
            <subject>Interdisciplinary physics</subject>
          </subj-group>
        </subj-group>
        <subj-group subj-group-type="Discipline-v2">
          <subject>Social and behavioral sciences</subject>
          <subj-group>
            <subject>Sociology</subject>
            <subj-group>
              <subject>Computational sociology</subject>
              <subject>Social networks</subject>
            </subj-group>
          </subj-group>
        </subj-group>
        <subj-group subj-group-type="Discipline">
          <subject>Physics</subject>
          <subject>Mathematics</subject>
        </subj-group>
      </article-categories><title-group><article-title>Geographic Constraints on Social Network Groups</article-title><alt-title alt-title-type="running-head">Geographic Constraints on Social Network Groups</alt-title></title-group><contrib-group>
        <contrib contrib-type="author" equal-contrib="yes" xlink:type="simple">
          <name name-style="western">
            <surname>Onnela</surname>
            <given-names>Jukka-Pekka</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
          <xref ref-type="corresp" rid="cor1">
            <sup>*</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" equal-contrib="yes" xlink:type="simple">
          <name name-style="western">
            <surname>Arbesman</surname>
            <given-names>Samuel</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>González</surname>
            <given-names>Marta C.</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">
            <sup>2</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Barabási</surname>
            <given-names>Albert-László</given-names>
          </name>
          <xref ref-type="aff" rid="aff3">
            <sup>3</sup>
          </xref>
          <xref ref-type="aff" rid="aff4">
            <sup>4</sup>
          </xref>
          <xref ref-type="aff" rid="aff5">
            <sup>5</sup>
          </xref>
        </contrib>
        <contrib contrib-type="author" xlink:type="simple">
          <name name-style="western">
            <surname>Christakis</surname>
            <given-names>Nicholas A.</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">
            <sup>1</sup>
          </xref>
          <xref ref-type="aff" rid="aff6">
            <sup>6</sup>
          </xref>
          <xref ref-type="aff" rid="aff7">
            <sup>7</sup>
          </xref>
        </contrib>
      </contrib-group><aff id="aff1"><label>1</label><addr-line>Department of Health Care Policy, Harvard Medical School, Boston, Massachusetts, United States of America</addr-line>       </aff><aff id="aff2"><label>2</label><addr-line>Department of Civil and Environmental Engineering and Engineering Systems, Massachusetts Institute of Technology, Cambridge, Massachusetts, United States of America</addr-line>       </aff><aff id="aff3"><label>3</label><addr-line>Department of Physics, Biology and Computer Science, Center for Complex Network Research, Northeastern University, Boston, Massachusetts, United States of America</addr-line>       </aff><aff id="aff4"><label>4</label><addr-line>Center for Cancer Systems Biology, Dana Farber Cancer Institute, Boston, Massachusetts, United States of America</addr-line>       </aff><aff id="aff5"><label>5</label><addr-line>Department of Medicine, Brigham and Women's Hospital, Harvard Medical School, Boston, Massachusetts, United States of America</addr-line>       </aff><aff id="aff6"><label>6</label><addr-line>Department of Medicine, Harvard Medical School, Boston, Massachusetts, United States of America</addr-line>       </aff><aff id="aff7"><label>7</label><addr-line>Department of Sociology, Harvard Faculty of Arts and Sciences, Cambridge, Massachusetts, United States of America</addr-line>       </aff><contrib-group>
        <contrib contrib-type="editor" xlink:type="simple">
          <name name-style="western">
            <surname>Perc</surname>
            <given-names>Matjaz</given-names>
          </name>
          <role>Editor</role>
          <xref ref-type="aff" rid="edit1"/>
        </contrib>
      </contrib-group><aff id="edit1">University of Maribor, Slovenia</aff><author-notes>
        <corresp id="cor1">* E-mail: <email xlink:type="simple">onnela@med.harvard.edu</email></corresp>
        <fn fn-type="con">
          <p>Conceived and designed the experiments: JPO SA NAC. Analyzed the data: JPO SA. Contributed reagents/materials/analysis tools: JPO SA MCG. Wrote the paper: JPO SA ALB NAC. Processed raw phone data: MCG.</p>
        </fn>
      <fn fn-type="conflict">
        <p>The authors have declared that no competing interests exist.</p>
      </fn></author-notes><pub-date pub-type="collection">
        <year>2011</year>
      </pub-date><pub-date pub-type="epub">
        <day>5</day>
        <month>4</month>
        <year>2011</year>
      </pub-date><volume>6</volume><issue>4</issue><elocation-id>e16939</elocation-id><history>
        <date date-type="received">
          <day>12</day>
          <month>12</month>
          <year>2010</year>
        </date>
        <date date-type="accepted">
          <day>6</day>
          <month>1</month>
          <year>2011</year>
        </date>
      </history><!--===== Grouping copyright info into permissions =====--><permissions><copyright-year>2011</copyright-year><copyright-holder>Onnela et al</copyright-holder><license><license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p></license></permissions><abstract>
        <p>Social groups are fundamental building blocks of human societies. While our social interactions have always been constrained by geography, it has been impossible, due to practical difficulties, to evaluate the nature of this restriction on social group structure. We construct a social network of individuals whose most frequent geographical locations are also known. We also classify the individuals into groups according to a community detection algorithm. We study the variation of geographical span for social groups of varying sizes, and explore the relationship between topological positions and geographic positions of their members. We find that small social groups are geographically very tight, but become much more clumped when the group size exceeds about 30 members. Also, we find no correlation between the topological positions and geographic positions of individuals within network communities. These results suggest that spreading processes face distinct structural and spatial constraints.</p>
      </abstract><funding-group><funding-statement>JPO, SA, and NAC are supported by the National Institute on Aging (grant P01 AG-031093); ALB and MCG by the Office of Naval Research (grant ONR N000141010968), the Network Science Collaborative Technology Alliance (grant ARL NS-CTA W911NF-09-2-0053), the Defense Threat Reduction Agency (grants DTRA BRBAA08-Per4-C-2-0033 and DTRA WMD BRBAA07-J-2-0035), the National Science Foundation (grant NSF BCS-0826958), and the James S. McDonnell Foundation (grant JSMF 220020084). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</funding-statement></funding-group><counts>
        <page-count count="7"/>
      </counts></article-meta>
  </front>
  <body>
    <sec id="s1">
      <title>Introduction</title>
      <p>Social groups are common among animals and humans <xref ref-type="bibr" rid="pone.0016939-Newman1">[1]</xref>–<xref ref-type="bibr" rid="pone.0016939-Newman2">[5]</xref>. In humans, they reflect friendship, kinship, and work relationships, and can also be seen as social networks. From an evolutionary and historical perspective, the formation of such network groups – consisting of agglomerations of dyadic interactions – has been constrained by geography. In contrast, larger social units, enabled by modern technology and political organization, offer drastically different opportunities for social interactions and for group assembly over larger geographic ranges. This raises two sorts of questions. First, is the structure of “old-fashioned” groups similar to the large-scale groups possible in modern society? And second, what role does geography play in group formation?</p>
      <p>If we represent the social relationships among a population of people as a network, then groups can be seen as “communities” within the population that consist of sets of nodes that are relatively densely connected to each other but sparsely connected to other nodes in the network <xref ref-type="bibr" rid="pone.0016939-Porter1">[6]</xref>, <xref ref-type="bibr" rid="pone.0016939-Fortunato1">[7]</xref>. While social communities have been studied for a long time <xref ref-type="bibr" rid="pone.0016939-Freeman1">[8]</xref>, it has recently become feasible, with mobile phone data, to monitor the social interactions and geographic positions of millions of individuals <xref ref-type="bibr" rid="pone.0016939-Onnela1">[9]</xref>, <xref ref-type="bibr" rid="pone.0016939-Gonzlez1">[10]</xref>, and to apply algorithmic detection of communities on a large scale <xref ref-type="bibr" rid="pone.0016939-Porter1">[6]</xref>, <xref ref-type="bibr" rid="pone.0016939-Fortunato1">[7]</xref>. The structure of dyadic social interactions is known to depend on geography, for example, as shown by the decay of friendship probability with distance, based on voluntary self-reports of hometown and US state, in a blog community <xref ref-type="bibr" rid="pone.0016939-LibenNowell1">[11]</xref>, and the decrease in communication probability with distance based on the zip codes of cell phone billing addresses <xref ref-type="bibr" rid="pone.0016939-Lambiotte1">[12]</xref>. In addition, a previous study has shown that smaller communities are more homogeneous with respect to the billing postal codes of their members <xref ref-type="bibr" rid="pone.0016939-Palla1">[13]</xref>, while another presented evidence that this persists across a hierarchy of communities <xref ref-type="bibr" rid="pone.0016939-Ahn1">[14]</xref>. However, there are no prior large-scale studies of the way in which community structure depends on geography, where the actual communication locations are used and where geographical properties of communities themselves are examined (see <xref ref-type="fig" rid="pone-0016939-g001">Fig. 1</xref>).</p>
      <fig id="pone-0016939-g001" position="float">
        <object-id pub-id-type="doi">10.1371/journal.pone.0016939.g001</object-id>
        <label>Figure 1</label>
        <caption>
          <title>Visualization of a community in the mobile phone network.</title>
          <p>This juxtaposition of (<bold>A</bold>) the topological structure and (<bold>B</bold>) the geographical structure demonstrates the interplay of these two dimensions. The purple and orange nodes are geographically close, but topologically they lie at five degrees of separation. In contrast, the red and green nodes are connected to each other, and also share several neighbors, yet they are geographically separated by a large distance. Overlapping nodes in (B) have been moved slightly for visual clarity.</p>
        </caption>
        <graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.g001" xlink:type="simple"/>
      </fig>
      <p>With respect to group formation, geography can be seen as a kind of constraint. That is, social connections not only face network constraints and opportunities (we tend to form ties with others who are the friends of our friends), but also, quite obviously, geographic constraints and opportunities. What is unclear, however, is the way in which such geographic constraints and opportunities affect and shape network communities above and beyond their effect on dyadic interactions.</p>
    </sec>
    <sec id="s2">
      <title>Results</title>
      <sec id="s2a">
        <title>Dyadic Interactions and Geography</title>
        <p>We create a network of social interactions by measuring ties between individuals based on mobile phone call and text messaging data from an unnamed European country. Based on the records of 72.4 millions calls and 17.1 million text messages accumulated over a one-month period, the resulting network has 3.4 million nodes connected by 5.2 million weighted (non-binary) ties, resulting in an average degree <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e001" xlink:type="simple"/></inline-formula>. Each time a user initiated or received a call or a text message, the location of the tower routing the communication was recorded <xref ref-type="bibr" rid="pone.0016939-Gonzlez1">[10]</xref>. We exploited these records to assign each individual to the location where they conducted most of their cell phone communication, which for most individuals is likely to correspond to the location of their home or work. This resulted in one coordinate pair <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e002" xlink:type="simple"/></inline-formula> per user, which enabled us to define the geographic distance for any user pair as <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e003" xlink:type="simple"/></inline-formula>. We used this to compute the probability of a call-tie and the probability of a text-tie as a function of distance (<xref ref-type="fig" rid="pone-0016939-g002">Fig. 2</xref>).</p>
        <fig id="pone-0016939-g002" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0016939.g002</object-id>
          <label>Figure 2</label>
          <caption>
            <title>The probability of having a tie decreases as a function of distance.</title>
            <p>Two limiting cases, corresponding to exponents one and two, are shown as dashed lines. Note that if geography played no role, we would expect <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e004" xlink:type="simple"/></inline-formula> to be independent of distance <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e005" xlink:type="simple"/></inline-formula>, resulting in a horizontal line in this plot. Inset: Tie strength, in contrast to the communication probability, is nearly flat with distance, although there is a minor decreasing trend for voice-ties.</p>
          </caption>
          <graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.g002" xlink:type="simple"/>
        </fig>
        <p>Although from the point of view of technology there is very little difference between placing a short-distance or long-distance communication (for either voice or text), we find that the probability of communication is strongly related to the distance between the individuals, and it decreases by approximately five orders of magnitude as distance increases from 1 km to 1,000 km. The behavior of voice-ties and text-ties is essentially identical. The average distance between two connected nodes is 42 km for voice ties and 51 km for text ties. The decay of the tie probability approximately follows a power-law of the form <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e006" xlink:type="simple"/></inline-formula>, before it falls due to reaching the physical boundaries of the system. We used the maximum-likelihood method <xref ref-type="bibr" rid="pone.0016939-Clauset1">[15]</xref> to estimate both the exponent <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e007" xlink:type="simple"/></inline-formula> and the lower bound <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e008" xlink:type="simple"/></inline-formula> from which the power-law holds, and obtained <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e009" xlink:type="simple"/></inline-formula> for voice ties and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e010" xlink:type="simple"/></inline-formula> for text ties, with the lower bounds estimated at 7.1 km and 4.1 km, respectively. In estimating these parameters, we constrained our search to ties whose distance was less than 800 km to avoid boundary effects, still leaving us over 99% of the ties.</p>
        <p>We define tie strength <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e011" xlink:type="simple"/></inline-formula> as the number of interactions between nodes <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e012" xlink:type="simple"/></inline-formula> and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e013" xlink:type="simple"/></inline-formula>, and it can quantified either as the number of calls between the two nodes or, alternatively, as the number of text messages between them. Interestingly, while geography is so strongly associated with the existence of a tie, tie strength varies only weakly with distance and is similar for both text and voice (<xref ref-type="fig" rid="pone-0016939-g002">Fig. 2</xref> inset).</p>
      </sec>
      <sec id="s2b">
        <title>Community Interaction Structure and Geography</title>
        <p>It is clear that ties or dyads should be the building blocks of social groups or communities, but what constitutes a community and how it should be identified needs to be specified. We detect topological communities using the method of modularity maximization, which measures how well a given partition of a network compartmentalizes its communities <xref ref-type="bibr" rid="pone.0016939-Porter1">[6]</xref>, <xref ref-type="bibr" rid="pone.0016939-Fortunato1">[7]</xref>, <xref ref-type="bibr" rid="pone.0016939-Newman3">[16]</xref>, <xref ref-type="bibr" rid="pone.0016939-Girvan1">[17]</xref> (see <xref ref-type="sec" rid="s4">Methods</xref> for details). For this purpose, we combine voice-ties and text-ties into one network.</p>
        <p>Next, we examined how the topological centrality of nodes within communities is associated with their physical centrality. Given the community membership of each individual, we computed the geographical center <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e014" xlink:type="simple"/></inline-formula> of community <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e015" xlink:type="simple"/></inline-formula> using <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e016" xlink:type="simple"/></inline-formula> and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e017" xlink:type="simple"/></inline-formula>, where <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e018" xlink:type="simple"/></inline-formula> is the number of members (nodes) in the community. We measured topological centrality using betweenness centrality, whereas physical centrality was measured as the distance from a node to the geographic center of its corresponding community. Given that both betweenness centrality and the physical span of communities increase as a function of community size, we normalized these quantities by considering their percentile values, instead of dealing with their absolute values. (Note that while betweenness centrality can be normalized to be independent of network size, there is no similar normalization available for the physical distances.) We included communities whose size varied between 10 and 1,000 nodes. While the community detection algorithm found communities that were significantly larger than this upper bound, we deemed them to be too large to be taken as social communities. Including communities smaller than 10 led to discretization effects when computing percentiles.</p>
        <p>In historically relevant social arrangements, one might expect the two measures of betweenness centrality and geographic distance from the community center to be strongly correlated, but here we found essentially no correlation between them (<xref ref-type="fig" rid="pone-0016939-g003">Fig. 3</xref>). Pearson's linear correlation coefficient between these two measures, both taken as percentiles, was −0.07 (we obtained 0.05 if communities smaller than 10 were also included). Therefore, there seems to be no relationship between topological centrality and physical centrality of nodes within communities in this network.</p>
        <fig id="pone-0016939-g003" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0016939.g003</object-id>
          <label>Figure 3</label>
          <caption>
            <title>Relationship between topological centrality and geographic centrality.</title>
            <p>42,123 nodes in communities varying in size from 10 to 1,000 are examined, and both quantities are measured in terms of percentiles. The number of observations (nodes) that lie within each bin is indicated by its color.</p>
          </caption>
          <graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.g003" xlink:type="simple"/>
        </fig>
        <p>Next, we characterized the overall geographical shape of the communities by defining the <italic>geographical span</italic> for a given community <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e019" xlink:type="simple"/></inline-formula> as<disp-formula><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.e020" xlink:type="simple"/><label>(1)</label></disp-formula></p>
        <p>where <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e021" xlink:type="simple"/></inline-formula> is measured in units of distance, and large values of <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e022" xlink:type="simple"/></inline-formula> indicate that the members of the community are geographically spread out. We found an upward trend that persisted with a leveling off until, surprisingly, a large bump occurred for communities in excess of 30 nodes (<xref ref-type="fig" rid="pone-0016939-g004">Fig. 4</xref>).</p>
        <fig id="pone-0016939-g004" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0016939.g004</object-id>
          <label>Figure 4</label>
          <caption>
            <title>Average observed geographic community span <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e023" xlink:type="simple"/></inline-formula> (red) and average geographic community null span <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e024" xlink:type="simple"/></inline-formula> (blue).</title>
            <p> The dyadic null span with decay, denoted by <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e025" xlink:type="simple"/></inline-formula>, incorporates the decay of the connection probability as a function of distance for various values of the scale parameter, shown as dashed lines. The solid black line is the dyadic null span without decay. Both are measured in kilometers. We observe large deviations from both null models, which can be quantified as the areas between the empirical curve and any of the null curves.</p>
          </caption>
          <graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.g004" xlink:type="simple"/>
        </fig>
        <p>To put this result in a context, we introduced two null models. In the <italic>community null model</italic>, instead of using the true geographical coordinates <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e026" xlink:type="simple"/></inline-formula> of community members, we draw the <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e027" xlink:type="simple"/></inline-formula> coordinate pairs uniformly at random from the underlying distribution of all coordinate pairs, keeping a given <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e028" xlink:type="simple"/></inline-formula>-coordinate coupled with the associated <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e029" xlink:type="simple"/></inline-formula>-coordinate, resulting in the quantity <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e030" xlink:type="simple"/></inline-formula>. If <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e031" xlink:type="simple"/></inline-formula>, this would suggest that the members of the community are randomly scattered in the country, i.e., regardless of being members of the same community, they are not geographically proximate. As shown in (<xref ref-type="fig" rid="pone-0016939-g004">Fig. 4</xref>), the real community span is much smaller than the span of the null community. What is especially notable is the constraining role of geography for small communities. As community sizes increase, say, from five to ten individuals, the value of the null span increases dramatically from about 70 km to about 300 km, quantifying the expected growth in geographical span if the impact of geography could, somehow, be turned off. Instead, we observe relatively modest growth for the empirical span <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e032" xlink:type="simple"/></inline-formula>, which for communities of size ten reaches a value of just 50 km, and stays relatively unchanged until communities exceed 30 in size.</p>
        <p>The community null model does not incorporate our earlier finding that the connection probability decays with distance as <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e033" xlink:type="simple"/></inline-formula>. We next asked whether this decay, coupled with the concentration of populations in cities, might explain the observed bump. To account for this possibility, we introduce the <italic>dyadic null model</italic>. The algorithm starts by picking one location, uniformly at random, as the geographical center of the community. It then samples other locations, again uniformly at random, and computes the probability for there to be a tie between the center of the community and the current location, where the probability distribution is assumed to follow a power-law with exponent <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e034" xlink:type="simple"/></inline-formula>. To determine whether the current location is included in the community, the algorithm performs a Bernoulli trial with the given probability, and this continues until we have 50 members in the community. We compared the result of the dyadic null model without decay, achieved by accepting each trial location for inclusion, to the community null span. Apart from a slight horizontal shift, the two null models produce very similar outcomes. We then consider the dyadic null model with decay, varying the value of the scale parameter <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e035" xlink:type="simple"/></inline-formula>, running each simulation 1,000 times. Although the numerical values are not comparable between the dyadic null model and the community null model, the former demonstrates that inclusion of the decay of the connection probability with distance yields a smooth curve for the span. In particular, decay with distance cannot explain the observed bump.</p>
        <p>We also explored the spatial distribution of the nodes within a community. In general, the nodes of a given community need not be distributed spatially uniformly. To quantify this “clumpiness” of a community, we wanted to determine the number of spatial clusters making up the community. We used <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e036" xlink:type="simple"/></inline-formula>-means clustering <xref ref-type="bibr" rid="pone.0016939-Gan1">[18]</xref> which aims to partition the set of data points into <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e037" xlink:type="simple"/></inline-formula> clusters such that each point belongs to the cluster with the nearest mean. Since the number of clusters <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e038" xlink:type="simple"/></inline-formula> is given as input to the method, it can be seen as a model parameter, and it needs to be determined separately. At the extreme ends, one could assign every point to a single cluster, an approach likely to result in a large error measure, or one could assign every point to its own cluster, leading to zero error. We used the Akaike Information Criterion to determine the optimal value for <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e039" xlink:type="simple"/></inline-formula> <xref ref-type="bibr" rid="pone.0016939-Akaike1">[19]</xref>.</p>
        <p>We found that the number of spatial clusters increases linearly with community size, until communities of about size 20, when the behavior appears to change (<xref ref-type="fig" rid="pone-0016939-g005">Fig. 5</xref>). The increase in community span for communities larger than 20, without a comparable increase in the number of spatial clusters, suggests a threshold in structure and behavior based on community size. Based on linear fits to data, the addition of an extra community member causes, on average, a marginal increase of 0.67 spatial clusters in small (few members) communities, whereas in large (many members) communities, the addition of an extra community member causes, on average, a marginal increase of 0.29 spatial clusters. For example, an increase from 5 to 15 members increases the number of spatial clusters by 6.1, whereas an increase from 25 to 35 members results in an increase of 2.7 clusters. Communities therefore seem to grow initially by recruiting spatially more distant clusters, but less and less so as the communities get bigger.</p>
        <fig id="pone-0016939-g005" position="float">
          <object-id pub-id-type="doi">10.1371/journal.pone.0016939.g005</object-id>
          <label>Figure 5</label>
          <caption>
            <title>The average number of spatial clusters for empirical data, versus topological (network) community size.</title>
            <p>Clusters are detected using the <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e040" xlink:type="simple"/></inline-formula>-means algorithm with the Akaike Information Criterion. We fit two models to data. First, a linear model <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e041" xlink:type="simple"/></inline-formula> was fit in two parts, shown in green, as well as a non-linear model <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e042" xlink:type="simple"/></inline-formula>, shown in red. We obtained the values <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e043" xlink:type="simple"/></inline-formula> for the first slope and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e044" xlink:type="simple"/></inline-formula> for the second slope of the linear fits, and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e045" xlink:type="simple"/></inline-formula> for the exponent of the non-linear model, implying approximately square-root behavior.</p>
          </caption>
          <graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.g005" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec id="s3">
      <title>Discussion</title>
      <p>Our findings on the geographic decay of ties differ from those obtained for a network constructed from the customers of a Belgian mobile operator. Using zip codes provided for billing purposes to compute distances between individuals, Lambiotte <italic>et al.</italic> showed that the probability for two individuals to be connected decays as <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e046" xlink:type="simple"/></inline-formula>, which led them to suggest that the decay follows a so-called gravity model <xref ref-type="bibr" rid="pone.0016939-Lambiotte1">[12]</xref>. Our result, essentially showing that <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e047" xlink:type="simple"/></inline-formula>, differs for various possible reasons: we used the maximum-likelihood technique to estimate the value of the exponent <xref ref-type="bibr" rid="pone.0016939-Clauset1">[15]</xref>; our range of distances is larger (<inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e048" xlink:type="simple"/></inline-formula> km vs. <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e049" xlink:type="simple"/></inline-formula> km), allowing for more statistical power; we used the location of maximal phone use as opposed to the location of the billing address (which is often not reliable); and the population density in our target country is significantly lower than that of Belgium. Our result that tie strength does not vary with distance is complementary to the finding of Lambiotte <italic>et al.</italic>, who report that the average duration of phone calls increases with distance, reaching a plateau around 40 km. Therefore, while the number of calls made to long-distance individuals friends is slightly smaller than those made to short distance friends, the average duration may be twice as long <xref ref-type="bibr" rid="pone.0016939-Lambiotte1">[12]</xref>.</p>
      <p>Communities appear to have particular properties in relationship to geography, properties that are distinct from the underlying interactions between pairs of individuals. Geography constrains group formation in important ways that nevertheless differ from the way it constrains dyadic interactions. On the one hand, comparison of topological and geographical centrality of nodes within communities demonstrated that the two are essentially uncorrelated. On the other hand, we find that the geographic shapes of social groups, measured in terms of geographic span and spatial clustering, vary in regular ways with the size of the group. For small communities, as their size increases, their expected geographic span increases smoothly at first, but then experiences a sudden bounce as the community size reaches about 30 members. To exemplify this behavior, an increase in community size from 10 to 20 members is associated with an increase in span by about 40%, whereas, in contrast, an increase from 30 to 40 members leads to an increase of about 100% in geographic span. This suggests that the tendency of human groups to remain geographically cohesive gradually gives in as the group size exceeds 30. Similarly, the number of clusters within a single topological group also increases with community size. Intriguingly, the number 30 is also close to the optimal group size for which cooperation in social dilemma situations, modeled, for example, by the public goods game, is maximized <xref ref-type="bibr" rid="pone.0016939-Szolnoki1">[20]</xref>, <xref ref-type="bibr" rid="pone.0016939-Skyrms1">[21]</xref>.</p>
      <p>Just as the structures of observed social interactions may be compared to randomized networks, the observed localities of individuals in communities may be compared to randomized locations. Indeed, if social ties could be formed without consideration for the underlying geography, we would expect the tie probability to be independent of distance, and the geographic span of groups to follow the proposed null models closely. However, we observe neither of the two. This demonstrates that network ties and network communities, in this context, do not behave as if they were in well mixed populations, suggesting that geography continues to maintain its power as a compartmentalizing factor. Thus, the assumption of perfect mixing of individuals, sometimes made in the study of infectious disease or technology diffusion in humans, does not then appear to hold either at the topological or at the geographic level.</p>
      <p>The extent to which a spreading process follows the assumptions of well-mixed populations often depends on a number of conditions, including the nature of the spreading process. For example, network models can better account for the spread of diseases that spread via the formation of a physical tie (such as STD's) than those that spread by simple proximity (like the common cold). This is illustrated in a mobile phone context by Wang <italic>et al.</italic> <xref ref-type="bibr" rid="pone.0016939-Wang1">[22]</xref>, who find that the nature of the spreading process, and its dependence on proximity, clearly affect the dynamics of the spreading. Similarly, localization of interacting proteins within the geography of the cell can explain certain disease associations <xref ref-type="bibr" rid="pone.0016939-Park1">[23]</xref>. In addition, other work has suggested that the diffusion-like movement of people alone can often explain how a pathogen spreads, such as the plague in medieval Europe <xref ref-type="bibr" rid="pone.0016939-Noble1">[24]</xref>. On the other hand, with the onset of air travel, pathogens are not constrained in the same way, as the epidemics of SARS and H1N1 documented <xref ref-type="bibr" rid="pone.0016939-Hufnagel1">[25]</xref>, <xref ref-type="bibr" rid="pone.0016939-Colizza1">[26]</xref>.</p>
      <p>Ideally, models of the flow of pathogens or information through human populations would account for the simultaneous roles of geographic and network constraints, and our work helps shed light on the intersecting relationship between the two. Future work will explore the complex interrelationship between network topology and geography and their joint importance in understanding how phenomena spread through populations.</p>
    </sec>
    <sec id="s4" sec-type="methods">
      <title>Methods</title>
      <p>All networks were constructed from four weeks of anonymized mobile phone call and text messaging data from an operator based in an unnamed European country. Only interactions that took place between customers of the operator were considered, and only individuals who made at least two calls were included as nodes. To filter out sporadic calls and texts that are unlikely to correspond to meaningful social interactions, we required there to be a minimal level of reciprocation for a tie to be included in the network; each person had to initiate at least one interaction, where the initial transaction could be either a call or a text, and this could be reciprocated by either a call or a text.</p>
      <p>We detected topological communities using the popular method of modularity maximization <xref ref-type="bibr" rid="pone.0016939-Porter1">[6]</xref>, <xref ref-type="bibr" rid="pone.0016939-Fortunato1">[7]</xref>, <xref ref-type="bibr" rid="pone.0016939-Newman3">[16]</xref>, <xref ref-type="bibr" rid="pone.0016939-Girvan1">[17]</xref> in the following manner. We first converted the original network consisting of directed voice calls and text messages into a symmetric unweighted network, effectively combining the two modes of interaction. We then proceeded to maximize modularity defined as <disp-formula><graphic mimetype="image" position="float" xlink:href="info:doi/10.1371/journal.pone.0016939.e050" xlink:type="simple"/><label>(2)</label></disp-formula></p>
      <p>where the adjacency matrix element <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e051" xlink:type="simple"/></inline-formula> denotes the presence (<inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e052" xlink:type="simple"/></inline-formula>) or absence (<inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e053" xlink:type="simple"/></inline-formula>) of a connection between nodes <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e054" xlink:type="simple"/></inline-formula> and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e055" xlink:type="simple"/></inline-formula>, <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e056" xlink:type="simple"/></inline-formula> is the degree of node <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e057" xlink:type="simple"/></inline-formula>, <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e058" xlink:type="simple"/></inline-formula> the total weight of the edges in the network, <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e059" xlink:type="simple"/></inline-formula> the community assignment of node <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e060" xlink:type="simple"/></inline-formula>, and <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e061" xlink:type="simple"/></inline-formula> is the Kronecker delta function, which is unity if and only if <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e062" xlink:type="simple"/></inline-formula>, otherwise it is zero. Modularity measures the difference between the total fraction of edges that fall within groups versus the fraction one would expect by chance. A common null model, sometimes called the Newman-Girvan null model, is codified by the <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e063" xlink:type="simple"/></inline-formula> term, and it takes degree heterogeneity into account by preserving the expected degree distribution. High values of <inline-formula><inline-graphic mimetype="image" xlink:href="info:doi/10.1371/journal.pone.0016939.e064" xlink:type="simple"/></inline-formula> indicate network partitions in which more of the edges fall within groups than expected by chance. While maximizing modularity is known to be an NP-hard problem <xref ref-type="bibr" rid="pone.0016939-Brandes1">[27]</xref>, there are numerous computational heuristics available <xref ref-type="bibr" rid="pone.0016939-Porter1">[6]</xref>, <xref ref-type="bibr" rid="pone.0016939-Fortunato1">[7]</xref>. Since we are dealing with networks consisting of millions of nodes, we chose the Louvain method for its computational efficiency <xref ref-type="bibr" rid="pone.0016939-Blondel1">[28]</xref>.</p>
    </sec>
  </body>
  <back>
    <ack>
      <p>We acknowledge A. Zaslavsky for useful discussions about the Akaike Information Criterion.</p>
    </ack>
    <ref-list>
      <title>References</title>
      <ref id="pone.0016939-Newman1">
        <label>1</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Newman</surname><given-names>MEJ</given-names></name></person-group>             <year>2008</year>             <article-title>The physics of networks.</article-title>             <source>Physics Today</source>             <volume>61</volume>             <fpage>33</fpage>             <lpage>38</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Caldarelli1">
        <label>2</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Caldarelli</surname><given-names>G</given-names></name></person-group>             <year>2007</year>             <article-title>Scale-Free Networks: Complex Webs in Nature and Technology.</article-title>             <comment>Oxford University Press, 1st edition</comment>          </element-citation>
      </ref>
      <ref id="pone.0016939-Dorogovtsev1">
        <label>3</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Dorogovtsev</surname><given-names>SN</given-names></name><name name-style="western"><surname>Mendes</surname><given-names>JFF</given-names></name></person-group>             <year>2003</year>             <article-title>Evolution of Networks: From Biological Nets to the Internet and WWW.</article-title>             <comment>Oxford University Press, 1st edition</comment>          </element-citation>
      </ref>
      <ref id="pone.0016939-Albert1">
        <label>4</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Albert</surname><given-names>R</given-names></name><name name-style="western"><surname>Barabási</surname><given-names>AL</given-names></name></person-group>             <year>2002</year>             <article-title>Statistical mechanics of complex networks.</article-title>             <source>Rev Mod Phys</source>             <volume>74</volume>             <fpage>47</fpage>             <lpage>97</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Newman2">
        <label>5</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Newman</surname><given-names>MEJ</given-names></name><name name-style="western"><surname>Barabási</surname><given-names>AL</given-names></name><name name-style="western"><surname>Watts</surname><given-names>DJ</given-names></name></person-group>             <year>2006</year>             <article-title>The Structure and Dynamics of Networks.</article-title>             <comment>Princeton University Press, 1st edition</comment>          </element-citation>
      </ref>
      <ref id="pone.0016939-Porter1">
        <label>6</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Porter</surname><given-names>MA</given-names></name><name name-style="western"><surname>Onnela</surname><given-names>J-P</given-names></name><name name-style="western"><surname>Mucha</surname><given-names>PJ</given-names></name></person-group>             <year>2009</year>             <article-title>Communities in networks.</article-title>             <source>Notices of the American Mathematical Society</source>             <volume>56</volume>             <fpage>1082</fpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Fortunato1">
        <label>7</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Fortunato</surname><given-names>S</given-names></name></person-group>             <year>2010</year>             <article-title>Community detection in graphs.</article-title>             <source>Physics Reports</source>             <volume>486</volume>             <fpage>75</fpage>             <lpage>174</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Freeman1">
        <label>8</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Freeman</surname><given-names>LC</given-names></name></person-group>             <year>2004</year>             <article-title>The Development of Social Network Analysis: A Study in the Sociology of Science.</article-title>             <publisher-loc>Vancouver, Canada</publisher-loc>             <publisher-name>Empirical Press</publisher-name>          </element-citation>
      </ref>
      <ref id="pone.0016939-Onnela1">
        <label>9</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Onnela</surname><given-names>J-P</given-names></name><name name-style="western"><surname>Saramäki</surname><given-names>J</given-names></name><name name-style="western"><surname>Hyvönen</surname><given-names>J</given-names></name><name name-style="western"><surname>Szabó</surname><given-names>G</given-names></name><name name-style="western"><surname>Lazer</surname><given-names>D</given-names></name><etal/></person-group>             <year>2007</year>             <article-title>Structure and tie strengths in mobile communication networks.</article-title>             <source>P Natl Acad Sci USAS</source>             <volume>104</volume>             <fpage>7332</fpage>             <lpage>7336</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Gonzlez1">
        <label>10</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>González</surname><given-names>MC</given-names></name><name name-style="western"><surname>Hidalgo</surname><given-names>CA</given-names></name><name name-style="western"><surname>Barabási</surname><given-names>AL</given-names></name></person-group>             <year>2008</year>             <article-title>Understanding individual human mobility patterns.</article-title>             <source>Nature</source>             <volume>453</volume>             <fpage>779</fpage>             <lpage>782</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-LibenNowell1">
        <label>11</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Liben-Nowell</surname><given-names>D</given-names></name></person-group>             <year>2005</year>             <article-title>Geographic routing in social networks.</article-title>             <source>P Natl Acad Sci USA</source>             <volume>102</volume>             <fpage>11623</fpage>             <lpage>11628</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Lambiotte1">
        <label>12</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Lambiotte</surname><given-names>R</given-names></name></person-group>             <year>2008</year>             <article-title>Geographical dispersal of mobile communication networks.</article-title>             <source>Physica A</source>             <volume>387</volume>             <fpage>5317</fpage>             <lpage>5325</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Palla1">
        <label>13</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Palla</surname><given-names>G</given-names></name><name name-style="western"><surname>Barabási</surname><given-names>AL</given-names></name><name name-style="western"><surname>Vicsek</surname><given-names>T</given-names></name></person-group>             <year>2007</year>             <article-title>Quantifying social group evolution.</article-title>             <source>Nature</source>             <volume>446</volume>             <fpage>664</fpage>             <lpage>667</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Ahn1">
        <label>14</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Ahn</surname><given-names>YY</given-names></name><name name-style="western"><surname>Bagrow</surname><given-names>JP</given-names></name><name name-style="western"><surname>Lehmann</surname><given-names>S</given-names></name></person-group>             <year>2010</year>             <article-title>Link communities reveal multiscale complexity in networks.</article-title>             <source>Nature</source>             <volume>466</volume>             <fpage>761</fpage>             <lpage>764</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Clauset1">
        <label>15</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Clauset</surname><given-names>A</given-names></name><name name-style="western"><surname>Shalizi</surname><given-names>CR</given-names></name><name name-style="western"><surname>Newman</surname><given-names>MEJ</given-names></name></person-group>             <year>2009</year>             <article-title>Power-law distributions in empirical data.</article-title>             <source>SIAM Review</source>             <volume>51</volume>             <fpage>661</fpage>             <lpage>703</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Newman3">
        <label>16</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Newman</surname><given-names>MEJ</given-names></name></person-group>             <year>2003</year>             <article-title>Mixing patterns in networks.</article-title>             <source>Phys Rev E</source>             <volume>67</volume>             <fpage>026126</fpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Girvan1">
        <label>17</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Girvan</surname><given-names>M</given-names></name><name name-style="western"><surname>J Newman</surname><given-names>MEJ</given-names></name></person-group>             <year>2002</year>             <article-title>Community structure in social and biological networks.</article-title>             <source>P Natl Acad Sci USA</source>             <volume>99</volume>             <fpage>7821</fpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Gan1">
        <label>18</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Gan</surname><given-names>G</given-names></name><name name-style="western"><surname>Ma</surname><given-names>C</given-names></name><name name-style="western"><surname>Wu</surname><given-names>J</given-names></name></person-group>             <year>2007</year>             <article-title>Data Clustering: Theory, Algorithms, and Applications. SIAM</article-title>          </element-citation>
      </ref>
      <ref id="pone.0016939-Akaike1">
        <label>19</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Akaike</surname><given-names>H</given-names></name></person-group>             <year>1974</year>             <article-title>A new look at the statistical model identification.</article-title>             <source>IEEE Transactions on Automatic Control</source>             <volume>19</volume>             <fpage>716</fpage>             <lpage>723</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Szolnoki1">
        <label>20</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Szolnoki</surname><given-names>A</given-names></name><name name-style="western"><surname>Perc</surname><given-names>M</given-names></name></person-group>             <year>2010</year>             <article-title>Impact of critical mass on the evolution of cooperation in spatial public goods games.</article-title>             <source>Phys Rev E</source>             <volume>81</volume>             <fpage>057101</fpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Skyrms1">
        <label>21</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Skyrms</surname><given-names>B</given-names></name></person-group>             <year>2004</year>             <article-title>The stag hunt and the evolution of social structure.</article-title>             <publisher-name>Cambridge University Press</publisher-name>          </element-citation>
      </ref>
      <ref id="pone.0016939-Wang1">
        <label>22</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>P</given-names></name><name name-style="western"><surname>González</surname><given-names>MC</given-names></name><name name-style="western"><surname>Hidalgo</surname><given-names>CA</given-names></name><name name-style="western"><surname>Barabási</surname><given-names>AL</given-names></name></person-group>             <year>2009</year>             <article-title>Understanding the spreading patterns of mobile phone viruses.</article-title>             <source>Science</source>             <volume>324</volume>             <fpage>1071</fpage>             <lpage>1076</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Park1">
        <label>23</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Park</surname><given-names>S</given-names></name></person-group>             <article-title>The importance of protein subcellular localization for disease profiling</article-title>          </element-citation>
      </ref>
      <ref id="pone.0016939-Noble1">
        <label>24</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Noble</surname><given-names>JV</given-names></name></person-group>             <year>1974</year>             <article-title>Geographic and temporal development of plagues.</article-title>             <source>Nature</source>             <volume>250</volume>             <fpage>726</fpage>             <lpage>729</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Hufnagel1">
        <label>25</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Hufnagel</surname><given-names>L</given-names></name><name name-style="western"><surname>Brockmann</surname><given-names>D</given-names></name><name name-style="western"><surname>Geisel</surname><given-names>T</given-names></name></person-group>             <year>2004</year>             <article-title>Forecast and control of epidemics in a globalized world.</article-title>             <source>P Natl Acad Sci USA</source>             <volume>101</volume>          </element-citation>
      </ref>
      <ref id="pone.0016939-Colizza1">
        <label>26</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Colizza</surname><given-names>V</given-names></name><name name-style="western"><surname>Barrat</surname><given-names>A</given-names></name><name name-style="western"><surname>Barthelemy</surname><given-names>M</given-names></name><name name-style="western"><surname>Valleron</surname><given-names>AJ</given-names></name><name name-style="western"><surname>Vespignani</surname><given-names>A</given-names></name></person-group>             <year>2007</year>             <article-title>Modeling the worldwide spread of pandemic influenza: baseline case and containment interventions.</article-title>             <source>PLoS Med</source>             <volume>4</volume>             <fpage>e13</fpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Brandes1">
        <label>27</label>
        <element-citation publication-type="journal" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Brandes</surname><given-names>U</given-names></name></person-group>             <year>2008</year>             <article-title>On modularity clustering.</article-title>             <source>IEEE Transactions on Knowledge and Data Engineering</source>             <volume>20</volume>             <fpage>172</fpage>             <lpage>188</lpage>          </element-citation>
      </ref>
      <ref id="pone.0016939-Blondel1">
        <label>28</label>
        <element-citation publication-type="other" xlink:type="simple">             <person-group person-group-type="author"><name name-style="western"><surname>Blondel</surname><given-names>VD</given-names></name><name name-style="western"><surname>Guillaume</surname><given-names>JL</given-names></name><name name-style="western"><surname>Lambiotte</surname><given-names>R</given-names></name><name name-style="western"><surname>Lefebvre</surname><given-names>E</given-names></name></person-group>             <year>2008</year>             <article-title>Fast unfolding of communities in large network.</article-title>             <publisher-loc>Journal of Statistical Mechanics</publisher-loc>             <publisher-name>Theory and Experiment</publisher-name> <!--===== Restructure page-count as size[@units="page"] =====--><size units="page">P10008</size>           </element-citation>
      </ref>
    </ref-list>
    
  </back>
</article>