gonum.org/v1/gonum@v0.14.0/graph/community/louvain.tex

gonum.org/v1/gonum@v0.14.0/graph/community/louvain.tex (about)

     1  % Copyright ©2015 The Gonum Authors. All rights reserved.
     2  % Use of this source code is governed by a BSD-style
     3  % license that can be found in the LICENSE file.
     4  
     5  \documentclass{article}
     6  
     7  \usepackage{amsmath,amsfonts}
     8  \usepackage[margin=4cm]{geometry}
     9  
    10  \title{Louvain algorithm for undirected and directed graphs}
    11  \author{The {\tt Gonum} Authors}
    12  
    13  \begin{document}
    14  
    15  \maketitle
    16  
    17  The algorithm attempts to find communities (highly connected sub-graphs),
    18  and it does this by minimising the modularity function
    19  \begin{equation}
    20  	Q(c) = \frac{1}{2m}\sum_i\sum_j\left[ A_{ij} - \gamma \frac{k_ik_j}{2m} \right] \delta_{ij}(c),
    21  \end{equation}
    22  where $c$ is a partition of nodes into subsets or communities,
    23  $A_{ij}$ is the edge weight between nodes $i$ and $j$, 
    24  $\gamma$ is a tuning parameter,
    25  \begin{equation}
    26  m = \frac{1}{2}\sum_i\sum_jA_{ij},
    27  \end{equation}
    28  \begin{equation}
    29  k_i = \sum_j{A_{ij}},
    30  \end{equation}
    31  and 
    32  \begin{equation}
    33  	\delta_{ij}(c) = \left \{ \begin{array}{ll}
    34  	1 & \text{if} \quad  c(i) = c(j) \\
    35  	0 & \text{otherwise} \end{array} \right ..
    36  \end{equation}
    37  Here $c(i)$ denotes the community to which node $i$ belongs 
    38  in the partitioning $c$.
    39  
    40  The algorithm finds a hierarchical community structure by iterating 
    41  between two phases:
    42  \begin{enumerate}
    43  	\item Find a set of communities that minimise $Q$.
    44  	\item Construct a new graph, whose nodes are the communities 
    45  	found in the preceding phase one step.
    46  \end{enumerate}
    47  Each iteration of these two phases is called a `pass'.
    48  In this way, the algorithm obtains a nested community structure, 
    49  where at each level $Q$ is minimised for the relevant graph.
    50  We consider this process in more detail, in particular looking 
    51  at phase one first in the first pass, when each node is a single
    52  node, and then how this generalises to later passes when each node 
    53  is a community.
    54  
    55  \section{Undirected Graphs}
    56  
    57  \subsection{Initial Pass}
    58  \label{sec:initialPass}
    59  
    60  The initial pass is simple as the initial pass uses the original graph, 
    61  and in all following passes graphs constructed in the previous pass's 
    62  phase two are used.
    63  Here we will consider this initial simple formulation for phase one, and
    64  in Section~\ref{sec:laterPasses} we consider how this generalises for 
    65  passes two and onwards. 
    66  Phase one works by initially allocating each node to a separate community,
    67  and then iterating through each node $a$ and checking if moving it into 
    68  a different community $\beta$ will reduce $Q$.
    69  If there are possible moves that will reduce $Q$, $a$ is moved into the 
    70  the community which will generate the largest reduction in $Q$. 
    71  This process is continued until there are no moves left to reduce $Q$ 
    72  further, meaning a local minimum for $Q$ has been achieved. 
    73  Then the algorithm moves to phase two (constructing a new graph where
    74  each node in the new graph is a community in the old graph). 
    75  
    76  Note that we assume the original graph to be simple and undirected.
    77  First, we introduce some notation that will be useful:
    78  Let $c(i)$ denote the community to which node $i$ belongs, 
    79  and let $\alpha$ be the community that the node $a$ mentioned above
    80  belongs to, i.e., $\alpha = c_a$.
    81  Then we define
    82  \newcommand{\Stot}[1]{\Sigma_{\text{tot}}^{#1}}
    83  \begin{equation}
    84  	\Stot{\alpha} = \sum_{i \in \alpha}\sum_{j}A_{ij} = \sum_{i \in \alpha}k_i,
    85  \end{equation}
    86  \newcommand{\kin}[2]{k_{#1}^{#2}}
    87  \begin{equation}
    88  	\kin{i}{\alpha} = \sum_{j \in \alpha}A_{ij},
    89  \end{equation}
    90  and
    91  \newcommand{\Sin}[1]{\Sigma_{\text{in}}^{#1}}
    92  \begin{equation}
    93  	\Sin{\alpha} = \sum_{i \in \alpha}\sum_{j \in \alpha}A_{ij} = \sum_{i \in \alpha}\kin{i}{\alpha}.
    94  \end{equation}
    95  
    96  We are interested in how $Q$ will change if we move a node $a$ from its 
    97  current community $\alpha$, to a new community $\beta$.
    98  This will have two effects, it will remove the terms from $Q$ 
    99  related to $a$ in $\alpha$, which we will call $Q^-$ and it will add terms 
   100  related to $a$ in $\beta$, which we will call $Q^+$. 
   101  The total change in $Q$ caused by the movement of $a$ from $\alpha$ to $\beta$ is 
   102  \begin{equation}
   103  	\Delta Q = Q^{+} - Q^{-},
   104  \end{equation}
   105  where
   106  \begin{align*}
   107  Q^- &= \frac{1}{2m}\left[ \left( A_{aa} - \gamma \frac{k_a^2}{2m} \right) 
   108  + 2\sum_{i \in \alpha, \, i \neq a} \left( A_{ia} - \gamma \frac{k_ik_a}{2m} \right) \right] \\
   109  	&= \frac{1}{2m}\left[ \left( A_{aa} - \gamma \frac{k_a^2}{2m} \right) 
   110  + 2 \left( \kin{a}{\alpha} -A_{aa}\right) - \gamma \frac{2k_a}{2m}\sum_{i \in \alpha, \, i \neq a} k_i \right] \\
   111  	&= \frac{1}{2m}\left[ \left( A_{aa} - \gamma \frac{k_a^2}{2m} \right) 
   112  + 2 \left( \kin{a}{\alpha} -A_{aa}\right) - \gamma \frac{2k_a}{2m}\left( \Stot{\alpha} - k_a \right)  \right], \\
   113  \end{align*}
   114  and
   115  \begin{align*}
   116  Q^+ &= \frac{1}{2m}\left[ \left( A_{aa} - \gamma \frac{k_a^2}{2m} \right) 
   117  + 2\sum_{i \in \beta} \left( A_{ia} - \gamma \frac{k_ik_a}{2m} \right) \right] \\
   118  		&= \frac{1}{2m}\left[ \left( A_{aa} - \gamma \frac{k_a^2}{2m} \right) 
   119  + 2\kin{a}{\beta} - \gamma \frac{2k_a}{2m}\sum_{i \in \beta} k_i \right] \\
   120  		&= \frac{1}{2m}\left[ \left( A_{aa} - \gamma \frac{k_a^2}{2m} \right) 
   121  + 2\kin{a}{\beta} - \gamma \frac{2k_a\Stot{\beta}}{2m} \right]. \\
   122  \end{align*}
   123  The first term in both these expressions ($Q^-$ and $Q^+$) is the same, and so cancels:
   124  \begin{equation}
   125  \Delta Q = \frac{1}{2m}\left[ \left( 2\kin{a}{\beta} - \gamma \frac{2k_a\Stot{\beta}}{2m} \right) 
   126  		- \left( 2 \left( \kin{a}{\alpha} -A_{aa}\right) - \gamma \frac{2k_a}{2m}\left( \Stot{\alpha} - k_a \right) \right) \right]. 
   127  \end{equation}
   128   
   129  \subsection{Later Passes}
   130  \label{sec:laterPasses}
   131  
   132  In phase two a `meta-graph' is constructed where nodes correspond to 
   133  the communities found in the preceding phase one step, and edge weight
   134  between two such communities (nodes, in the meta-graph)
   135  $\alpha$ and $\beta$ are defined to be
   136  \begin{equation}
   137  	A_{\alpha \beta}^* = \sum_{i \in \alpha}\sum_{j \in \beta}A_{ij}.
   138  	\label{eqn:Aij*}
   139  \end{equation} 
   140  Note that $i$ and $j$ refer to nodes in the original graph, not nodes 
   141  in the previous graph, and so holds any meta-graph, not just the first.
   142  Also note that this definition of $A^*_{\alpha \beta}$ allows for 
   143  $A^*_{\alpha \alpha}$ to be non-zero as
   144  \begin{equation}
   145  A_{\alpha \alpha}^* = \sum_{i \in \alpha}\sum_{j \in \alpha}A_{ij} = \Sin{\alpha}.
   146  \end{equation} 
   147  
   148  In this newly constructed graph, $\alpha$ and $\beta$ are nodes, but 
   149  also refer to communities (sets of nodes) in the original graph, and I 
   150  use these two interpretations interchangeably.
   151  This should be the only ambiguous bit of notation in this document, I hope.
   152  
   153  The results of Section~\ref{sec:initialPass} generalise to these meta-graphs,
   154  and the generalised results mirror those of Section~\ref{sec:initialPass} closely
   155  -- I distinguish the new results from those of Section~\ref{sec:initialPass} by a 
   156  superscript $*$.
   157  I use $i$ and $j$ to denote nodes of the original graph as in Section~\ref{sec:initialPass}, 
   158  and use $z$ and $w$ to denote nodes of the meta-graph (communities of the original).
   159  I use analogous notation to Section~\ref{sec:initialPass}, $c^*(z)$, to 
   160  denote the community to which node $z$ of the meta-graph belongs, 
   161  and let $\mathfrak{a}$ be the community that the node $\alpha$ belongs to 
   162  ($c^*(\alpha) = \mathfrak{a}$), i.e.
   163  \begin{equation}
   164  	\mathfrak{a} = \{z | c^*(z) = c^*(\alpha) \}.
   165  \end{equation}
   166  
   167  Given this notation, we can observe that
   168  \begin{equation}
   169  m^* = \frac{1}{2}\sum_{z}\sum_{w}{A_{zw}^*} = \frac{1}{2}\sum_{z}\sum_{w}{\sum_{i \in z}\sum_{j \in w}A_{ij}} = \frac{1}{2}\sum_i\sum_jA_{ij} = m,
   170  \end{equation}
   171  \begin{equation}
   172  k_{z}^* = \sum_{w}{A_{zw}^*} =  \sum_{w}{\sum_{i \in z}\sum_{j \in w}A_{ij}} = \sum_{i \in z}\sum_{j}A_{ij} = \Stot{z},
   173  \end{equation}
   174  \begin{equation}
   175  	\Stot{\mathfrak{a} *} = \sum_{z \in \mathfrak{a}}\sum_{w}A_{zw}^* = \sum_{z \in \mathfrak{a}}k_z^* = \sum_{z \in \mathfrak{a}}\Stot{z},
   176  \end{equation}
   177  \begin{equation}
   178  	\kin{z}{\mathfrak{a} *} = \sum_{w \in \mathfrak{a}}{A_{zw}^*} = \sum_{w \in \mathfrak{a}}{\sum_{i \in z}\sum_{j \in w}A_{ij}},
   179  \end{equation}
   180  and
   181  \begin{equation}
   182  \Sin{\mathfrak{a} *} = \sum_{z \in \mathfrak{a}}\sum_{w \in \mathfrak{a}}A_{zw}^* = \sum_{z \in \mathfrak{a}}\kin{z}{\mathfrak{a} *} = \sum_{z \in \mathfrak{a}}\sum_{w \in \mathfrak{a}}{\sum_{i \in z}\sum_{j \in w}A_{ij}}.
   183  	%\label{eqn:Sin}
   184  \end{equation}
   185  
   186  If we let $\mathfrak{b}$ denote the community to which we are considering moving $\alpha$,
   187  then the expression for $\Delta Q$ from Section~\ref{sec:initialPass} trivially generalises to
   188  \begin{equation}
   189  \Delta Q = \frac{1}{2m}\left[ \left( 2 \kin{\alpha}{\mathfrak{b} *} - \gamma \frac{2k_{\alpha}^*\Stot{\mathfrak{b} *}}{2m} \right) 
   190  		- \left( 2\left( \kin{\alpha}{\mathfrak{a} *} - A_{\alpha \alpha}^* \right) - \gamma \frac{2k_{\alpha}^*}{2m} \left( \Stot{\mathfrak{a} *} - k_{\alpha}^* \right ) \right) \right] \\
   191  \end{equation}
   192  
   193  \section{Directed Graphs}
   194  \label{sec:directedGraphs}
   195  
   196  It is of interest to consider how this generalises to directed graphs.
   197  If we are to treat incoming and outgoing nodes equally, there are several
   198  thoughts on how to extend the algorithm to directed graphs, of which we 
   199  will explore three: 
   200  \begin{itemize}
   201  	\item Construct an undirected graph first, and then use the undirected case.
   202  	\item Generalise the expressions from the undirected case to the directed case, 
   203  	we will consider two different suggestions for such generalisations. 
   204  \end{itemize}
   205  We will show that one of the two `generalisation of expressions' approaches is 
   206  equivalent to constructing an undirected graph, and the other is not.
   207  
   208  \subsection{Construction of an undirected graph}
   209  A simple approach to generalising to directed graphs is to construct 
   210  an undirected graph with edge weights
   211  \begin{equation}
   212  A_{ij} = B_{ij} + B_{ji},
   213  \label{eqn:undirectedAB}
   214  \end{equation}
   215  and simply use the undirected algorithm.
   216  Another suggestion is to average the directed edges to make
   217  an undirected graph, i.e. to use a directed graph with edge weights
   218  \begin{equation}
   219  A_{ij} = \frac{B_{ij} + B_{ji}}{2}.
   220  \end{equation}
   221  This raises an important question: does scaling all edge weights across 
   222  the entire graph by a constant affect the results of the algorithm?
   223  Hopefully not, but worth checking.
   224  We can follow this through the results for the undirected graph by 
   225  substituting $A_{ij}^{(1)} = pA_{ij}$, $p \in \mathbb{R}$, and 
   226  distinguishing the new expressions by a superscript ${(1)}$. These
   227  new expressions are:
   228  \begin{equation}
   229  m^{(1)} = \frac{1}{2}\sum_i\sum_jpA_{ij}  = p\frac{1}{2}\sum_i\sum_j A_{ij} = pm ,
   230  \end{equation}
   231  \begin{equation}
   232  k_i^{(1)} = \sum_j{pA_{ij}} = p\sum_j{A_{ij}} = pk_i,
   233  \end{equation}
   234  and so
   235  \begin{align*}
   236  	Q^{(1)}(c) &= \frac{1}{2pm}\sum_i\sum_j\left[ pA_{ij} - \gamma \frac{pk_ipk_j}{2pm} \right] \delta_{ij}(c) \\
   237  	&= \frac{1}{2m}\sum_i\sum_j\left[ A_{ij} - \gamma \frac{k_ik_j}{2m} \right] \delta_{ij}(c) \\
   238  	&= Q(c)
   239  \end{align*}
   240  Note that as we have shown $Q^{(1)} = Q$ there is no need to go into the remainder of the terms 
   241  involved in the algorithm, as they all derive from $Q$.
   242  
   243  \subsection{First generalisation of expressions approach}
   244  
   245  One suggested extension to directed graphs is to modify the expressions 
   246  involved by adding the `from' case and the `to' case for each term. 
   247  If we let $B_{ij}$ be the edge weight between nodes $i$ and $j$ in 
   248  the directed graph, and distinguishing these extended expressions by 
   249  a superscript $(2)$, the extended expressions become:
   250  \begin{equation}
   251  m^{(2)} = \frac{1}{2}\left ( \sum_i\sum_jB_{ij} + \sum_i\sum_jB_{ji}\right)  = \frac{1}{2}\sum_i\sum_j \left( B_{ij} + B_{ji} \right) ,
   252  \end{equation}
   253  \begin{equation}
   254  k_i^{(2)} = \sum_jB_{ij} + \sum_jB_{ji} = \sum_j{\left( B_{ij} + B_{ji} \right)},
   255  \end{equation}
   256  and similarly
   257  \begin{equation}
   258  	Q^{(2)}(c) = \frac{1}{2m}\sum_i\sum_j\left[ \left( B_{ij} + B_{ji} \right) - \gamma \frac{k_i^{(2)}k_j^{(2)}}{2m} \right] \delta_{ij}(c).
   259  \end{equation}
   260  
   261  Note how this is equivalent to the construction of an undirected graph as 
   262  per Equation~(\ref{eqn:undirectedAB}). Similarly to above, 
   263  there is no need to go into the remainder of the terms 
   264  involved in the algorithm, as they all derive from $Q$.
   265  
   266  
   267  \subsection{Second generalisation of expressions approach}
   268  
   269  Another approach to generalising the expressions to the 
   270  directed case, that still treats incoming and outgoing edges 
   271  as equally important, is to propose an alternative modularity 
   272  expression:
   273  \newcommand{\dkin}[1]{k_{#1}^{\text{in}}}
   274  \newcommand{\dkout}[1]{k_{#1}^{\text{out}}}
   275  \begin{equation}
   276  Q^{(3)}(c) = \frac{1}{2m}\sum_i\sum_j\left[ 2B_{ij} - 2\gamma \frac{\dkin{i}\dkout{j}}{2m} \right] \delta_{ij}(c), \\
   277  \end{equation}
   278  where 
   279  \begin{equation}
   280  \dkout{i} = \sum_j{B_{ij}} 
   281  \quad \quad \text{and} \quad \quad
   282  \dkin{i} = \sum_j{B_{ji}},
   283  \end{equation}
   284  so $k_i^{(2)} = \dkin{i} + \dkout{i}$.
   285  Note I leave the factor of two in the expression for $Q^{(3)}$ so that it 
   286  remains as comparable to that for $Q^{(2)}$ as possible.
   287  There is no need for alternative $m$, as it will still be the same as above.
   288  $Q^{(3)}$ will differ from $Q^{(2)}$ in two ways.
   289  Firstly, as $k_i^{(2)} = \dkin{i} + \dkout{i}$, 
   290  \begin{align*}
   291  \sum_i\sum_j k_i^{(2)} k_j^{(2)} \delta_{ij}(c)  &= \sum_i\sum_j  (\dkin{i} + \dkout{i}) (\dkin{j} + \dkout{j}) \delta_{ij}(c) \\
   292   &= \sum_i\sum_j \left[ (\dkin{i}\dkin{j} + \dkout{i}\dkout{j}) + (\dkin{i}\dkout{j} + \dkin{j}\dkout{i}) \right] \delta_{ij}(c). \\
   293   &= \sum_i\sum_j \left[ (\dkin{i}\dkin{j} + \dkout{i}\dkout{j}) + 2\dkin{i}\dkout{j} \right] \delta_{ij}(c), \\
   294  \end{align*}
   295  and similarly,
   296  \begin{equation}
   297  \sum_i\sum_j  \left( B_{ij} + B_{ji} \right) \delta_{ij}(c) = 2\sum_i\sum_j B_{ij} \delta_{ij}(c).
   298  \end{equation}
   299  From these two expressions, we can see that 
   300  \begin{equation}
   301  Q^{(3)} - Q^{(2)} = \frac{1}{2m}\sum_i\sum_j \gamma \frac{\dkin{i}\dkin{j} + \dkout{i}\dkout{j}}{2m} \delta_{ij}(c).
   302  \end{equation}
   303  
   304  
   305  \section{Directed Graphs in more detail}
   306  \label{sec:directedGraphsDetail}
   307  
   308  In Section \ref{sec:directedGraphs} we essentially showed three 
   309  things:
   310  \begin{itemize}
   311  	\item How an undirected graph could be constructed from a directed
   312  	graph, thereby allowing the undirected algorithm to be used for 
   313  	directed graphs.
   314  	\item How scaling all edge weights by a non-zero constant would not 
   315  	affect the modularity function.
   316  	\item An alternative approach to extending the algorithm to 
   317  	directed graphs that is not equivalent to first reducing it 
   318  	to an undirected graph.
   319  \end{itemize}
   320  It is this third point that we will explore here.
   321  Analogously to Sections \ref{sec:initialPass} and \ref{sec:laterPasses} we will 
   322  break this up into the initial pass and the later passes.
   323  
   324  \subsection{Initial pass}
   325  \label{sec:initialPassDirected}
   326  
   327  Continuing with the notation of Section \ref{sec:initialPass}, in which 
   328  $c(i)$ denotes the community to which node $i$ belongs, 
   329  and $\alpha = c(a)$, we define
   330  \newcommand{\dinStot}[1]{\Sigma_{\text{tot}}^{\text{in}(#1)}}
   331  \newcommand{\doutStot}[1]{\Sigma_{\text{tot}}^{\text{out}(#1)}}
   332  \begin{equation}
   333  	\doutStot{\alpha} = \sum_{i \in \alpha}\sum_{j}B_{ij} = \sum_{i \in \alpha}\dkout{i}
   334  	\quad \quad \text{and} \quad \quad
   335  	\dinStot{\alpha} = \sum_{i \in \alpha}\sum_{j}B_{ji} = \sum_{i \in \alpha}\dkin{i},
   336  \end{equation}
   337  \newcommand{\dinkin}[2]{k_{#1}^{\text{in}(#2)}}
   338  \newcommand{\doutkin}[2]{k_{#1}^{\text{out}(#2)}}
   339  \begin{equation}
   340  	\doutkin{i}{\alpha} = \sum_{j \in \alpha}B_{ij}
   341  	\quad \quad \text{and} \quad \quad
   342  	\dinkin{i}{\alpha} = \sum_{j \in \alpha}B_{ji},
   343  \end{equation}
   344  and we will entertain one more ambiguous notation choice:
   345  %\newcommand{\Sin}[1]{\Sigma_{\text{in}}^{#1}}
   346  \begin{equation}
   347  	\Sin{\alpha} = \sum_{i \in \alpha}\sum_{j \in \alpha}B_{ij} = \sum_{i \in \alpha}\doutkin{i}{\alpha} = \sum_{i \in \alpha}\dinkin{i}{\alpha}.
   348  \end{equation}
   349  
   350  Analogously to Section \ref{sec:initialPass}, we are interested in how 
   351  $Q^{(3)}$ will change if we move a node $a$ from its 
   352  current community $\alpha$, to a new community $\beta$, 
   353  and analogously this will have two effects -- it will remove the terms 
   354  from $Q^{(3)}$ related to $a$ in $\alpha$, which we will call $Q^{-(3)}$ 
   355  and it will add terms related to $a$ in $\beta$, which we will call $Q^{+(3)}$. 
   356  The total change in $Q^{(3)}$ caused by the movement of $a$ from $\alpha$ to $\beta$ is 
   357  \begin{equation}
   358  	\Delta Q^{(3)} = Q^{+(3)} - Q^{-(3)},
   359  \end{equation}
   360  where
   361  \begin{align*}
   362  Q^{-(3)} &= \frac{1}{2m}\left[ \left( 2B_{aa} - 2\gamma \frac{\dkin{a}\dkout{a}}{2m} \right) 
   363  + \sum_{i \in \alpha, \, i \neq a} \left( 2B_{ia} + 2B_{ai} - 2\gamma \frac{\dkin{i}\dkout{a}}{2m} - 2\gamma \frac{\dkin{a}\dkout{i}}{2m} \right) \right] \\
   364  				 &= \frac{1}{2m}\left[ \left( 2B_{aa} - 2\gamma \frac{\dkin{a}\dkout{a}}{2m} \right) 
   365  + 2(\dinkin{a}{\alpha} - B_{aa}) + 2(\doutkin{a}{\alpha} - B_{aa}) \hdots \right . \\
   366   & \quad \quad \quad \quad \quad \quad \left .
   367  - \frac{2\gamma\dkout{a}}{2m} (\dinStot{\alpha} - \dkin{a}) - \frac{2\gamma\dkin{a}}{2m} (\doutStot{\alpha} - \dkout{a}) \right] \\
   368  \end{align*}
   369  and
   370  \begin{align*}
   371  Q^{+(3)} &= \frac{1}{2m}\left[ \left( 2B_{aa} - 2\gamma \frac{\dkin{a}\dkout{a}}{2m} \right) 
   372  + \sum_{i \in \beta} \left( 2B_{ia} + 2B_{ai} - 2\gamma \frac{\dkin{i}\dkout{a}}{2m} - 2\gamma \frac{\dkin{a}\dkout{i}}{2m} \right) \right] \\
   373  				 &= \frac{1}{2m}\left[ \left( 2B_{aa} - 2\gamma \frac{\dkin{a}\dkout{a}}{2m} \right) 
   374  + 2\dinkin{a}{\beta} + 2\doutkin{a}{\beta} - \frac{2\gamma\dkout{a}}{2m} \dinStot{\beta}  - \frac{2\gamma\dkin{a}}{2m} \doutStot{\beta} \right] \\
   375  \end{align*}
   376  Similarly to Section \ref{sec:initialPass}, the first term in both these expressions is the same, and so cancels, leaving:
   377  \begin{align*}
   378  \Delta Q^{(3)} &= \frac{2}{2m}\left[ 
   379  \left( \dinkin{a}{\beta} + \doutkin{a}{\beta} - \frac{\gamma\dkout{a}}{2m} \dinStot{\beta}  - \frac{\gamma\dkin{a}}{2m} \doutStot{\beta} \right) \right. \\
   380  & \hspace{-1cm}
   381  - \left. \left( (\dinkin{a}{\alpha} - B_{aa}) + (\doutkin{a}{\alpha} - B_{aa}) - \frac{\gamma\dkout{a}}{2m} (\dinStot{\alpha} - \dkin{a}) - \frac{\gamma\dkin{a}}{2m} (\doutStot{\alpha} - \dkout{a})  \right) \right] \\
   382   &= \frac{2}{2m}\left[ (\dinkin{a}{\beta}-\dinkin{a}{\alpha}) + (\doutkin{a}{\beta}-\doutkin{a}{\alpha}) + 2B_{aa} \right. \\
   383  & \hspace{-1cm} \left.
   384  - \frac{\gamma\dkout{a}}{2m} (\dinStot{\beta}-\dinStot{\alpha}) - \frac{\gamma\dkin{a}}{2m} (\doutStot{\beta} - \doutStot{\alpha}) - \frac{2\gamma\dkin{a}\dkout{a}}{2m} \right]
   385  \end{align*}
   386  
   387  
   388  
   389  \subsection{Later passes}
   390  \label{sec:laterPassesDirected}
   391  
   392  In phase two a `meta-graph' is constructed where nodes correspond to 
   393  the communities found in the preceding phase one step, and edge weight
   394  between two such communities (nodes, in the meta-graph)
   395  $\alpha$ and $\beta$ are defined to be
   396  \begin{equation}
   397  	B_{\alpha \beta}^* = \sum_{i \in \alpha}\sum_{j \in \beta}B_{ij}.
   398  	\label{eqn:Bij*}
   399  \end{equation} 
   400  Note that $i$ and $j$ refer to nodes in the original graph, not nodes 
   401  in the previous graph, and so holds any meta-graph, not just the first.
   402  Also note that this definition of $B^*_{\alpha \beta}$ allows for 
   403  $B^*_{\alpha \alpha}$ to be non-zero, in fact
   404  \begin{equation}
   405  B_{\alpha \alpha}^* = \sum_{i \in \alpha}\sum_{j \in \alpha}B_{ij} = \Sin{\alpha}.
   406  \end{equation} 
   407  
   408  In this newly constructed graph, $\alpha$ and $\beta$ are nodes, but 
   409  also refer to communities (sets of nodes) in the original graph, and I 
   410  use these two interpretations interchangeably, completely analogously to 
   411  Section \ref{sec:laterPasses}.
   412  
   413  The results of Section~\ref{sec:initialPassDirected} generalise to these meta-graphs,
   414  and the generalised results mirror those of Section~\ref{sec:initialPassDirected} closely
   415  -- I distinguish the new results from those of Section~\ref{sec:initialPassDirected} by a 
   416  superscript $*$.
   417  I use $i$ and $j$ to denote nodes of the original graph as in Sections~\ref{sec:initialPass}
   418  and \ref{sec:initialPassDirected}, 
   419  and use $z$ and $w$ to denote nodes of the meta-graph (communities of the original).
   420  I use analogous notation to Section~\ref{sec:initialPass}, $c^*(z)$, to 
   421  denote the community to which node $z$ of the meta-graph belongs, 
   422  and let $\mathfrak{a}$ be the community that the node $\alpha$ belongs to, 
   423  i.e., $\mathfrak{a} = c^*(\alpha) $.
   424  
   425  Given this notation, we get all the same results as in \ref{sec:laterPasses}, but 
   426  each split into two cases `out' and `in', separating by direction, essentially, so
   427  \newcommand{\dkinStar}[1]{k_{#1}^{\text{in} *}}
   428  \newcommand{\dkoutStar}[1]{k_{#1}^{\text{out} *}}
   429  \begin{equation}
   430  \dkoutStar{z} = \sum_w{B_{zw}^*} = \sum_w\sum_{i \in z}\sum_{j \in w}B_{ij} = \sum_{i \in z}\sum_jB_{ij} = \doutStot{z},
   431  \end{equation}
   432  \begin{equation}
   433  \dkinStar{z}  = \sum_w{B_{wz}^*} = \sum_w\sum_{i \in z}\sum_{j \in w}B_{ji} = \sum_{i \in z}\sum_jB_{ji} = \dinStot{z},
   434  \end{equation}
   435  \newcommand{\dinStotStar}[1]{\Sigma_{\text{tot}}^{\text{in}(#1) *}}
   436  \newcommand{\doutStotStar}[1]{\Sigma_{\text{tot}}^{\text{out}(#1) *}}
   437  \begin{equation}
   438  	\doutStotStar{\mathfrak{a}} = \sum_{z \in \mathfrak{a}}\sum_{w}B_{zw}^* = \sum_{z \in \mathfrak{a}}\dkoutStar{z} = \sum_{z \in \mathfrak{a}}\doutStot{z},
   439  \end{equation}
   440  \begin{equation}
   441  	\dinStotStar{\mathfrak{a}}  = \sum_{z \in \mathfrak{a}}\sum_{w}B_{wz}^* = \sum_{z \in \mathfrak{a}}\dkinStar{z}  = \sum_{z \in \mathfrak{a}}\dinStot{z},
   442  \end{equation}
   443  \newcommand{\dinkinStar}[2]{k_{#1}^{\text{in}(#2) *}}
   444  \newcommand{\doutkinStar}[2]{k_{#1}^{\text{out}(#2) *}}
   445  \begin{equation}
   446  	\doutkinStar{z}{\mathfrak{a}} = \sum_{w \in \mathfrak{a}}{B_{zw}^*} = \sum_{w \in \mathfrak{a}}{\sum_{i \in z}\sum_{j \in w}B_{ij}},
   447  \end{equation}
   448  \begin{equation}
   449  	\dinkinStar{z}{\mathfrak{a}}  = \sum_{w \in \mathfrak{a}}{B_{wz}^*} = \sum_{w \in \mathfrak{a}}{\sum_{i \in z}\sum_{j \in w}B_{ji}},
   450  \end{equation}
   451  and
   452  \begin{equation}
   453  \Sin{\mathfrak{a} *} = \sum_{z \in \mathfrak{a}}\sum_{w \in \mathfrak{a}}A_{zw}^* = \sum_{z \in \mathfrak{a}}\kin{z}{\mathfrak{a} *} = \sum_{z \in \mathfrak{a}}\sum_{w \in \mathfrak{a}}{\sum_{i \in z}\sum_{j \in w}A_{ij}}.
   454  	%\label{eqn:Sin}
   455  \end{equation}
   456  
   457  If we let $\mathfrak{b}$ denote the community to which we are considering moving $\alpha$,
   458  then the expression for $\Delta Q$ from Section~\ref{sec:initialPassDirected} simply generalises as
   459  \begin{align*}
   460  \Delta Q^{(3)} &= \frac{2}{2m}\left[ (\dinkinStar{\alpha}{\mathfrak{b}}-\dinkinStar{\alpha}{\mathfrak{a}}) + (\doutkinStar{\alpha}{\mathfrak{b}}-\doutkinStar{\alpha}{\mathfrak{a}}) + 2B_{\alpha\alpha}^* \right. \\
   461  & \hspace{-1cm} \left.
   462  - \frac{\gamma\dkoutStar{\alpha}}{2m} (\dinStotStar{\mathfrak{b}}-\dinStotStar{\mathfrak{a}}) - \frac{\gamma\dkinStar{\alpha}}{2m} (\doutStotStar{\mathfrak{b}} - \doutStotStar{\mathfrak{a}}) - \frac{2\gamma\dkinStar{\alpha}\dkoutStar{\alpha}}{2m} \right]
   463  \end{align*}
   464  
   465  
   466  \end{document}