diff options
author | KatolaZ <katolaz@freaknet.org> | 2017-09-27 15:06:31 +0100 |
---|---|---|
committer | KatolaZ <katolaz@freaknet.org> | 2017-09-27 15:06:31 +0100 |
commit | 3aee2fd43e3059a699af2b63c6f2395e5a55e515 (patch) | |
tree | 58c95505a0906ed9cfa694f9dbd319403fd8f01d /src/betweenness/betweenness.c |
First commit on github -- NetBunch 1.0
Diffstat (limited to 'src/betweenness/betweenness.c')
-rw-r--r-- | src/betweenness/betweenness.c | 316 |
1 files changed, 316 insertions, 0 deletions
diff --git a/src/betweenness/betweenness.c b/src/betweenness/betweenness.c new file mode 100644 index 0000000..5e37747 --- /dev/null +++ b/src/betweenness/betweenness.c @@ -0,0 +1,316 @@ +/** + * This program is free software: you can redistribute it and/or + * modify it under the terms of the GNU General Public License as + * published by the Free Software Foundation, either version 3 of the + * License, or (at your option) any later version. + * + * This program is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * General Public License for more details. + * + * You should have received a copy of the GNU General Public License + * along with this program. If not, see + * <http://www.gnu.org/licenses/>. + * + * (c) Vincenzo Nicosia 2009-2017 -- <v.nicosia@qmul.ac.uk> + * + * This file is part of NetBunch, a package for complex network + * analysis and modelling. For more information please visit: + * + * http://www.complex-networks.net/ + * + * If you use this software, please add a reference to + * + * V. Latora, V. Nicosia, G. Russo + * "Complex Networks: Principles, Methods and Applications" + * Cambridge University Press (2017) + * ISBN: 9781107103184 + * + *********************************************************************** + * + * This program computes the betweenness of all the nodes of a graph, + * using Brandes' algorithm, and counting all the shortest paths + * originating from a set of nodes (potentially the whole set of + * vertices). + * + * References: + * U. Brandes. "A Faster Algorithm for Betweenness + * Centrality". J. Math. Sociol. 25 (2001), 163-177. + * + */ + + +#include <stdio.h> +#include <stdlib.h> +#include <string.h> + +#include <time.h> + +#include "utils.h" + + +void usage(char *argv[]){ + printf("********************************************************************\n" + "** **\n" + "** -*- betweenness -*- **\n" + "** **\n" + "** Compute the betweenness of all the nodes and edges of a **\n" + "** network due to the shortest paths originating from a set **\n" + "** of initial nodes. The set can be either a sequence of **\n" + "** nodes (if the second argument is 'SEQ') or a random sample **\n" + "** from the set of all the nodes (if it is 'RND'). **\n" + "** **\n" + "** The input file is an edge-list (use '-' to read from STDIN). **\n" + "** **\n" + "** With 'SEQ': **\n" + "** If <node_start> is not specified, computes the betweenness **\n" + "** using shortest paths from *all* the nodes (WARNING: This can **\n" + "** be slow for large graphs!). If <node_end> is not specified, **\n" + "** use shortest paths from all the nodes between <node_start> **\n" + "** and the node with the largest label. **\n" + "** **\n" + "** With 'RND': **\n" + "** Compute the betweenness based on the shortest paths from **\n" + "** <num> nodes sampled uniformly at random. **\n" + "** **\n" + "** When called with just <graph_in>, use all the nodes. **\n" + "** **\n" + "** The betweenness of all the nodes is printed on standard **\n" + "** output (STDOUT), while the edge betweenness is printed on **\n" + "** standard error (STDERR) **\n" + "** **\n" + "********************************************************************\n" + "\n\n" + " This is Free Software - You can use and distribute it under \n" + " the terms of the GNU General Public License, version 3 or later\n\n" + " (c) Vincenzo Nicosia 2009-2017 (v.nicosia@qmul.ac.uk)\n\n"); + printf("Usage: %s <graph_in> [SEQ <node_start> [<node_end>]]\n" , argv[0]); + printf("Usage: %s <graph_in> [RND <num>]\n" , argv[0]); + +} + +/* + * Add a node the a list of predecessors + */ + +void add_predecessor(unsigned int **pred, unsigned int k){ + + (*pred)[0] += 1; + *pred = realloc(*pred, ((*pred)[0] + 1) * sizeof(unsigned int)); + (*pred)[ (*pred)[0] ] = k; +} + + + +/* + * + * Compute node and edge betweenness, based on shortest paths + * originating on the "num" nodes specified in "nlist". "edge_bet" + * should be an appropriately allocated (and initialised to zero!!!!) + * vector of length equal to J_slap, and will contain the values of + * edge betweenness. + * + */ +double* compute_bet_dependency(unsigned int N, unsigned int *J_slap, unsigned int *r_slap, + unsigned int *nlist, unsigned int num, double *edge_bet){ + + int i, j, k, w, idx, cur_node, m; + unsigned int *marked, **preds, *dist, *nj; + double *delta, *cB, val; + unsigned int d; + unsigned int n, nd, ndp; + unsigned int edge_pos; + + dist = malloc(N * sizeof(unsigned int)); + marked = malloc(N * sizeof(unsigned int)); + preds = malloc(N * sizeof(unsigned int *)); + + nj = malloc(N * sizeof(unsigned int)); + delta = malloc(N * sizeof(double)); + cB = malloc(N * sizeof(double)); + + for (i=0; i<N; i++){ + cB[i] = 0; + preds[i] = NULL; + } + + for (m=0; m<num; m++){ + /* We start from the m-th node in nlist*/ + j = nlist[m]; + + for(i=0; i<N; i ++){ + dist[i] = N; + if (! preds[i]){ + preds[i] = malloc(sizeof(unsigned int)); + } + preds[i][0] = 0; /* The list of predecessors is now empty! */ + + nj[i] = 0; + delta[i]= 0; + } + dist[j] = 0; + nj[j] = 1; + marked[0] = j; + d = 0; + n = 0; + nd = 1; + ndp = 0; + while (d<N && nd > 0){ + for(i = n; i< n+nd; i ++){ + cur_node = marked[i]; + for (k=r_slap[cur_node]; k<r_slap[cur_node +1] ; k++){ + w = J_slap[k]; + if ( dist[w] == d+1){ + add_predecessor((unsigned int **)(preds + w), cur_node); + nj[w] += nj[cur_node]; + } + if ( dist[w] == N){ + dist[w] = d+1; + marked[n + nd + ndp] = w; + add_predecessor(preds + w, cur_node); + ndp +=1; + nj[w] += nj[cur_node]; + } + } + } + n = n + nd; + nd = ndp; + ndp = 0; + d += 1; + } + for (k= n-1; k>=1; k--){ + w = marked[k]; + for (idx=1; idx <= preds[w][0]; idx ++ ){ + i = preds[w][idx]; + val = 1.0 * nj[i] / nj[w] * (1 + delta[w]); + delta[i] += val; + /* Now we should update the betweenness of the edge (i,w) in + the appropriate position of the vector edge_bet*/ + find_neigh_in_Jslap(J_slap, r_slap, N, i, w, &edge_pos); + edge_bet[edge_pos] += val; + find_neigh_in_Jslap(J_slap, r_slap, N, w, i, &edge_pos); + edge_bet[edge_pos] += val; + } + cB[w] += delta[w]; + } + } + free(dist); + free(marked); + for (i=0; i<N; i++){ + free(preds[i]); + } + free(preds); + free(nj); + free(delta); + return cB; +} + + + +/* + * print of STDOUT the betweenness of each node + */ +void dump_cB(double *cB, unsigned int N){ + + unsigned int i; + for (i=0; i<N; i++){ + printf("%g\n", cB[i]); + } +} + +/* + * print on STDERR the betweenness of each edge + */ + +void dump_edge_bet(unsigned int *J_slap, unsigned int *r_slap, unsigned int N, + double *v, FILE *fout){ + + unsigned int i, j; + + for(i=0; i<N; i++){ + for (j=r_slap[i]; j<r_slap[i+1]; j++) + fprintf(fout, "%d %d %g\n", i, J_slap[j], v[j]); + } +} + + + +int main(int argc, char *argv[]){ + + unsigned int *J_slap=NULL, *r_slap=NULL; + unsigned int K, N, i; + unsigned int n_start, n_end; + unsigned int *nlist=NULL; + unsigned int num; + double *edge_bet = NULL; + double *cB; + FILE *filein; + + + if(argc < 2){ + usage(argv); + exit(1); + } + + srand(time(NULL)); + + if (!strcmp(argv[1], "-")){ + /* take the input from STDIN */ + filein = stdin; + } + else { + filein = openfile_or_exit(argv[1], "r", 2); + } + + read_slap(filein, &K, &N, &J_slap, &r_slap); + + nlist = malloc(N * sizeof(unsigned int)); + + for(i=0; i<N; i++){ + nlist[i] = i; + } + + n_start = 0; + n_end = N-1; + num = N; + + + if (argc > 3){ + if(!my_strcasecmp(argv[2], "SEQ")){ + n_start = atoi(argv[3]); + if (n_start > N-1) + n_start = 0; + if (argc > 4){ + n_end = atoi(argv[4]); + } + else{ + n_end = N-1; + } + num = n_end - n_start + 1; + } + else if (!my_strcasecmp(argv[2], "RND")){ + num = atoi(argv[3]); + n_start = 0; + n_end = num-1; + if (num > N || num < 1) + num = N; + shuffle_vector(nlist, N); + } + } + + sort_neighbours(J_slap, r_slap, N); + edge_bet = malloc(K * sizeof(double)); + memset(edge_bet, 0, K * sizeof(double)); + cB = compute_bet_dependency(N, J_slap, r_slap, nlist+n_start, num, edge_bet); + + dump_cB(cB, N); + dump_edge_bet(J_slap, r_slap, N, edge_bet, stderr); + + free(cB); + free(J_slap); + free(r_slap); + free(edge_bet); + free(nlist); + +} |