]> git.meshlink.io Git - meshlink/commitdiff
Merge branch 'partition_healing' into everbase
authorGuus Sliepen <guus@sliepen.org>
Tue, 29 Jul 2014 15:02:47 +0000 (17:02 +0200)
committerGuus Sliepen <guus@sliepen.org>
Tue, 29 Jul 2014 15:02:47 +0000 (17:02 +0200)
src/net.c

index 5f50531b9ff4fada055e90b255ecf9b9f03ea351..d8f7d642e4ac0307d1ef6f84c9156cf70d46f75d 100644 (file)
--- a/src/net.c
+++ b/src/net.c
@@ -119,6 +119,74 @@ static void timeout_handler(event_loop_t *loop, void *data) {
        timeout_set(&mesh->loop, data, &(struct timeval){mesh->pingtimeout, rand() % 100000});
 }
 
+/// Utility function to establish connections based on condition check
+/** The function iterates over all nodes, but skips those that do
+ *  not pass the condition check.
+ *  
+ *  The condition check function is passed
+ *  a pointer to a random number r between 0 and rand_modulo, a pointer to the
+ *  current node index i, and the node pointer n. This function should return true
+ *  if a connection attempt to the node should be made.
+ *  
+ *  @param mesh                A pointer to the mesh structure
+ *  @param rand_modulo Random index is selected between 0 and rand_modulo
+ *  @cond_check                A function pointer. This function should return true
+ *                     if a connection attempt to the node should be made
+ */
+static void cond_add_connection(meshlink_handle_t *mesh, int rand_modulo, bool (*cond_check)(int*, int*, node_t*)) {
+       int r = rand() % rand_modulo;
+       int i = 0;
+
+       for splay_each(node_t, n, mesh->nodes) {
+               /* skip nodes that do not pass condition check */
+               if(!(*cond_check)(&i, &r, n))
+                       continue;
+
+               /* check if there is already a connection attempt to this node */
+               bool found = false;
+               for list_each(outgoing_t, outgoing, mesh->outgoings) {
+                       if(!strcmp(outgoing->name, n->name)) {
+                               found = true;
+                               break;
+                       }
+               }
+
+               if(!found) {
+                       //TODO: if the node is blacklisted the connection will not happen, but
+                       //the user will read this debug message "Autoconnecting to %s" that is misleading
+                       logger(DEBUG_CONNECTIONS, LOG_INFO, "Autoconnecting to %s", n->name);
+                       outgoing_t *outgoing = xzalloc(sizeof *outgoing);
+                       outgoing->name = xstrdup(n->name);
+                       list_insert_tail(mesh->outgoings, outgoing);
+                       setup_outgoing_connection(mesh, outgoing);
+               }
+               break;
+       }
+}
+
+static bool found_random_node(int *i, int *r, node_t *n) {
+       if((*i)++ != *r)
+               return false;
+
+       if(n->connection)
+               return false;
+       
+       return true;
+}
+
+static bool found_random_unreachable_node(int *i, int *r, node_t *n) {
+       if(n->status.reachable)
+               return false;
+       
+       if((*i)++ != *r)
+               return false;
+
+       if(n->connection)
+               return false;
+
+       return true;
+}
+
 static void periodic_handler(event_loop_t *loop, void *data) {
        meshlink_handle_t *mesh = loop->data;
 
@@ -152,43 +220,29 @@ static void periodic_handler(event_loop_t *loop, void *data) {
                                nc++;
                }
 
+               /* Count number of unreachable nodes */
+               int num_unreachable = 0;
+               for splay_each(node_t, n, mesh->nodes) {
+                       if(!n->status.reachable)
+                               num_unreachable++;
+               }
+
                if(nc < autoconnect) {
                        /* Not enough active connections, try to add one.
                           Choose a random node, if we don't have a connection to it,
                           and we are not already trying to make one, create an
                           outgoing connection to this node.
                        */
-                       int r = rand() % mesh->nodes->count;
-                       int i = 0;
-
-                       for splay_each(node_t, n, mesh->nodes) {
-                               if(i++ != r)
-                                       continue;
-
-                               if(n->connection)
-                                       break;
-
-                               bool found = false;
-
-                               for list_each(outgoing_t, outgoing, mesh->outgoings) {
-                                       if(!strcmp(outgoing->name, n->name)) {
-                                               found = true;
-                                               break;
-                                       }
-                               }
-
-                               if(!found) {
-                                       //TODO: if the node is blacklisted the connection will not happen, but
-                                       //the user will read this debug message "Autoconnecting to %s" that is misleading
-                                       logger(DEBUG_CONNECTIONS, LOG_INFO, "Autoconnecting to %s", n->name);
-                                       outgoing_t *outgoing = xzalloc(sizeof *outgoing);
-                                       outgoing->name = xstrdup(n->name);
-                                       list_insert_tail(mesh->outgoings, outgoing);
-                                       setup_outgoing_connection(mesh, outgoing);
-                               }
-                               break;
-                       }
-               } else if(nc > autoconnect) {
+                       cond_add_connection(mesh, mesh->nodes->count, &found_random_node);
+               } else if(num_unreachable > 0) {
+                       /* Min number of connections established. Now try
+                          to connect to some unreachable nodes to attempt
+                          to heal possible partitions.
+                       */
+                       cond_add_connection(mesh, num_unreachable, &found_random_unreachable_node);
+               }
+               
+               if(nc > autoconnect) {
                        /* Too many active connections, try to remove one.
                           Choose a random outgoing connection to a node
                           that has at least one other connection.
@@ -217,8 +271,16 @@ static void periodic_handler(event_loop_t *loop, void *data) {
                if(nc >= autoconnect) {
                        /* If we have enough active connections,
                           remove any pending outgoing connections.
+                          Do not remove pending connections to unreachable
+                          nodes.
                        */
+                       node_t *o_node = NULL;
                        for list_each(outgoing_t, o, mesh->outgoings) {
+                               o_node = lookup_node(mesh, o->name);
+                               /* o_node is NULL if it is not part of the graph yet */
+                               if(!o_node || !o_node->status.reachable)
+                                       continue;
+
                                bool found = false;
                                for list_each(connection_t, c, mesh->connections) {
                                        if(c->outgoing == o) {
@@ -228,6 +290,10 @@ static void periodic_handler(event_loop_t *loop, void *data) {
                                }
                                if(!found) {
                                        logger(DEBUG_CONNECTIONS, LOG_INFO, "Cancelled outgoing connection to %s", o->name);
+                                       /* The node variable is leaked in from using the list_each macro.
+                                          The o variable could be used, but using node directly
+                                          is more efficient.
+                                       */
                                        list_delete_node(mesh->outgoings, node);
                                }
                        }