Fix identification issues, including a race condition causing id conflicts

The added test describes how the new id timestamps fix the race condition. These timestamps could be any unique opaque values, and the protocol is extended to exchange them along with node ids. Internally, nodes also reuse timestamps as a marker to identify the first NotifyNodeInformation packets from the master: since this packet is a complete list of nodes in the cluster, any other node in the node manager has left the cluster definitely and is removed. The secondary masters didn't receive update about master nodes. It's also useless to send them information about non-master nodes.

Fix identification issues, including a race condition causing id conflicts
The added test describes how the new id timestamps fix the race condition. These timestamps could be any unique opaque values, and the protocol is extended to exchange them along with node ids. Internally, nodes also reuse timestamps as a marker to identify the first NotifyNodeInformation packets from the master: since this packet is a complete list of nodes in the cluster, any other node in the node manager has left the cluster definitely and is removed. The secondary masters didn't receive update about master nodes. It's also useless to send them information about non-master nodes.
9385706f · Julien Muchembled · d048a52d · 9385706f · 9385706f · 9385706f
Commit 9385706f authored Nov 24, 2016 by Julien Muchembled
30 changed files
--- a/neo/admin/app.py
+++ b/neo/admin/app.py
@@ -105,13 +105,9 @@ class Application(BaseApplication):
        """
        self.cluster_state = None
        # search, find, connect and identify to the primary master
-        bootstrap = BootstrapManager(self, self.name, NodeTypes.ADMIN,
-                self.uuid, self.server)
-        data = bootstrap.getPrimaryConnection()
-        (node, conn, uuid, num_partitions, num_replicas) = data
-        self.master_node = node
-        self.master_conn = conn
-        self.uuid = uuid
+        bootstrap = BootstrapManager(self, NodeTypes.ADMIN, self.server)
+        self.master_node, self.master_conn, num_partitions, num_replicas = \
+            bootstrap.getPrimaryConnection()

        if self.pt is None:
            self.pt = PartitionTable(num_partitions, num_replicas)

--- a/neo/admin/handler.py
+++ b/neo/admin/handler.py
@@ -120,8 +120,6 @@ class MasterEventHandler(EventHandler):
    def notifyClusterInformation(self, conn, cluster_state):
        self.app.cluster_state = cluster_state

-    def notifyNodeInformation(self, conn, node_list):
-        self.app.nm.update(node_list)

 class MasterRequestEventHandler(EventHandler):
    """ This class handle all answer from primary master node"""

--- a/neo/client/app.py
+++ b/neo/client/app.py
@@ -240,10 +240,10 @@ class Application(ThreadedApplication):
                        self.notifications_handler,
                        node=self.trying_master_node,
                        dispatcher=self.dispatcher)
+                p = Packets.RequestIdentification(
+                    NodeTypes.CLIENT, self.uuid, None, self.name, None)
                try:
-                    ask(conn, Packets.RequestIdentification(
-                            NodeTypes.CLIENT, self.uuid, None, self.name),
-                        handler=handler)
+                    ask(conn, p, handler=handler)
                except ConnectionClosed:
                    continue
                # If we reached the primary master node, mark as connected

--- a/neo/client/handlers/master.py
+++ b/neo/client/handlers/master.py
@@ -87,6 +87,7 @@ class PrimaryNotificationsHandler(MTEventHandler):
            raise ProtocolError('No UUID supplied')
        app.uuid = your_uuid
        logging.info('Got an UUID: %s', dump(app.uuid))
+        app.id_timestamp = None

        # Always create partition table
        app.pt = PartitionTable(num_partitions, num_replicas)
@@ -179,13 +180,14 @@ class PrimaryNotificationsHandler(MTEventHandler):
            self.app.pt.update(ptid, cell_list, self.app.nm)

    def notifyNodeInformation(self, conn, node_list):
-        nm = self.app.nm
-        nm.update(node_list)
+        super(PrimaryNotificationsHandler, self).notifyNodeInformation(
+            conn, node_list)
        # XXX: 'update' automatically closes DOWN nodes. Do we really want
        #      to do the same thing for nodes in other non-running states ?
-        for node_type, addr, uuid, state in node_list:
-            if state != NodeStates.RUNNING:
-                node = nm.getByUUID(uuid)
+        getByUUID = self.app.nm.getByUUID
+        for node in node_list:
+            if node[3] != NodeStates.RUNNING:
+                node = getByUUID(node[2])
                if node and node.isConnected():
                    node.getConnection().close()


--- a/neo/client/pool.py
+++ b/neo/client/pool.py
@@ -57,7 +57,7 @@ class ConnectionPool(object):
        conn = MTClientConnection(app, app.storage_event_handler, node,
                                  dispatcher=app.dispatcher)
        p = Packets.RequestIdentification(NodeTypes.CLIENT,
-            app.uuid, None, app.name)
+            app.uuid, None, app.name, app.id_timestamp)
        try:
            app._ask(conn, p, handler=app.storage_bootstrap_handler)
        except ConnectionClosed:

--- a/neo/lib/bootstrap.py
+++ b/neo/lib/bootstrap.py
@@ -26,7 +26,7 @@ class BootstrapManager(EventHandler):
    """
    accepted = False

-    def __init__(self, app, name, node_type, uuid=None, server=None):
+    def __init__(self, app, node_type, server=None):
        """
        Manage the bootstrap stage of a non-master node, it lookup for the
        primary master node, connect to it then returns when the master node
@@ -35,12 +35,12 @@ class BootstrapManager(EventHandler):
        self.primary = None
        self.server = server
        self.node_type = node_type
-        self.uuid = uuid
-        self.name = name
        self.num_replicas = None
        self.num_partitions = None
        self.current = None

+    uuid = property(lambda self: self.app.uuid)
+
    def announcePrimary(self, conn):
        # We found the primary master early enough to be notified of election
        # end. Lucky. Anyway, we must carry on with identification request, so
@@ -55,7 +55,7 @@ class BootstrapManager(EventHandler):
        EventHandler.connectionCompleted(self, conn)
        self.current.setRunning()
        conn.ask(Packets.RequestIdentification(self.node_type, self.uuid,
-            self.server, self.name))
+            self.server, self.app.name, None))

    def connectionFailed(self, conn):
        """
@@ -106,8 +106,9 @@ class BootstrapManager(EventHandler):
        self.num_replicas = num_replicas
        if self.uuid != your_uuid:
            # got an uuid from the primary master
-            self.uuid = your_uuid
+            self.app.uuid = your_uuid
            logging.info('Got a new UUID: %s', uuid_str(self.uuid))
+        self.app.id_timestamp = None
        self.accepted = True

    def getPrimaryConnection(self):
@@ -141,8 +142,4 @@ class BootstrapManager(EventHandler):
                    continue
            # still processing
            poll(1)
-        return (self.current, conn, self.uuid, self.num_partitions,
-            self.num_replicas)
-
-
-
+        return self.current, conn, self.num_partitions, self.num_replicas
--- a/neo/lib/handler.py
+++ b/neo/lib/handler.py
@@ -165,6 +165,10 @@ class EventHandler(object):
            return
        conn.close()

+    def notifyNodeInformation(self, conn, node_list):
+        app = self.app
+        app.nm.update(app, node_list)
+
    def ping(self, conn):
        conn.answer(Packets.Pong())


--- a/neo/lib/node.py
+++ b/neo/lib/node.py
@@ -27,6 +27,7 @@ class Node(object):

    _connection = None
    _identified = False
+    id_timestamp = None

    def __init__(self, manager, address=None, uuid=None,
            state=NodeStates.UNKNOWN):
@@ -172,7 +173,8 @@ class Node(object):

    def asTuple(self):
        """ Returned tuple is intended to be used in protocol encoders """
-        return (self.getType(), self._address, self._uuid, self._state)
+        return (self.getType(), self._address, self._uuid, self._state,
+                self.id_timestamp)

    def __gt__(self, node):
        # sort per UUID if defined
@@ -348,9 +350,11 @@ class NodeManager(object):
        """ Return the node that match with a given address """
        return self._address_dict.get(address, None)

-    def getByUUID(self, uuid):
+    def getByUUID(self, uuid, *id_timestamp):
        """ Return the node that match with a given UUID """
-        return self._uuid_dict.get(uuid, None)
+        node = self._uuid_dict.get(uuid)
+        if not id_timestamp or node and (node.id_timestamp,) == id_timestamp:
+            return node

    def _createNode(self, klass, address=None, uuid=None, **kw):
        by_address = self.getByAddress(address)
@@ -386,8 +390,9 @@ class NodeManager(object):
    def createFromNodeType(self, node_type, **kw):
        return self._createNode(NODE_TYPE_MAPPING[node_type], **kw)

-    def update(self, node_list):
-        for node_type, addr, uuid, state in node_list:
+    def update(self, app, node_list):
+        node_set = self._node_set.copy() if app.id_timestamp is None else None
+        for node_type, addr, uuid, state, id_timestamp in node_list:
            # This should be done here (although klass might not be used in this
            # iteration), as it raises if type is not valid.
            klass = NODE_TYPE_MAPPING[node_type]
@@ -397,11 +402,11 @@ class NodeManager(object):
            node_by_addr = self.getByAddress(addr)
            node = node_by_uuid or node_by_addr

-            log_args = node_type, uuid_str(uuid), addr, state
+            log_args = node_type, uuid_str(uuid), addr, state, id_timestamp
            if node is None:
                if state == NodeStates.DOWN:
-                    logging.debug('NOT creating node %s %s %s %s', *log_args)
-                else:
+                    logging.debug('NOT creating node %s %s %s %s %s', *log_args)
+                    continue
                node = self._createNode(klass, address=addr, uuid=uuid,
                        state=state)
                logging.debug('creating node %r', node)
@@ -414,7 +419,7 @@ class NodeManager(object):
                    'node_by_addr (%r)' % (node_by_uuid, node_by_addr)
                if state == NodeStates.DOWN:
                    logging.debug('dropping node %r (%r), found with %s '
-                        '%s %s %s', node, node.isConnected(), *log_args)
+                        '%s %s %s %s', node, node.isConnected(), *log_args)
                    if node.isConnected():
                        # Cut this connection, node removed by handler.
                        # It's important for a storage to disconnect nodes that
@@ -424,12 +429,20 @@ class NodeManager(object):
                        # partition table upon disconnection.
                        node.getConnection().close()
                    self.remove(node)
-                else:
-                    logging.debug('updating node %r to %s %s %s %s',
+                    continue
+                logging.debug('updating node %r to %s %s %s %s %s',
                    node, *log_args)
                node.setUUID(uuid)
                node.setAddress(addr)
                node.setState(state)
+            node.id_timestamp = id_timestamp
+            if app.uuid == uuid:
+                app.id_timestamp = id_timestamp
+        if node_set:
+            # For the first notification, we receive a full list of nodes from
+            # the master. Remove all unknown nodes from a previous connection.
+            for node in node_set - self._node_set:
+                self.remove(node)
        self.log()

    def log(self):

--- a/neo/lib/protocol.py
+++ b/neo/lib/protocol.py
@@ -595,6 +595,13 @@ class PTID(PItem):
 # same definition, for now
 POID = PTID

+class PFloat(PStructItemOrNone):
+    """
+        A float number (8-bytes length)
+    """
+    _fmt = '!d'
+    _None = '\xff' * 8
+
 # common definitions

 PFEmpty = PStruct('no_content')
@@ -608,6 +615,7 @@ PFNodeList = PList('node_list',
        PAddress('address'),
        PUUID('uuid'),
        PFNodeState,
+        PFloat('id_timestamp'),
    ),
 )

@@ -689,6 +697,7 @@ class RequestIdentification(Packet):
        PUUID('uuid'),
        PAddress('address'),
        PString('name'),
+        PFloat('id_timestamp'),
    )

    _answer = PStruct('accept_identification',

--- a/neo/lib/threaded_app.py
+++ b/neo/lib/threaded_app.py
@@ -43,6 +43,8 @@ class ThreadContainer(threading.local):
 class ThreadedApplication(BaseApplication):
    """The client node application."""

+    uuid = None
+
    def __init__(self, master_nodes, name, **kw):
        super(ThreadedApplication, self).__init__(**kw)
        self.poll_thread = threading.Thread(target=self.run, name=name)
@@ -56,8 +58,6 @@ class ThreadedApplication(BaseApplication):
        for address in master_nodes:
            self.nm.createMaster(address=address)

-        # no self-assigned UUID, primary master will supply us one
-        self.uuid = None
        # Internal attribute distinct between thread
        self._thread_container = ThreadContainer()
        app_set.add(self) # to register self.on_log

--- a/neo/master/app.py
+++ b/neo/master/app.py
@@ -15,6 +15,7 @@
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.

 import sys, weakref
+from collections import defaultdict
 from time import time

 from neo.lib import logging
@@ -44,7 +45,6 @@ class Application(BaseApplication):
    last_transaction = ZERO_TID
    backup_tid = None
    backup_app = None
-    uuid = None
    truncate_tid = None

    def __init__(self, config):
@@ -79,9 +79,7 @@ class Application(BaseApplication):
        self.primary_master_node = None
        self.cluster_state = None

-        uuid = config.getUUID()
-        if uuid:
-            self.uuid = uuid
+        self.uuid = config.getUUID()

        # election related data
        self.unconnected_master_node_set = set()
@@ -227,19 +225,20 @@ class Application(BaseApplication):
          Broadcast changes for a set a nodes
          Send only one packet per connection to reduce bandwidth
        """
-        node_dict = {}
+        node_dict = defaultdict(list)
        # group modified nodes by destination node type
        for node in node_list:
            node_info = node.asTuple()
-            def assign_for_notification(node_type):
-                # helper function
-                node_dict.setdefault(node_type, []).append(node_info)
-            if node.isMaster() or node.isStorage():
-                # client get notifications for master and storage only
-                assign_for_notification(NodeTypes.CLIENT)
-            if node.isMaster() or node.isStorage() or node.isClient():
-                assign_for_notification(NodeTypes.STORAGE)
-                assign_for_notification(NodeTypes.ADMIN)
+            if node.isAdmin():
+                continue
+            node_dict[NodeTypes.ADMIN].append(node_info)
+            node_dict[NodeTypes.STORAGE].append(node_info)
+            if node.isClient():
+                continue
+            node_dict[NodeTypes.CLIENT].append(node_info)
+            if node.isStorage():
+                continue
+            node_dict[NodeTypes.MASTER].append(node_info)

        # send at most one non-empty notification packet per node
        for node in self.nm.getIdentifiedList():
@@ -498,7 +497,7 @@ class Application(BaseApplication):
                conn.setHandler(handler)
                conn.notify(Packets.NotifyNodeInformation(((
                  node.getType(), node.getAddress(), node.getUUID(),
-                  NodeStates.TEMPORARILY_DOWN),)))
+                  NodeStates.TEMPORARILY_DOWN, None),)))
                conn.abort()
            elif conn.pending():
                conn.abort()

--- a/neo/master/backup_app.py
+++ b/neo/master/backup_app.py
@@ -65,6 +65,7 @@ There is no UUID conflict between the 2 clusters:
 class BackupApplication(object):

    pt = None
+    uuid = None

    def __init__(self, app, name, master_addresses):
        self.app = weakref.proxy(app)
@@ -92,7 +93,7 @@ class BackupApplication(object):
        pt = app.pt
        while True:
            app.changeClusterState(ClusterStates.STARTING_BACKUP)
-            bootstrap = BootstrapManager(self, self.name, NodeTypes.CLIENT)
+            bootstrap = BootstrapManager(self, NodeTypes.CLIENT)
            # {offset -> node}
            self.primary_partition_dict = {}
            # [[tid]]
@@ -105,7 +106,7 @@ class BackupApplication(object):
                    else:
                        break
                    poll(1)
-                node, conn, uuid, num_partitions, num_replicas = \
+                node, conn, num_partitions, num_replicas = \
                    bootstrap.getPrimaryConnection()
                try:
                    app.changeClusterState(ClusterStates.BACKINGUP)

--- a/neo/master/handlers/__init__.py
+++ b/neo/master/handlers/__init__.py
@@ -30,7 +30,7 @@ class MasterHandler(EventHandler):
        elif new:
            self._notifyNodeInformation(conn)

-    def requestIdentification(self, conn, node_type, uuid, address, name):
+    def requestIdentification(self, conn, node_type, uuid, address, name, _):
        self.checkClusterName(name)
        app = self.app
        node = app.nm.getByUUID(uuid)

--- a/neo/master/handlers/backup.py
+++ b/neo/master/handlers/backup.py
@@ -31,9 +31,6 @@ class BackupHandler(EventHandler):
    def notifyPartitionChanges(self, conn, ptid, cell_list):
        self.app.pt.update(ptid, cell_list, self.app.nm)

-    def notifyNodeInformation(self, conn, node_list):
-        self.app.nm.update(node_list)
-
    def answerLastTransaction(self, conn, tid):
        app = self.app
        if tid != ZERO_TID:

--- a/neo/master/handlers/client.py
+++ b/neo/master/handlers/client.py
@@ -32,9 +32,8 @@ class ClientServiceHandler(MasterHandler):
            app.nm.remove(node)

    def _notifyNodeInformation(self, conn):
-        # send informations about master and storages only
        nm = self.app.nm
-        node_list = []
+        node_list = [nm.getByUUID(conn.getUUID()).asTuple()] # for id_timestamp
        node_list.extend(n.asTuple() for n in nm.getMasterList())
        node_list.extend(n.asTuple() for n in nm.getStorageList())
        conn.notify(Packets.NotifyNodeInformation(node_list))

--- a/neo/master/handlers/election.py
+++ b/neo/master/handlers/election.py
@@ -56,6 +56,11 @@ class BaseElectionHandler(EventHandler):

 class ClientElectionHandler(BaseElectionHandler):

+    def notifyNodeInformation(self, conn, node_list):
+        # XXX: For the moment, do nothing because
+        # we'll close this connection and reconnect.
+        pass
+
    def connectionFailed(self, conn):
        addr = conn.getAddress()
        node = self.app.nm.getByAddress(addr)
@@ -71,6 +76,7 @@ class ClientElectionHandler(BaseElectionHandler):
            app.uuid,
            app.server,
            app.name,
+            None,
        ))
        super(ClientElectionHandler, self).connectionCompleted(conn)


--- a/neo/master/handlers/identification.py
+++ b/neo/master/handlers/identification.py
@@ -14,6 +14,7 @@
 # You should have received a copy of the GNU General Public License
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.

+from time import time
 from neo.lib import logging
 from neo.lib.protocol import ClusterStates, NodeStates, NodeTypes, \
    NotReadyError, ProtocolError, uuid_str
@@ -91,6 +92,7 @@ class IdentificationHandler(MasterHandler):
                uuid=uuid, address=address)
        else:
            node.setUUID(uuid)
+        node.id_timestamp = time()
        node.setState(state)
        node.setConnection(conn)
        conn.setHandler(handler)

--- a/neo/master/handlers/secondary.py
+++ b/neo/master/handlers/secondary.py
@@ -36,6 +36,10 @@ class SecondaryMasterHandler(MasterHandler):
    def reelectPrimary(self, conn):
        raise ElectionFailure, 'reelection requested'

+    def _notifyNodeInformation(self, conn):
+        node_list = [n.asTuple() for n in self.app.nm.getMasterList()]
+        conn.notify(Packets.NotifyNodeInformation(node_list))
+
 class PrimaryHandler(EventHandler):
    """ Handler used by secondaries to handle primary master"""

@@ -58,6 +62,7 @@ class PrimaryHandler(EventHandler):
            app.uuid,
            app.server,
            app.name,
+            None,
        ))
        super(PrimaryHandler, self).connectionCompleted(conn)

@@ -68,27 +73,11 @@ class PrimaryHandler(EventHandler):
        self.app.cluster_state = state

    def notifyNodeInformation(self, conn, node_list):
-        app = self.app
-        for node_type, addr, uuid, state in node_list:
-            if node_type != NodeTypes.MASTER:
-                # No interest.
-                continue
-            if uuid == app.uuid and state == NodeStates.UNKNOWN:
+        super(PrimaryHandler, self).notifyNodeInformation(conn, node_list)
+        for node_type, _, uuid, state, _ in node_list:
+            assert node_type == NodeTypes.MASTER, node_type
+            if uuid == self.app.uuid and state == NodeStates.UNKNOWN:
                sys.exit()
-            # Register new master nodes.
-            if app.server == addr:
-                # This is self.
-                continue
-            else:
-                n = app.nm.getByAddress(addr)
-                # master node must be known
-                assert n is not None
-
-                if uuid is not None:
-                    # If I don't know the UUID yet, believe what the peer
-                    # told me at the moment.
-                    if n.getUUID() is None:
-                        n.setUUID(uuid)

    def _acceptIdentification(self, node, uuid, num_partitions,
            num_replicas, your_uuid, primary, known_master_list):
@@ -101,4 +90,5 @@ class PrimaryHandler(EventHandler):
            logging.info('My UUID: ' + uuid_str(your_uuid))

        node.setUUID(uuid)
+        app.id_timestamp = None

--- a/neo/scripts/neolog.py
+++ b/neo/scripts/neolog.py
@@ -146,15 +146,14 @@ class Log(object):

    def notifyNodeInformation(self, node_list):
        node_list.sort(key=lambda x: x[2])
-        node_list = [(self.uuid_str(uuid), str(node_type),
-                      '%s:%u' % address if address else '?', state)
-                     for node_type, address, uuid, state in node_list]
+        node_list = [(self.uuid_str(x[2]), str(x[0]),
+                      '%s:%u' % x[1] if x[1] else '?', str(x[3]))
+                     + ((repr(x[4]),) if len(x) > 4 else ()) # BBB
+                     for x in node_list]
        if node_list:
-            t = ' ! %%%us | %%%us | %%%us | %%s' % (
-                max(len(x[0]) for x in node_list),
-                max(len(x[1]) for x in node_list),
-                max(len(x[2]) for x in node_list))
-            return map(t.__mod__, node_list)
+            t = ''.join(' %%%us |' % max(len(x[i]) for x in node_list)
+                        for i in xrange(len(node_list[0]) - 1))
+            return map((' !' + t + ' %s').__mod__, node_list)
        return ()



--- a/neo/storage/app.py
+++ b/neo/storage/app.py
@@ -219,14 +219,11 @@ class Application(BaseApplication):
                conn.close()

        # search, find, connect and identify to the primary master
-        bootstrap = BootstrapManager(self, self.name,
-                NodeTypes.STORAGE, self.uuid, self.server)
-        data = bootstrap.getPrimaryConnection()
-        (node, conn, uuid, num_partitions, num_replicas) = data
-        self.master_node = node
-        self.master_conn = conn
+        bootstrap = BootstrapManager(self, NodeTypes.STORAGE, self.server)
+        self.master_node, self.master_conn, num_partitions, num_replicas = \
+            bootstrap.getPrimaryConnection()
+        uuid = self.uuid
        logging.info('I am %s', uuid_str(uuid))
-        self.uuid = uuid
        self.dm.setUUID(uuid)

        # Reload a partition table from the database. This is necessary

--- a/neo/storage/checker.py
+++ b/neo/storage/checker.py
@@ -50,8 +50,8 @@ class Checker(object):
                conn.asClient()
            else:
                conn = ClientConnection(app, StorageOperationHandler(app), node)
-                conn.ask(Packets.RequestIdentification(
-                    NodeTypes.STORAGE, uuid, app.server, name))
+                conn.ask(Packets.RequestIdentification(NodeTypes.STORAGE,
+                    uuid, app.server, name, app.id_timestamp))
            self.conn_dict[conn] = node.isIdentified()
        conn_set = set(self.conn_dict)
        conn_set.discard(None)

--- a/neo/storage/handlers/__init__.py
+++ b/neo/storage/handlers/__init__.py
@@ -38,8 +38,8 @@ class BaseMasterHandler(EventHandler):
    def notifyNodeInformation(self, conn, node_list):
        """Store information on nodes, only if this is sent by a primary
        master node."""
-        self.app.nm.update(node_list)
-        for node_type, addr, uuid, state in node_list:
+        super(BaseMasterHandler, self).notifyNodeInformation(conn, node_list)
+        for node_type, _, uuid, state, _ in node_list:
            if uuid == self.app.uuid:
                # This is me, do what the master tell me
                logging.info("I was told I'm %s", state)

--- a/neo/storage/handlers/identification.py
+++ b/neo/storage/handlers/identification.py
@@ -27,7 +27,8 @@ class IdentificationHandler(EventHandler):
    def connectionLost(self, conn, new_state):
        logging.warning('A connection was lost during identification')

-    def requestIdentification(self, conn, node_type, uuid, address, name):
+    def requestIdentification(self, conn, node_type, uuid, address, name,
+                              id_timestamp):
        self.checkClusterName(name)
        app = self.app
        # reject any incoming connections if not ready
@@ -41,7 +42,7 @@ class IdentificationHandler(EventHandler):
        else:
            if uuid == app.uuid:
                raise ProtocolError("uuid conflict or loopback connection")
-            node = app.nm.getByUUID(uuid)
+            node = app.nm.getByUUID(uuid, id_timestamp)
            if node is None:
                # Do never create node automatically, or we could get id
                # conflicts. We must only rely on the notifications from the
@@ -56,12 +57,7 @@ class IdentificationHandler(EventHandler):
                    handler = ClientReadOnlyOperationHandler
                else:
                    handler = ClientOperationHandler
-                if node.isConnected(): # XXX
-                    # This can happen if we haven't processed yet a notification
-                    # from the master, telling us the existing node is not
-                    # running anymore. If we accept the new client, we won't
-                    # know what to do with this late notification.
-                    raise NotReadyError('uuid conflict: retry later')
+                assert not node.isConnected(), node
                assert node.isRunning(), node
            elif node_type == NodeTypes.STORAGE:
                handler = StorageOperationHandler

--- a/neo/storage/replicator.py
+++ b/neo/storage/replicator.py
@@ -258,7 +258,8 @@ class Replicator(object):
            conn = ClientConnection(app, StorageOperationHandler(app), node)
            try:
                conn.ask(Packets.RequestIdentification(NodeTypes.STORAGE,
-                    None if name else app.uuid, app.server, name or app.name))
+                    None if name else app.uuid, app.server, name or app.name,
+                    app.id_timestamp))
            except ConnectionClosed:
                if previous_node is self.current_node:
                    return

--- a/neo/tests/functional/__init__.py
+++ b/neo/tests/functional/__init__.py
@@ -119,7 +119,7 @@ class NEOProcess(object):
        except ImportError:
            raise NotFound, '%s not found' % (command)
        self.command = command
-        self.arg_dict = {'--' + k: v for k, v in arg_dict.iteritems()}
+        self.arg_dict = arg_dict
        self.with_uuid = True
        self.setUUID(uuid)

@@ -131,11 +131,11 @@ class NEOProcess(object):
        args = []
        self.with_uuid = with_uuid
        for arg, param in self.arg_dict.iteritems():
-            if with_uuid is False and arg == '--uuid':
-                continue
-            args.append(arg)
+            args.append('--' + arg)
            if param is not None:
                args.append(str(param))
+        if with_uuid:
+            args += '--uuid', str(self.uuid)
        self.pid = os.fork()
        if self.pid == 0:
            # Child
@@ -213,7 +213,6 @@ class NEOProcess(object):
          Note: for this change to take effect, the node must be restarted.
        """
        self.uuid = uuid
-        self.arg_dict['--uuid'] = str(uuid)

    def isAlive(self):
        try:
@@ -297,7 +296,6 @@ class NEOCluster(object):
    def _newProcess(self, node_type, logfile=None, port=None, **kw):
        self.uuid_dict[node_type] = uuid = 1 + self.uuid_dict.get(node_type, 0)
        uuid += UUID_NAMESPACES[node_type] << 24
-        kw['uuid'] = uuid
        kw['cluster'] = self.cluster_name
        kw['masters'] = self.master_nodes
        if logfile:
@@ -483,13 +481,9 @@ class NEOCluster(object):
        return self.__getNodeList(NodeTypes.CLIENT, state)

    def __getNodeState(self, node_type, uuid):
-        node_list = self.__getNodeList(node_type)
-        for node_type, address, node_uuid, state in node_list:
-            if node_uuid == uuid:
-                break
-        else:
-            state = None
-        return state
+        for node in self.__getNodeList(node_type):
+            if node[2] == uuid:
+                return node[3]

    def getMasterNodeState(self, uuid):
        return self.__getNodeState(NodeTypes.MASTER, uuid)

--- a/neo/tests/master/testElectionHandler.py
+++ b/neo/tests/master/testElectionHandler.py
@@ -231,7 +231,7 @@ class MasterServerElectionTests(MasterClientElectionTestBase):
    def test_requestIdentification1(self):
        """ A non-master node request identification """
        node, conn = self.identifyToMasterNode()
-        args = (node.getUUID(), node.getAddress(), self.app.name)
+        args = node.getUUID(), node.getAddress(), self.app.name, None
        self.assertRaises(protocol.NotReadyError,
            self.election.requestIdentification,
            conn, NodeTypes.CLIENT, *args)
@@ -240,7 +240,7 @@ class MasterServerElectionTests(MasterClientElectionTestBase):
        """ A broken master node request identification """
        node, conn = self.identifyToMasterNode()
        node.setBroken()
-        args = (node.getUUID(), node.getAddress(), self.app.name)
+        args = node.getUUID(), node.getAddress(), self.app.name, None
        self.assertRaises(protocol.BrokenNodeDisallowedError,
            self.election.requestIdentification,
            conn, NodeTypes.MASTER, *args)
@@ -248,7 +248,7 @@ class MasterServerElectionTests(MasterClientElectionTestBase):
    def test_requestIdentification4(self):
        """ No conflict """
        node, conn = self.identifyToMasterNode()
-        args = (node.getUUID(), node.getAddress(), self.app.name)
+        args = node.getUUID(), node.getAddress(), self.app.name, None
        self.election.requestIdentification(conn,
            NodeTypes.MASTER, *args)
        self.checkUUIDSet(conn, node.getUUID())
@@ -280,11 +280,12 @@ class MasterServerElectionTests(MasterClientElectionTestBase):
        conn = self.__getClient()
        self.checkNotReadyErrorRaised(
            self.election.requestIdentification,
-            conn=conn,
-            node_type=NodeTypes.CLIENT,
-            uuid=conn.getUUID(),
-            address=conn.getAddress(),
-            name=self.app.name
+            conn,
+            NodeTypes.CLIENT,
+            conn.getUUID(),
+            conn.getAddress(),
+            self.app.name,
+            None,
        )

    def _requestIdentification(self):
@@ -297,6 +298,7 @@ class MasterServerElectionTests(MasterClientElectionTestBase):
            peer_uuid,
            address,
            self.app.name,
+            None,
        )
        node_type, uuid, partitions, replicas, _peer_uuid, primary, \
            master_list = self.checkAcceptIdentification(conn, decode=True)

--- a/neo/tests/storage/testIdentificationHandler.py
+++ b/neo/tests/storage/testIdentificationHandler.py
@@ -50,6 +50,7 @@ class StorageIdentificationHandlerTests(NeoUnitTestBase):
                self.getClientUUID(),
                None,
                self.app.name,
+                None,
        )
        self.app.ready = True
        self.assertRaises(
@@ -60,6 +61,7 @@ class StorageIdentificationHandlerTests(NeoUnitTestBase):
                self.getStorageUUID(),
                None,
                self.app.name,
+                None,
        )

    def test_requestIdentification3(self):
@@ -75,6 +77,7 @@ class StorageIdentificationHandlerTests(NeoUnitTestBase):
                uuid,
                None,
                self.app.name,
+                None,
        )

    def test_requestIdentification2(self):
@@ -87,7 +90,7 @@ class StorageIdentificationHandlerTests(NeoUnitTestBase):
          'getAddress': master,
        })
        self.identification.requestIdentification(conn, NodeTypes.CLIENT, uuid,
-                None, self.app.name)
+                None, self.app.name, None)
        self.assertTrue(node.isRunning())
        self.assertTrue(node.isConnected())
        self.assertEqual(node.getUUID(), uuid)

--- a/neo/tests/testBootstrap.py
+++ b/neo/tests/testBootstrap.py
@@ -28,7 +28,7 @@ class BootstrapManagerTests(NeoUnitTestBase):
        # create an application object
        config = self.getStorageConfiguration()
        self.app = Application(config)
-        self.bootstrap = BootstrapManager(self.app, 'main', NodeTypes.STORAGE)
+        self.bootstrap = BootstrapManager(self.app,  NodeTypes.STORAGE)
        # define some variable to simulate client and storage node
        self.master_port = 10010
        self.storage_port = 10020

--- a/neo/tests/testNodes.py
+++ b/neo/tests/testNodes.py
@@ -183,15 +183,15 @@ class NodeManagerTests(NeoUnitTestBase):
        old_uuid = self.storage.getUUID()
        new_uuid = self.getStorageUUID()
        node_list = (
-            (NodeTypes.CLIENT, None, self.client.getUUID(), NodeStates.DOWN),
-            (NodeTypes.MASTER, new_address, self.master.getUUID(), NodeStates.RUNNING),
+            (NodeTypes.CLIENT, None, self.client.getUUID(), NodeStates.DOWN, None),
+            (NodeTypes.MASTER, new_address, self.master.getUUID(), NodeStates.RUNNING, None),
            (NodeTypes.STORAGE, self.storage.getAddress(), new_uuid,
-                NodeStates.RUNNING),
+                NodeStates.RUNNING, None),
            (NodeTypes.ADMIN, self.admin.getAddress(), self.admin.getUUID(),
-                NodeStates.UNKNOWN),
+                NodeStates.UNKNOWN, None),
        )
        # update manager content
-        manager.update(node_list)
+        manager.update(Mock(), node_list)
        # - the client gets down
        self.checkClients([])
        # - master change it's address

--- a/neo/tests/threaded/test.py
+++ b/neo/tests/threaded/test.py
@@ -27,14 +27,14 @@ from ZODB import DB, POSException
 from ZODB.DB import TransactionalUndo
 from neo.storage.transactions import TransactionManager, \
    DelayedError, ConflictError
-from neo.lib.connection import MTClientConnection
+from neo.lib.connection import ServerConnection, MTClientConnection
 from neo.lib.exception import DatabaseFailure, StoppedOperation
 from neo.lib.protocol import CellStates, ClusterStates, NodeStates, Packets, \
-    ZERO_TID
+    ZERO_OID, ZERO_TID
 from .. import expectedFailure, Patch
 from . import LockLock, NEOCluster, NEOThreadedTest
 from neo.lib.util import add64, makeChecksum, p64, u64
-from neo.client.exception import NEOStorageError
+from neo.client.exception import NEOPrimaryMasterLost, NEOStorageError
 from neo.client.pool import CELL_CONNECTED, CELL_GOOD
 from neo.master.handlers.client import ClientServiceHandler
 from neo.storage.handlers.client import ClientOperationHandler
@@ -1347,6 +1347,58 @@ class Test(NEOThreadedTest):
        finally:
            cluster.stop()

+    def testIdTimestamp(self):
+        """
+        Given a master M, a storage S, and 2 clients Ca and Cb.
+
+        While Ca(id=1) is being identified by S:
+        1. connection between Ca and M breaks
+        2. M -> S: C1 down
+        3. Cb connect to M: id=1
+        4. M -> S: C1 up
+        5. S processes RequestIdentification from Ca with id=1
+
+        At 5, S must reject Ca, otherwise Cb can't connect to S. This is where
+        id timestamps come into play: with C1 up since t2, S rejects Ca due to
+        a request with t1  < t2.
+
+        To avoid issues with clocks that are out of sync, the client gets its
+        connection timestamp by being notified about itself from the master.
+        """
+        s2c = []
+        def __init__(orig, self, *args, **kw):
+            orig(self, *args, **kw)
+            self.readable = bool
+            s2c.append(self)
+            ll()
+        def connectToStorage(client):
+            next(client.cp.iterateForObject(0))
+        cluster = NEOCluster()
+        try:
+            cluster.start()
+            Ca = cluster.client
+            Ca.pt      # only connect to the master
+            # In a separate thread, connect to the storage but suspend the
+            # processing of the RequestIdentification packet, until the
+            # storage is notified about the existence of the other client.
+            with LockLock() as ll, Patch(ServerConnection, __init__=__init__):
+                t = self.newThread(connectToStorage, Ca)
+                ll()
+            s2c, = s2c
+            m2c, = cluster.master.getConnectionList(cluster.client)
+            m2c.close()
+            Cb = cluster.newClient()
+            try:
+                Cb.pt  # only connect to the master
+                del s2c.readable
+                self.assertRaises(NEOPrimaryMasterLost, t.join)
+                self.assertTrue(s2c.isClosed())
+                connectToStorage(Cb)
+            finally:
+                Cb.close()
+        finally:
+            cluster.stop()
+

 if __name__ == "__main__":
    unittest.main()