From: Brian Warner Date: Wed, 10 Jan 2007 02:40:36 +0000 (-0700) Subject: test_system.py: exercise queen.Roster._lost_node too X-Git-Tag: tahoe_v0.1.0-0-UNSTABLE~379 X-Git-Url: https://git.rkrishnan.org/(%5B%5E?a=commitdiff_plain;h=ceda35089238ffafc610a327d809d14a62b40595;p=tahoe-lafs%2Ftahoe-lafs.git test_system.py: exercise queen.Roster._lost_node too --- diff --git a/src/allmydata/queen.py b/src/allmydata/queen.py index 011d57b5..8e6885b2 100644 --- a/src/allmydata/queen.py +++ b/src/allmydata/queen.py @@ -4,12 +4,18 @@ from foolscap import Referenceable from foolscap.eventual import eventually from twisted.application import service from twisted.python import log +from twisted.internet.error import ConnectionLost, ConnectionDone from allmydata.util import idlib from zope.interface import implements from allmydata.interfaces import RIQueenRoster from allmydata import node from allmydata.filetable import GlobalVirtualDrive + +def sendOnly(call, methname, *args, **kwargs): + d = call(methname, *args, **kwargs) + d.addErrback(lambda f: f.trap((ConnectionLost, ConnectionDone))) + class Roster(service.MultiService, Referenceable): implements(RIQueenRoster) @@ -51,7 +57,11 @@ class Roster(service.MultiService, Referenceable): def _announce_lost_peer(self, lost_nodeid): for targetnode in self.connections.values(): - targetnode.callRemote("lost_peers", lost_peers=[lost_nodeid]) + # use sendOnly, because if they go away then we assume it's + # because they crashed and they've lost all their peer + # connections anyways. + sendOnly(targetnode.callRemote, "lost_peers", + lost_peers=[lost_nodeid]) diff --git a/src/allmydata/test/test_system.py b/src/allmydata/test/test_system.py index 165e42d8..6c43460c 100644 --- a/src/allmydata/test/test_system.py +++ b/src/allmydata/test/test_system.py @@ -10,15 +10,25 @@ from allmydata.util import idlib from twisted.web.client import getPage class SystemTest(unittest.TestCase): + # it takes a little while for a disconnected loopback TCP connection to + # be noticed by the other side. This is not directly visible to us, so we + # have to wait for time to pass rather than just waiting on a deferred. + # This is unfortunate, both because it arbitrarily slows down the test + # process, and because it is hard to predict what the minimum time + # necessary would be (on a slow or heavily loaded system, 100ms might not + # be enough). + DISCONNECT_DELAY = 0.1 + def setUp(self): self.sparent = service.MultiService() self.sparent.startService() def tearDown(self): + log.msg("shutting down SystemTest services") d = self.sparent.stopService() d.addCallback(lambda res: flushEventualQueue()) def _done(res): d1 = defer.Deferred() - reactor.callLater(0.1, d1.callback, None) + reactor.callLater(self.DISCONNECT_DELAY, d1.callback, None) return d1 d.addCallback(_done) return d @@ -55,6 +65,21 @@ class SystemTest(unittest.TestCase): d.addCallback(_connected) return d + def add_extra_node(self, client_num): + # this node is *not* parented to our self.sparent, so we can shut it + # down separately from the rest, to exercise the connection-lost code + basedir = "client%d" % client_num + if not os.path.isdir(basedir): + os.mkdir(basedir) + c = client.Client(basedir=basedir) + self.clients.append(c) + c.set_queen_pburl(self.queen_pburl) + self.numclients += 1 + c.startService() + d = self.wait_for_connections() + d.addCallback(lambda res: c) + return d + def wait_for_connections(self, ignored=None): for c in self.clients: if len(c.connections) != self.numclients - 1: @@ -66,10 +91,19 @@ class SystemTest(unittest.TestCase): def test_connections(self): d = self.set_up_nodes() - def _check(res): + d.addCallback(lambda res: self.add_extra_node(5)) + def _check(extra_node): for c in self.clients: - self.failUnlessEqual(len(c.connections), 4) + self.failUnlessEqual(len(c.connections), 5) + return extra_node d.addCallback(_check) + def _shutdown_extra_node(extra_node): + d1 = extra_node.stopService() + d2 = defer.Deferred() + reactor.callLater(self.DISCONNECT_DELAY, d2.callback, None) + d1.addCallback(lambda res: d2) + return d1 + d.addCallback(_shutdown_extra_node) return d test_connections.timeout = 20