1
=== modified file 'txzookeeper/lock.py'
2
--- txzookeeper/lock.py	2010-06-10 15:44:40 +0000
3
+++ txzookeeper/lock.py	2010-07-09 19:52:57 +0000
4
@@ -51,17 +51,22 @@
5
51
            "/".join((self.path, self.prefix)),
51
            "/".join((self.path, self.prefix)),
6
52
            flags=zookeeper.EPHEMERAL|zookeeper.SEQUENCE)
52
            flags=zookeeper.EPHEMERAL|zookeeper.SEQUENCE)
7
53
53
14
54
        def on_candidate_create(path):
54
        d.addCallback(self._on_candidate_create)
15
55
            self._candidate_path = path
55
        d.addErrback(self._on_no_queue_error)
10
56
            return self._acquire()
11
57
12
58
        d.addCallback(on_candidate_create)
13
59
16
60
        return d
56
        return d
17
61
57
19
62
    def _acquire(self):
58
    def _on_candidate_create(self, path):
20
59
        self._candidate_path = path
21
60
        return self._acquire()
22
61
23
62
    def _on_no_queue_error(self, failure):
24
63
        self._candidate_path = None
25
64
        return failure
26
65
27
66
    def _acquire(self, *args):
28
63
        d = self._client.get_children(self.path)
67
        d = self._client.get_children(self.path)
29
64
        d.addCallback(self._check_candidate_nodes)
68
        d.addCallback(self._check_candidate_nodes)
30
69
        d.addErrback(self._on_no_queue_error)
31
65
        return d
70
        return d
32
66
71
33
67
    def _check_candidate_nodes(self, children):
72
    def _check_candidate_nodes(self, children):
34
68
73
35
=== added file 'txzookeeper/queue.py'
36
--- txzookeeper/queue.py	1970-01-01 00:00:00 +0000
37
+++ txzookeeper/queue.py	2010-07-09 19:52:57 +0000
38
@@ -0,0 +1,451 @@
39
1
"""
40
2
Several distributed multiprocess queue implementations.
41
3
42
4
The C{Queue} implementation follows closely the apache zookeeper recipe, it
43
5
provides no guarantees beyond isolation and concurrency of retrieval of items.
44
6
45
7
The C{ReliableQueue} implementation, provides isolation, and concurrency, as
46
8
well guarantees that if a consumer dies before processing an item, that item is
47
9
made available to another consumer.
48
10
49
11
The C{SerializedQueue} implementation provides for strict in order processing
50
12
of items within a queue.
51
13
"""
52
14
53
15
import zookeeper
54
16
55
17
from twisted.internet.defer import Deferred, fail
56
18
from twisted.python.failure import Failure
57
19
from txzookeeper.lock import Lock
58
20
from txzookeeper.client import ZOO_OPEN_ACL_UNSAFE
59
21
60
22
61
23
class Queue(object):
62
24
    """
63
25
    Implementation is based off the apache zookeeper Queue recipe.
64
26
65
27
    There are some things to keep in mind when using this queue implementation.
66
28
    Its primarily to enforce isolation and concurrent access, however it does
67
29
    not provide for reliable consumption.  An error condition in a queue
68
30
    consumer must requeue the item, else its lost, as its removed from
69
31
    zookeeper on retrieval in this implementation. This implementation more
70
32
    closely mirrors the behavior and api of the pythonstandard library Queue,
71
33
    or multiprocessing.Queue ableit with the caveat of only strings for queue
72
34
    items.
73
35
    """
74
36
75
37
    prefix = "entry-"
76
38
77
39
    def __init__(self, path, client, acl=None, persistent=False):
78
40
        """
79
41
        @param client: A connected C{ZookeeperClient} instance.
80
42
        @param path: The path to the queue inthe zookeeper hierarchy.
81
43
        @param acl: An acl to be used for queue items.
82
44
        @param persistent: Boolean flag which denotes if items in the queue are
83
45
        persistent.
84
46
        """
85
47
        self._path = path
86
48
        self._client = client
87
49
        self._persistent = persistent
88
50
        if acl is None:
89
51
            acl = [ZOO_OPEN_ACL_UNSAFE]
90
52
        self._acl = acl
91
53
92
54
    @property
93
55
    def path(self):
94
56
        """Path to the queue."""
95
57
        return self._path
96
58
97
59
    @property
98
60
    def persistent(self):
99
61
        """If the queue is persistent returns True."""
100
62
        return self._persistent
101
63
102
64
    def get(self):
103
65
        """
104
66
        Get and remove an item from the queue. If no item is available
105
67
        at the moment, a deferred is return that will fire when an item
106
68
        is available.
107
69
        """
108
70
109
71
        def on_queue_items_changed(*args):
110
72
            """Event watcher on queue node child events."""
111
73
            if request.complete or not self._client.connected:
112
74
                return # pragma: no cover
113
75
114
76
            if request.processing_children:
115
77
                # If deferred stack is currently processing a set of children
116
78
                # defer refetching the children till its done.
117
79
                request.refetch_children = True
118
80
            else:
119
81
                # Else the item get request is just waiting for a watch,
120
82
                # restart the get.
121
83
                self._get(request)
122
84
123
85
        request = GetRequest(Deferred(), on_queue_items_changed)
124
86
        self._get(request)
125
87
        return request.deferred
126
88
127
89
    def put(self, item):
128
90
        """
129
91
        Put an item into the queue.
130
92
131
93
        @param item: String data to be put on the queue.
132
94
        """
133
95
        if not isinstance(item, str):
134
96
            return fail(ValueError("queue items must be strings"))
135
97
136
98
        flags = zookeeper.SEQUENCE
137
99
        if not self._persistent:
138
100
            flags = flags|zookeeper.EPHEMERAL
139
101
140
102
        d = self._client.create(
141
103
            "/".join((self._path, self.prefix)), item, self._acl, flags)
142
104
        return d
143
105
144
106
    def qsize(self):
145
107
        """
146
108
        Return the approximate size of the queue. This value is always
147
109
        effectively a snapshot. Returns a deferred returning an integer.
148
110
        """
149
111
        d = self._client.exists(self._path)
150
112
151
113
        def on_success(stat):
152
114
            return stat["numChildren"]
153
115
154
116
        d.addCallback(on_success)
155
117
        return d
156
118
157
119
    def _get(self, request):
158
120
        request.processing_children = True
159
121
        d = self._client.get_children(self._path, request.child_watcher)
160
122
        d.addCallback(self._get_item, request)
161
123
        return d
162
124
163
125
    def _get_item(self, children, request):
164
126
165
127
        def fetch_node(name):
166
128
            path = "/".join((self._path, name))
167
129
            d = self._client.get(path)
168
130
            d.addCallback(on_get_node_success)
169
131
            d.addErrback(on_no_node)
170
132
            return d
171
133
172
134
        def on_get_node_success((data, stat)):
173
135
            d = self._client.delete("/".join((self._path, name)))
174
136
            d.addCallback(on_delete_node_success, data)
175
137
            d.addErrback(on_no_node)
176
138
            return d
177
139
178
140
        def on_delete_node_success(result_code, data):
179
141
            request.processing_children = False
180
142
            request.callback(data)
181
143
182
144
        def on_no_node(failure=None):
183
145
            if failure and not failure.check(zookeeper.NoNodeException):
184
146
                request.errback(failure)
185
147
                return
186
148
            if children:
187
149
                name = children.pop(0)
188
150
                return fetch_node(name)
189
151
190
152
            # Refetching deferred until we process all the children from
191
153
            # from a get children call.
192
154
            request.processing_children = False
193
155
            if request.refetch_children:
194
156
                request.refetch_children = False
195
157
                return self._get(request)
196
158
197
159
        if not children:
198
160
            return on_no_node()
199
161
200
162
        children.sort()
201
163
        name = children.pop(0)
202
164
        return fetch_node(name)
203
165
204
166
205
167
class GetRequest(object):
206
168
    """
207
169
    An encapsulation of a consumer request to fetch an item from the queue.
208
170
209
171
    @refetch_children - boolean field, when true signals that children should
210
172
    be refetched after processing the current set of children.
211
173
212
174
    @child_watcher -The queue child/item watcher.
213
175
214
176
    @processing_children - Boolean flag, set to true when the last known
215
177
    children of the queue are being processed. If a watch fires while the
216
178
    children are being processed it sets the refetch_children flag to true
217
179
    instead of getting the children immediately.
218
180
219
181
    @deferred - The deferred representing retrieving an item from the queue.
220
182
    """
221
183
222
184
    def __init__(self, deferred, watcher):
223
185
        self.deferred = deferred
224
186
        self.child_watcher = watcher
225
187
        self.processing_children = False
226
188
        self.refetch_children = False
227
189
228
190
    @property
229
191
    def complete(self):
230
192
        return self.deferred.called
231
193
232
194
    def callback(self, data):
233
195
        self.deferred.callback(data)
234
196
235
197
    def errback(self, error):
236
198
        self.deferred.errback(error)
237
199
238
200
239
201
class QueueItem(object):
240
202
    """
241
203
    An encapsulation of a work item put into a queue. The work item data is
242
204
    accessible via the data attribute. When the item has been processed by
243
205
    the consumer, the delete method can be invoked to remove the item
244
206
    permanently from the queue.
245
207
246
208
    An optional processed callback maybe passed to the constructor that will
247
209
    be invoked after the node has been processed.
248
210
    """
249
211
250
212
    def __init__(self, path, data, client, processed_callback=None):
251
213
        self._path = path
252
214
        self._data = data
253
215
        self._client = client
254
216
        self._processed_callback = processed_callback
255
217
256
218
    @property
257
219
    def data(self):
258
220
        return self._data
259
221
260
222
    @property
261
223
    def path(self):
262
224
        return self._path
263
225
264
226
    def delete(self):
265
227
        """
266
228
        Delete the item node and the item processing node in the queue.
267
229
        Typically invoked by a queue consumer, to signal succesful processing
268
230
        of the queue item.
269
231
        """
270
232
        d = self._client.delete(self.path)
271
233
272
234
        if self._processed_callback:
273
235
            d.addCallback(self._processed_callback, self.path)
274
236
        return d
275
237
276
238
277
239
class ReliableQueue(Queue):
278
240
    """
279
241
    A distributed queue. It varies from a C{Queue} in that it ensures any
280
242
    item consumed from the queue is explicitly ack'd by the consumer.
281
243
    If the consumer dies after retrieving an item before ack'ing the item.
282
244
    The item will be made available to another consumer. To encapsulate the
283
245
    acking behavior the queue item data is returned in a C{QueueItem} instance,
284
246
    with a delete method that will remove it from the queue after processing.
285
247
286
248
    Reliable queues may be persistent or transient. If the queue is durable,
287
249
    than any item added to the queue must be processed in order to be removed.
288
250
    If the queue is transient, then any jobs placed in the queue by a client
289
251
    are removed when the client is closed, regardless of whether the job
290
252
    has been processed or not.
291
253
    """
292
254
293
255
    def _item_processed_callback(self, result_code, item_path):
294
256
        return self._client.delete(item_path+"-processing")
295
257
296
258
    def _filter_children(self, children, suffix="-processing"):
297
259
        """
298
260
        Filter any children currently being processed, modified in place.
299
261
        """
300
262
        children.sort()
301
263
        for name in list(children):
302
264
            # remove any processing nodes and their associated queue item.
303
265
            if name.endswith(suffix):
304
266
                children.remove(name)
305
267
                item_name = name[:-len(suffix)]
306
268
                if item_name in children:
307
269
                    children.remove(item_name)
308
270
309
271
    def _get_item(self, children, request):
310
272
311
273
        def check_node(name):
312
274
            """Check the node still exists."""
313
275
            path = "/".join((self._path, name))
314
276
            d = self._client.exists(path)
315
277
            d.addCallback(on_node_exists, path)
316
278
            d.addErrback(on_reservation_failed)
317
279
            return d
318
280
319
281
        def on_node_exists(stat, path):
320
282
            """Reserve the node for consumer processing."""
321
283
            d = self._client.create(path+"-processing",
322
284
                                    flags=zookeeper.EPHEMERAL)
323
285
            d.addCallback(on_reservation_success, path)
324
286
            d.addErrback(on_reservation_failed)
325
287
            return d
326
288
327
289
        def on_reservation_success(processing_path, path):
328
290
            """Fetch the node data to return"""
329
291
            d = self._client.get(path)
330
292
            d.addCallback(on_get_node_success, path)
331
293
            d.addErrback(on_get_node_failed, path)
332
294
            return d
333
295
334
296
        def on_get_node_failed(failure, path):
335
297
            """If we can't fetch the node, delete the processing node."""
336
298
            d = self._client.delete(path+"-processing")
337
299
338
300
            # propogate unexpected errors appropriately
339
301
            if not failure.check(zookeeper.NoNodeException):
340
302
                d.addCallback(lambda x: request.errback(failure))
341
303
            else:
342
304
                d.addCallback(on_reservation_failed)
343
305
            return d
344
306
345
307
        def on_get_node_success((data, stat), path):
346
308
            """If we got the node, we're done."""
347
309
            request.processing_children = False
348
310
            request.callback(
349
311
                QueueItem(
350
312
                    path, data, self._client, self._item_processed_callback))
351
313
352
314
        def on_reservation_failed(failure=None):
353
315
            """If we can't get the node or reserve, continue processing
354
316
            the children."""
355
317
            if failure and not failure.check(
356
318
                zookeeper.NodeExistsException, zookeeper.NoNodeException):
357
319
                request.processing_children = True
358
320
                request.errback(failure)
359
321
                return
360
322
361
323
            if children:
362
324
                name = children.pop(0)
363
325
                return check_node(name)
364
326
365
327
            # If a watch fired while processing children, process it
366
328
            # after the children list is exhausted.
367
329
            request.processing_children = False
368
330
            if request.refetch_children:
369
331
                request.refetch_children = False
370
332
                return self._get(request)
371
333
372
334
        self._filter_children(children)
373
335
374
336
        if not children:
375
337
            return on_reservation_failed()
376
338
377
339
        name = children.pop(0)
378
340
        return check_node(name)
379
341
380
342
381
343
class SerializedQueue(Queue):
382
344
    """
383
345
    A serialized queue ensures even with multiple consumers items are retrieved
384
346
    and processed in the order they where placed in the queue.
385
347
386
348
    This implementation aggregates a reliable queue, with a lock to provide
387
349
    for serialized consumer access. The lock is released only when a queue item
388
350
    has been processed.
389
351
    """
390
352
391
353
    def __init__(self, path, client, acl=None, persistent=False):
392
354
        super(SerializedQueue, self).__init__(path, client, acl, persistent)
393
355
        self._lock = Lock("%s/%s"%(self.path, "_lock"), client)
394
356
395
357
    def _item_processed_callback(self, result_code, item_path):
396
358
        return self._lock.release()
397
359
398
360
    def _filter_children(self, children, suffix="-processing"):
399
361
        """
400
362
        Filter the lock from consideration as an item to be processed.
401
363
        """
402
364
        children.sort()
403
365
        for name in list(children):
404
366
            if name.startswith('_'):
405
367
                children.remove(name)
406
368
407
369
    def _on_lock_directory_does_not_exist(self, failure):
408
370
        """
409
371
        If the lock directory does not exist, go ahead and create it and
410
372
        attempt to acquire the lock.
411
373
        """
412
374
        failure.trap(zookeeper.NoNodeException)
413
375
        d = self._client.create(self._lock.path)
414
376
        d.addBoth(self._on_lock_created_or_exists)
415
377
        return d
416
378
417
379
    def _on_lock_created_or_exists(self, failure):
418
380
        """
419
381
        The lock node creation will either result in success or node exists
420
382
        error, if a concurrent client created the node first. In either case
421
383
        we proceed with attempting to acquire the lock.
422
384
        """
423
385
        if isinstance(failure, Failure):
424
386
            failure.trap(zookeeper.NodeExistsException)
425
387
        d = self._lock.acquire()
426
388
        return d
427
389
428
390
    def _on_lock_acquired(self, lock):
429
391
        """
430
392
        After the exclusive queue lock is acquired, we proceed with an attempt
431
393
        to fetch an item from the queue.
432
394
        """
433
395
        d = super(SerializedQueue, self).get()
434
396
        return d
435
397
436
398
    def get(self):
437
399
        """
438
400
        Get and remove an item from the queue. If no item is available
439
401
        at the moment, a deferred is return that will fire when an item
440
402
        is available.
441
403
        """
442
404
        d = self._lock.acquire()
443
405
444
406
        d.addErrback(self._on_lock_directory_does_not_exist)
445
407
        d.addCallback(self._on_lock_acquired)
446
408
        return d
447
409
448
410
    def _get_item(self, children, request):
449
411
450
412
        def fetch_node(name):
451
413
            path = "/".join((self._path, name))
452
414
            d = self._client.get(path)
453
415
            d.addCallback(on_node_retrieved, path)
454
416
            d.addErrback(on_reservation_failed)
455
417
            return d
456
418
457
419
        def on_node_retrieved((data, stat), path):
458
420
            request.processing_children = False
459
421
            request.callback(
460
422
                QueueItem(
461
423
                    path, data, self._client, self._item_processed_callback))
462
424
463
425
        def on_reservation_failed(failure=None):
464
426
            """If we can't get the node or reserve, continue processing
465
427
            the children."""
466
428
            if failure and not failure.check(
467
429
                zookeeper.NodeExistsException, zookeeper.NoNodeException):
468
430
                request.processing_children = True
469
431
                request.errback(failure)
470
432
                return
471
433
472
434
            if children:
473
435
                name = children.pop(0)
474
436
                return fetch_node(name)
475
437
476
438
            # If a watch fired while processing children, process it
477
439
            # after the children list is exhausted.
478
440
            request.processing_children = False
479
441
            if request.refetch_children:
480
442
                request.refetch_children = False
481
443
                return self._get(request)
482
444
483
445
        self._filter_children(children)
484
446
485
447
        if not children:
486
448
            return on_reservation_failed()
487
449
488
450
        name = children.pop(0)
489
451
        return fetch_node(name)
490
0
452
491
=== modified file 'txzookeeper/tests/__init__.py'
492
--- txzookeeper/tests/__init__.py	2010-06-10 15:46:02 +0000
493
+++ txzookeeper/tests/__init__.py	2010-07-09 19:52:57 +0000
494
@@ -4,10 +4,6 @@
495
4
from twisted.trial.unittest import TestCase
4
from twisted.trial.unittest import TestCase
496
5
from mocker import MockerTestCase
5
from mocker import MockerTestCase
497
6
6
498
7
#from txzookeeper.client import Wrapper
499
8
500
9
#zookeeper = Wrapper(zookeeper)
501
10
502
11
class ZookeeperTestCase(TestCase, MockerTestCase):
7
class ZookeeperTestCase(TestCase, MockerTestCase):
503
12
8
504
13
    def setUp(self):
9
    def setUp(self):
505
14
10
506
=== modified file 'txzookeeper/tests/test_client.py'
507
--- txzookeeper/tests/test_client.py	2010-06-01 14:26:45 +0000
508
+++ txzookeeper/tests/test_client.py	2010-07-09 19:52:57 +0000
509
@@ -342,6 +342,33 @@
510
342
        d.addCallback(verify_exists)
342
        d.addCallback(verify_exists)
511
343
        return d
343
        return d
512
344
344
513
345
    def test_exists_with_watcher_and_close(self):
514
346
        """
515
347
        Closing a connection with an watch outstanding behaves correctly.
516
348
        """
517
349
        d = self.client.connect()
518
350
        zookeeper.set_debug_level(zookeeper.LOG_LEVEL_DEBUG)
519
351
520
352
        def node_watcher(event_type, state, path):
521
353
            client = getattr(self, "client", None)
522
354
            if client is not None and client.connected:
523
355
                self.fail("Client should be disconnected")
524
356
525
357
        def create_node(client):
526
358
            return client.create("/syracuse")
527
359
528
360
        def check_exists(path):
529
361
            # shouldn't fire till unit test cleanup
530
362
            return self.client.exists(path, node_watcher)
531
363
532
364
        def verify_exists(result):
533
365
            self.assertTrue(result)
534
366
535
367
        d.addCallback(create_node)
536
368
        d.addCallback(check_exists)
537
369
        d.addCallback(verify_exists)
538
370
        return d
539
371
540
345
    def test_exists_with_nonexistant_watcher(self):
372
    def test_exists_with_nonexistant_watcher(self):
541
346
        """
373
        """
542
347
        The exists method can also be used to set an optional watcher on a
374
        The exists method can also be used to set an optional watcher on a
543
348
375
544
=== modified file 'txzookeeper/tests/test_lock.py'
545
--- txzookeeper/tests/test_lock.py	2010-06-10 15:44:40 +0000
546
+++ txzookeeper/tests/test_lock.py	2010-07-09 19:52:57 +0000
547
@@ -1,4 +1,5 @@
548
1
1
549
2
from zookeeper import NoNodeException
550
2
from mocker import ANY
3
from mocker import ANY
551
3
from twisted.internet.defer import (
4
from twisted.internet.defer import (
552
4
    inlineCallbacks, returnValue, Deferred, succeed)
5
    inlineCallbacks, returnValue, Deferred, succeed)
553
@@ -81,6 +82,22 @@
554
81
        yield self.failUnlessFailure(lock.acquire(), LockError)
82
        yield self.failUnlessFailure(lock.acquire(), LockError)
555
82
83
556
83
    @inlineCallbacks
84
    @inlineCallbacks
557
85
    def test_acquire_after_error(self):
558
86
        """
559
87
        Any instance state associated with a failed acquired should be cleared
560
88
        on error, allowing subsequent to succeed.
561
89
        """
562
90
        client = yield self.open_client()
563
91
        path = "/lock-test-acquire-after-error"
564
92
        lock = Lock(path, client)
565
93
        d = lock.acquire()
566
94
        self.failUnlessFailure(d, NoNodeException)
567
95
        yield d
568
96
        yield client.create(path)
569
97
        yield lock.acquire()
570
98
        self.assertEqual(lock.acquired, True)
571
99
572
100
    @inlineCallbacks
573
84
    def test_error_on_acquire_acquiring(self):
101
    def test_error_on_acquire_acquiring(self):
574
85
        """
102
        """
575
86
        Attempting to acquire the lock while an attempt is already in progress,
103
        Attempting to acquire the lock while an attempt is already in progress,
576
87
104
577
=== added file 'txzookeeper/tests/test_queue.py'
578
--- txzookeeper/tests/test_queue.py	1970-01-01 00:00:00 +0000
579
+++ txzookeeper/tests/test_queue.py	2010-07-09 19:52:57 +0000
580
@@ -0,0 +1,392 @@
581
1
582
2
from zookeeper import NoNodeException
583
3
from twisted.internet.defer import (
584
4
    inlineCallbacks, returnValue, DeferredList, Deferred, succeed, fail)
585
5
586
6
from txzookeeper import ZookeeperClient
587
7
from txzookeeper.client import NotConnectedException
588
8
from txzookeeper.queue import Queue, ReliableQueue, SerializedQueue, QueueItem
589
9
from txzookeeper.tests import ZookeeperTestCase, utils
590
10
591
11
from mocker import ANY
592
12
593
13
594
14
class QueueTests(ZookeeperTestCase):
595
15
596
16
    queue_factory = Queue
597
17
598
18
    def setUp(self):
599
19
        super(QueueTests, self).setUp()
600
20
        self.clients = []
601
21
602
22
    def tearDown(self):
603
23
        cleanup = False
604
24
605
25
        for client in self.clients:
606
26
            if not cleanup and client.connected:
607
27
                utils.deleteTree(handle=client.handle)
608
28
                cleanup = True
609
29
            if client.connected:
610
30
                client.close()
611
31
        super(QueueTests, self).tearDown()
612
32
613
33
    def compare_data(self, data, item):
614
34
        if isinstance(item, QueueItem):
615
35
            self.assertEqual(data, item.data)
616
36
        else:
617
37
            self.assertEqual(data, item)
618
38
619
39
    def consume_item(self, item):
620
40
        if isinstance(item, QueueItem):
621
41
            return item.delete(), item.data
622
42
        return None, item
623
43
624
44
    @inlineCallbacks
625
45
    def open_client(self, credentials=None):
626
46
        """
627
47
        Open a zookeeper client, optionally authenticating with the
628
48
        credentials if given.
629
49
        """
630
50
        client = ZookeeperClient("127.0.0.1:2181")
631
51
        self.clients.append(client)
632
52
        yield client.connect()
633
53
        if credentials:
634
54
            d = client.add_auth("digest", credentials)
635
55
            # hack to keep auth fast
636
56
            yield client.exists("/")
637
57
            yield d
638
58
        returnValue(client)
639
59
640
60
    def test_path_property(self):
641
61
        """
642
62
        The queue has a property that can be used to introspect its
643
63
        path in read only manner.
644
64
        """
645
65
        q = self.queue_factory("/moon", None)
646
66
        self.assertEqual(q.path, "/moon")
647
67
648
68
    def test_persistent_property(self):
649
69
        """
650
70
        The queue has a property that can be used to introspect
651
71
        whether or not the queue entries are persistent.
652
72
        """
653
73
        q = self.queue_factory("/moon", None, persistent=True)
654
74
        self.assertEqual(q.persistent, True)
655
75
656
76
    @inlineCallbacks
657
77
    def test_put_item(self):
658
78
        """
659
79
        An item can be put on the queue, and is stored in a node in
660
80
        queue's directory.
661
81
        """
662
82
        client = yield self.open_client()
663
83
        path = yield client.create("/queue-test")
664
84
        queue = self.queue_factory(path, client)
665
85
        item = "transform image bluemarble.jpg"
666
86
        yield queue.put(item)
667
87
        children = yield client.get_children(path)
668
88
        self.assertEqual(len(children), 1)
669
89
        data, stat = yield client.get("/".join((path, children[0])))
670
90
        self.compare_data(data, item)
671
91
672
92
    @inlineCallbacks
673
93
    def test_qsize(self):
674
94
        """
675
95
        The client implements a method which returns an unreliable
676
96
        approximation of the number of items in the queue (mirrors api
677
97
        of Queue.Queue), its unreliable only in that the value represents
678
98
        a temporal snapshot of the value at the time it was requested,
679
99
        not its current value.
680
100
        """
681
101
        client = yield self.open_client()
682
102
        path = yield client.create("/test-qsize")
683
103
        queue = self.queue_factory(path, client)
684
104
685
105
        yield queue.put("abc")
686
106
        size = yield queue.qsize()
687
107
        self.assertTrue(size, 1)
688
108
689
109
        yield queue.put("bcd")
690
110
        size = yield queue.qsize()
691
111
        self.assertTrue(size, 2)
692
112
693
113
        yield queue.get()
694
114
        size = yield queue.qsize()
695
115
        self.assertTrue(size, 1)
696
116
697
117
    @inlineCallbacks
698
118
    def test_invalid_put_item(self):
699
119
        """
700
120
        The queue only accepts string items.
701
121
        """
702
122
        client = yield self.open_client()
703
123
        queue = self.queue_factory("/unused", client)
704
124
        self.failUnlessFailure(queue.put(123), ValueError)
705
125
706
126
    @inlineCallbacks
707
127
    def test_get_with_invalid_queue(self):
708
128
        """
709
129
        If the queue hasn't been created an unknown node exception is raised
710
130
        on get.
711
131
        """
712
132
        client = yield self.open_client()
713
133
        queue = self.queue_factory("/unused", client)
714
134
        yield self.failUnlessFailure(queue.put("abc"), NoNodeException)
715
135
716
136
    @inlineCallbacks
717
137
    def test_put_with_invalid_queue(self):
718
138
        """
719
139
        If the queue hasn't been created an unknown node exception is raised
720
140
        on put.
721
141
        """
722
142
        client = yield self.open_client()
723
143
        queue = self.queue_factory("/unused", client)
724
144
        yield self.failUnlessFailure(queue.put("abc"), NoNodeException)
725
145
726
146
    @inlineCallbacks
727
147
    def test_unexpected_error_during_item_retrieval(self):
728
148
        """
729
149
        If an unexpected error occurs when reserving an item, the error is
730
150
        passed up to the get deferred's errback method.
731
151
        """
732
152
        test_client = yield self.open_client()
733
153
        path = yield test_client.create("/reliable-queue-test")
734
154
735
155
        # setup the test scenario
736
156
        mock_client = self.mocker.patch(test_client)
737
157
        mock_client.get_children(path, ANY)
738
158
        self.mocker.result(succeed(["entry-000000"]))
739
159
740
160
        item_path = "%s/%s"%(path, "entry-000000")
741
161
        mock_client.get(item_path)
742
162
        self.mocker.result(fail(SyntaxError("x")))
743
163
        self.mocker.replay()
744
164
745
165
        # odd behavior, this should return a failure, as above, but it returns
746
166
        # None
747
167
        d = self.queue_factory(path, mock_client).get()
748
168
        assert d
749
169
        self.failUnlessFailure(d, SyntaxError)
750
170
        yield d
751
171
752
172
    @inlineCallbacks
753
173
    def test_get_and_put(self):
754
174
        """
755
175
        Get can also be used on empty queues and returns a deferred that fires
756
176
        whenever an item is has been retrieved from the queue.
757
177
        """
758
178
        client = yield self.open_client()
759
179
        path = yield client.create("/queue-wait-test")
760
180
        data = "zebra moon"
761
181
        queue = self.queue_factory(path, client)
762
182
        d = queue.get()
763
183
764
184
        @inlineCallbacks
765
185
        def push_item():
766
186
            queue = self.queue_factory(path, client)
767
187
            yield queue.put(data)
768
188
769
189
        from twisted.internet import reactor
770
190
        reactor.callLater(0.1, push_item)
771
191
772
192
        item = yield d
773
193
        self.compare_data(data, item)
774
194
775
195
    @inlineCallbacks
776
196
    def test_interleaved_multiple_consumers_wait(self):
777
197
        """
778
198
        Multiple consumers and a producer adding and removing items on the
779
199
        the queue concurrently.
780
200
        """
781
201
        test_client = yield self.open_client()
782
202
        path = yield test_client.create("/multi-consumer-wait-test")
783
203
        results = []
784
204
785
205
        @inlineCallbacks
786
206
        def producer(item_count):
787
207
            from twisted.internet import reactor
788
208
            client = yield self.open_client()
789
209
            queue = self.queue_factory(path, client)
790
210
791
211
            items = []
792
212
            producer_done = Deferred()
793
213
794
214
            def iteration(i):
795
215
                if len(items) == (item_count-1):
796
216
                    return producer_done.callback(None)
797
217
                items.append(i)
798
218
                queue.put(str(i))
799
219
800
220
            for i in range(item_count):
801
221
                reactor.callLater(i*0.05, iteration, i)
802
222
            yield producer_done
803
223
            returnValue(items)
804
224
805
225
        @inlineCallbacks
806
226
        def consumer(item_count):
807
227
            client = yield self.open_client()
808
228
            queue = self.queue_factory(path, client)
809
229
            for i in range(item_count):
810
230
                try:
811
231
                    data = yield queue.get()
812
232
                    d, data = self.consume_item(data)
813
233
                    if d:
814
234
                        yield d
815
235
                except NotConnectedException:
816
236
                    # when the test closes, we need to catch this
817
237
                    # as one of the producers will likely hang.
818
238
                    returnValue(len(results))
819
239
                results.append((client.handle, data))
820
240
821
241
            returnValue(len(results))
822
242
823
243
        yield DeferredList(
824
244
            [DeferredList([consumer(3), consumer(2)], fireOnOneCallback=1),
825
245
             producer(6)])
826
246
        # as soon as the producer and either consumer is complete than the test
827
247
        # is done. Thus the only assertion we can make is the result is the
828
248
        # size of at least the smallest consumer.
829
249
        self.assertTrue(len(results) >= 2)
830
250
831
251
    @inlineCallbacks
832
252
    def test_staged_multiproducer_multiconsumer(self):
833
253
        """
834
254
        A real world scenario test, A set of producers filling a queue with
835
255
        items, and then a set of concurrent consumers pulling from the queue
836
256
        till its empty. The consumers use a non blocking get (defer raises
837
257
        exception on empty).
838
258
        """
839
259
        test_client = yield self.open_client()
840
260
        path = yield test_client.create("/multi-prod-cons")
841
261
842
262
        consume_results = []
843
263
        produce_results = []
844
264
845
265
        @inlineCallbacks
846
266
        def producer(start, offset):
847
267
            client = yield self.open_client()
848
268
            q = self.queue_factory(path, client)
849
269
            for i in range(start, start+offset):
850
270
                yield q.put(str(i))
851
271
                produce_results.append(str(i))
852
272
853
273
        @inlineCallbacks
854
274
        def consumer(max):
855
275
            client = yield self.open_client()
856
276
            q = self.queue_factory(path, client)
857
277
            attempts = range(max)
858
278
            for el in attempts:
859
279
                value = yield q.get()
860
280
                d, value = self.consume_item(value)
861
281
                if d:
862
282
                    yield d
863
283
                consume_results.append(value)
864
284
            returnValue(True)
865
285
866
286
        # two producers 20 items total
867
287
        yield DeferredList(
868
288
            [producer(0, 10), producer(10, 10)])
869
289
870
290
        children = yield test_client.get_children(path)
871
291
        self.assertEqual(len(children), 20)
872
292
873
293
        yield DeferredList(
874
294
            [consumer(8), consumer(8), consumer(4)])
875
295
876
296
        err = set(produce_results)-set(consume_results)
877
297
        self.assertFalse(err)
878
298
879
299
        self.assertEqual(len(consume_results), len(produce_results))
880
300
881
301
882
302
class ReliableQueueTests(QueueTests):
883
303
884
304
    queue_factory = ReliableQueue
885
305
886
306
    @inlineCallbacks
887
307
    def test_unprocessed_item_reappears(self):
888
308
        """
889
309
        If a queue consumer exits before processing an item, then
890
310
        the item will become visible to other queue consumers.
891
311
        """
892
312
        test_client = yield self.open_client()
893
313
        path = yield test_client.create("/reliable-queue-test")
894
314
895
315
        data = "rabbit stew"
896
316
        queue = self.queue_factory(path, test_client)
897
317
        yield queue.put(data)
898
318
899
319
        test_client2 = yield self.open_client()
900
320
        queue2 = self.queue_factory(path, test_client2)
901
321
        item = yield queue2.get()
902
322
        self.compare_data(data, item)
903
323
904
324
        d = queue.get()
905
325
        yield test_client2.close()
906
326
907
327
        item = yield d
908
328
        self.compare_data(data, item)
909
329
910
330
    @inlineCallbacks
911
331
    def test_processed_item_removed(self):
912
332
        """
913
333
        If a client processes an item, than that item is removed from the queue
914
334
        permanently.
915
335
        """
916
336
        test_client = yield self.open_client()
917
337
        path = yield test_client.create("/reliable-queue-test")
918
338
919
339
        data = "rabbit stew"
920
340
        queue = self.queue_factory(path, test_client)
921
341
        yield queue.put(data)
922
342
        item = yield queue.get()
923
343
        self.compare_data(data, item)
924
344
        yield item.delete()
925
345
        yield test_client.close()
926
346
927
347
        test_client2 = yield self.open_client()
928
348
        children = yield test_client2.get_children(path)
929
349
        children = [c for c in children if c.startswith(queue.prefix)]
930
350
        self.assertFalse(bool(children))
931
351
932
352
933
353
class SerializedQueueTests(ReliableQueueTests):
934
354
935
355
    queue_factory = SerializedQueue
936
356
937
357
    @inlineCallbacks
938
358
    def test_serialized_behavior(self):
939
359
        """
940
360
        The serialized queue behavior is such that even with multiple
941
361
        consumers, items are processed in order.
942
362
        """
943
363
        test_client = yield self.open_client()
944
364
        path = yield test_client.create("/serialized-queue-test")
945
365
946
366
        queue = self.queue_factory(path, test_client, persistent=True)
947
367
948
368
        yield queue.put("a")
949
369
        yield queue.put("b")
950
370
951
371
        test_client2 = yield self.open_client()
952
372
        queue2 = self.queue_factory(path, test_client2, persistent=True)
953
373
954
374
        d = queue2.get()
955
375
956
376
        def on_get_item_sleep_and_close(item):
957
377
            """Close the connection after we have the item."""
958
378
            from twisted.internet import reactor
959
379
            reactor.callLater(0.1, test_client2.close)
960
380
            return item
961
381
962
382
        d.addCallback(on_get_item_sleep_and_close)
963
383
964
384
        # fetch the item from queue2
965
385
        item1 = yield d
966
386
        # fetch the item from queue1, this will not get "b", because client2 is
967
387
        # still processing "a". When client2 closes its connection, client1
968
388
        # will get item "a"
969
389
        item2 = yield queue.get()
970
390
971
391
        self.compare_data("a", item2)
972
392
        self.assertEqual(item1.data, item2.data)
973
0
393
974
=== modified file 'txzookeeper/todo.txt'
975
--- txzookeeper/todo.txt	2010-05-08 12:14:56 +0000
976
+++ txzookeeper/todo.txt	2010-07-09 19:52:57 +0000
977
@@ -2,10 +2,10 @@
978
2
bugs to file upstream
2
bugs to file upstream
979
3
3
980
4
 - you can set acl on a non existant node.
4
 - you can set acl on a non existant node.
982
5
 - memory leak every api invocation.
5
 - memory leak every api invocation. [really? need some measurements here]
983
6
6
984
7
 observed while trying xtest_get_children_with_watcher
7
 observed while trying xtest_get_children_with_watcher
985
8
8
987
9
 - async get children with watcher seems broken.
9
 - async get children with watcher seems broken. [772 - fixed upstream]
988
10
 - segfault if close during completion.
10
 - segfault if close during completion.
989
11
 - getting a watch notification when closing a connection, segfaults.
11
 - getting a watch notification when closing a connection, segfaults.
Status:	Merged
Merged at revision:	24
Proposed branch:	lp:~hazmat/txzookeeper/distributed-queue
Merge into:	lp:txzookeeper
Diff against target:	989 lines (+901/-13) 7 files modified txzookeeper/lock.py (+12/-7) txzookeeper/queue.py (+451/-0) txzookeeper/tests/__init__.py (+0/-4) txzookeeper/tests/test_client.py (+27/-0) txzookeeper/tests/test_lock.py (+17/-0) txzookeeper/tests/test_queue.py (+392/-0) txzookeeper/todo.txt (+2/-2)
To merge this branch:	bzr merge lp:~hazmat/txzookeeper/distributed-queue
Related bugs:	Link a bug report
Reviewer	Review Type	Date Requested	Status
Gustavo Niemeyer		2010-05-20	Approve on 2010-06-15
Review via email: mp+25712@code.launchpad.net