1
=== modified file 'NEWS'
2
--- NEWS	2010-01-29 09:13:30 +0000
3
+++ NEWS	2010-01-29 15:23:14 +0000
4
@@ -5,6 +5,24 @@
5
5
.. contents:: List of Releases
5
.. contents:: List of Releases
6
6
   :depth: 1
6
   :depth: 1
7
7
7
8
8
bzr 2.1.0 (not released yet)
9
9
############################
10
10
11
11
:Codename: 
12
12
:2.1.0: 
13
13
14
14
Bug Fixes
15
15
*********
16
16
17
17
* Using the ``bzrlib.chk_map`` module from within multiple threads at the
18
18
  same time was broken due to race conditions with a module level page
19
19
  cache. This shows up as a KeyError in the ``bzrlib.lru_cache`` code with
20
20
  ``bzrlib.chk_map`` in the backtrace, and can be triggered without using
21
21
  the same high level objects such as ``bzrlib.repository.Repository``
22
22
  from different threads. chk_map now uses a thread local cache which may
23
23
  increase memory pressure on processes using threads.
24
24
  (Robert Collins, John Arbash Meinel, #514090)
25
25
26
8
bzr 2.1.0rc2
26
bzr 2.1.0rc2
27
9
############
27
############
28
10
28
29
11
29
30
=== modified file 'bzrlib/chk_map.py'
31
--- bzrlib/chk_map.py	2009-11-02 17:27:52 +0000
32
+++ bzrlib/chk_map.py	2010-01-29 15:23:14 +0000
33
@@ -38,6 +38,7 @@
34
38
"""
38
"""
35
39
39
36
40
import heapq
40
import heapq
37
41
import threading
38
41
42
39
42
from bzrlib import lazy_import
43
from bzrlib import lazy_import
40
43
lazy_import.lazy_import(globals(), """
44
lazy_import.lazy_import(globals(), """
41
@@ -59,11 +60,31 @@
42
59
# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan
60
# If each line is 50 bytes, and you have 255 internal pages, with 255-way fan
43
60
# out, it takes 3.1MB to cache the layer.
61
# out, it takes 3.1MB to cache the layer.
44
61
_PAGE_CACHE_SIZE = 4*1024*1024
62
_PAGE_CACHE_SIZE = 4*1024*1024
47
62
# We are caching bytes so len(value) is perfectly accurate
63
# Per thread caches for 2 reasons:
48
63
_page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)
64
# - in the server we may be serving very different content, so we get less
49
65
#   cache thrashing.
50
66
# - we avoid locking on every cache lookup.
51
67
_thread_caches = threading.local()
52
68
# The page cache.
53
69
_thread_caches.page_cache = None
54
70
55
71
def _get_cache():
56
72
    """Get the per-thread page cache.
57
73
58
74
    We need a function to do this because in a new thread the _thread_caches
59
75
    threading.local object does not have the cache initialized yet.
60
76
    """
61
77
    page_cache = getattr(_thread_caches, 'page_cache', None)
62
78
    if page_cache is None:
63
79
        # We are caching bytes so len(value) is perfectly accurate
64
80
        page_cache = lru_cache.LRUSizeCache(_PAGE_CACHE_SIZE)
65
81
        _thread_caches.page_cache = page_cache
66
82
    return page_cache
67
83
68
64
84
69
65
def clear_cache():
85
def clear_cache():
71
66
    _page_cache.clear()
86
    _get_cache().clear()
72
87
73
67
88
74
68
# If a ChildNode falls below this many bytes, we check for a remap
89
# If a ChildNode falls below this many bytes, we check for a remap
75
69
_INTERESTING_NEW_SIZE = 50
90
_INTERESTING_NEW_SIZE = 50
76
@@ -161,11 +182,11 @@
77
161
182
78
162
    def _read_bytes(self, key):
183
    def _read_bytes(self, key):
79
163
        try:
184
        try:
81
164
            return _page_cache[key]
185
            return _get_cache()[key]
82
165
        except KeyError:
186
        except KeyError:
83
166
            stream = self._store.get_record_stream([key], 'unordered', True)
187
            stream = self._store.get_record_stream([key], 'unordered', True)
84
167
            bytes = stream.next().get_bytes_as('fulltext')
188
            bytes = stream.next().get_bytes_as('fulltext')
86
168
            _page_cache[key] = bytes
189
            _get_cache()[key] = bytes
87
169
            return bytes
190
            return bytes
88
170
191
89
171
    def _dump_tree(self, include_keys=False):
192
    def _dump_tree(self, include_keys=False):
90
@@ -901,7 +922,7 @@
91
901
        bytes = ''.join(lines)
922
        bytes = ''.join(lines)
92
902
        if len(bytes) != self._current_size():
923
        if len(bytes) != self._current_size():
93
903
            raise AssertionError('Invalid _current_size')
924
            raise AssertionError('Invalid _current_size')
95
904
        _page_cache.add(self._key, bytes)
925
        _get_cache().add(self._key, bytes)
96
905
        return [self._key]
926
        return [self._key]
97
906
927
98
907
    def refs(self):
928
    def refs(self):
99
@@ -1143,7 +1164,7 @@
100
1143
            found_keys = set()
1164
            found_keys = set()
101
1144
            for key in keys:
1165
            for key in keys:
102
1145
                try:
1166
                try:
104
1146
                    bytes = _page_cache[key]
1167
                    bytes = _get_cache()[key]
105
1147
                except KeyError:
1168
                except KeyError:
106
1148
                    continue
1169
                    continue
107
1149
                else:
1170
                else:
108
@@ -1174,7 +1195,7 @@
109
1174
                    prefix, node_key_filter = keys[record.key]
1195
                    prefix, node_key_filter = keys[record.key]
110
1175
                    node_and_filters.append((node, node_key_filter))
1196
                    node_and_filters.append((node, node_key_filter))
111
1176
                    self._items[prefix] = node
1197
                    self._items[prefix] = node
113
1177
                    _page_cache.add(record.key, bytes)
1198
                    _get_cache().add(record.key, bytes)
114
1178
                for info in node_and_filters:
1199
                for info in node_and_filters:
115
1179
                    yield info
1200
                    yield info
116
1180
1201
117
@@ -1300,7 +1321,7 @@
118
1300
            lines.append(serialised[prefix_len:])
1321
            lines.append(serialised[prefix_len:])
119
1301
        sha1, _, _ = store.add_lines((None,), (), lines)
1322
        sha1, _, _ = store.add_lines((None,), (), lines)
120
1302
        self._key = StaticTuple("sha1:" + sha1,).intern()
1323
        self._key = StaticTuple("sha1:" + sha1,).intern()
122
1303
        _page_cache.add(self._key, ''.join(lines))
1324
        _get_cache().add(self._key, ''.join(lines))
123
1304
        yield self._key
1325
        yield self._key
124
1305
1326
125
1306
    def _search_key(self, key):
1327
    def _search_key(self, key):
126
@@ -1489,11 +1510,11 @@
127
1489
        self._state = None
1510
        self._state = None
128
1490
1511
129
1491
    def _read_nodes_from_store(self, keys):
1512
    def _read_nodes_from_store(self, keys):
135
1492
        # We chose not to use _page_cache, because we think in terms of records
1513
        # We chose not to use _get_cache(), because we think in
136
1493
        # to be yielded. Also, we expect to touch each page only 1 time during
1514
        # terms of records to be yielded. Also, we expect to touch each page
137
1494
        # this code. (We may want to evaluate saving the raw bytes into the
1515
        # only 1 time during this code. (We may want to evaluate saving the
138
1495
        # page cache, which would allow a working tree update after the fetch
1516
        # raw bytes into the page cache, which would allow a working tree
139
1496
        # to not have to read the bytes again.)
1517
        # update after the fetch to not have to read the bytes again.)
140
1497
        as_st = StaticTuple.from_sequence
1518
        as_st = StaticTuple.from_sequence
141
1498
        stream = self._store.get_record_stream(keys, 'unordered', True)
1519
        stream = self._store.get_record_stream(keys, 'unordered', True)
142
1499
        for record in stream:
1520
        for record in stream:
143
1500
1521
144
=== modified file 'bzrlib/tests/test_chk_map.py'
145
--- bzrlib/tests/test_chk_map.py	2009-10-21 20:53:21 +0000
146
+++ bzrlib/tests/test_chk_map.py	2010-01-29 15:23:14 +0000
147
@@ -905,7 +905,7 @@
148
905
        # Unmapping the new node will check the existing nodes to see if they
905
        # Unmapping the new node will check the existing nodes to see if they
149
906
        # would fit.
906
        # would fit.
150
907
        # Clear the page cache so we ensure we have to read all the children
907
        # Clear the page cache so we ensure we have to read all the children
152
908
        chk_map._page_cache.clear()
908
        chk_map.clear_cache()
153
909
        chkmap.unmap(('aad',))
909
        chkmap.unmap(('aad',))
154
910
        self.assertIsInstance(chkmap._root_node._items['aaa'], LeafNode)
910
        self.assertIsInstance(chkmap._root_node._items['aaa'], LeafNode)
155
911
        self.assertIsInstance(chkmap._root_node._items['aab'], LeafNode)
911
        self.assertIsInstance(chkmap._root_node._items['aab'], LeafNode)
156
@@ -945,12 +945,12 @@
157
945
        # Now clear the page cache, and only include 2 of the children in the
945
        # Now clear the page cache, and only include 2 of the children in the
158
946
        # cache
946
        # cache
159
947
        aab_key = chkmap._root_node._items['aab']
947
        aab_key = chkmap._root_node._items['aab']
161
948
        aab_bytes = chk_map._page_cache[aab_key]
948
        aab_bytes = chk_map._get_cache()[aab_key]
162
949
        aac_key = chkmap._root_node._items['aac']
949
        aac_key = chkmap._root_node._items['aac']
167
950
        aac_bytes = chk_map._page_cache[aac_key]
950
        aac_bytes = chk_map._get_cache()[aac_key]
168
951
        chk_map._page_cache.clear()
951
        chk_map.clear_cache()
169
952
        chk_map._page_cache[aab_key] = aab_bytes
952
        chk_map._get_cache()[aab_key] = aab_bytes
170
953
        chk_map._page_cache[aac_key] = aac_bytes
953
        chk_map._get_cache()[aac_key] = aac_bytes
171
954
954
172
955
        # Unmapping the new node will check the nodes from the page cache
955
        # Unmapping the new node will check the nodes from the page cache
173
956
        # first, and not have to read in 'aaa'
956
        # first, and not have to read in 'aaa'
Reviewer	Review Type	Date Requested	Status
Martin Pool		2010-01-29	Approve on 2010-01-29
Review via email: mp+18263@code.launchpad.net