1
=== modified file 'bzrlib/groupcompress.py'
2
--- bzrlib/groupcompress.py	2009-05-29 10:25:37 +0000
3
+++ bzrlib/groupcompress.py	2009-06-04 20:35:40 +0000
4
@@ -992,6 +992,26 @@
5
992
                                               nostore_sha=nostore_sha))[0]
992
                                               nostore_sha=nostore_sha))[0]
6
993
        return sha1, length, None
993
        return sha1, length, None
7
994
994
8
995
    def add_text(self, key, parents, text, parent_texts=None,
9
996
        nostore_sha=None, random_id=False,
10
997
        check_content=True):
11
998
        """See VersionedFiles.add_text()."""
12
999
        self._index._check_write_ok()
13
1000
        self._check_add(key, None, random_id, check_content=False)
14
1001
        if text.__class__ is not str:
15
1002
            raise errors.BzrBadParameterUnicode("text")
16
1003
        if parents is None:
17
1004
            # The caller might pass None if there is no graph data, but kndx
18
1005
            # indexes can't directly store that, so we give them
19
1006
            # an empty tuple instead.
20
1007
            parents = ()
21
1008
        # double handling for now. Make it work until then.
22
1009
        length = len(text)
23
1010
        record = FulltextContentFactory(key, parents, None, text)
24
1011
        sha1 = list(self._insert_record_stream([record], random_id=random_id,
25
1012
                                               nostore_sha=nostore_sha))[0]
26
1013
        return sha1, length, None
27
1014
28
995
    def add_fallback_versioned_files(self, a_versioned_files):
1015
    def add_fallback_versioned_files(self, a_versioned_files):
29
996
        """Add a source of texts for texts not present in this knit.
1016
        """Add a source of texts for texts not present in this knit.
30
997
1017
31
@@ -1597,7 +1617,7 @@
32
1597
                if refs:
1617
                if refs:
33
1598
                    for ref in refs:
1618
                    for ref in refs:
34
1599
                        if ref:
1619
                        if ref:
36
1600
                            raise KnitCorrupt(self,
1620
                            raise errors.KnitCorrupt(self,
37
1601
                                "attempt to add node with parents "
1621
                                "attempt to add node with parents "
38
1602
                                "in parentless index.")
1622
                                "in parentless index.")
39
1603
                    refs = ()
1623
                    refs = ()
40
1604
1624
41
=== modified file 'bzrlib/knit.py'
42
--- bzrlib/knit.py	2009-05-29 10:25:37 +0000
43
+++ bzrlib/knit.py	2009-06-04 20:35:40 +0000
44
@@ -909,18 +909,37 @@
45
909
            # indexes can't directly store that, so we give them
909
            # indexes can't directly store that, so we give them
46
910
            # an empty tuple instead.
910
            # an empty tuple instead.
47
911
            parents = ()
911
            parents = ()
48
912
        line_bytes = ''.join(lines)
49
912
        return self._add(key, lines, parents,
913
        return self._add(key, lines, parents,
51
913
            parent_texts, left_matching_blocks, nostore_sha, random_id)
914
            parent_texts, left_matching_blocks, nostore_sha, random_id,
52
915
            line_bytes=line_bytes)
53
916
54
917
    def add_text(self, key, parents, text, parent_texts=None,
55
918
        nostore_sha=None, random_id=False,
56
919
        check_content=True):
57
920
        """See VersionedFiles.add_text()."""
58
921
        self._index._check_write_ok()
59
922
        self._check_add(key, None, random_id, check_content=False)
60
923
        if text.__class__ is not str:
61
924
            raise errors.BzrBadParameterUnicode("text")
62
925
        if parents is None:
63
926
            # The caller might pass None if there is no graph data, but kndx
64
927
            # indexes can't directly store that, so we give them
65
928
            # an empty tuple instead.
66
929
            parents = ()
67
930
        return self._add(key, None, parents,
68
931
            parent_texts, None, nostore_sha, random_id,
69
932
            line_bytes=text)
70
914
933
71
915
    def _add(self, key, lines, parents, parent_texts,
934
    def _add(self, key, lines, parents, parent_texts,
73
916
        left_matching_blocks, nostore_sha, random_id):
935
        left_matching_blocks, nostore_sha, random_id,
74
936
        line_bytes):
75
917
        """Add a set of lines on top of version specified by parents.
937
        """Add a set of lines on top of version specified by parents.
76
918
938
77
919
        Any versions not present will be converted into ghosts.
939
        Any versions not present will be converted into ghosts.
78
920
        """
940
        """
79
921
        # first thing, if the content is something we don't need to store, find
941
        # first thing, if the content is something we don't need to store, find
80
922
        # that out.
942
        # that out.
81
923
        line_bytes = ''.join(lines)
82
924
        digest = sha_string(line_bytes)
943
        digest = sha_string(line_bytes)
83
925
        if nostore_sha == digest:
944
        if nostore_sha == digest:
84
926
            raise errors.ExistingContent
945
            raise errors.ExistingContent
85
@@ -947,13 +966,22 @@
86
947
966
87
948
        text_length = len(line_bytes)
967
        text_length = len(line_bytes)
88
949
        options = []
968
        options = []
92
950
        if lines:
969
        no_eol = False
93
951
            if lines[-1][-1] != '\n':
970
        # Note: line_bytes is not modified to add a newline, that is tracked
94
952
                # copy the contents of lines.
971
        #       via the no_eol flag. 'lines' *is* modified, because that is the
95
972
        #       general values needed by the Content code.
96
973
        if line_bytes and line_bytes[-1] != '\n':
97
974
            options.append('no-eol')
98
975
            no_eol = True
99
976
            # Copy the existing list, or create a new one
100
977
            if lines is None:
101
978
                lines = osutils.split_lines(line_bytes)
102
979
            else:
103
953
                lines = lines[:]
980
                lines = lines[:]
107
954
                options.append('no-eol')
981
            # Replace the last line with one that ends in a final newline
108
955
                lines[-1] = lines[-1] + '\n'
982
            lines[-1] = lines[-1] + '\n'
109
956
                line_bytes += '\n'
983
        if lines is None:
110
984
            lines = osutils.split_lines(line_bytes)
111
957
985
112
958
        for element in key[:-1]:
986
        for element in key[:-1]:
113
959
            if type(element) != str:
987
            if type(element) != str:
114
@@ -965,7 +993,7 @@
115
965
        # Knit hunks are still last-element only
993
        # Knit hunks are still last-element only
116
966
        version_id = key[-1]
994
        version_id = key[-1]
117
967
        content = self._factory.make(lines, version_id)
995
        content = self._factory.make(lines, version_id)
119
968
        if 'no-eol' in options:
996
        if no_eol:
120
969
            # Hint to the content object that its text() call should strip the
997
            # Hint to the content object that its text() call should strip the
121
970
            # EOL.
998
            # EOL.
122
971
            content._should_strip_eol = True
999
            content._should_strip_eol = True
123
@@ -986,8 +1014,11 @@
124
986
            if self._factory.__class__ is KnitPlainFactory:
1014
            if self._factory.__class__ is KnitPlainFactory:
125
987
                # Use the already joined bytes saving iteration time in
1015
                # Use the already joined bytes saving iteration time in
126
988
                # _record_to_data.
1016
                # _record_to_data.
127
1017
                dense_lines = [line_bytes]
128
1018
                if no_eol:
129
1019
                    dense_lines.append('\n')
130
989
                size, bytes = self._record_to_data(key, digest,
1020
                size, bytes = self._record_to_data(key, digest,
132
990
                    lines, [line_bytes])
1021
                    lines, dense_lines)
133
991
            else:
1022
            else:
134
992
                # get mixed annotation + content and feed it into the
1023
                # get mixed annotation + content and feed it into the
135
993
                # serialiser.
1024
                # serialiser.
136
@@ -1920,21 +1951,16 @@
137
1920
            function spends less time resizing the final string.
1951
            function spends less time resizing the final string.
138
1921
        :return: (len, a StringIO instance with the raw data ready to read.)
1952
        :return: (len, a StringIO instance with the raw data ready to read.)
139
1922
        """
1953
        """
152
1923
        # Note: using a string copy here increases memory pressure with e.g.
1954
        chunks = ["version %s %d %s\n" % (key[-1], len(lines), digest)]
153
1924
        # ISO's, but it is about 3 seconds faster on a 1.2Ghz intel machine
1955
        chunks.extend(dense_lines or lines)
154
1925
        # when doing the initial commit of a mozilla tree. RBC 20070921
1956
        chunks.append("end %s\n" % key[-1])
155
1926
        bytes = ''.join(chain(
1957
        for chunk in chunks:
156
1927
            ["version %s %d %s\n" % (key[-1],
1958
            if type(chunk) != str:
157
1928
                                     len(lines),
1959
                raise AssertionError(
158
1929
                                     digest)],
1960
                    'data must be plain bytes was %s' % type(chunk))
147
1930
            dense_lines or lines,
148
1931
            ["end %s\n" % key[-1]]))
149
1932
        if type(bytes) != str:
150
1933
            raise AssertionError(
151
1934
                'data must be plain bytes was %s' % type(bytes))
159
1935
        if lines and lines[-1][-1] != '\n':
1961
        if lines and lines[-1][-1] != '\n':
160
1936
            raise ValueError('corrupt lines value %r' % lines)
1962
            raise ValueError('corrupt lines value %r' % lines)
162
1937
        compressed_bytes = tuned_gzip.bytes_to_gzip(bytes)
1963
        compressed_bytes = tuned_gzip.chunks_to_gzip(chunks)
163
1938
        return len(compressed_bytes), compressed_bytes
1964
        return len(compressed_bytes), compressed_bytes
164
1939
1965
165
1940
    def _split_header(self, line):
1966
    def _split_header(self, line):
166
1941
1967
167
=== modified file 'bzrlib/repository.py'
168
--- bzrlib/repository.py	2009-06-03 21:31:43 +0000
169
+++ bzrlib/repository.py	2009-06-04 20:35:40 +0000
170
@@ -494,12 +494,12 @@
171
494
            ie.executable = content_summary[2]
494
            ie.executable = content_summary[2]
172
495
            file_obj, stat_value = tree.get_file_with_stat(ie.file_id, path)
495
            file_obj, stat_value = tree.get_file_with_stat(ie.file_id, path)
173
496
            try:
496
            try:
175
497
                lines = file_obj.readlines()
497
                text = file_obj.read()
176
498
            finally:
498
            finally:
177
499
                file_obj.close()
499
                file_obj.close()
178
500
            try:
500
            try:
179
501
                ie.text_sha1, ie.text_size = self._add_text_to_weave(
501
                ie.text_sha1, ie.text_size = self._add_text_to_weave(
181
502
                    ie.file_id, lines, heads, nostore_sha)
502
                    ie.file_id, text, heads, nostore_sha)
182
503
                # Let the caller know we generated a stat fingerprint.
503
                # Let the caller know we generated a stat fingerprint.
183
504
                fingerprint = (ie.text_sha1, stat_value)
504
                fingerprint = (ie.text_sha1, stat_value)
184
505
            except errors.ExistingContent:
505
            except errors.ExistingContent:
185
@@ -517,8 +517,7 @@
186
517
                # carry over:
517
                # carry over:
187
518
                ie.revision = parent_entry.revision
518
                ie.revision = parent_entry.revision
188
519
                return self._get_delta(ie, basis_inv, path), False, None
519
                return self._get_delta(ie, basis_inv, path), False, None
191
520
            lines = []
520
            self._add_text_to_weave(ie.file_id, '', heads, None)
190
521
            self._add_text_to_weave(ie.file_id, lines, heads, None)
192
522
        elif kind == 'symlink':
521
        elif kind == 'symlink':
193
523
            current_link_target = content_summary[3]
522
            current_link_target = content_summary[3]
194
524
            if not store:
523
            if not store:
195
@@ -532,8 +531,7 @@
196
532
                ie.symlink_target = parent_entry.symlink_target
531
                ie.symlink_target = parent_entry.symlink_target
197
533
                return self._get_delta(ie, basis_inv, path), False, None
532
                return self._get_delta(ie, basis_inv, path), False, None
198
534
            ie.symlink_target = current_link_target
533
            ie.symlink_target = current_link_target
201
535
            lines = []
534
            self._add_text_to_weave(ie.file_id, '', heads, None)
200
536
            self._add_text_to_weave(ie.file_id, lines, heads, None)
202
537
        elif kind == 'tree-reference':
535
        elif kind == 'tree-reference':
203
538
            if not store:
536
            if not store:
204
539
                if content_summary[3] != parent_entry.reference_revision:
537
                if content_summary[3] != parent_entry.reference_revision:
205
@@ -544,8 +542,7 @@
206
544
                ie.revision = parent_entry.revision
542
                ie.revision = parent_entry.revision
207
545
                return self._get_delta(ie, basis_inv, path), False, None
543
                return self._get_delta(ie, basis_inv, path), False, None
208
546
            ie.reference_revision = content_summary[3]
544
            ie.reference_revision = content_summary[3]
211
547
            lines = []
545
            self._add_text_to_weave(ie.file_id, '', heads, None)
210
548
            self._add_text_to_weave(ie.file_id, lines, heads, None)
212
549
        else:
546
        else:
213
550
            raise NotImplementedError('unknown kind')
547
            raise NotImplementedError('unknown kind')
214
551
        ie.revision = self._new_revision_id
548
        ie.revision = self._new_revision_id
215
@@ -745,7 +742,7 @@
216
745
                        entry.executable = True
742
                        entry.executable = True
217
746
                    else:
743
                    else:
218
747
                        entry.executable = False
744
                        entry.executable = False
220
748
                    if (carry_over_possible and 
745
                    if (carry_over_possible and
221
749
                        parent_entry.executable == entry.executable):
746
                        parent_entry.executable == entry.executable):
222
750
                            # Check the file length, content hash after reading
747
                            # Check the file length, content hash after reading
223
751
                            # the file.
748
                            # the file.
224
@@ -754,12 +751,12 @@
225
754
                        nostore_sha = None
751
                        nostore_sha = None
226
755
                    file_obj, stat_value = tree.get_file_with_stat(file_id, change[1][1])
752
                    file_obj, stat_value = tree.get_file_with_stat(file_id, change[1][1])
227
756
                    try:
753
                    try:
229
757
                        lines = file_obj.readlines()
754
                        text = file_obj.read()
230
758
                    finally:
755
                    finally:
231
759
                        file_obj.close()
756
                        file_obj.close()
232
760
                    try:
757
                    try:
233
761
                        entry.text_sha1, entry.text_size = self._add_text_to_weave(
758
                        entry.text_sha1, entry.text_size = self._add_text_to_weave(
235
762
                            file_id, lines, heads, nostore_sha)
759
                            file_id, text, heads, nostore_sha)
236
763
                        yield file_id, change[1][1], (entry.text_sha1, stat_value)
760
                        yield file_id, change[1][1], (entry.text_sha1, stat_value)
237
764
                    except errors.ExistingContent:
761
                    except errors.ExistingContent:
238
765
                        # No content change against a carry_over parent
762
                        # No content change against a carry_over parent
239
@@ -774,7 +771,7 @@
240
774
                        parent_entry.symlink_target == entry.symlink_target):
771
                        parent_entry.symlink_target == entry.symlink_target):
241
775
                        carried_over = True
772
                        carried_over = True
242
776
                    else:
773
                    else:
244
777
                        self._add_text_to_weave(change[0], [], heads, None)
774
                        self._add_text_to_weave(change[0], '', heads, None)
245
778
                elif kind == 'directory':
775
                elif kind == 'directory':
246
779
                    if carry_over_possible:
776
                    if carry_over_possible:
247
780
                        carried_over = True
777
                        carried_over = True
248
@@ -782,7 +779,7 @@
249
782
                        # Nothing to set on the entry.
779
                        # Nothing to set on the entry.
250
783
                        # XXX: split into the Root and nonRoot versions.
780
                        # XXX: split into the Root and nonRoot versions.
251
784
                        if change[1][1] != '' or self.repository.supports_rich_root():
781
                        if change[1][1] != '' or self.repository.supports_rich_root():
253
785
                            self._add_text_to_weave(change[0], [], heads, None)
782
                            self._add_text_to_weave(change[0], '', heads, None)
254
786
                elif kind == 'tree-reference':
783
                elif kind == 'tree-reference':
255
787
                    if not self.repository._format.supports_tree_reference:
784
                    if not self.repository._format.supports_tree_reference:
256
788
                        # This isn't quite sane as an error, but we shouldn't
785
                        # This isn't quite sane as an error, but we shouldn't
257
@@ -797,7 +794,7 @@
258
797
                        parent_entry.reference_revision == reference_revision):
794
                        parent_entry.reference_revision == reference_revision):
259
798
                        carried_over = True
795
                        carried_over = True
260
799
                    else:
796
                    else:
262
800
                        self._add_text_to_weave(change[0], [], heads, None)
797
                        self._add_text_to_weave(change[0], '', heads, None)
263
801
                else:
798
                else:
264
802
                    raise AssertionError('unknown kind %r' % kind)
799
                    raise AssertionError('unknown kind %r' % kind)
265
803
                if not carried_over:
800
                if not carried_over:
266
@@ -818,15 +815,15 @@
267
818
            self._require_root_change(tree)
815
            self._require_root_change(tree)
268
819
        self.basis_delta_revision = basis_revision_id
816
        self.basis_delta_revision = basis_revision_id
269
820
817
271
821
    def _add_text_to_weave(self, file_id, new_lines, parents, nostore_sha):
818
    def _add_text_to_weave(self, file_id, new_text, parents, nostore_sha):
272
822
        # Note: as we read the content directly from the tree, we know its not
819
        # Note: as we read the content directly from the tree, we know its not
273
823
        # been turned into unicode or badly split - but a broken tree
820
        # been turned into unicode or badly split - but a broken tree
274
824
        # implementation could give us bad output from readlines() so this is
821
        # implementation could give us bad output from readlines() so this is
275
825
        # not a guarantee of safety. What would be better is always checking
822
        # not a guarantee of safety. What would be better is always checking
276
826
        # the content during test suite execution. RBC 20070912
823
        # the content during test suite execution. RBC 20070912
277
827
        parent_keys = tuple((file_id, parent) for parent in parents)
824
        parent_keys = tuple((file_id, parent) for parent in parents)
280
828
        return self.repository.texts.add_lines(
825
        return self.repository.texts.add_text(
281
829
            (file_id, self._new_revision_id), parent_keys, new_lines,
826
            (file_id, self._new_revision_id), parent_keys, new_text,
282
830
            nostore_sha=nostore_sha, random_id=self.random_revid,
827
            nostore_sha=nostore_sha, random_id=self.random_revid,
283
831
            check_content=False)[0:2]
828
            check_content=False)[0:2]
284
832
829
285
833
830
286
=== modified file 'bzrlib/tests/test_tuned_gzip.py'
287
--- bzrlib/tests/test_tuned_gzip.py	2009-03-23 14:59:43 +0000
288
+++ bzrlib/tests/test_tuned_gzip.py	2009-06-04 20:35:40 +0000
289
@@ -85,3 +85,28 @@
290
85
        self.assertEqual('', stream.read())
85
        self.assertEqual('', stream.read())
291
86
        # and it should be new member time in the stream.
86
        # and it should be new member time in the stream.
292
87
        self.failUnless(myfile._new_member)
87
        self.failUnless(myfile._new_member)
293
88
294
89
295
90
class TestToGzip(TestCase):
296
91
297
92
    def assertToGzip(self, chunks):
298
93
        bytes = ''.join(chunks)
299
94
        gzfromchunks = tuned_gzip.chunks_to_gzip(chunks)
300
95
        gzfrombytes = tuned_gzip.bytes_to_gzip(bytes)
301
96
        self.assertEqual(gzfrombytes, gzfromchunks)
302
97
        decoded = tuned_gzip.GzipFile(fileobj=StringIO(gzfromchunks)).read()
303
98
        self.assertEqual(bytes, decoded)
304
99
305
100
    def test_single_chunk(self):
306
101
        self.assertToGzip(['a modest chunk\nwith some various\nbits\n'])
307
102
308
103
    def test_simple_text(self):
309
104
        self.assertToGzip(['some\n', 'strings\n', 'to\n', 'process\n'])
310
105
311
106
    def test_large_chunks(self):
312
107
        self.assertToGzip(['a large string\n'*1024])
313
108
        self.assertToGzip(['a large string\n']*1024)
314
109
315
110
    def test_enormous_chunks(self):
316
111
        self.assertToGzip(['a large string\n'*1024*256])
317
112
        self.assertToGzip(['a large string\n']*1024*256)
318
88
113
319
=== modified file 'bzrlib/tests/test_versionedfile.py'
320
--- bzrlib/tests/test_versionedfile.py	2009-05-01 18:09:24 +0000
321
+++ bzrlib/tests/test_versionedfile.py	2009-06-04 20:35:40 +0000
322
@@ -1471,6 +1471,58 @@
323
1471
            self.addCleanup(lambda:self.cleanup(files))
1471
            self.addCleanup(lambda:self.cleanup(files))
324
1472
        return files
1472
        return files
325
1473
1473
326
1474
    def test_add_lines(self):
327
1475
        f = self.get_versionedfiles()
328
1476
        if self.key_length == 1:
329
1477
            key0 = ('r0',)
330
1478
            key1 = ('r1',)
331
1479
            key2 = ('r2',)
332
1480
            keyf = ('foo',)
333
1481
        else:
334
1482
            key0 = ('fid', 'r0')
335
1483
            key1 = ('fid', 'r1')
336
1484
            key2 = ('fid', 'r2')
337
1485
            keyf = ('fid', 'foo')
338
1486
        f.add_lines(key0, [], ['a\n', 'b\n'])
339
1487
        if self.graph:
340
1488
            f.add_lines(key1, [key0], ['b\n', 'c\n'])
341
1489
        else:
342
1490
            f.add_lines(key1, [], ['b\n', 'c\n'])
343
1491
        keys = f.keys()
344
1492
        self.assertTrue(key0 in keys)
345
1493
        self.assertTrue(key1 in keys)
346
1494
        records = []
347
1495
        for record in f.get_record_stream([key0, key1], 'unordered', True):
348
1496
            records.append((record.key, record.get_bytes_as('fulltext')))
349
1497
        records.sort()
350
1498
        self.assertEqual([(key0, 'a\nb\n'), (key1, 'b\nc\n')], records)
351
1499
352
1500
    def test_add_text(self):
353
1501
        f = self.get_versionedfiles()
354
1502
        if self.key_length == 1:
355
1503
            key0 = ('r0',)
356
1504
            key1 = ('r1',)
357
1505
            key2 = ('r2',)
358
1506
            keyf = ('foo',)
359
1507
        else:
360
1508
            key0 = ('fid', 'r0')
361
1509
            key1 = ('fid', 'r1')
362
1510
            key2 = ('fid', 'r2')
363
1511
            keyf = ('fid', 'foo')
364
1512
        f.add_text(key0, [], 'a\nb\n')
365
1513
        if self.graph:
366
1514
            f.add_text(key1, [key0], 'b\nc\n')
367
1515
        else:
368
1516
            f.add_text(key1, [], 'b\nc\n')
369
1517
        keys = f.keys()
370
1518
        self.assertTrue(key0 in keys)
371
1519
        self.assertTrue(key1 in keys)
372
1520
        records = []
373
1521
        for record in f.get_record_stream([key0, key1], 'unordered', True):
374
1522
            records.append((record.key, record.get_bytes_as('fulltext')))
375
1523
        records.sort()
376
1524
        self.assertEqual([(key0, 'a\nb\n'), (key1, 'b\nc\n')], records)
377
1525
378
1474
    def test_annotate(self):
1526
    def test_annotate(self):
379
1475
        files = self.get_versionedfiles()
1527
        files = self.get_versionedfiles()
380
1476
        self.get_diamond_files(files)
1528
        self.get_diamond_files(files)
381
@@ -1520,7 +1572,7 @@
382
1520
            trailing_eol=trailing_eol, nograph=not self.graph,
1572
            trailing_eol=trailing_eol, nograph=not self.graph,
383
1521
            left_only=left_only, nokeys=nokeys)
1573
            left_only=left_only, nokeys=nokeys)
384
1522
1574
386
1523
    def test_add_lines_nostoresha(self):
1575
    def _add_content_nostoresha(self, add_lines):
387
1524
        """When nostore_sha is supplied using old content raises."""
1576
        """When nostore_sha is supplied using old content raises."""
388
1525
        vf = self.get_versionedfiles()
1577
        vf = self.get_versionedfiles()
389
1526
        empty_text = ('a', [])
1578
        empty_text = ('a', [])
390
@@ -1528,7 +1580,12 @@
391
1528
        sample_text_no_nl = ('c', ["foo\n", "bar"])
1580
        sample_text_no_nl = ('c', ["foo\n", "bar"])
392
1529
        shas = []
1581
        shas = []
393
1530
        for version, lines in (empty_text, sample_text_nl, sample_text_no_nl):
1582
        for version, lines in (empty_text, sample_text_nl, sample_text_no_nl):
395
1531
            sha, _, _ = vf.add_lines(self.get_simple_key(version), [], lines)
1583
            if add_lines:
396
1584
                sha, _, _ = vf.add_lines(self.get_simple_key(version), [],
397
1585
                                         lines)
398
1586
            else:
399
1587
                sha, _, _ = vf.add_text(self.get_simple_key(version), [],
400
1588
                                        ''.join(lines))
401
1532
            shas.append(sha)
1589
            shas.append(sha)
402
1533
        # we now have a copy of all the lines in the vf.
1590
        # we now have a copy of all the lines in the vf.
403
1534
        for sha, (version, lines) in zip(
1591
        for sha, (version, lines) in zip(
404
@@ -1537,10 +1594,19 @@
405
1537
            self.assertRaises(errors.ExistingContent,
1594
            self.assertRaises(errors.ExistingContent,
406
1538
                vf.add_lines, new_key, [], lines,
1595
                vf.add_lines, new_key, [], lines,
407
1539
                nostore_sha=sha)
1596
                nostore_sha=sha)
408
1597
            self.assertRaises(errors.ExistingContent,
409
1598
                vf.add_text, new_key, [], ''.join(lines),
410
1599
                nostore_sha=sha)
411
1540
            # and no new version should have been added.
1600
            # and no new version should have been added.
412
1541
            record = vf.get_record_stream([new_key], 'unordered', True).next()
1601
            record = vf.get_record_stream([new_key], 'unordered', True).next()
413
1542
            self.assertEqual('absent', record.storage_kind)
1602
            self.assertEqual('absent', record.storage_kind)
414
1543
1603
415
1604
    def test_add_lines_nostoresha(self):
416
1605
        self._add_content_nostoresha(add_lines=True)
417
1606
418
1607
    def test_add_text_nostoresha(self):
419
1608
        self._add_content_nostoresha(add_lines=False)
420
1609
421
1544
    def test_add_lines_return(self):
1610
    def test_add_lines_return(self):
422
1545
        files = self.get_versionedfiles()
1611
        files = self.get_versionedfiles()
423
1546
        # save code by using the stock data insertion helper.
1612
        # save code by using the stock data insertion helper.
424
1547
1613
425
=== modified file 'bzrlib/tuned_gzip.py'
426
--- bzrlib/tuned_gzip.py	2009-03-23 14:59:43 +0000
427
+++ bzrlib/tuned_gzip.py	2009-06-04 20:35:40 +0000
428
@@ -52,6 +52,18 @@
429
52
    width=-zlib.MAX_WBITS, mem=zlib.DEF_MEM_LEVEL,
52
    width=-zlib.MAX_WBITS, mem=zlib.DEF_MEM_LEVEL,
430
53
    crc32=zlib.crc32):
53
    crc32=zlib.crc32):
431
54
    """Create a gzip file containing bytes and return its content."""
54
    """Create a gzip file containing bytes and return its content."""
432
55
    return chunks_to_gzip([bytes])
433
56
434
57
435
58
def chunks_to_gzip(chunks, factory=zlib.compressobj,
436
59
    level=zlib.Z_DEFAULT_COMPRESSION, method=zlib.DEFLATED,
437
60
    width=-zlib.MAX_WBITS, mem=zlib.DEF_MEM_LEVEL,
438
61
    crc32=zlib.crc32):
439
62
    """Create a gzip file containing chunks and return its content.
440
63
441
64
    :param chunks: An iterable of strings. Each string can have arbitrary
442
65
        layout.
443
66
    """
444
55
    result = [
67
    result = [
445
56
        '\037\213'  # self.fileobj.write('\037\213')  # magic header
68
        '\037\213'  # self.fileobj.write('\037\213')  # magic header
446
57
        '\010'      # self.fileobj.write('\010')      # compression method
69
        '\010'      # self.fileobj.write('\010')      # compression method
447
@@ -69,11 +81,17 @@
448
69
    # using a compressobj avoids a small header and trailer that the compress()
81
    # using a compressobj avoids a small header and trailer that the compress()
449
70
    # utility function adds.
82
    # utility function adds.
450
71
    compress = factory(level, method, width, mem, 0)
83
    compress = factory(level, method, width, mem, 0)
452
72
    result.append(compress.compress(bytes))
84
    crc = 0
453
85
    total_len = 0
454
86
    for chunk in chunks:
455
87
        crc = crc32(chunk, crc)
456
88
        total_len += len(chunk)
457
89
        zbytes = compress.compress(chunk)
458
90
        if zbytes:
459
91
            result.append(zbytes)
460
73
    result.append(compress.flush())
92
    result.append(compress.flush())
461
74
    result.append(struct.pack("<L", LOWU32(crc32(bytes))))
462
75
    # size may exceed 2GB, or even 4GB
93
    # size may exceed 2GB, or even 4GB
464
76
    result.append(struct.pack("<L", LOWU32(len(bytes))))
94
    result.append(struct.pack("<LL", LOWU32(crc), LOWU32(total_len)))
465
77
    return ''.join(result)
95
    return ''.join(result)
466
78
96
467
79
97
468
80
98
469
=== modified file 'bzrlib/versionedfile.py'
470
--- bzrlib/versionedfile.py	2009-04-29 17:02:36 +0000
471
+++ bzrlib/versionedfile.py	2009-06-04 20:35:40 +0000
472
@@ -829,6 +829,14 @@
473
829
        """
829
        """
474
830
        raise NotImplementedError(self.add_lines)
830
        raise NotImplementedError(self.add_lines)
475
831
831
476
832
    def add_text(self, key, parents, text, parent_texts=None,
477
833
                 nostore_sha=None, random_id=False, check_content=True):
478
834
        return self.add_lines(key, parents, osutils.split_lines(text),
479
835
                              parent_texts=parent_texts,
480
836
                              nostore_sha=nostore_sha,
481
837
                              random_id=random_id,
482
838
                              check_content=check_content)
483
839
484
832
    def add_mpdiffs(self, records):
840
    def add_mpdiffs(self, records):
485
833
        """Add mpdiffs to this VersionedFile.
841
        """Add mpdiffs to this VersionedFile.
486
834
842
Reviewer	Review Type	Date Requested	Status
bzr-core		2009-06-02	Pending
Review via email: mp+6988@code.launchpad.net