1
=== modified file 'bin/apport-unpack'
2
--- bin/apport-unpack	2012-05-04 06:54:56 +0000
3
+++ bin/apport-unpack	2015-02-02 14:38:34 +0000
4
@@ -49,18 +49,27 @@
5
49
except OSError as e:
49
except OSError as e:
6
50
    fatal(str(e))
50
    fatal(str(e))
7
51
51
8
52
bin_keys = []
9
52
pr = problem_report.ProblemReport()
53
pr = problem_report.ProblemReport()
10
53
if report == '-':
54
if report == '-':
12
54
    pr.load(sys.stdin)
55
    pr.load(sys.stdin, binary=False)
13
55
else:
56
else:
14
56
    try:
57
    try:
15
57
        with open(report, 'rb') as f:
58
        with open(report, 'rb') as f:
17
58
            pr.load(f)
59
            pr.load(f, binary=False)
18
59
    except IOError as e:
60
    except IOError as e:
19
60
        fatal(str(e))
61
        fatal(str(e))
20
61
for k in pr:
62
for k in pr:
21
63
    if pr[k] == '':
22
64
        bin_keys.append(k)
23
65
        continue
24
62
    with open(os.path.join(dir, k), 'wb') as f:
66
    with open(os.path.join(dir, k), 'wb') as f:
25
63
        if type(pr[k]) == t_str:
67
        if type(pr[k]) == t_str:
26
64
            f.write(pr[k].encode('UTF-8'))
68
            f.write(pr[k].encode('UTF-8'))
27
65
        else:
69
        else:
28
66
            f.write(pr[k])
70
            f.write(pr[k])
29
71
try:
30
72
    with open(report, 'rb') as f:
31
73
        pr.extract_keys(f, bin_keys, dir)
32
74
except IOError as e:
33
75
    fatal(str(e))
34
67
76
35
=== modified file 'problem_report.py'
36
--- problem_report.py	2013-09-19 14:26:33 +0000
37
+++ problem_report.py	2015-02-02 14:38:34 +0000
38
@@ -188,6 +188,72 @@
39
188
188
40
189
        self.old_keys = set(self.data.keys())
189
        self.old_keys = set(self.data.keys())
41
190
190
42
191
    def extract_keys(self, file, bin_keys, dir):
43
192
        '''Extract only one binary element from the problem_report
44
193
45
194
        Binary elements can be very big. This method extracts
46
195
        directly to a file without loading the report beforehand
47
196
        This is required for Kernel Crash Dumps that can be
48
197
        very big and saturate the RAM
49
198
        '''
50
199
        self._assert_bin_mode(file)
51
200
        if not isinstance(bin_keys, list):
52
201
            bin_keys = [bin_keys]
53
202
        key = None
54
203
        value = None
55
204
        has_key = {key: False for key in bin_keys}
56
205
        b64_block = {}
57
206
        bd = None
58
207
        out = None
59
208
        for line in file:
60
209
            # Identify the bin_keys we're looking for
61
210
            while not line.startswith(b' '):
62
211
                (key, value) = line.split(b':', 1)
63
212
                if not _python2:
64
213
                    key = key.decode('ASCII')
65
214
                if key not in bin_keys:
66
215
                    break
67
216
                b64_block[key] = False
68
217
                has_key[key] = True
69
218
                value = value.strip()
70
219
                if value == b'base64':
71
220
                    value = b''
72
221
                    b64_block[key] = True
73
222
                    try:
74
223
                        bd = None
75
224
                        with open(os.path.join(dir, key), 'wb') as out:
76
225
                            for line in file:
77
226
                                # continuation line
78
227
                                if line.startswith(b' '):
79
228
                                    assert (key is not None and value is not None)
80
229
                                    if b64_block[key]:
81
230
                                        l = base64.b64decode(line)
82
231
                                        if bd:
83
232
                                            out.write(bd.decompress(l))
84
233
                                        else:
85
234
                                            # lazy initialization of bd
86
235
                                            # skip gzip header, if present
87
236
                                            if l.startswith(b'\037\213\010'):
88
237
                                                bd = zlib.decompressobj(-zlib.MAX_WBITS)
89
238
                                                out.write(bd.decompress(self._strip_gzip_header(l)))
90
239
                                            else:
91
240
                                                # legacy zlib-only format used default block
92
241
                                                # size
93
242
                                                bd = zlib.decompressobj()
94
243
                                                out.write(bd.decompress(l))
95
244
                                else:
96
245
                                    break
97
246
                    except IOError:
98
247
                        raise IOError('unable to open %s' % (os.path.join(dir, key)))
99
248
                else:
100
249
                    break
101
250
        if False in has_key.values():
102
251
            raise KeyError('Cannot find %s in report' %
103
252
                           [item for item, element in has_key.items() if element is False])
104
253
        if False in b64_block.values():
105
254
            raise ValueError('%s has no binary content' %
106
255
                             [item for item, element in b64_block.items() if element is False])
107
256
108
191
    def has_removed_fields(self):
257
    def has_removed_fields(self):
109
192
        '''Check if the report has any keys which were not loaded.
258
        '''Check if the report has any keys which were not loaded.
110
193
259
111
194
260
112
=== modified file 'test/test_problem_report.py'
113
--- test/test_problem_report.py	2012-10-11 05:56:35 +0000
114
+++ test/test_problem_report.py	2015-02-02 14:38:34 +0000
115
@@ -1,5 +1,5 @@
116
1
# vim: set encoding=UTF-8 fileencoding=UTF-8 :
1
# vim: set encoding=UTF-8 fileencoding=UTF-8 :
118
2
import unittest, tempfile, os, email, gzip, time, sys
2
import unittest, tempfile, os, shutil, email, gzip, time, sys
119
3
3
120
4
from io import BytesIO
4
from io import BytesIO
121
5
import problem_report
5
import problem_report
122
@@ -12,6 +12,14 @@
123
12
12
124
13
13
125
14
class T(unittest.TestCase):
14
class T(unittest.TestCase):
126
15
    @classmethod
127
16
    def setUp(self):
128
17
        self.workdir = tempfile.mkdtemp()
129
18
130
19
    @classmethod
131
20
    def tearDown(self):
132
21
        shutil.rmtree(self.workdir)
133
22
134
15
    def test_basic_operations(self):
23
    def test_basic_operations(self):
135
16
        '''basic creation and operation.'''
24
        '''basic creation and operation.'''
136
17
25
137
@@ -258,6 +266,52 @@
138
258
        pr.load(BytesIO(b'ProblemType: Crash'))
266
        pr.load(BytesIO(b'ProblemType: Crash'))
139
259
        self.assertEqual(list(pr.keys()), ['ProblemType'])
267
        self.assertEqual(list(pr.keys()), ['ProblemType'])
140
260
268
141
269
    def test_extract_keys(self):
142
270
        '''extract_keys() with various binary elements.'''
143
271
144
272
        # create a test report with binary elements
145
273
        large_val = b'A' * 5000000
146
274
147
275
        pr = problem_report.ProblemReport()
148
276
        pr['Txt'] = 'some text'
149
277
        pr['MoreTxt'] = 'some more text'
150
278
        pr['Foo'] = problem_report.CompressedValue(b'FooFoo!')
151
279
        pr['Uncompressed'] = bin_data
152
280
        pr['Bin'] = problem_report.CompressedValue()
153
281
        pr['Bin'].set_value(bin_data)
154
282
        pr['Large'] = problem_report.CompressedValue(large_val)
155
283
        pr['Multiline'] = problem_report.CompressedValue(b'\1\1\1\n\2\2\n\3\3\3')
156
284
157
285
        report = BytesIO()
158
286
        pr.write(report)
159
287
        report.seek(0)
160
288
161
289
        self.assertRaises(IOError, pr.extract_keys, report, 'Bin', '{}/foo'.format(self.workdir))
162
290
        # Test exception handling : Non-binary and inexistant key
163
291
        tests = {ValueError: 'Txt', ValueError: ['Foo', 'Txt'], KeyError: 'Bar', KeyError: ['Foo', 'Bar']}
164
292
        for test in tests.keys():
165
293
            report.seek(0)
166
294
            self.assertRaises(test, pr.extract_keys, report, tests[test], self.workdir)
167
295
        # Check valid single elements
168
296
        tests = {'Foo': b'FooFoo!', 'Uncompressed': bin_data, 'Bin': bin_data, 'Large': large_val,
169
297
                 'Multiline': b'\1\1\1\n\2\2\n\3\3\3'}
170
298
        for test in tests.keys():
171
299
            report.seek(0)
172
300
            pr.extract_keys(report, test, self.workdir)
173
301
            with open(os.path.join(self.workdir, test), 'rb') as element:
174
302
                self.assertEqual(element.read(), tests[test])
175
303
                element.close()
176
304
            # remove file for next pass
177
305
            os.remove(os.path.join(self.workdir, test))
178
306
        # Check element list
179
307
        report.seek(0)
180
308
        key_list = ['Foo', 'Uncompressed']
181
309
        tests = {'Foo': b'FooFoo!', 'Uncompressed': bin_data}
182
310
        pr.extract_keys(report, key_list, self.workdir)
183
311
        for key in key_list:
184
312
            with open(os.path.join(self.workdir, key), 'rb') as element:
185
313
                self.assertEqual(element.read(), tests[key])
186
314
187
261
    def test_write_file(self):
315
    def test_write_file(self):
188
262
        '''writing a report with binary file data.'''
316
        '''writing a report with binary file data.'''
189
263
317
Status:	Merged
Merged at revision:	2896
Proposed branch:	lp:~louis/apport/apport-unpack-extract
Merge into:	lp:~apport-hackers/apport/trunk
Diff against target:	188 lines (+132/-3) 3 files modified bin/apport-unpack (+11/-2) problem_report.py (+66/-0) test/test_problem_report.py (+55/-1)
To merge this branch:	bzr merge lp:~louis/apport/apport-unpack-extract
Related bugs:	Link a bug report
Reviewer	Review Type	Date Requested	Status
Martin Pitt (community)		2015-01-26	Approve on 2015-02-05
Review via email: mp+247591@code.launchpad.net