Merge lp:~gz/brz/py3_bencode into lp:brz

Proposed by Martin Packman
Status: Merged
Approved by: Martin Packman
Approved revision: no longer in the source branch.
Merge reported by: The Breezy Bot
Merged at revision: not available
Proposed branch: lp:~gz/brz/py3_bencode
Merge into: lp:brz
Diff against target: 396 lines (+127/-124)
2 files modified
breezy/tests/test__bencode.py (+91/-94)
breezy/util/_bencode_py.py (+36/-30)
To merge this branch: bzr merge lp:~gz/brz/py3_bencode
Reviewer Review Type Date Requested Status
Jelmer Vernooij Approve
Review via email: mp+325451@code.launchpad.net

Commit message

Make _bencode_py Python 3 compatible

Description of the change

It's b-time for b-encode.

Only real thing of note is the annoyance of turning int(4) into b'4' on Python 3. Also one change from [0] to [:1] so keys are always one char bytestrings not ints.

To post a comment you must log in.
Revision history for this message
Jelmer Vernooij (jelmer) :
review: Approve

Preview Diff

[H/L] Next/Prev Comment, [J/K] Next/Prev File, [N/P] Next/Prev Hunk
=== modified file 'breezy/tests/test__bencode.py'
--- breezy/tests/test__bencode.py 2017-05-23 14:08:03 +0000
+++ breezy/tests/test__bencode.py 2017-06-10 22:12:08 +0000
@@ -38,73 +38,73 @@
38 self.assertRaises(exc, self.module.bdecode, bad)38 self.assertRaises(exc, self.module.bdecode, bad)
3939
40 def test_int(self):40 def test_int(self):
41 self._check(0, 'i0e')41 self._check(0, b'i0e')
42 self._check(4, 'i4e')42 self._check(4, b'i4e')
43 self._check(123456789, 'i123456789e')43 self._check(123456789, b'i123456789e')
44 self._check(-10, 'i-10e')44 self._check(-10, b'i-10e')
45 self._check(int('1' * 1000), 'i' + ('1' * 1000) + 'e')45 self._check(int('1' * 1000), b'i' + (b'1' * 1000) + b'e')
4646
47 def test_long(self):47 def test_long(self):
48 self._check(12345678901234567890, 'i12345678901234567890e')48 self._check(12345678901234567890, b'i12345678901234567890e')
49 self._check(-12345678901234567890, 'i-12345678901234567890e')49 self._check(-12345678901234567890, b'i-12345678901234567890e')
5050
51 def test_malformed_int(self):51 def test_malformed_int(self):
52 self._run_check_error(ValueError, 'ie')52 self._run_check_error(ValueError, b'ie')
53 self._run_check_error(ValueError, 'i-e')53 self._run_check_error(ValueError, b'i-e')
54 self._run_check_error(ValueError, 'i-010e')54 self._run_check_error(ValueError, b'i-010e')
55 self._run_check_error(ValueError, 'i-0e')55 self._run_check_error(ValueError, b'i-0e')
56 self._run_check_error(ValueError, 'i00e')56 self._run_check_error(ValueError, b'i00e')
57 self._run_check_error(ValueError, 'i01e')57 self._run_check_error(ValueError, b'i01e')
58 self._run_check_error(ValueError, 'i-03e')58 self._run_check_error(ValueError, b'i-03e')
59 self._run_check_error(ValueError, 'i')59 self._run_check_error(ValueError, b'i')
60 self._run_check_error(ValueError, 'i123')60 self._run_check_error(ValueError, b'i123')
61 self._run_check_error(ValueError, 'i341foo382e')61 self._run_check_error(ValueError, b'i341foo382e')
6262
63 def test_string(self):63 def test_string(self):
64 self._check('', '0:')64 self._check(b'', b'0:')
65 self._check('abc', '3:abc')65 self._check(b'abc', b'3:abc')
66 self._check('1234567890', '10:1234567890')66 self._check(b'1234567890', b'10:1234567890')
6767
68 def test_large_string(self):68 def test_large_string(self):
69 self.assertRaises(ValueError, self.module.bdecode, "2147483639:foo")69 self.assertRaises(ValueError, self.module.bdecode, b"2147483639:foo")
7070
71 def test_malformed_string(self):71 def test_malformed_string(self):
72 self._run_check_error(ValueError, '10:x')72 self._run_check_error(ValueError, b'10:x')
73 self._run_check_error(ValueError, '10:')73 self._run_check_error(ValueError, b'10:')
74 self._run_check_error(ValueError, '10')74 self._run_check_error(ValueError, b'10')
75 self._run_check_error(ValueError, '01:x')75 self._run_check_error(ValueError, b'01:x')
76 self._run_check_error(ValueError, '00:')76 self._run_check_error(ValueError, b'00:')
77 self._run_check_error(ValueError, '35208734823ljdahflajhdf')77 self._run_check_error(ValueError, b'35208734823ljdahflajhdf')
78 self._run_check_error(ValueError, '432432432432432:foo')78 self._run_check_error(ValueError, b'432432432432432:foo')
79 self._run_check_error(ValueError, ' 1:x') # leading whitespace79 self._run_check_error(ValueError, b' 1:x') # leading whitespace
80 self._run_check_error(ValueError, '-1:x') # negative80 self._run_check_error(ValueError, b'-1:x') # negative
81 self._run_check_error(ValueError, '1 x') # space vs colon81 self._run_check_error(ValueError, b'1 x') # space vs colon
82 self._run_check_error(ValueError, '1x') # missing colon82 self._run_check_error(ValueError, b'1x') # missing colon
83 self._run_check_error(ValueError, ('1' * 1000) + ':')83 self._run_check_error(ValueError, (b'1' * 1000) + b':')
8484
85 def test_list(self):85 def test_list(self):
86 self._check([], 'le')86 self._check([], b'le')
87 self._check(['', '', ''], 'l0:0:0:e')87 self._check([b'', b'', b''], b'l0:0:0:e')
88 self._check([1, 2, 3], 'li1ei2ei3ee')88 self._check([1, 2, 3], b'li1ei2ei3ee')
89 self._check(['asd', 'xy'], 'l3:asd2:xye')89 self._check([b'asd', b'xy'], b'l3:asd2:xye')
90 self._check([['Alice', 'Bob'], [2, 3]], 'll5:Alice3:Bobeli2ei3eee')90 self._check([[b'Alice', b'Bob'], [2, 3]], b'll5:Alice3:Bobeli2ei3eee')
9191
92 def test_list_deepnested(self):92 def test_list_deepnested(self):
93 self._run_check_error(RuntimeError, ("l" * 10000) + ("e" * 10000))93 self._run_check_error(RuntimeError, (b"l" * 10000) + (b"e" * 10000))
9494
95 def test_malformed_list(self):95 def test_malformed_list(self):
96 self._run_check_error(ValueError, 'l')96 self._run_check_error(ValueError, b'l')
97 self._run_check_error(ValueError, 'l01:ae')97 self._run_check_error(ValueError, b'l01:ae')
98 self._run_check_error(ValueError, 'l0:')98 self._run_check_error(ValueError, b'l0:')
99 self._run_check_error(ValueError, 'li1e')99 self._run_check_error(ValueError, b'li1e')
100 self._run_check_error(ValueError, 'l-3:e')100 self._run_check_error(ValueError, b'l-3:e')
101101
102 def test_dict(self):102 def test_dict(self):
103 self._check({}, 'de')103 self._check({}, b'de')
104 self._check({'':3}, 'd0:i3ee')104 self._check({b'':3}, b'd0:i3ee')
105 self._check({'age': 25, 'eyes': 'blue'}, 'd3:agei25e4:eyes4:bluee')105 self._check({b'age': 25, b'eyes': b'blue'}, b'd3:agei25e4:eyes4:bluee')
106 self._check({'spam.mp3': {'author': 'Alice', 'length': 100000}},106 self._check({b'spam.mp3': {b'author': b'Alice', b'length': 100000}},
107 'd8:spam.mp3d6:author5:Alice6:lengthi100000eee')107 b'd8:spam.mp3d6:author5:Alice6:lengthi100000eee')
108108
109 def test_dict_deepnested(self):109 def test_dict_deepnested(self):
110 # The recursion here provokes CPython into emitting a warning on110 # The recursion here provokes CPython into emitting a warning on
@@ -114,30 +114,30 @@
114 # avoid distracting noise in the test output.114 # avoid distracting noise in the test output.
115 self.overrideAttr(sys, 'stderr', self._log_file)115 self.overrideAttr(sys, 'stderr', self._log_file)
116 self._run_check_error(116 self._run_check_error(
117 RuntimeError, ("d0:" * 10000) + 'i1e' + ("e" * 10000))117 RuntimeError, (b"d0:" * 10000) + b'i1e' + (b"e" * 10000))
118118
119 def test_malformed_dict(self):119 def test_malformed_dict(self):
120 self._run_check_error(ValueError, 'd')120 self._run_check_error(ValueError, b'd')
121 self._run_check_error(ValueError, 'defoobar')121 self._run_check_error(ValueError, b'defoobar')
122 self._run_check_error(ValueError, 'd3:fooe')122 self._run_check_error(ValueError, b'd3:fooe')
123 self._run_check_error(ValueError, 'di1e0:e')123 self._run_check_error(ValueError, b'di1e0:e')
124 self._run_check_error(ValueError, 'd1:b0:1:a0:e')124 self._run_check_error(ValueError, b'd1:b0:1:a0:e')
125 self._run_check_error(ValueError, 'd1:a0:1:a0:e')125 self._run_check_error(ValueError, b'd1:a0:1:a0:e')
126 self._run_check_error(ValueError, 'd0:0:')126 self._run_check_error(ValueError, b'd0:0:')
127 self._run_check_error(ValueError, 'd0:')127 self._run_check_error(ValueError, b'd0:')
128 self._run_check_error(ValueError, 'd432432432432432432:e')128 self._run_check_error(ValueError, b'd432432432432432432:e')
129129
130 def test_empty_string(self):130 def test_empty_string(self):
131 self.assertRaises(ValueError, self.module.bdecode, '')131 self.assertRaises(ValueError, self.module.bdecode, b'')
132132
133 def test_junk(self):133 def test_junk(self):
134 self._run_check_error(ValueError, 'i6easd')134 self._run_check_error(ValueError, b'i6easd')
135 self._run_check_error(ValueError, '2:abfdjslhfld')135 self._run_check_error(ValueError, b'2:abfdjslhfld')
136 self._run_check_error(ValueError, '0:0:')136 self._run_check_error(ValueError, b'0:0:')
137 self._run_check_error(ValueError, 'leanfdldjfh')137 self._run_check_error(ValueError, b'leanfdldjfh')
138138
139 def test_unknown_object(self):139 def test_unknown_object(self):
140 self.assertRaises(ValueError, self.module.bdecode, 'relwjhrlewjh')140 self.assertRaises(ValueError, self.module.bdecode, b'relwjhrlewjh')
141141
142 def test_unsupported_type(self):142 def test_unsupported_type(self):
143 self._run_check_error(TypeError, float(1.5))143 self._run_check_error(TypeError, float(1.5))
@@ -158,28 +158,28 @@
158 self.assertEqual(expected, self.module.bencode(source))158 self.assertEqual(expected, self.module.bencode(source))
159159
160 def test_int(self):160 def test_int(self):
161 self._check('i4e', 4)161 self._check(b'i4e', 4)
162 self._check('i0e', 0)162 self._check(b'i0e', 0)
163 self._check('i-10e', -10)163 self._check(b'i-10e', -10)
164164
165 def test_long(self):165 def test_long(self):
166 self._check('i12345678901234567890e', 12345678901234567890)166 self._check(b'i12345678901234567890e', 12345678901234567890)
167 self._check('i-12345678901234567890e', -12345678901234567890)167 self._check(b'i-12345678901234567890e', -12345678901234567890)
168168
169 def test_string(self):169 def test_string(self):
170 self._check('0:', '')170 self._check(b'0:', b'')
171 self._check('3:abc', 'abc')171 self._check(b'3:abc', b'abc')
172 self._check('10:1234567890', '1234567890')172 self._check(b'10:1234567890', b'1234567890')
173173
174 def test_list(self):174 def test_list(self):
175 self._check('le', [])175 self._check(b'le', [])
176 self._check('li1ei2ei3ee', [1, 2, 3])176 self._check(b'li1ei2ei3ee', [1, 2, 3])
177 self._check('ll5:Alice3:Bobeli2ei3eee', [['Alice', 'Bob'], [2, 3]])177 self._check(b'll5:Alice3:Bobeli2ei3eee', [[b'Alice', b'Bob'], [2, 3]])
178178
179 def test_list_as_tuple(self):179 def test_list_as_tuple(self):
180 self._check('le', ())180 self._check(b'le', ())
181 self._check('li1ei2ei3ee', (1, 2, 3))181 self._check(b'li1ei2ei3ee', (1, 2, 3))
182 self._check('ll5:Alice3:Bobeli2ei3eee', (('Alice', 'Bob'), (2, 3)))182 self._check(b'll5:Alice3:Bobeli2ei3eee', ((b'Alice', b'Bob'), (2, 3)))
183183
184 def test_list_deep_nested(self):184 def test_list_deep_nested(self):
185 top = []185 top = []
@@ -187,31 +187,28 @@
187 for i in range(10000):187 for i in range(10000):
188 l.append([])188 l.append([])
189 l = l[0]189 l = l[0]
190 self.assertRaises(RuntimeError, self.module.bencode, 190 self.assertRaises(RuntimeError, self.module.bencode, top)
191 top)
192191
193 def test_dict(self):192 def test_dict(self):
194 self._check('de', {})193 self._check(b'de', {})
195 self._check('d3:agei25e4:eyes4:bluee', {'age': 25, 'eyes': 'blue'})194 self._check(b'd3:agei25e4:eyes4:bluee', {b'age': 25, b'eyes': b'blue'})
196 self._check('d8:spam.mp3d6:author5:Alice6:lengthi100000eee',195 self._check(b'd8:spam.mp3d6:author5:Alice6:lengthi100000eee',
197 {'spam.mp3': {'author': 'Alice',196 {b'spam.mp3': {b'author': b'Alice', b'length': 100000}})
198 'length': 100000}})
199197
200 def test_dict_deep_nested(self):198 def test_dict_deep_nested(self):
201 d = top = {}199 d = top = {}
202 for i in range(10000):200 for i in range(10000):
203 d[''] = {}201 d[b''] = {}
204 d = d['']202 d = d[b'']
205 self.assertRaises(RuntimeError, self.module.bencode, 203 self.assertRaises(RuntimeError, self.module.bencode, top)
206 top)
207204
208 def test_bencached(self):205 def test_bencached(self):
209 self._check('i3e', self.module.Bencached(self.module.bencode(3)))206 self._check(b'i3e', self.module.Bencached(self.module.bencode(3)))
210207
211 def test_invalid_dict(self):208 def test_invalid_dict(self):
212 self.assertRaises(TypeError, self.module.bencode, {1:"foo"})209 self.assertRaises(TypeError, self.module.bencode, {1: b"foo"})
213210
214 def test_bool(self):211 def test_bool(self):
215 self._check('i1e', True)212 self._check(b'i1e', True)
216 self._check('i0e', False)213 self._check(b'i0e', False)
217214
218215
=== modified file 'breezy/util/_bencode_py.py'
--- breezy/util/_bencode_py.py 2017-05-22 00:56:52 +0000
+++ breezy/util/_bencode_py.py 2017-06-10 22:12:08 +0000
@@ -30,43 +30,43 @@
30 """30 """
31 self.yield_tuples = yield_tuples31 self.yield_tuples = yield_tuples
32 decode_func = {}32 decode_func = {}
33 decode_func['l'] = self.decode_list33 decode_func[b'l'] = self.decode_list
34 decode_func['d'] = self.decode_dict34 decode_func[b'd'] = self.decode_dict
35 decode_func['i'] = self.decode_int35 decode_func[b'i'] = self.decode_int
36 decode_func['0'] = self.decode_string36 decode_func[b'0'] = self.decode_string
37 decode_func['1'] = self.decode_string37 decode_func[b'1'] = self.decode_string
38 decode_func['2'] = self.decode_string38 decode_func[b'2'] = self.decode_string
39 decode_func['3'] = self.decode_string39 decode_func[b'3'] = self.decode_string
40 decode_func['4'] = self.decode_string40 decode_func[b'4'] = self.decode_string
41 decode_func['5'] = self.decode_string41 decode_func[b'5'] = self.decode_string
42 decode_func['6'] = self.decode_string42 decode_func[b'6'] = self.decode_string
43 decode_func['7'] = self.decode_string43 decode_func[b'7'] = self.decode_string
44 decode_func['8'] = self.decode_string44 decode_func[b'8'] = self.decode_string
45 decode_func['9'] = self.decode_string45 decode_func[b'9'] = self.decode_string
46 self.decode_func = decode_func46 self.decode_func = decode_func
4747
48 def decode_int(self, x, f):48 def decode_int(self, x, f):
49 f += 149 f += 1
50 newf = x.index('e', f)50 newf = x.index(b'e', f)
51 n = int(x[f:newf])51 n = int(x[f:newf])
52 if x[f] == '-':52 if x[f] == b'-':
53 if x[f + 1] == '0':53 if x[f + 1] == b'0':
54 raise ValueError54 raise ValueError
55 elif x[f] == '0' and newf != f+1:55 elif x[f] == b'0' and newf != f+1:
56 raise ValueError56 raise ValueError
57 return (n, newf+1)57 return (n, newf+1)
5858
59 def decode_string(self, x, f):59 def decode_string(self, x, f):
60 colon = x.index(':', f)60 colon = x.index(b':', f)
61 n = int(x[f:colon])61 n = int(x[f:colon])
62 if x[f] == '0' and colon != f+1:62 if x[f] == b'0' and colon != f+1:
63 raise ValueError63 raise ValueError
64 colon += 164 colon += 1
65 return (x[colon:colon+n], colon+n)65 return (x[colon:colon+n], colon+n)
6666
67 def decode_list(self, x, f):67 def decode_list(self, x, f):
68 r, f = [], f+168 r, f = [], f+1
69 while x[f] != 'e':69 while x[f] != b'e':
70 v, f = self.decode_func[x[f]](x, f)70 v, f = self.decode_func[x[f]](x, f)
71 r.append(v)71 r.append(v)
72 if self.yield_tuples:72 if self.yield_tuples:
@@ -76,7 +76,7 @@
76 def decode_dict(self, x, f):76 def decode_dict(self, x, f):
77 r, f = {}, f+177 r, f = {}, f+1
78 lastkey = None78 lastkey = None
79 while x[f] != 'e':79 while x[f] != b'e':
80 k, f = self.decode_string(x, f)80 k, f = self.decode_string(x, f)
81 if lastkey >= k:81 if lastkey >= k:
82 raise ValueError82 raise ValueError
@@ -88,7 +88,7 @@
88 if not isinstance(x, bytes):88 if not isinstance(x, bytes):
89 raise TypeError89 raise TypeError
90 try:90 try:
91 r, l = self.decode_func[x[0]](x, 0)91 r, l = self.decode_func[x[:1]](x, 0)
92 except (IndexError, KeyError, OverflowError) as e:92 except (IndexError, KeyError, OverflowError) as e:
93 raise ValueError(str(e))93 raise ValueError(str(e))
94 if l != len(x):94 if l != len(x):
@@ -116,30 +116,36 @@
116 encode_int(int(x), r)116 encode_int(int(x), r)
117117
118def encode_int(x, r):118def encode_int(x, r):
119 r.extend(('i', str(x), 'e'))119 r.extend((b'i', int_to_bytes(x), b'e'))
120120
121def encode_string(x, r):121def encode_string(x, r):
122 r.extend((str(len(x)), ':', x))122 r.extend((int_to_bytes(len(x)), b':', x))
123
124def encode_unicode(x, r):
125 r.extend((int_to_bytes(len(x)), b':', x))
123126
124def encode_list(x, r):127def encode_list(x, r):
125 r.append('l')128 r.append(b'l')
126 for i in x:129 for i in x:
127 encode_func[type(i)](i, r)130 encode_func[type(i)](i, r)
128 r.append('e')131 r.append(b'e')
129132
130def encode_dict(x,r):133def encode_dict(x,r):
131 r.append('d')134 r.append(b'd')
132 ilist = sorted(x.items())135 ilist = sorted(x.items())
133 for k, v in ilist:136 for k, v in ilist:
134 r.extend((str(len(k)), ':', k))137 r.extend((int_to_bytes(len(k)), b':', k))
135 encode_func[type(v)](v, r)138 encode_func[type(v)](v, r)
136 r.append('e')139 r.append(b'e')
137140
138encode_func = {}141encode_func = {}
139encode_func[type(Bencached(0))] = encode_bencached142encode_func[type(Bencached(0))] = encode_bencached
140encode_func[int] = encode_int143encode_func[int] = encode_int
141if sys.version_info < (3,):144if sys.version_info < (3,):
142 encode_func[long] = encode_int145 encode_func[long] = encode_int
146 int_to_bytes = str
147else:
148 int_to_bytes = lambda n: b"%d" % n
143encode_func[bytes] = encode_string149encode_func[bytes] = encode_string
144encode_func[list] = encode_list150encode_func[list] = encode_list
145encode_func[tuple] = encode_list151encode_func[tuple] = encode_list
@@ -159,5 +165,5 @@
159def bencode(x):165def bencode(x):
160 r = []166 r = []
161 encode_func[type(x)](x, r)167 encode_func[type(x)](x, r)
162 return ''.join(r)168 return b''.join(r)
163169

Subscribers

People subscribed via source and target branches