1
=== modified file 'lib/canonical/config/schema-lazr.conf'
2
--- lib/canonical/config/schema-lazr.conf	2010-06-14 18:32:58 +0000
3
+++ lib/canonical/config/schema-lazr.conf	2010-06-18 11:23:29 +0000
4
@@ -1132,8 +1132,8 @@
5
1132
geonames_identity:
1132
geonames_identity:
6
1133
1133
7
1134
# The maximum number of lines that should be parsed by the launchpad
1134
# The maximum number of lines that should be parsed by the launchpad
10
1135
# log parser.
1135
# log parser. The default value of None means there is no maximum.
11
1136
logparser_max_parsed_lines: 100000
1136
logparser_max_parsed_lines: None
12
1137
1137
13
1138
1138
14
1139
[launchpad_session]
1139
[launchpad_session]
15
1140
1140
16
=== modified file 'lib/canonical/launchpad/scripts/tests/test_librarian_apache_log_parser.py'
17
--- lib/canonical/launchpad/scripts/tests/test_librarian_apache_log_parser.py	2009-12-22 14:08:17 +0000
18
+++ lib/canonical/launchpad/scripts/tests/test_librarian_apache_log_parser.py	2010-06-18 11:23:29 +0000
19
@@ -95,10 +95,12 @@
20
95
        downloads, parsed_bytes = parse_file(
95
        downloads, parsed_bytes = parse_file(
21
96
            fd, start_position=0, logger=self.logger,
96
            fd, start_position=0, logger=self.logger,
22
97
            get_download_key=get_library_file_id)
97
            get_download_key=get_library_file_id)
24
98
        self.assertEqual(self.logger.buffer.getvalue(), '')
98
        self.assertEqual(
25
99
            self.logger.buffer.getvalue().strip(),
26
100
            'INFO: Parsed 1 lines resulting in 1 download stats.')
27
99
101
28
100
        date = datetime(2008, 6, 13)
102
        date = datetime(2008, 6, 13)
30
101
        self.assertEqual(downloads, 
103
        self.assertEqual(downloads,
31
102
            {'15018215': {datetime(2008, 6, 13): {'US': 1}}})
104
            {'15018215': {datetime(2008, 6, 13): {'US': 1}}})
32
103
105
33
104
        self.assertEqual(parsed_bytes, fd.tell())
106
        self.assertEqual(parsed_bytes, fd.tell())
34
@@ -112,7 +114,9 @@
35
112
        downloads, parsed_bytes = parse_file(
114
        downloads, parsed_bytes = parse_file(
36
113
            fd, start_position=0, logger=self.logger,
115
            fd, start_position=0, logger=self.logger,
37
114
            get_download_key=get_library_file_id)
116
            get_download_key=get_library_file_id)
39
115
        self.assertEqual(self.logger.buffer.getvalue(), '')
117
        self.assertEqual(
40
118
            self.logger.buffer.getvalue().strip(),
41
119
            'INFO: Parsed 1 lines resulting in 0 download stats.')
42
116
        self.assertEqual(downloads, {})
120
        self.assertEqual(downloads, {})
43
117
        self.assertEqual(parsed_bytes, fd.tell())
121
        self.assertEqual(parsed_bytes, fd.tell())
44
118
122
45
119
123
46
=== modified file 'lib/lp/services/apachelogparser/base.py'
47
--- lib/lp/services/apachelogparser/base.py	2010-06-01 14:31:13 +0000
48
+++ lib/lp/services/apachelogparser/base.py	2010-06-18 11:23:29 +0000
49
@@ -85,7 +85,7 @@
50
85
    """
85
    """
51
86
    # Seek file to given position, read all lines.
86
    # Seek file to given position, read all lines.
52
87
    fd.seek(start_position)
87
    fd.seek(start_position)
54
88
    line = fd.readline()
88
    next_line = fd.readline()
55
89
89
56
90
    parsed_bytes = start_position
90
    parsed_bytes = start_position
57
91
91
58
@@ -97,16 +97,17 @@
59
97
    max_parsed_lines = getattr(
97
    max_parsed_lines = getattr(
60
98
        config.launchpad, 'logparser_max_parsed_lines', None)
98
        config.launchpad, 'logparser_max_parsed_lines', None)
61
99
99
63
100
    while line:
100
    while next_line:
64
101
        if max_parsed_lines is not None and parsed_lines >= max_parsed_lines:
101
        if max_parsed_lines is not None and parsed_lines >= max_parsed_lines:
65
102
            break
102
            break
66
103
103
67
104
        line = next_line
68
105
69
104
        # Always skip the last line as it may be truncated since we're
106
        # Always skip the last line as it may be truncated since we're
70
105
        # rsyncing live logs, unless there is only one line for us to
107
        # rsyncing live logs, unless there is only one line for us to
71
106
        # parse, in which case This probably means we're dealing with a
108
        # parse, in which case This probably means we're dealing with a
72
107
        # logfile that has been rotated already, so it should be safe to
109
        # logfile that has been rotated already, so it should be safe to
73
108
        # parse its last line.
110
        # parse its last line.
74
109
        next_line = ''
75
110
        try:
111
        try:
76
111
            next_line = fd.next()
112
            next_line = fd.next()
77
112
        except StopIteration:
113
        except StopIteration:
78
@@ -161,7 +162,11 @@
79
161
            logger.error('Error (%s) while parsing "%s"' % (e, line))
162
            logger.error('Error (%s) while parsing "%s"' % (e, line))
80
162
            break
163
            break
81
163
164
83
164
        line = next_line
165
84
166
    if parsed_lines > 0:
85
167
        logger.info('Parsed %d lines resulting in %d download stats.' % (
86
168
            parsed_lines, len(downloads)))
87
169
88
165
    return downloads, parsed_bytes
170
    return downloads, parsed_bytes
89
166
171
90
167
172
91
168
173
92
=== modified file 'lib/lp/services/apachelogparser/tests/apache-log-files/launchpadlibrarian.net.access-log'
93
--- lib/lp/services/apachelogparser/tests/apache-log-files/launchpadlibrarian.net.access-log	2009-03-27 03:29:31 +0000
94
+++ lib/lp/services/apachelogparser/tests/apache-log-files/launchpadlibrarian.net.access-log	2010-06-18 11:23:29 +0000
95
@@ -1,3 +1,4 @@
96
1
121.44.28.210 - - [13/Jun/2008:14:55:06 +0100] "GET /9096290/me-tv-icon-14x14.png HTTP/1.1" 404 730 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
97
1
121.44.28.210 - - [13/Jun/2008:14:55:06 +0100] "GET /9096290/me-tv-icon-14x14.png HTTP/1.1" 200 730 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
2
121.44.28.210 - - [13/Jun/2008:14:55:06 +0100] "GET /9096290/me-tv-icon-14x14.png HTTP/1.1" 200 730 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
98
2
121.44.28.210 - - [13/Jun/2008:14:55:13 +0100] "GET /12060796/me-tv-icon-64x64.png HTTP/1.1" 200 6378 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
3
121.44.28.210 - - [13/Jun/2008:14:55:13 +0100] "GET /12060796/me-tv-icon-64x64.png HTTP/1.1" 200 6378 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
99
3
157.92.18.21 - - [13/Jun/2008:14:55:15 +0100] "GET /8196569/mediumubuntulogo.png HTTP/1.1" 200 3420 "https://bugs.launchpad.net/ubuntu/+source/acpi-support/+bug/59695/comments/14" "Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9) Gecko/2008052623 Iceweasel/3.0 (Debian-3.0~rc1-1)"
4
157.92.18.21 - - [13/Jun/2008:14:55:15 +0100] "GET /8196569/mediumubuntulogo.png HTTP/1.1" 200 3420 "https://bugs.launchpad.net/ubuntu/+source/acpi-support/+bug/59695/comments/14" "Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9) Gecko/2008052623 Iceweasel/3.0 (Debian-3.0~rc1-1)"
100
4
5
101
=== modified file 'lib/lp/services/apachelogparser/tests/test_apachelogparser.py'
102
--- lib/lp/services/apachelogparser/tests/test_apachelogparser.py	2010-06-01 14:28:40 +0000
103
+++ lib/lp/services/apachelogparser/tests/test_apachelogparser.py	2010-06-18 11:23:29 +0000
104
@@ -126,7 +126,9 @@
105
126
        downloads, parsed_bytes = parse_file(
126
        downloads, parsed_bytes = parse_file(
106
127
            fd, start_position=0, logger=self.logger,
127
            fd, start_position=0, logger=self.logger,
107
128
            get_download_key=get_path_download_key)
128
            get_download_key=get_path_download_key)
109
129
        self.assertEqual(self.logger.buffer.getvalue(), '')
129
        self.assertEqual(
110
130
            self.logger.buffer.getvalue().strip(),
111
131
            'INFO: Parsed 5 lines resulting in 3 download stats.')
112
130
        date = datetime(2008, 6, 13)
132
        date = datetime(2008, 6, 13)
113
131
        self.assertContentEqual(
133
        self.assertContentEqual(
114
132
            downloads.items(),
134
            downloads.items(),
115
@@ -148,7 +150,9 @@
116
148
        downloads, parsed_bytes = parse_file(
150
        downloads, parsed_bytes = parse_file(
117
149
            fd, start_position=self._getLastLineStart(fd), logger=self.logger,
151
            fd, start_position=self._getLastLineStart(fd), logger=self.logger,
118
150
            get_download_key=get_path_download_key)
152
            get_download_key=get_path_download_key)
120
151
        self.assertEqual(self.logger.buffer.getvalue(), '')
153
        self.assertEqual(
121
154
            self.logger.buffer.getvalue().strip(),
122
155
            'INFO: Parsed 1 lines resulting in 1 download stats.')
123
152
        self.assertEqual(parsed_bytes, fd.tell())
156
        self.assertEqual(parsed_bytes, fd.tell())
124
153
157
125
154
        self.assertContentEqual(
158
        self.assertContentEqual(
126
@@ -175,7 +179,9 @@
127
175
        downloads, parsed_bytes = parse_file(
179
        downloads, parsed_bytes = parse_file(
128
176
            fd, start_position=0, logger=self.logger,
180
            fd, start_position=0, logger=self.logger,
129
177
            get_download_key=get_path_download_key)
181
            get_download_key=get_path_download_key)
131
178
        self.assertEqual(self.logger.buffer.getvalue(), '')
182
        self.assertEqual(
132
183
            self.logger.buffer.getvalue().strip(),
133
184
            'INFO: Parsed 1 lines resulting in 0 download stats.')
134
179
        self.assertEqual(downloads, {})
185
        self.assertEqual(downloads, {})
135
180
        self.assertEqual(parsed_bytes, fd.tell())
186
        self.assertEqual(parsed_bytes, fd.tell())
136
181
187
137
@@ -198,7 +204,9 @@
138
198
        downloads, parsed_bytes = parse_file(
204
        downloads, parsed_bytes = parse_file(
139
199
            fd, start_position=0, logger=self.logger,
205
            fd, start_position=0, logger=self.logger,
140
200
            get_download_key=get_path_download_key)
206
            get_download_key=get_path_download_key)
142
201
        self.assertEqual(self.logger.buffer.getvalue(), '')
207
        self.assertEqual(
143
208
            self.logger.buffer.getvalue().strip(),
144
209
            'INFO: Parsed 1 lines resulting in 0 download stats.')
145
202
        self.assertEqual(downloads, {})
210
        self.assertEqual(downloads, {})
146
203
        self.assertEqual(parsed_bytes, fd.tell())
211
        self.assertEqual(parsed_bytes, fd.tell())
147
204
212
148
@@ -214,9 +222,10 @@
149
214
        downloads, parsed_bytes = parse_file(
222
        downloads, parsed_bytes = parse_file(
150
215
            fd, start_position=0, logger=self.logger,
223
            fd, start_position=0, logger=self.logger,
151
216
            get_download_key=get_path_download_key)
224
            get_download_key=get_path_download_key)
153
217
        self.assertEqual(self.logger.buffer.getvalue(), '')
225
        self.assertEqual(
154
226
            self.logger.buffer.getvalue().strip(),
155
227
            'INFO: Parsed 1 lines resulting in 1 download stats.')
156
218
228
157
219
        date = datetime(2008, 6, 13)
158
220
        self.assertEqual(downloads,
229
        self.assertEqual(downloads,
159
221
            {'/15018215/ul_logo_64x64.png':
230
            {'/15018215/ul_logo_64x64.png':
160
222
                {datetime(2008, 6, 13): {'US': 1}}})
231
                {datetime(2008, 6, 13): {'US': 1}}})
161
@@ -232,24 +241,37 @@
162
232
                [launchpad]
241
                [launchpad]
163
233
                logparser_max_parsed_lines: 2
242
                logparser_max_parsed_lines: 2
164
234
                '''))
243
                '''))
165
244
        self.addCleanup(config.pop, 'log_parser config')
166
235
        fd = open(os.path.join(
245
        fd = open(os.path.join(
167
236
            here, 'apache-log-files', 'launchpadlibrarian.net.access-log'))
246
            here, 'apache-log-files', 'launchpadlibrarian.net.access-log'))
168
247
        self.addCleanup(fd.close)
169
248
170
237
        downloads, parsed_bytes = parse_file(
249
        downloads, parsed_bytes = parse_file(
171
238
            fd, start_position=0, logger=self.logger,
250
            fd, start_position=0, logger=self.logger,
172
239
            get_download_key=get_path_download_key)
251
            get_download_key=get_path_download_key)
173
240
        config.pop("log_parser config")
174
241
252
176
242
        self.assertEqual(self.logger.buffer.getvalue(), '')
253
        # We have initially parsed only the first two lines of data,
177
254
        # corresponding to one download (the first line is a 404 and
178
255
        # so ignored).
179
243
        date = datetime(2008, 6, 13)
256
        date = datetime(2008, 6, 13)
180
244
        self.assertContentEqual(
257
        self.assertContentEqual(
181
245
            downloads.items(),
258
            downloads.items(),
186
246
            [('/12060796/me-tv-icon-64x64.png', {date: {'AU': 1}}),
259
            [('/9096290/me-tv-icon-14x14.png', {date: {'AU': 1}})])
183
247
             ('/9096290/me-tv-icon-14x14.png', {date: {'AU': 1}})])
184
248
185
249
        # We should have parsed only the first two lines of data.
187
250
        fd.seek(0)
260
        fd.seek(0)
188
251
        lines = fd.readlines()
261
        lines = fd.readlines()
190
252
        self.assertEqual(parsed_bytes, len(lines[0]) + len(lines[1]))
262
        line_lengths = [len(line) for line in lines]
191
263
        self.assertEqual(parsed_bytes, sum(line_lengths[:2]))
192
264
193
265
        # And the subsequent parse will be for the 3rd and 4th lines,
194
266
        # corresponding to two downloads of the same file.
195
267
        downloads, parsed_bytes = parse_file(
196
268
            fd, start_position=parsed_bytes, logger=self.logger,
197
269
            get_download_key=get_path_download_key)
198
270
        self.assertContentEqual(
199
271
            downloads.items(),
200
272
            [('/12060796/me-tv-icon-64x64.png', {date: {'AU': 1}}),
201
273
             ('/8196569/mediumubuntulogo.png', {date: {'AR': 1}})])
202
274
        self.assertEqual(parsed_bytes, sum(line_lengths[:4]))
203
253
275
204
254
276
205
255
class TestParsedFilesDetection(TestCase):
277
class TestParsedFilesDetection(TestCase):
Reviewer	Review Type	Date Requested	Status
Abel Deuring (community)	code	2010-06-17	Approve on 2010-06-18
Review via email: mp+27849@code.launchpad.net
1	=== modified file 'lib/canonical/config/schema-lazr.conf'
2	--- lib/canonical/config/schema-lazr.conf 2010-06-14 18:32:58 +0000
3	+++ lib/canonical/config/schema-lazr.conf 2010-06-18 11:23:29 +0000
4	@@ -1132,8 +1132,8 @@
5	1132	geonames_identity:	1132	geonames_identity:
6	1133		1133
7	1134	# The maximum number of lines that should be parsed by the launchpad	1134	# The maximum number of lines that should be parsed by the launchpad
10	1135	# log parser.	1135	# log parser. The default value of None means there is no maximum.
11	1136	logparser_max_parsed_lines: 100000	1136	logparser_max_parsed_lines: None
12	1137		1137
13	1138		1138
14	1139	[launchpad_session]	1139	[launchpad_session]
15	1140		1140
16	=== modified file 'lib/canonical/launchpad/scripts/tests/test_librarian_apache_log_parser.py'
17	--- lib/canonical/launchpad/scripts/tests/test_librarian_apache_log_parser.py 2009-12-22 14:08:17 +0000
18	+++ lib/canonical/launchpad/scripts/tests/test_librarian_apache_log_parser.py 2010-06-18 11:23:29 +0000
19	@@ -95,10 +95,12 @@
20	95	downloads, parsed_bytes = parse_file(	95	downloads, parsed_bytes = parse_file(
21	96	fd, start_position=0, logger=self.logger,	96	fd, start_position=0, logger=self.logger,
22	97	get_download_key=get_library_file_id)	97	get_download_key=get_library_file_id)
24	98	self.assertEqual(self.logger.buffer.getvalue(), '')	98	self.assertEqual(
25			99	self.logger.buffer.getvalue().strip(),
26			100	'INFO: Parsed 1 lines resulting in 1 download stats.')
27	99		101
28	100	date = datetime(2008, 6, 13)	102	date = datetime(2008, 6, 13)
30	101	self.assertEqual(downloads,	103	self.assertEqual(downloads,
31	102	{'15018215': {datetime(2008, 6, 13): {'US': 1}}})	104	{'15018215': {datetime(2008, 6, 13): {'US': 1}}})
32	103		105
33	104	self.assertEqual(parsed_bytes, fd.tell())	106	self.assertEqual(parsed_bytes, fd.tell())
34	@@ -112,7 +114,9 @@
35	112	downloads, parsed_bytes = parse_file(	114	downloads, parsed_bytes = parse_file(
36	113	fd, start_position=0, logger=self.logger,	115	fd, start_position=0, logger=self.logger,
37	114	get_download_key=get_library_file_id)	116	get_download_key=get_library_file_id)
39	115	self.assertEqual(self.logger.buffer.getvalue(), '')	117	self.assertEqual(
40			118	self.logger.buffer.getvalue().strip(),
41			119	'INFO: Parsed 1 lines resulting in 0 download stats.')
42	116	self.assertEqual(downloads, {})	120	self.assertEqual(downloads, {})
43	117	self.assertEqual(parsed_bytes, fd.tell())	121	self.assertEqual(parsed_bytes, fd.tell())
44	118		122
45	119		123
46	=== modified file 'lib/lp/services/apachelogparser/base.py'
47	--- lib/lp/services/apachelogparser/base.py 2010-06-01 14:31:13 +0000
48	+++ lib/lp/services/apachelogparser/base.py 2010-06-18 11:23:29 +0000
49	@@ -85,7 +85,7 @@
50	85	"""	85	"""
51	86	# Seek file to given position, read all lines.	86	# Seek file to given position, read all lines.
52	87	fd.seek(start_position)	87	fd.seek(start_position)
54	88	line = fd.readline()	88	next_line = fd.readline()
55	89		89
56	90	parsed_bytes = start_position	90	parsed_bytes = start_position
57	91		91
58	@@ -97,16 +97,17 @@
59	97	max_parsed_lines = getattr(	97	max_parsed_lines = getattr(
60	98	config.launchpad, 'logparser_max_parsed_lines', None)	98	config.launchpad, 'logparser_max_parsed_lines', None)
61	99		99
63	100	while line:	100	while next_line:
64	101	if max_parsed_lines is not None and parsed_lines >= max_parsed_lines:	101	if max_parsed_lines is not None and parsed_lines >= max_parsed_lines:
65	102	break	102	break
66	103		103
67			104	line = next_line
68			105
69	104	# Always skip the last line as it may be truncated since we're	106	# Always skip the last line as it may be truncated since we're
70	105	# rsyncing live logs, unless there is only one line for us to	107	# rsyncing live logs, unless there is only one line for us to
71	106	# parse, in which case This probably means we're dealing with a	108	# parse, in which case This probably means we're dealing with a
72	107	# logfile that has been rotated already, so it should be safe to	109	# logfile that has been rotated already, so it should be safe to
73	108	# parse its last line.	110	# parse its last line.
74	109	next_line = ''
75	110	try:	111	try:
76	111	next_line = fd.next()	112	next_line = fd.next()
77	112	except StopIteration:	113	except StopIteration:
78	@@ -161,7 +162,11 @@
79	161	logger.error('Error (%s) while parsing "%s"' % (e, line))	162	logger.error('Error (%s) while parsing "%s"' % (e, line))
80	162	break	163	break
81	163		164
83	164	line = next_line	165
84			166	if parsed_lines > 0:
85			167	logger.info('Parsed %d lines resulting in %d download stats.' % (
86			168	parsed_lines, len(downloads)))
87			169
88	165	return downloads, parsed_bytes	170	return downloads, parsed_bytes
89	166		171
90	167		172
91	168		173
92	=== modified file 'lib/lp/services/apachelogparser/tests/apache-log-files/launchpadlibrarian.net.access-log'
93	--- lib/lp/services/apachelogparser/tests/apache-log-files/launchpadlibrarian.net.access-log 2009-03-27 03:29:31 +0000
94	+++ lib/lp/services/apachelogparser/tests/apache-log-files/launchpadlibrarian.net.access-log 2010-06-18 11:23:29 +0000
95	@@ -1,3 +1,4 @@
96			1	121.44.28.210 - - [13/Jun/2008:14:55:06 +0100] "GET /9096290/me-tv-icon-14x14.png HTTP/1.1" 404 730 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
97	1	121.44.28.210 - - [13/Jun/2008:14:55:06 +0100] "GET /9096290/me-tv-icon-14x14.png HTTP/1.1" 200 730 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"	2	121.44.28.210 - - [13/Jun/2008:14:55:06 +0100] "GET /9096290/me-tv-icon-14x14.png HTTP/1.1" 200 730 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
98	2	121.44.28.210 - - [13/Jun/2008:14:55:13 +0100] "GET /12060796/me-tv-icon-64x64.png HTTP/1.1" 200 6378 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"	3	121.44.28.210 - - [13/Jun/2008:14:55:13 +0100] "GET /12060796/me-tv-icon-64x64.png HTTP/1.1" 200 6378 "https://launchpad.net/me-tv" "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.9) Gecko/2008060900 Firefox/3.0"
99	3	157.92.18.21 - - [13/Jun/2008:14:55:15 +0100] "GET /8196569/mediumubuntulogo.png HTTP/1.1" 200 3420 "https://bugs.launchpad.net/ubuntu/+source/acpi-support/+bug/59695/comments/14" "Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9) Gecko/2008052623 Iceweasel/3.0 (Debian-3.0~rc1-1)"	4	157.92.18.21 - - [13/Jun/2008:14:55:15 +0100] "GET /8196569/mediumubuntulogo.png HTTP/1.1" 200 3420 "https://bugs.launchpad.net/ubuntu/+source/acpi-support/+bug/59695/comments/14" "Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9) Gecko/2008052623 Iceweasel/3.0 (Debian-3.0~rc1-1)"
100	4		5
101	=== modified file 'lib/lp/services/apachelogparser/tests/test_apachelogparser.py'
102	--- lib/lp/services/apachelogparser/tests/test_apachelogparser.py 2010-06-01 14:28:40 +0000
103	+++ lib/lp/services/apachelogparser/tests/test_apachelogparser.py 2010-06-18 11:23:29 +0000
104	@@ -126,7 +126,9 @@
105	126	downloads, parsed_bytes = parse_file(	126	downloads, parsed_bytes = parse_file(
106	127	fd, start_position=0, logger=self.logger,	127	fd, start_position=0, logger=self.logger,
107	128	get_download_key=get_path_download_key)	128	get_download_key=get_path_download_key)
109	129	self.assertEqual(self.logger.buffer.getvalue(), '')	129	self.assertEqual(
110			130	self.logger.buffer.getvalue().strip(),
111			131	'INFO: Parsed 5 lines resulting in 3 download stats.')
112	130	date = datetime(2008, 6, 13)	132	date = datetime(2008, 6, 13)
113	131	self.assertContentEqual(	133	self.assertContentEqual(
114	132	downloads.items(),	134	downloads.items(),
115	@@ -148,7 +150,9 @@
116	148	downloads, parsed_bytes = parse_file(	150	downloads, parsed_bytes = parse_file(
117	149	fd, start_position=self._getLastLineStart(fd), logger=self.logger,	151	fd, start_position=self._getLastLineStart(fd), logger=self.logger,
118	150	get_download_key=get_path_download_key)	152	get_download_key=get_path_download_key)
120	151	self.assertEqual(self.logger.buffer.getvalue(), '')	153	self.assertEqual(
121			154	self.logger.buffer.getvalue().strip(),
122			155	'INFO: Parsed 1 lines resulting in 1 download stats.')
123	152	self.assertEqual(parsed_bytes, fd.tell())	156	self.assertEqual(parsed_bytes, fd.tell())
124	153		157
125	154	self.assertContentEqual(	158	self.assertContentEqual(
126	@@ -175,7 +179,9 @@
127	175	downloads, parsed_bytes = parse_file(	179	downloads, parsed_bytes = parse_file(
128	176	fd, start_position=0, logger=self.logger,	180	fd, start_position=0, logger=self.logger,
129	177	get_download_key=get_path_download_key)	181	get_download_key=get_path_download_key)
131	178	self.assertEqual(self.logger.buffer.getvalue(), '')	182	self.assertEqual(
132			183	self.logger.buffer.getvalue().strip(),
133			184	'INFO: Parsed 1 lines resulting in 0 download stats.')
134	179	self.assertEqual(downloads, {})	185	self.assertEqual(downloads, {})
135	180	self.assertEqual(parsed_bytes, fd.tell())	186	self.assertEqual(parsed_bytes, fd.tell())
136	181		187
137	@@ -198,7 +204,9 @@
138	198	downloads, parsed_bytes = parse_file(	204	downloads, parsed_bytes = parse_file(
139	199	fd, start_position=0, logger=self.logger,	205	fd, start_position=0, logger=self.logger,
140	200	get_download_key=get_path_download_key)	206	get_download_key=get_path_download_key)
142	201	self.assertEqual(self.logger.buffer.getvalue(), '')	207	self.assertEqual(
143			208	self.logger.buffer.getvalue().strip(),
144			209	'INFO: Parsed 1 lines resulting in 0 download stats.')
145	202	self.assertEqual(downloads, {})	210	self.assertEqual(downloads, {})
146	203	self.assertEqual(parsed_bytes, fd.tell())	211	self.assertEqual(parsed_bytes, fd.tell())
147	204		212
148	@@ -214,9 +222,10 @@
149	214	downloads, parsed_bytes = parse_file(	222	downloads, parsed_bytes = parse_file(
150	215	fd, start_position=0, logger=self.logger,	223	fd, start_position=0, logger=self.logger,
151	216	get_download_key=get_path_download_key)	224	get_download_key=get_path_download_key)
153	217	self.assertEqual(self.logger.buffer.getvalue(), '')	225	self.assertEqual(
154			226	self.logger.buffer.getvalue().strip(),
155			227	'INFO: Parsed 1 lines resulting in 1 download stats.')
156	218		228
157	219	date = datetime(2008, 6, 13)
158	220	self.assertEqual(downloads,	229	self.assertEqual(downloads,
159	221	{'/15018215/ul_logo_64x64.png':	230	{'/15018215/ul_logo_64x64.png':
160	222	{datetime(2008, 6, 13): {'US': 1}}})	231	{datetime(2008, 6, 13): {'US': 1}}})
161	@@ -232,24 +241,37 @@
162	232	[launchpad]	241	[launchpad]
163	233	logparser_max_parsed_lines: 2	242	logparser_max_parsed_lines: 2
164	234	'''))	243	'''))
165			244	self.addCleanup(config.pop, 'log_parser config')
166	235	fd = open(os.path.join(	245	fd = open(os.path.join(
167	236	here, 'apache-log-files', 'launchpadlibrarian.net.access-log'))	246	here, 'apache-log-files', 'launchpadlibrarian.net.access-log'))
168			247	self.addCleanup(fd.close)
169			248
170	237	downloads, parsed_bytes = parse_file(	249	downloads, parsed_bytes = parse_file(
171	238	fd, start_position=0, logger=self.logger,	250	fd, start_position=0, logger=self.logger,
172	239	get_download_key=get_path_download_key)	251	get_download_key=get_path_download_key)
173	240	config.pop("log_parser config")
174	241		252
176	242	self.assertEqual(self.logger.buffer.getvalue(), '')	253	# We have initially parsed only the first two lines of data,
177			254	# corresponding to one download (the first line is a 404 and
178			255	# so ignored).
179	243	date = datetime(2008, 6, 13)	256	date = datetime(2008, 6, 13)
180	244	self.assertContentEqual(	257	self.assertContentEqual(
181	245	downloads.items(),	258	downloads.items(),
186	246	[('/12060796/me-tv-icon-64x64.png', {date: {'AU': 1}}),	259	[('/9096290/me-tv-icon-14x14.png', {date: {'AU': 1}})])
183	247	('/9096290/me-tv-icon-14x14.png', {date: {'AU': 1}})])
184	248
185	249	# We should have parsed only the first two lines of data.
187	250	fd.seek(0)	260	fd.seek(0)
188	251	lines = fd.readlines()	261	lines = fd.readlines()
190	252	self.assertEqual(parsed_bytes, len(lines[0]) + len(lines[1]))	262	line_lengths = [len(line) for line in lines]
191			263	self.assertEqual(parsed_bytes, sum(line_lengths[:2]))
192			264
193			265	# And the subsequent parse will be for the 3rd and 4th lines,
194			266	# corresponding to two downloads of the same file.
195			267	downloads, parsed_bytes = parse_file(
196			268	fd, start_position=parsed_bytes, logger=self.logger,
197			269	get_download_key=get_path_download_key)
198			270	self.assertContentEqual(
199			271	downloads.items(),
200			272	[('/12060796/me-tv-icon-64x64.png', {date: {'AU': 1}}),
201			273	('/8196569/mediumubuntulogo.png', {date: {'AR': 1}})])
202			274	self.assertEqual(parsed_bytes, sum(line_lengths[:4]))
203	253		275
204	254		276
205	255	class TestParsedFilesDetection(TestCase):	277	class TestParsedFilesDetection(TestCase):