Launchpad itself

Merge lp:~lifeless/launchpad/ppr-move into lp:launchpad

ppr-move
Merge into devel

Proposed by Robert Collins on 2012-08-09

Status:	Merged
Approved by:	Robert Collins on 2012-08-09
Approved revision:	no longer in the source branch.
Merged at revision:	15780
Proposed branch:	lp:~lifeless/launchpad/ppr-move
Merge into:	lp:launchpad
Diff against target:	1955 lines (+0/-1931) 5 files modified lib/lp/scripts/utilities/pageperformancereport.py (+0/-1236) lib/lp/scripts/utilities/tests/test_pageperformancereport.py (+0/-483) utilities/page-performance-report-daily.sh (+0/-115) utilities/page-performance-report.ini (+0/-79) utilities/page-performance-report.py (+0/-18)
To merge this branch:	bzr merge lp:~lifeless/launchpad/ppr-move
Related bugs:	Link a bug report

Reviewer	Review Type	Date Requested	Status
Robert Collins (community)			Approve on 2012-08-09
Review via email: mp+118873@code.launchpad.net

Commit message

PPR is now in lp-dev-utils, remove it from LP so we don't have two copies.

Description of the change

PPR is now in lp-dev-utils, remove it from LP so we don't have two copies.

Revision history for this message

Robert Collins (lifeless) wrote on 2012-08-09:

Self review, nothing to see here. We might want to bring the ini file back I suppose, but lp-dev-utils is still LP focused so for now, keep it all together.

review: Approve

Preview Diff

[H/L] Next/Prev Comment, [J/K] Next/Prev File, [N/P] Next/Prev Hunk

Subscribers

People subscribed via source and target branches

to all changes:

Barki Mustapha

Celso Providelo

Christian Reis

Christy Awad

Colin Watson

Harpianto,ANDI

James Troup

John A Meinel

Kevin bush

Launchpad code reviewers

Launchpad code reviewers from Canonical

Matthew Tanner

Maximiliano Bertacchini

Oguz Ersoz

Robert Collins

Simon Brakhane

Ubuntu-BR DevOps

William Grant

alhawiti

api.ng

pedro cavazos

todaioan

wenjingwen

to status/vote changes:

Tzaddi

Tzaddi Belding

 === removed file 'lib/lp/scripts/utilities/pageperformancereport.py'
 --- lib/lp/scripts/utilities/pageperformancereport.py	2012-06-29 08:40:05 +0000
 +++ lib/lp/scripts/utilities/pageperformancereport.py	1970-01-01 00:00:00 +0000
@@ -1,1236 +0,0 @@
--# Copyright 2010 Canonical Ltd.  This software is licensed under the
--# GNU Affero General Public License version 3 (see the file LICENSE).
--
--"""Page performance report generated from zserver trace logs."""
--
--__metaclass__ = type
--__all__ = ['main']
--
--import bz2
--from cgi import escape as html_quote
--from ConfigParser import RawConfigParser
--import copy
--import cPickle
--import csv
--from datetime import datetime
--import gzip
--import math
--import os.path
--import re
--import textwrap
--from textwrap import dedent
--import time
--
--import simplejson as json
--import sre_constants
--import zc.zservertracelog.tracereport
--
--from lp.scripts.helpers import LPOptionParser
--from lp.services.config import config
--from lp.services.scripts.logger import log
--
--
--class Request(zc.zservertracelog.tracereport.Request):
--    url = None
--    pageid = None
--    ticks = None
--    sql_statements = None
--    sql_seconds = None
--
--    # Override the broken version in our superclass that always
--    # returns an integer.
--    @property
--    def app_seconds(self):
--        interval = self.app_time - self.start_app_time
--        return interval.seconds + interval.microseconds / 1000000.0
--
--    # Override the broken version in our superclass that always
--    # returns an integer.
--    @property
--    def total_seconds(self):
--        interval = self.end - self.start
--        return interval.seconds + interval.microseconds / 1000000.0
--
--
--class Category:
--    """A Category in our report.
--
--    Requests belong to a Category if the URL matches a regular expression.
--    """
--
--    def __init__(self, title, regexp):
--        self.title = title
--        self.regexp = regexp
--        self._compiled_regexp = re.compile(regexp, re.I | re.X)
--        self.partition = False
--
--    def match(self, request):
--        """Return true when the request match this category."""
--        return self._compiled_regexp.search(request.url) is not None
--
--    def __cmp__(self, other):
--        return cmp(self.title.lower(), other.title.lower())
--
--    def __deepcopy__(self, memo):
--        # We provide __deepcopy__ because the module doesn't handle
--        # compiled regular expression by default.
--        return Category(self.title, self.regexp)
--
--
--class OnlineStatsCalculator:
--    """Object that can compute count, sum, mean, variance and median.
--
--    It computes these value incrementally and using minimal storage
--    using the Welford / Knuth algorithm described at
--    http://en.wikipedia.org/wiki/Algorithms_for_calculating_variance#On-line_algorithm
--    """
--
--    def __init__(self):
--        self.count = 0
--        self.sum = 0
--        self.M2 = 0.0 # Sum of square difference
--        self.mean = 0.0
--
--    def update(self, x):
--        """Incrementally update the stats when adding x to the set.
--
--        None values are ignored.
--        """
--        if x is None:
--            return
--        self.count += 1
--        self.sum += x
--        delta = x - self.mean
--        self.mean = float(self.sum)/self.count
--        self.M2 += delta*(x - self.mean)
--
--    @property
--    def variance(self):
--        """Return the population variance."""
--        if self.count == 0:
--            return 0
--        else:
--            return self.M2/self.count
--
--    @property
--    def std(self):
--        """Return the standard deviation."""
--        if self.count == 0:
--            return 0
--        else:
--            return math.sqrt(self.variance)
--
--    def __add__(self, other):
--        """Adds this and another OnlineStatsCalculator.
--
--        The result combines the stats of the two objects.
--        """
--        results = OnlineStatsCalculator()
--        results.count = self.count + other.count
--        results.sum = self.sum + other.sum
--        if self.count > 0 and other.count > 0:
--            # This is 2.1b in Chan, Tony F.; Golub, Gene H.; LeVeque,
--            # Randall J. (1979), "Updating Formulae and a Pairwise Algorithm
--            # for Computing Sample Variances.",
--            # Technical Report STAN-CS-79-773,
--            # Department of Computer Science, Stanford University,
--            # ftp://reports.stanford.edu/pub/cstr/reports/cs/tr/79/773/CS-TR-79-773.pdf .
--            results.M2 = self.M2 + other.M2 + (
--                (float(self.count) / (other.count * results.count)) *
--                ((float(other.count) / self.count) * self.sum - other.sum)**2)
--        else:
--            results.M2 = self.M2 + other.M2 # One of them is 0.
--        if results.count > 0:
--            results.mean = float(results.sum) / results.count
--        return results
--
--
--class OnlineApproximateMedian:
--    """Approximate the median of a set of elements.
--
--    This implements a space-efficient algorithm which only sees each value
--    once. (It will hold in memory log bucket_size of n elements.)
--
--    It was described and analysed in
--    D. Cantone and  M.Hofri,
--    "Analysis of An Approximate Median Selection Algorithm"
--    ftp://ftp.cs.wpi.edu/pub/techreports/pdf/06-17.pdf
--
--    This algorithm is similar to Tukey's median of medians technique.
--    It will compute the median among bucket_size values. And the median among
--    those.
--    """
--
--    def __init__(self, bucket_size=9):
--        """Creates a new estimator.
--
--        It approximates the median by finding the median among each
--        successive bucket_size element. And then using these medians for other
--        rounds of selection.
--
--        The bucket size should be a low odd-integer.
--        """
--        self.bucket_size = bucket_size
--        # Index of the median in a completed bucket.
--        self.median_idx = (bucket_size-1)//2
--        self.buckets = []
--
--    def update(self, x, order=0):
--        """Update with x."""
--        if x is None:
--            return
--
--        i = order
--        while True:
--            # Create bucket on demand.
--            if i >= len(self.buckets):
--                for n in range((i+1)-len(self.buckets)):
--                    self.buckets.append([])
--            bucket = self.buckets[i]
--            bucket.append(x)
--            if len(bucket) == self.bucket_size:
--                # Select the median in this bucket, and promote it.
--                x = sorted(bucket)[self.median_idx]
--                # Free the bucket for the next round.
--                del bucket[:]
--                i += 1
--                continue
--            else:
--                break
--
--    @property
--    def median(self):
--        """Return the median."""
--        # Find the 'weighted' median by assigning a weight to each
--        # element proportional to how far they have been selected.
--        candidates = []
--        total_weight = 0
--        for i, bucket in enumerate(self.buckets):
--            weight = self.bucket_size ** i
--            for x in bucket:
--                total_weight += weight
--                candidates.append([x, weight])
--        if len(candidates) == 0:
--            return 0
--
--        # Each weight is the equivalent of having the candidates appear
--        # that number of times in the array.
--        # So buckets like [[1, 2], [2, 3], [4, 2]] would be expanded to
--        # [1, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 4, 4, 4, 4,
--        # 4, 4, 4, 4, 4] and we find the median of that list (2).
--        # We don't expand the items to conserve memory.
--        median = (total_weight-1) / 2
--        weighted_idx = 0
--        for x, weight in sorted(candidates):
--            weighted_idx += weight
--            if weighted_idx > median:
--                return x
--
--    def __add__(self, other):
--        """Merge two approximators together.
--
--        All candidates from the other are merged through the standard
--        algorithm, starting at the same level. So an item that went through
--        two rounds of selection, will be compared with other items having
--        gone through the same number of rounds.
--        """
--        results = OnlineApproximateMedian(self.bucket_size)
--        results.buckets = copy.deepcopy(self.buckets)
--        for i, bucket in enumerate(other.buckets):
--            for x in bucket:
--                results.update(x, i)
--        return results
--
--
--class Stats:
--    """Bag to hold and compute request statistics.
--
--    All times are in seconds.
--    """
--    total_hits = 0 # Total hits.
--
--    total_time = 0 # Total time spent rendering.
--    mean = 0 # Mean time per hit.
--    median = 0 # Median time per hit.
--    std = 0 # Standard deviation per hit.
--    histogram = None # # Request times histogram.
--
--    total_sqltime = 0 # Total time spent waiting for SQL to process.
--    mean_sqltime = 0 # Mean time spend waiting for SQL to process.
--    median_sqltime = 0 # Median time spend waiting for SQL to process.
--    std_sqltime = 0 # Standard deviation of SQL time.
--
--    total_sqlstatements = 0 # Total number of SQL statements issued.
--    mean_sqlstatements = 0
--    median_sqlstatements = 0
--    std_sqlstatements = 0
--
--    @property
--    def ninetyninth_percentile_time(self):
--        """Time under which 99% of requests are rendered.
--
--        This is estimated as 3 std deviations from the mean. Given that
--        in a daily report, many URLs or PageIds won't have 100 requests, it's
--        more useful to use this estimator.
--        """
--        return self.mean + 3*self.std
--
--    @property
--    def ninetyninth_percentile_sqltime(self):
--        """SQL time under which 99% of requests are rendered.
--
--        This is estimated as 3 std deviations from the mean.
--        """
--        return self.mean_sqltime + 3*self.std_sqltime
--
--    @property
--    def ninetyninth_percentile_sqlstatements(self):
--        """Number of SQL statements under which 99% of requests are rendered.
--
--        This is estimated as 3 std deviations from the mean.
--        """
--        return self.mean_sqlstatements + 3*self.std_sqlstatements
--
--    def text(self):
--        """Return a textual version of the stats."""
--        return textwrap.dedent("""
--        <Stats for %d requests:
--            Time:     total=%.2f; mean=%.2f; median=%.2f; std=%.2f
--            SQL time: total=%.2f; mean=%.2f; median=%.2f; std=%.2f
--            SQL stmt: total=%.f;  mean=%.2f; median=%.f; std=%.2f
--            >""" % (
--                self.total_hits, self.total_time, self.mean, self.median,
--                self.std, self.total_sqltime, self.mean_sqltime,
--                self.median_sqltime, self.std_sqltime,
--                self.total_sqlstatements, self.mean_sqlstatements,
--                self.median_sqlstatements, self.std_sqlstatements))
--
--
--class OnlineStats(Stats):
--    """Implementation of stats that can be computed online.
--
--    You call update() for each request and the stats are updated incrementally
--    with minimum storage space.
--    """
--
--    def __init__(self, histogram_width, histogram_resolution):
--        self.time_stats = OnlineStatsCalculator()
--        self.time_median_approximate = OnlineApproximateMedian()
--        self.sql_time_stats = OnlineStatsCalculator()
--        self.sql_time_median_approximate = OnlineApproximateMedian()
--        self.sql_statements_stats = OnlineStatsCalculator()
--        self.sql_statements_median_approximate = OnlineApproximateMedian()
--        self.histogram = Histogram(histogram_width, histogram_resolution)
--
--    @property
--    def total_hits(self):
--        return self.time_stats.count
--
--    @property
--    def total_time(self):
--        return self.time_stats.sum
--
--    @property
--    def mean(self):
--        return self.time_stats.mean
--
--    @property
--    def median(self):
--        return self.time_median_approximate.median
--
--    @property
--    def std(self):
--        return self.time_stats.std
--
--    @property
--    def total_sqltime(self):
--        return self.sql_time_stats.sum
--
--    @property
--    def mean_sqltime(self):
--        return self.sql_time_stats.mean
--
--    @property
--    def median_sqltime(self):
--        return self.sql_time_median_approximate.median
--
--    @property
--    def std_sqltime(self):
--        return self.sql_time_stats.std
--
--    @property
--    def total_sqlstatements(self):
--        return self.sql_statements_stats.sum
--
--    @property
--    def mean_sqlstatements(self):
--        return self.sql_statements_stats.mean
--
--    @property
--    def median_sqlstatements(self):
--        return self.sql_statements_median_approximate.median
--
--    @property
--    def std_sqlstatements(self):
--        return self.sql_statements_stats.std
--
--    def update(self, request):
--        """Update the stats based on request."""
--        self.time_stats.update(request.app_seconds)
--        self.time_median_approximate.update(request.app_seconds)
--        self.sql_time_stats.update(request.sql_seconds)
--        self.sql_time_median_approximate.update(request.sql_seconds)
--        self.sql_statements_stats.update(request.sql_statements)
--        self.sql_statements_median_approximate.update(request.sql_statements)
--        self.histogram.update(request.app_seconds)
--
--    def __add__(self, other):
--        """Merge another OnlineStats with this one."""
--        results = copy.deepcopy(self)
--        results.time_stats += other.time_stats
--        results.time_median_approximate += other.time_median_approximate
--        results.sql_time_stats += other.sql_time_stats
--        results.sql_time_median_approximate += (
--            other.sql_time_median_approximate)
--        results.sql_statements_stats += other.sql_statements_stats
--        results.sql_statements_median_approximate += (
--            other.sql_statements_median_approximate)
--        results.histogram = self.histogram + other.histogram
--        return results
--
--
--class Histogram:
--    """A simple object to compute histogram of a value."""
--
--    @staticmethod
--    def from_bins_data(data):
--        """Create an histogram from existing bins data."""
--        assert data[0][0] == 0, "First bin should start at zero."
--
--        hist = Histogram(len(data), data[1][0])
--        for idx, bin in enumerate(data):
--            hist.count += bin[1]
--            hist.bins[idx][1] = bin[1]
--
--        return hist
--
--    def __init__(self, bins_count, bins_size):
--        """Create a new histogram.
--
--        The histogram will count the frequency of values in bins_count bins
--        of bins_size each.
--        """
--        self.count = 0
--        self.bins_count = bins_count
--        self.bins_size = bins_size
--        self.bins = []
--        for x in range(bins_count):
--            self.bins.append([x*bins_size, 0])
--
--    @property
--    def bins_relative(self):
--        """Return the bins with the frequency expressed as a ratio."""
--        return [[x, float(f)/self.count] for x, f in self.bins]
--
--    def update(self, value):
--        """Update the histogram for this value.
--
--        All values higher than the last bin minimum are counted in that last
--        bin.
--        """
--        self.count += 1
--        idx = int(min(self.bins_count-1, value / self.bins_size))
--        self.bins[idx][1] += 1
--
--    def __repr__(self):
--        """A string representation of this histogram."""
--        return "<Histogram %s>" % self.bins
--
--    def __eq__(self, other):
--        """Two histogram are equals if they have the same bins content."""
--        if not isinstance(other, Histogram):
--            return False
--
--        if self.bins_count != other.bins_count:
--            return False
--
--        if self.bins_size != other.bins_size:
--            return False
--
--        for idx, other_bin in enumerate(other.bins):
--            if self.bins[idx][1] != other_bin[1]:
--                return False
--
--        return True
--
--    def __add__(self, other):
--        """Add the frequency of the other histogram to this one.
--
--        The resulting histogram has the same bins_size than this one.
--        If the other one has a bigger bins_size, we'll assume an even
--        distribution and distribute the frequency across the smaller bins. If
--        it has a lower bin_size, we'll aggregate its bins into the larger
--        ones. We only support different bins_size if the ratio can be
--        expressed as the ratio between 1 and an integer.
--
--        The resulting histogram is as wide as the widest one.
--        """
--        ratio = float(other.bins_size) / self.bins_size
--        bins_count = max(self.bins_count, math.ceil(other.bins_count * ratio))
--        total = Histogram(int(bins_count), self.bins_size)
--        total.count = self.count + other.count
--
--        # Copy our bins into the total
--        for idx, bin in enumerate(self.bins):
--            total.bins[idx][1] = bin[1]
--
--        assert int(ratio) == ratio or int(1/ratio) == 1/ratio, (
--            "We only support different bins size when the ratio is an "
--            "integer to 1: "
--            % ratio)
--
--        if ratio >= 1:
--            # We distribute the frequency across the bins.
--            # For example. if the ratio is 3:1, we'll add a third
--            # of the lower resolution bin to 3 of the higher one.
--            for other_idx, bin in enumerate(other.bins):
--                f = bin[1] / ratio
--                start = int(math.floor(other_idx * ratio))
--                end = int(start + ratio)
--                for idx in range(start, end):
--                    total.bins[idx][1] += f
--        else:
--            # We need to collect the higher resolution bins into the
--            # corresponding lower one.
--            for other_idx, bin in enumerate(other.bins):
--                idx = int(other_idx * ratio)
--                total.bins[idx][1] += bin[1]
--
--        return total
--
--
--class RequestTimes:
--    """Collect statistics from requests.
--
--    Statistics are updated by calling the add_request() method.
--
--    Statistics for mean/stddev/total/median for request times, SQL times and
--    number of SQL statements are collected.
--
--    They are grouped by Category, URL or PageID.
--    """
--
--    def __init__(self, categories, options):
--        self.by_pageids = options.pageids
--        self.top_urls = options.top_urls
--        # We only keep in memory 50 times the number of URLs we want to
--        # return. The number of URLs can go pretty high (because of the
--        # distinct query parameters).
--        #
--        # Keeping all in memory at once is prohibitive. On a small but
--        # representative sample, keeping 50 times the possible number of
--        # candidates and culling to 90% on overflow, generated an identical
--        # report than keeping all the candidates in-memory.
--        #
--        # Keeping 10 times or culling at 90% generated a near-identical report
--        # (it differed a little in the tail.)
--        #
--        # The size/cull parameters might need to change if the requests
--        # distribution become very different than what it currently is.
--        self.top_urls_cache_size = self.top_urls * 50
--
--        # Histogram has a bin per resolution up to our timeout
--        #(and an extra bin).
--        self.histogram_resolution = float(options.resolution)
--        self.histogram_width = int(
--            options.timeout / self.histogram_resolution) + 1
--        self.category_times = [
--            (category, OnlineStats(
--                self.histogram_width, self.histogram_resolution))
--            for category in categories]
--        self.url_times = {}
--        self.pageid_times = {}
--
--    def add_request(self, request):
--        """Add request to the set of requests we collect stats for."""
--        matched = []
--        for category, stats in self.category_times:
--            if category.match(request):
--                stats.update(request)
--                if category.partition:
--                    matched.append(category.title)
--
--        if len(matched) > 1:
--            log.warning(
--                "Multiple partition categories matched by %s (%s)",
--                request.url, ", ".join(matched))
--        elif not matched:
--            log.warning("%s isn't part of the partition", request.url)
--
--        if self.by_pageids:
--            pageid = request.pageid or 'Unknown'
--            stats = self.pageid_times.setdefault(
--                pageid, OnlineStats(
--                    self.histogram_width, self.histogram_resolution))
--            stats.update(request)
--
--        if self.top_urls:
--            stats = self.url_times.setdefault(
--                request.url, OnlineStats(
--                    self.histogram_width, self.histogram_resolution))
--            stats.update(request)
--            #  Whenever we have more URLs than we need to, discard 10%
--            # that is less likely to end up in the top.
--            if len(self.url_times) > self.top_urls_cache_size:
--                cutoff = int(self.top_urls_cache_size*0.90)
--                self.url_times = dict(
--                    sorted(self.url_times.items(),
--                    key=lambda (url, stats): stats.total_time,
--                    reverse=True)[:cutoff])
--
--    def get_category_times(self):
--        """Return the times for each category."""
--        return self.category_times
--
--    def get_top_urls_times(self):
--        """Return the times for the Top URL by total time"""
--        # Sort the result by total time
--        return sorted(
--            self.url_times.items(),
--            key=lambda (url, stats): stats.total_time,
--            reverse=True)[:self.top_urls]
--
--    def get_pageid_times(self):
--        """Return the times for the pageids."""
--        # Sort the result by pageid
--        return sorted(self.pageid_times.items())
--
--    def __add__(self, other):
--        """Merge two RequestTimes together."""
--        results = copy.deepcopy(self)
--        for other_category, other_stats in other.category_times:
--            for i, (category, stats) in enumerate(self.category_times):
--                if category.title == other_category.title:
--                    results.category_times[i] = (
--                        category, stats + other_stats)
--                    break
--            else:
--                results.category_times.append(
--                    (other_category, copy.deepcopy(other_stats)))
--
--        url_times = results.url_times
--        for url, stats in other.url_times.items():
--            if url in url_times:
--                url_times[url] += stats
--            else:
--                url_times[url] = copy.deepcopy(stats)
--        # Only keep top_urls_cache_size entries.
--        if len(self.url_times) > self.top_urls_cache_size:
--            self.url_times = dict(
--                sorted(
--                    url_times.items(),
--                    key=lambda (url, stats): stats.total_time,
--                    reverse=True)[:self.top_urls_cache_size])
--
--        pageid_times = results.pageid_times
--        for pageid, stats in other.pageid_times.items():
--            if pageid in pageid_times:
--                pageid_times[pageid] += stats
--            else:
--                pageid_times[pageid] = copy.deepcopy(stats)
--
--        return results
--
--
--def main():
--    parser = LPOptionParser("%prog [args] tracelog [...]")
--
--    parser.add_option(
--        "-c", "--config", dest="config",
--        default=os.path.join(
--            config.root, "utilities", "page-performance-report.ini"),
--        metavar="FILE", help="Load configuration from FILE")
--    parser.add_option(
--        "--from", dest="from_ts", type="datetime",
--        default=None, metavar="TIMESTAMP",
--        help="Ignore log entries before TIMESTAMP")
--    parser.add_option(
--        "--until", dest="until_ts", type="datetime",
--        default=None, metavar="TIMESTAMP",
--        help="Ignore log entries after TIMESTAMP")
--    parser.add_option(
--        "--no-partition", dest="partition",
--        action="store_false", default=True,
--        help="Do not produce partition report")
--    parser.add_option(
--        "--no-categories", dest="categories",
--        action="store_false", default=True,
--        help="Do not produce categories report")
--    parser.add_option(
--        "--no-pageids", dest="pageids",
--        action="store_false", default=True,
--        help="Do not produce pageids report")
--    parser.add_option(
--        "--top-urls", dest="top_urls", type=int, metavar="N",
--        default=50, help="Generate report for top N urls by hitcount.")
--    parser.add_option(
--        "--directory", dest="directory",
--        default=os.getcwd(), metavar="DIR",
--        help="Output reports in DIR directory")
--    parser.add_option(
--        "--timeout", dest="timeout",
--        # Default to 9: our production timeout.
--        default=9, type="int", metavar="SECONDS",
--        help="The configured timeout value: used to determine high risk " +
--        "page ids. That would be pages which 99% under render time is "
--        "greater than timeoout - 2s. Default is %defaults.")
--    parser.add_option(
--        "--histogram-resolution", dest="resolution",
--        # Default to 0.5s
--        default=0.5, type="float", metavar="SECONDS",
--        help="The resolution of the histogram bin width. Detault to "
--        "%defaults.")
--    parser.add_option(
--        "--merge", dest="merge",
--        default=False, action='store_true',
--        help="Files are interpreted as pickled stats and are aggregated " +
--        "for the report.")
--
--    options, args = parser.parse_args()
--
--    if not os.path.isdir(options.directory):
--        parser.error("Directory %s does not exist" % options.directory)
--
--    if len(args) == 0:
--        parser.error("At least one zserver tracelog file must be provided")
--
--    if options.from_ts is not None and options.until_ts is not None:
--        if options.from_ts > options.until_ts:
--            parser.error(
--                "--from timestamp %s is before --until timestamp %s"
--                % (options.from_ts, options.until_ts))
--    if options.from_ts is not None or options.until_ts is not None:
--        if options.merge:
--            parser.error('--from and --until cannot be used with --merge')
--
--    for filename in args:
--        if not os.path.exists(filename):
--            parser.error("Tracelog file %s not found." % filename)
--
--    if not os.path.exists(options.config):
--        parser.error("Config file %s not found." % options.config)
--
--    # Need a better config mechanism as ConfigParser doesn't preserve order.
--    script_config = RawConfigParser()
--    script_config.optionxform = str # Make keys case sensitive.
--    script_config.readfp(open(options.config))
--
--    categories = [] # A list of Category, in report order.
--    for option in script_config.options('categories'):
--        regexp = script_config.get('categories', option)
--        try:
--            categories.append(Category(option, regexp))
--        except sre_constants.error as x:
--            log.fatal("Unable to compile regexp %r (%s)" % (regexp, x))
--            return 1
--    categories.sort()
--
--    if len(categories) == 0:
--        parser.error("No data in [categories] section of configuration.")
--
--    # Determine the categories making a partition of the requests
--    for option in script_config.options('partition'):
--        for category in categories:
--            if category.title == option:
--                category.partition = True
--                break
--        else:
--            log.warning(
--                "In partition definition: %s isn't a defined category",
--                option)
--
--    times = RequestTimes(categories, options)
--
--    if options.merge:
--        for filename in args:
--            log.info('Merging %s...' % filename)
--            f = bz2.BZ2File(filename, 'r')
--            times += cPickle.load(f)
--            f.close()
--    else:
--        parse(args, times, options)
--
--    category_times = times.get_category_times()
--
--    pageid_times = []
--    url_times= []
--    if options.top_urls:
--        url_times = times.get_top_urls_times()
--    if options.pageids:
--        pageid_times = times.get_pageid_times()
--
--    def _report_filename(filename):
--        return os.path.join(options.directory, filename)
--
--    # Partition report
--    if options.partition:
--        report_filename = _report_filename('partition.html')
--        log.info("Generating %s", report_filename)
--        partition_times = [
--            category_time
--            for category_time in category_times
--            if category_time[0].partition]
--        html_report(
--            open(report_filename, 'w'), partition_times, None, None,
--            histogram_resolution=options.resolution,
--            category_name='Partition')
--
--    # Category only report.
--    if options.categories:
--        report_filename = _report_filename('categories.html')
--        log.info("Generating %s", report_filename)
--        html_report(
--            open(report_filename, 'w'), category_times, None, None,
--            histogram_resolution=options.resolution)
--
--    # Pageid only report.
--    if options.pageids:
--        report_filename = _report_filename('pageids.html')
--        log.info("Generating %s", report_filename)
--        html_report(
--            open(report_filename, 'w'), None, pageid_times, None,
--            histogram_resolution=options.resolution)
--
--    # Top URL only report.
--    if options.top_urls:
--        report_filename = _report_filename('top%d.html' % options.top_urls)
--        log.info("Generating %s", report_filename)
--        html_report(
--            open(report_filename, 'w'), None, None, url_times,
--            histogram_resolution=options.resolution)
--
--    # Combined report.
--    if options.categories and options.pageids:
--        report_filename = _report_filename('combined.html')
--        html_report(
--            open(report_filename, 'w'),
--            category_times, pageid_times, url_times,
--            histogram_resolution=options.resolution)
--
--    # Report of likely timeout candidates
--    report_filename = _report_filename('timeout-candidates.html')
--    log.info("Generating %s", report_filename)
--    html_report(
--        open(report_filename, 'w'), None, pageid_times, None,
--        options.timeout - 2,
--        histogram_resolution=options.resolution)
--
--    # Save the times cache for later merging.
--    report_filename = _report_filename('stats.pck.bz2')
--    log.info("Saving times database in %s", report_filename)
--    stats_file = bz2.BZ2File(report_filename, 'w')
--    cPickle.dump(times, stats_file, protocol=cPickle.HIGHEST_PROTOCOL)
--    stats_file.close()
--
--    # Output metrics for selected categories.
--    report_filename = _report_filename('metrics.dat')
--    log.info('Saving category_metrics %s', report_filename)
--    metrics_file = open(report_filename, 'w')
--    writer = csv.writer(metrics_file, delimiter=':')
--    date = options.until_ts or options.from_ts or datetime.utcnow()
--    date = time.mktime(date.timetuple())
--
--    for option in script_config.options('metrics'):
--        name = script_config.get('metrics', option)
--        for category, stats in category_times:
--            if category.title == name:
--                writer.writerows([
--                    ("%s_99" % option, "%f@%d" % (
--                        stats.ninetyninth_percentile_time, date)),
--                    ("%s_hits" % option, "%d@%d" % (stats.total_hits, date))])
--                break
--        else:
--            log.warning("Can't find category %s for metric %s" % (
--                option, name))
--    metrics_file.close()
--
--    return 0
--
--
--def smart_open(filename, mode='r'):
--    """Open a file, transparently handling compressed files.
--
--    Compressed files are detected by file extension.
--    """
--    ext = os.path.splitext(filename)[1]
--    if ext == '.bz2':
--        return bz2.BZ2File(filename, 'r')
--    elif ext == '.gz':
--        return gzip.GzipFile(filename, 'r')
--    else:
--        return open(filename, mode)
--
--
--class MalformedLine(Exception):
--    """A malformed line was found in the trace log."""
--
--
--_ts_re = re.compile(
--    '^(\d{4})-(\d\d)-(\d\d)\s(\d\d):(\d\d):(\d\d)(?:.(\d{6}))?$')
--
--
--def parse_timestamp(ts_string):
--    match = _ts_re.search(ts_string)
--    if match is None:
--        raise ValueError("Invalid timestamp")
--    return datetime(
--        *(int(elem) for elem in match.groups() if elem is not None))
--
--
--def parse(tracefiles, times, options):
--    requests = {}
--    total_requests = 0
--    for tracefile in tracefiles:
--        log.info('Processing %s', tracefile)
--        for line in smart_open(tracefile):
--            line = line.rstrip()
--            try:
--                record = line.split(' ', 7)
--                try:
--                    record_type, request_id, date, time_ = record[:4]
--                except ValueError:
--                    raise MalformedLine()
--
--                if record_type == 'S':
--                    # Short circuit - we don't care about these entries.
--                    continue
--
--                # Parse the timestamp.
--                ts_string = '%s %s' % (date, time_)
--                try:
--                    dt = parse_timestamp(ts_string)
--                except ValueError:
--                    raise MalformedLine(
--                        'Invalid timestamp %s' % repr(ts_string))
--
--                # Filter entries by command line date range.
--                if options.from_ts is not None and dt < options.from_ts:
--                    continue # Skip to next line.
--                if options.until_ts is not None and dt > options.until_ts:
--                    break # Skip to next log file.
--
--                args = record[4:]
--
--                def require_args(count):
--                    if len(args) < count:
--                        raise MalformedLine()
--
--                if record_type == 'B': # Request begins.
--                    require_args(2)
--                    requests[request_id] = Request(dt, args[0], args[1])
--                    continue
--
--                request = requests.get(request_id, None)
--                if request is None: # Just ignore partial records.
--                    continue
--
--                # Old stype extension record from Launchpad. Just
--                # contains the URL.
--                if (record_type == '-' and len(args) == 1
--                    and args[0].startswith('http')):
--                    request.url = args[0]
--
--                # New style extension record with a prefix.
--                elif record_type == '-':
--                    # Launchpad outputs several things as tracelog
--                    # extension records. We include a prefix to tell
--                    # them apart.
--                    require_args(1)
--
--                    parse_extension_record(request, args)
--
--                elif record_type == 'I': # Got request input.
--                    require_args(1)
--                    request.I(dt, args[0])
--
--                elif record_type == 'C': # Entered application thread.
--                    request.C(dt)
--
--                elif record_type == 'A': # Application done.
--                    require_args(2)
--                    request.A(dt, args[0], args[1])
--
--                elif record_type == 'E': # Request done.
--                    del requests[request_id]
--                    request.E(dt)
--                    total_requests += 1
--                    if total_requests % 10000 == 0:
--                        log.debug("Parsed %d requests", total_requests)
--
--                    # Add the request to any matching categories.
--                    times.add_request(request)
--                else:
--                    raise MalformedLine('Unknown record type %s', record_type)
--            except MalformedLine as x:
--                log.error(
--                    "Malformed line %s (%s)" % (repr(line), x))
--
--
--def parse_extension_record(request, args):
--    """Decode a ZServer extension records and annotate request."""
--    prefix = args[0]
--
--    if prefix == 'u':
--        request.url = ' '.join(args[1:]) or None
--    elif prefix == 'p':
--        request.pageid = ' '.join(args[1:]) or None
--    elif prefix == 't':
--        if len(args) != 4:
--            raise MalformedLine("Wrong number of arguments %s" % (args,))
--        request.sql_statements = int(args[2])
--        request.sql_seconds = float(args[3]) / 1000
--    else:
--        raise MalformedLine(
--            "Unknown extension prefix %s" % prefix)
--
--
--def html_report(
--    outf, category_times, pageid_times, url_times,
--    ninetyninth_percentile_threshold=None, histogram_resolution=0.5,
--    category_name='Category'):
--    """Write an html report to outf.
--
--    :param outf: A file object to write the report to.
--    :param category_times: The time statistics for categories.
--    :param pageid_times: The time statistics for pageids.
--    :param url_times: The time statistics for the top XXX urls.
--    :param ninetyninth_percentile_threshold: Lower threshold for inclusion of
--        pages in the pageid section; pages where 99 percent of the requests are
--        served under this threshold will not be included.
--    :param histogram_resolution: used as the histogram bar width
--    :param category_name: The name to use for category report. Defaults to
--        'Category'.
--    """
--
--    print >> outf, dedent('''\
--        <!DOCTYPE html>
--        <html>
--        <head>
--        <meta http-equiv="Content-Type" content="text/html; charset=utf-8">
--        <title>Launchpad Page Performance Report %(date)s</title>
--        <script language="javascript" type="text/javascript"
--            src="https://devpad.canonical.com/~lpqateam/ppr/js/flot/jquery.min.js"
--            ></script>
--        <script language="javascript" type="text/javascript"
--            src="https://devpad.canonical.com/~lpqateam/ppr/js/jquery.appear-1.1.1.min.js"
--            ></script>
--        <script language="javascript" type="text/javascript"
--            src="https://devpad.canonical.com/~lpqateam/ppr/js/flot/jquery.flot.min.js"
--            ></script>
--        <script language="javascript" type="text/javascript"
--            src="https://devpad.canonical.com/~lpqateam/ppr/js/sorttable.js"></script>
--        <style type="text/css">
--            h3 { font-weight: normal; font-size: 1em; }
--            thead th { padding-left: 1em; padding-right: 1em; }
--            .category-title { text-align: right; padding-right: 2em;
--                              max-width: 25em; }
--            .regexp { font-size: x-small; font-weight: normal; }
--            .mean { text-align: right; padding-right: 1em; }
--            .median { text-align: right; padding-right: 1em; }
--            .standard-deviation { text-align: right; padding-right: 1em; }
--            .histogram { padding: 0.5em 1em; width:400px; height:250px; }
--            .odd-row { background-color: #eeeeff; }
--            .even-row { background-color: #ffffee; }
--            table.sortable thead {
--                background-color:#eee;
--                color:#666666;
--                font-weight: bold;
--                cursor: default;
--                }
--            td.numeric {
--                font-family: monospace;
--                text-align: right;
--                padding: 1em;
--                }
--            .clickable { cursor: hand; }
--            .total-hits, .histogram, .median-sqltime,
--            .median-sqlstatements { border-right: 1px dashed #000000; }
--        </style>
--        </head>
--        <body>
--        <h1>Launchpad Page Performance Report</h1>
--        <h3>%(date)s</h3>
--        ''' % {'date': time.ctime()})
--
--    table_header = dedent('''\
--        <table class="sortable page-performance-report">
--        <caption align="top">Click on column headings to sort.</caption>
--        <thead>
--            <tr>
--            <th class="clickable">Name</th>
--
--            <th class="clickable">Total Hits</th>
--
--            <th class="clickable">99% Under Time (secs)</th>
--
--            <th class="clickable">Mean Time (secs)</th>
--            <th class="clickable">Time Standard Deviation</th>
--            <th class="clickable">Median Time (secs)</th>
--            <th class="sorttable_nosort">Time Distribution</th>
--
--            <th class="clickable">99% Under SQL Time (secs)</th>
--            <th class="clickable">Mean SQL Time (secs)</th>
--            <th class="clickable">SQL Time Standard Deviation</th>
--            <th class="clickable">Median SQL Time (secs)</th>
--
--            <th class="clickable">99% Under SQL Statements</th>
--            <th class="clickable">Mean SQL Statements</th>
--            <th class="clickable">SQL Statement Standard Deviation</th>
--            <th class="clickable">Median SQL Statements</th>
--
--            <th class="clickable">Hits * 99% Under SQL Statement</th>
--            </tr>
--        </thead>
--        <tbody>
--        ''')
--    table_footer = "</tbody></table>"
--
--    # Store our generated histograms to output Javascript later.
--    histograms = []
--
--    def handle_times(html_title, stats):
--        histograms.append(stats.histogram)
--        print >> outf, dedent("""\
--            <tr>
--            <th class="category-title">%s</th>
--            <td class="numeric total-hits">%d</td>
--            <td class="numeric 99pc-under-time">%.2f</td>
--            <td class="numeric mean-time">%.2f</td>
--            <td class="numeric std-time">%.2f</td>
--            <td class="numeric median-time">%.2f</td>
--            <td>
--                <div class="histogram" id="histogram%d"></div>
--            </td>
--            <td class="numeric 99pc-under-sqltime">%.2f</td>
--            <td class="numeric mean-sqltime">%.2f</td>
--            <td class="numeric std-sqltime">%.2f</td>
--            <td class="numeric median-sqltime">%.2f</td>
--
--            <td class="numeric 99pc-under-sqlstatement">%.f</td>
--            <td class="numeric mean-sqlstatements">%.2f</td>
--            <td class="numeric std-sqlstatements">%.2f</td>
--            <td class="numeric median-sqlstatements">%.2f</td>
--
--            <td class="numeric high-db-usage">%.f</td>
--            </tr>
--            """ % (
--                html_title,
--                stats.total_hits, stats.ninetyninth_percentile_time,
--                stats.mean, stats.std, stats.median,
--                len(histograms) - 1,
--                stats.ninetyninth_percentile_sqltime, stats.mean_sqltime,
--                stats.std_sqltime, stats.median_sqltime,
--                stats.ninetyninth_percentile_sqlstatements,
--                stats.mean_sqlstatements,
--                stats.std_sqlstatements, stats.median_sqlstatements,
--                stats.ninetyninth_percentile_sqlstatements* stats.total_hits,
--                ))
--
--    # Table of contents
--    print >> outf, '<ol>'
--    if category_times:
--        print >> outf, '<li><a href="#catrep">%s Report</a></li>' % (
--            category_name)
--    if pageid_times:
--        print >> outf, '<li><a href="#pageidrep">Pageid Report</a></li>'
--    if url_times:
--        print >> outf, '<li><a href="#topurlrep">Top URL Report</a></li>'
--    print >> outf, '</ol>'
--
--    if category_times:
--        print >> outf, '<h2 id="catrep">%s Report</h2>' % (
--            category_name)
--        print >> outf, table_header
--        for category, times in category_times:
--            html_title = '%s<br/><span class="regexp">%s</span>' % (
--                html_quote(category.title), html_quote(category.regexp))
--            handle_times(html_title, times)
--        print >> outf, table_footer
--
--    if pageid_times:
--        print >> outf, '<h2 id="pageidrep">Pageid Report</h2>'
--        print >> outf, table_header
--        for pageid, times in pageid_times:
--            if (ninetyninth_percentile_threshold is not None and
--                (times.ninetyninth_percentile_time <
--                ninetyninth_percentile_threshold)):
--                continue
--            handle_times(html_quote(pageid), times)
--        print >> outf, table_footer
--
--    if url_times:
--        print >> outf, '<h2 id="topurlrep">Top URL Report</h2>'
--        print >> outf, table_header
--        for url, times in url_times:
--            handle_times(html_quote(url), times)
--        print >> outf, table_footer
--
--    # Ourput the javascript to render our histograms nicely, replacing
--    # the placeholder <div> tags output earlier.
--    print >> outf, dedent("""\
--        <script language="javascript" type="text/javascript">
--        $(function () {
--            var options = {
--                series: {
--                    bars: {show: true, barWidth: %s}
--                    },
--                xaxis: {
--                    tickFormatter: function (val, axis) {
--                        return val.toFixed(axis.tickDecimals) + "s";
--                        }
--                    },
--                yaxis: {
--                    min: 0,
--                    max: 1,
--                    transform: function (v) {
--                        return Math.pow(Math.log(v*100+1)/Math.LN2, 0.5);
--                        },
--                    inverseTransform: function (v) {
--                        return Math.pow(Math.exp(v*100+1)/Math.LN2, 2);
--                        },
--                    tickDecimals: 1,
--                    tickFormatter: function (val, axis) {
--                        return (val * 100).toFixed(axis.tickDecimals) + "%%";
--                        },
--                    ticks: [0.001,0.01,0.10,0.50,1.0]
--                    },
--                grid: {
--                    aboveData: true,
--                    labelMargin: 15
--                    }
--                };
--        """ % histogram_resolution)
--
--    for i, histogram in enumerate(histograms):
--        if histogram.count == 0:
--            continue
--        print >> outf, dedent("""\
--            function plot_histogram_%(id)d() {
--                var d = %(data)s;
--
--                $.plot(
--                    $("#histogram%(id)d"),
--                    [{data: d}], options);
--            }
--            $('#histogram%(id)d').appear(function() {
--                plot_histogram_%(id)d();
--            });
--
--            """ % {'id': i, 'data': json.dumps(histogram.bins_relative)})
--
--    print >> outf, dedent("""\
--            });
--        </script>
--        </body>
--        </html>
--        """)
 === removed file 'lib/lp/scripts/utilities/tests/test_pageperformancereport.py'
 --- lib/lp/scripts/utilities/tests/test_pageperformancereport.py	2011-08-12 11:37:08 +0000
 +++ lib/lp/scripts/utilities/tests/test_pageperformancereport.py	1970-01-01 00:00:00 +0000
@@ -1,483 +0,0 @@
--# Copyright 2010 Canonical Ltd.  This software is licensed under the
--# GNU Affero General Public License version 3 (see the file LICENSE).
--
--"""Test the pageperformancereport script."""
--
--__metaclass__ = type
--
--from lp.scripts.utilities.pageperformancereport import (
--    Category,
--    Histogram,
--    OnlineApproximateMedian,
--    OnlineStats,
--    OnlineStatsCalculator,
--    RequestTimes,
--    Stats,
--    )
--from lp.testing import TestCase
--
--
--class FakeOptions:
--    timeout = 5
--    db_file = None
--    pageids = True
--    top_urls = 3
--    resolution = 1
--
--    def __init__(self, **kwargs):
--        """Assign all arguments as attributes."""
--        self.__dict__.update(kwargs)
--
--
--class FakeRequest:
--
--    def __init__(self, url, app_seconds, sql_statements=None,
--                 sql_seconds=None, pageid=None):
--        self.url = url
--        self.pageid = pageid
--        self.app_seconds = app_seconds
--        self.sql_statements = sql_statements
--        self.sql_seconds = sql_seconds
--
--
--class FakeStats(Stats):
--
--    def __init__(self, **kwargs):
--        # Override the constructor to just store the values.
--        self.__dict__.update(kwargs)
--
--
--FAKE_REQUESTS = [
--    FakeRequest('/', 0.5, pageid='+root'),
--    FakeRequest('/bugs', 4.5, 56, 3.0, pageid='+bugs'),
--    FakeRequest('/bugs', 4.2, 56, 2.2, pageid='+bugs'),
--    FakeRequest('/bugs', 5.5, 76, 4.0, pageid='+bugs'),
--    FakeRequest('/ubuntu', 2.5, 6, 2.0, pageid='+distribution'),
--    FakeRequest('/launchpad', 3.5, 3, 3.0, pageid='+project'),
--    FakeRequest('/bzr', 2.5, 4, 2.0, pageid='+project'),
--    FakeRequest('/bugs/1', 20.5, 567, 14.0, pageid='+bug'),
--    FakeRequest('/bugs/1', 15.5, 567, 9.0, pageid='+bug'),
--    FakeRequest('/bugs/5', 1.5, 30, 1.2, pageid='+bug'),
--    FakeRequest('/lazr', 1.0, 16, 0.3, pageid='+project'),
--    FakeRequest('/drizzle', 0.9, 11, 1.3, pageid='+project'),
--    ]
--
--
--# The category stats computed for the above 12 requests.
--CATEGORY_STATS = [
--    # Median is an approximation.
--    # Real values are: 2.50, 2.20, 30
--    (Category('All', ''), FakeStats(
--        total_hits=12, total_time=62.60, mean=5.22, median=4.20, std=5.99,
--        total_sqltime=42, mean_sqltime=3.82, median_sqltime=3.0,
--        std_sqltime=3.89,
--        total_sqlstatements=1392, mean_sqlstatements=126.55,
--        median_sqlstatements=56, std_sqlstatements=208.94,
--        histogram=[[0, 2], [1, 2], [2, 2], [3, 1], [4, 2], [5, 3]],
--        )),
--    (Category('Test', ''), FakeStats(
--        histogram=[[0, 0], [1, 0], [2, 0], [3, 0], [4, 0], [5, 0]])),
--    (Category('Bugs', ''), FakeStats(
--        total_hits=6, total_time=51.70, mean=8.62, median=4.5, std=6.90,
--        total_sqltime=33.40, mean_sqltime=5.57, median_sqltime=3,
--        std_sqltime=4.52,
--        total_sqlstatements=1352, mean_sqlstatements=225.33,
--        median_sqlstatements=56, std_sqlstatements=241.96,
--        histogram=[[0, 0], [1, 1], [2, 0], [3, 0], [4, 2], [5, 3]],
--        )),
--    ]
--
--
--# The top 3 URL stats computed for the above 12 requests.
--TOP_3_URL_STATS = [
--    ('/bugs/1', FakeStats(
--        total_hits=2, total_time=36.0, mean=18.0, median=15.5, std=2.50,
--        total_sqltime=23.0, mean_sqltime=11.5, median_sqltime=9.0,
--        std_sqltime=2.50,
--        total_sqlstatements=1134, mean_sqlstatements=567.0,
--        median_sqlstatements=567, std_statements=0,
--        histogram=[[0, 0], [1, 0], [2, 0], [3, 0], [4, 0], [5, 2]],
--        )),
--    ('/bugs', FakeStats(
--        total_hits=3, total_time=14.2, mean=4.73, median=4.5, std=0.56,
--        total_sqltime=9.2, mean_sqltime=3.07, median_sqltime=3,
--        std_sqltime=0.74,
--        total_sqlstatements=188, mean_sqlstatements=62.67,
--        median_sqlstatements=56, std_sqlstatements=9.43,
--        histogram=[[0, 0], [1, 0], [2, 0], [3, 0], [4, 2], [5, 1]],
--        )),
--    ('/launchpad', FakeStats(
--        total_hits=1, total_time=3.5, mean=3.5, median=3.5, std=0,
--        total_sqltime=3.0, mean_sqltime=3, median_sqltime=3, std_sqltime=0,
--        total_sqlstatements=3, mean_sqlstatements=3,
--        median_sqlstatements=3, std_sqlstatements=0,
--        histogram=[[0, 0], [1, 0], [2, 0], [3, 1], [4, 0], [5, 0]],
--        )),
--    ]
--
--
--# The pageid stats computed for the above 12 requests.
--PAGEID_STATS = [
--    ('+bug', FakeStats(
--        total_hits=3, total_time=37.5, mean=12.5, median=15.5, std=8.04,
--        total_sqltime=24.2, mean_sqltime=8.07, median_sqltime=9,
--        std_sqltime=5.27,
--        total_sqlstatements=1164, mean_sqlstatements=388,
--        median_sqlstatements=567, std_sqlstatements=253.14,
--        histogram=[[0, 0], [1, 1], [2, 0], [3, 0], [4, 0], [5, 2]],
--        )),
--    ('+bugs', FakeStats(
--        total_hits=3, total_time=14.2, mean=4.73, median=4.5, std=0.56,
--        total_sqltime=9.2, mean_sqltime=3.07, median_sqltime=3,
--        std_sqltime=0.74,
--        total_sqlstatements=188, mean_sqlstatements=62.67,
--        median_sqlstatements=56, std_sqlstatements=9.43,
--        histogram=[[0, 0], [1, 0], [2, 0], [3, 0], [4, 2], [5, 1]],
--        )),
--    ('+distribution', FakeStats(
--        total_hits=1, total_time=2.5, mean=2.5, median=2.5, std=0,
--        total_sqltime=2.0, mean_sqltime=2, median_sqltime=2, std_sqltime=0,
--        total_sqlstatements=6, mean_sqlstatements=6,
--        median_sqlstatements=6, std_sqlstatements=0,
--        histogram=[[0, 0], [1, 0], [2, 1], [3, 0], [4, 0], [5, 0]],
--        )),
--    ('+project', FakeStats(
--        total_hits=4, total_time=7.9, mean=1.98, median=1, std=1.08,
--        total_sqltime=6.6, mean_sqltime=1.65, median_sqltime=1.3,
--        std_sqltime=0.99,
--        total_sqlstatements=34, mean_sqlstatements=8.5,
--        median_sqlstatements=4, std_sqlstatements=5.32,
--        histogram=[[0, 1], [1, 1], [2, 1], [3, 1], [4, 0], [5, 0]],
--        )),
--    ('+root', FakeStats(
--        total_hits=1, total_time=0.5, mean=0.5, median=0.5, std=0,
--        histogram=[[0, 1], [1, 0], [2, 0], [3, 0], [4, 0], [5, 0]],
--        )),
--    ]
--
--
--class TestRequestTimes(TestCase):
--    """Tests the RequestTimes backend."""
--
--    def setUp(self):
--        TestCase.setUp(self)
--        self.categories = [
--            Category('All', '.*'), Category('Test', '.*test.*'),
--            Category('Bugs', '.*bugs.*')]
--        self.db = RequestTimes(self.categories, FakeOptions())
--
--    def setUpRequests(self):
--        """Insert some requests into the db."""
--        for r in FAKE_REQUESTS:
--            self.db.add_request(r)
--
--    def assertStatsAreEquals(self, expected, results):
--        self.assertEquals(
--            len(expected), len(results), 'Wrong number of results')
--        for idx in range(len(results)):
--            self.assertEquals(expected[idx][0], results[idx][0],
--                "Wrong key for results %d" % idx)
--            key = results[idx][0]
--            self.assertEquals(expected[idx][1].text(), results[idx][1].text(),
--                "Wrong stats for results %d (%s)" % (idx, key))
--            self.assertEquals(
--                Histogram.from_bins_data(expected[idx][1].histogram),
--                results[idx][1].histogram,
--                "Wrong histogram for results %d (%s)" % (idx, key))
--
--    def test_get_category_times(self):
--        self.setUpRequests()
--        category_times = self.db.get_category_times()
--        self.assertStatsAreEquals(CATEGORY_STATS, category_times)
--
--    def test_get_url_times(self):
--        self.setUpRequests()
--        url_times = self.db.get_top_urls_times()
--        self.assertStatsAreEquals(TOP_3_URL_STATS, url_times)
--
--    def test_get_pageid_times(self):
--        self.setUpRequests()
--        pageid_times = self.db.get_pageid_times()
--        self.assertStatsAreEquals(PAGEID_STATS, pageid_times)
--
--    def test___add__(self):
--        # Ensure that adding two RequestTimes together result in
--        # a merge of their constituencies.
--        db1 = self.db
--        db2 = RequestTimes(self.categories, FakeOptions())
--        db1.add_request(FakeRequest('/', 1.5, 5, 1.0, '+root'))
--        db1.add_request(FakeRequest('/bugs', 3.5, 15, 1.0, '+bugs'))
--        db2.add_request(FakeRequest('/bugs/1', 5.0, 30, 4.0, '+bug'))
--        results = db1 + db2
--        self.assertEquals(3, results.category_times[0][1].total_hits)
--        self.assertEquals(0, results.category_times[1][1].total_hits)
--        self.assertEquals(2, results.category_times[2][1].total_hits)
--        self.assertEquals(1, results.pageid_times['+root'].total_hits)
--        self.assertEquals(1, results.pageid_times['+bugs'].total_hits)
--        self.assertEquals(1, results.pageid_times['+bug'].total_hits)
--        self.assertEquals(1, results.url_times['/'].total_hits)
--        self.assertEquals(1, results.url_times['/bugs'].total_hits)
--        self.assertEquals(1, results.url_times['/bugs/1'].total_hits)
--
--    def test_histogram_init_with_resolution(self):
--        # Test that the resolution parameter increase the number of bins
--        db = RequestTimes(
--            self.categories, FakeOptions(timeout=4, resolution=1))
--        self.assertEquals(5, db.histogram_width)
--        self.assertEquals(1, db.histogram_resolution)
--        db = RequestTimes(
--            self.categories, FakeOptions(timeout=4, resolution=0.5))
--        self.assertEquals(9, db.histogram_width)
--        self.assertEquals(0.5, db.histogram_resolution)
--        db = RequestTimes(
--            self.categories, FakeOptions(timeout=4, resolution=2))
--        self.assertEquals(3, db.histogram_width)
--        self.assertEquals(2, db.histogram_resolution)
--
--
--class TestOnlineStats(TestCase):
--    """Tests for the OnlineStats class."""
--
--    def test___add__(self):
--        # Ensure that adding two OnlineStats merge all their constituencies.
--        stats1 = OnlineStats(4, 1)
--        stats1.update(FakeRequest('/', 2.0, 5, 1.5))
--        stats2 = OnlineStats(4, 1)
--        stats2.update(FakeRequest('/', 1.5, 2, 3.0))
--        stats2.update(FakeRequest('/', 5.0, 2, 2.0))
--        results = stats1 + stats2
--        self.assertEquals(3, results.total_hits)
--        self.assertEquals(2, results.median)
--        self.assertEquals(9, results.total_sqlstatements)
--        self.assertEquals(2, results.median_sqlstatements)
--        self.assertEquals(6.5, results.total_sqltime)
--        self.assertEquals(2.0, results.median_sqltime)
--        self.assertEquals(
--            Histogram.from_bins_data([[0, 0], [1, 1], [2, 1], [3, 1]]),
--            results.histogram)
--
--
--class TestOnlineStatsCalculator(TestCase):
--    """Tests for the online stats calculator."""
--
--    def setUp(self):
--        TestCase.setUp(self)
--        self.stats = OnlineStatsCalculator()
--
--    def test_stats_for_empty_set(self):
--        # Test the stats when there is no input.
--        self.assertEquals(0, self.stats.count)
--        self.assertEquals(0, self.stats.sum)
--        self.assertEquals(0, self.stats.mean)
--        self.assertEquals(0, self.stats.variance)
--        self.assertEquals(0, self.stats.std)
--
--    def test_stats_for_one_value(self):
--        # Test the stats when adding one element.
--        self.stats.update(5)
--        self.assertEquals(1, self.stats.count)
--        self.assertEquals(5, self.stats.sum)
--        self.assertEquals(5, self.stats.mean)
--        self.assertEquals(0, self.stats.variance)
--        self.assertEquals(0, self.stats.std)
--
--    def test_None_are_ignored(self):
--        self.stats.update(None)
--        self.assertEquals(0, self.stats.count)
--
--    def test_stats_for_3_values(self):
--        for x in [3, 6, 9]:
--            self.stats.update(x)
--        self.assertEquals(3, self.stats.count)
--        self.assertEquals(18, self.stats.sum)
--        self.assertEquals(6, self.stats.mean)
--        self.assertEquals(6, self.stats.variance)
--        self.assertEquals("2.45", "%.2f" % self.stats.std)
--
--    def test___add___two_empty_together(self):
--        stats2 = OnlineStatsCalculator()
--        results = self.stats + stats2
--        self.assertEquals(0, results.count)
--        self.assertEquals(0, results.sum)
--        self.assertEquals(0, results.mean)
--        self.assertEquals(0, results.variance)
--
--    def test___add___one_empty(self):
--        stats2 = OnlineStatsCalculator()
--        for x in [1, 2, 3]:
--            self.stats.update(x)
--        results = self.stats + stats2
--        self.assertEquals(3, results.count)
--        self.assertEquals(6, results.sum)
--        self.assertEquals(2, results.mean)
--        self.assertEquals(2, results.M2)
--
--    def test___add__(self):
--        stats2 = OnlineStatsCalculator()
--        for x in [3, 6, 9]:
--            self.stats.update(x)
--        for x in [1, 2, 3]:
--            stats2.update(x)
--        results = self.stats + stats2
--        self.assertEquals(6, results.count)
--        self.assertEquals(24, results.sum)
--        self.assertEquals(4, results.mean)
--        self.assertEquals(44, results.M2)
--
--
--SHUFFLE_RANGE_100 = [
--    25, 79, 99, 76, 60, 63, 87, 77, 51, 82, 42, 96, 93, 58, 32, 66, 75,
--     2, 26, 22, 11, 73, 61, 83, 65, 68, 44, 81, 64, 3, 33, 34, 15, 1,
--    92, 27, 90, 74, 46, 57, 59, 31, 13, 19, 89, 29, 56, 94, 50, 49, 62,
--    37, 21, 35, 5, 84, 88, 16, 8, 23, 40, 6, 48, 10, 97, 0, 53, 17, 30,
--    18, 43, 86, 12, 71, 38, 78, 36, 7, 45, 47, 80, 54, 39, 91, 98, 24,
--    55, 14, 52, 20, 69, 85, 95, 28, 4, 9, 67, 70, 41, 72,
--    ]
--
--
--class TestOnlineApproximateMedian(TestCase):
--    """Tests for the approximate median computation."""
--
--    def setUp(self):
--        TestCase.setUp(self)
--        self.estimator = OnlineApproximateMedian()
--
--    def test_median_is_0_when_no_input(self):
--        self.assertEquals(0, self.estimator.median)
--
--    def test_median_is_true_median_for_n_lower_than_bucket_size(self):
--        for x in range(9):
--            self.estimator.update(x)
--        self.assertEquals(4, self.estimator.median)
--
--    def test_None_input_is_ignored(self):
--        self.estimator.update(1)
--        self.estimator.update(None)
--        self.assertEquals(1, self.estimator.median)
--
--    def test_approximate_median_is_good_enough(self):
--        for x in SHUFFLE_RANGE_100:
--            self.estimator.update(x)
--        # True median is 50, 49 is good enough :-)
--        self.assertIn(self.estimator.median, range(49,52))
--
--    def test___add__(self):
--        median1 = OnlineApproximateMedian(3)
--        median1.buckets = [[1, 3], [4, 5], [6, 3]]
--        median2 = OnlineApproximateMedian(3)
--        median2.buckets = [[], [3, 6], [3, 7]]
--        results = median1 + median2
--        self.assertEquals([[1, 3], [6], [3, 7], [4]], results.buckets)
--
--
--class TestHistogram(TestCase):
--    """Test the histogram computation."""
--
--    def test__init__(self):
--        hist = Histogram(4, 1)
--        self.assertEquals(4, hist.bins_count)
--        self.assertEquals(1, hist.bins_size)
--        self.assertEquals([[0, 0], [1, 0], [2, 0], [3, 0]], hist.bins)
--
--    def test__init__bins_size_float(self):
--        hist = Histogram(9, 0.5)
--        self.assertEquals(9, hist.bins_count)
--        self.assertEquals(0.5, hist.bins_size)
--        self.assertEquals(
--            [[0, 0], [0.5, 0], [1.0, 0], [1.5, 0],
--             [2.0, 0], [2.5, 0], [3.0, 0], [3.5, 0], [4.0, 0]], hist.bins)
--
--    def test_update(self):
--        hist = Histogram(4, 1)
--        hist.update(1)
--        self.assertEquals(1, hist.count)
--        self.assertEquals([[0, 0], [1, 1], [2, 0], [3, 0]], hist.bins)
--
--        hist.update(1.3)
--        self.assertEquals(2, hist.count)
--        self.assertEquals([[0, 0], [1, 2], [2, 0], [3, 0]], hist.bins)
--
--    def test_update_float_bin_size(self):
--        hist = Histogram(4, 0.5)
--        hist.update(1.3)
--        self.assertEquals([[0, 0], [0.5, 0], [1.0, 1], [1.5, 0]], hist.bins)
--        hist.update(0.5)
--        self.assertEquals([[0, 0], [0.5, 1], [1.0, 1], [1.5, 0]], hist.bins)
--        hist.update(0.6)
--        self.assertEquals([[0, 0], [0.5, 2], [1.0, 1], [1.5, 0]], hist.bins)
--
--    def test_update_max_goes_in_last_bin(self):
--        hist = Histogram(4, 1)
--        hist.update(9)
--        self.assertEquals([[0, 0], [1, 0], [2, 0], [3, 1]], hist.bins)
--
--    def test_bins_relative(self):
--        hist = Histogram(4, 1)
--        for x in range(4):
--            hist.update(x)
--        self.assertEquals(
--            [[0, 0.25], [1, 0.25], [2, 0.25], [3, 0.25]], hist.bins_relative)
--
--    def test_from_bins_data(self):
--        hist = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        self.assertEquals(4, hist.bins_count)
--        self.assertEquals(1, hist.bins_size)
--        self.assertEquals(6, hist.count)
--        self.assertEquals([[0, 1], [1, 3], [2, 1], [3, 1]], hist.bins)
--
--    def test___repr__(self):
--        hist = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        self.assertEquals(
--            "<Histogram [[0, 1], [1, 3], [2, 1], [3, 1]]>", repr(hist))
--
--    def test___eq__(self):
--        hist1 = Histogram(4, 1)
--        hist2 = Histogram(4, 1)
--        self.assertEquals(hist1, hist2)
--
--    def test__eq___with_data(self):
--        hist1 = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        hist2 = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        self.assertEquals(hist1, hist2)
--
--    def test___add__(self):
--        hist1 = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        hist2 = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        hist3 = Histogram.from_bins_data([[0, 2], [1, 6], [2, 2], [3, 2]])
--        total = hist1 + hist2
--        self.assertEquals(hist3, total)
--        self.assertEquals(12, total.count)
--
--    def test___add___uses_widest(self):
--        # Make sure that the resulting histogram is as wide as the widest one.
--        hist1 = Histogram.from_bins_data([[0, 1], [1, 3], [2, 1], [3, 1]])
--        hist2 = Histogram.from_bins_data(
--            [[0, 1], [1, 3], [2, 1], [3, 1], [4, 2], [5, 3]])
--        hist3 = Histogram.from_bins_data(
--            [[0, 2], [1, 6], [2, 2], [3, 2], [4, 2], [5, 3]])
--        self.assertEquals(hist3, hist1 + hist2)
--
--    def test___add___interpolate_lower_resolution(self):
--        # Make sure that when the other histogram has a bigger bin_size
--        # the frequency is correctly split across the different bins.
--        hist1 = Histogram.from_bins_data(
--            [[0, 1], [0.5, 3], [1.0, 1], [1.5, 1]])
--        hist2 = Histogram.from_bins_data(
--            [[0, 1], [1, 2], [2, 3], [3, 1], [4, 1]])
--
--        hist3 = Histogram.from_bins_data(
--            [[0, 1.5], [0.5, 3.5], [1.0, 2], [1.5, 2],
--            [2.0, 1.5], [2.5, 1.5], [3.0, 0.5], [3.5, 0.5],
--            [4.0, 0.5], [4.5, 0.5]])
--        self.assertEquals(hist3, hist1 + hist2)
--
--    def test___add___higher_resolution(self):
--        # Make sure that when the other histogram has a smaller bin_size
--        # the frequency is correctly added.
--        hist1 = Histogram.from_bins_data([[0, 1], [1, 2], [2, 3]])
--        hist2 = Histogram.from_bins_data(
--            [[0, 1], [0.5, 3], [1.0, 1], [1.5, 1], [2.0, 3], [2.5, 1],
--             [3, 4], [3.5, 2]])
--
--        hist3 = Histogram.from_bins_data([[0, 5], [1, 4], [2, 7], [3, 6]])
--        self.assertEquals(hist3, hist1 + hist2)
 === removed file 'utilities/page-performance-report-daily.sh'
 --- utilities/page-performance-report-daily.sh	2011-05-04 17:32:17 +0000
 +++ utilities/page-performance-report-daily.sh	1970-01-01 00:00:00 +0000
@@ -1,115 +0,0 @@
--#!/bin/sh
--
--#TZ=UTC # trace logs are still BST - blech
--
--CATEGORY=lpnet
--LOGS_ROOTS="/srv/launchpad.net-logs/production /srv/launchpad.net-logs/edge"
--OUTPUT_ROOT=${HOME}/public_html/ppr/lpnet
--DAY_FMT="+%Y-%m-%d"
--
--find_logs() {
--    from=$1
--    until=$2
--
--    end_mtime_switch=
--    days_to_end="$(expr `date +%j` - `date -d $until +%j` - 1)"
--    if [ $days_to_end -gt 0 ]; then
--        end_mtime_switch="-daystart -mtime +$days_to_end"
--    fi
--
--    find ${LOGS_ROOTS} \
--        -maxdepth 2 -type f -newermt "$from - 1 day" $end_mtime_switch \
--        -name launchpad-trace\* \
--        | sort | xargs -x
--}
--
--# Find all the daily stats.pck.bz2 $from $until
--find_stats() {
--    from=$1
--    until=$2
--
--    # Build a string of all the days within range.
--    local dates
--    local day
--    day=$from
--    while [ $day != $until ]; do
--        dates="$dates $day"
--        day=`date $DAY_FMT -d "$day + 1 day"`
--    done
--
--    # Use that to build a regex that will be used to select
--    # the files to use.
--    local regex
--    regex="daily_(`echo $dates |sed -e 's/ /|/g'`)"
--
--    find ${OUTPUT_ROOT} -name 'stats.pck.bz2' | egrep $regex
--}
--
--report() {
--    type=$1
--    from=$2
--    until=$3
--    link=$4
--
--    local files
--    local options
--    if [ "$type" = "daily" ]; then
--        files=`find_logs $from $until`
--        options="--from=$from --until=$until"
--    else
--        files=`find_stats $from $until`
--        options="--merge"
--    fi
--
--    local dir
--    dir=${OUTPUT_ROOT}/`date -d $from +%Y-%m`/${type}_${from}_${until}
--    mkdir -p ${dir}
--
--    echo Generating report from $from until $until into $dir `date`
--
--    ./page-performance-report.py -v  --top-urls=200 --directory=${dir} \
--        $options $files
--
--    # Only do the linking if requested.
--    if [ "$link" = "link" ]; then
--        ln -sf ${dir}/partition.html \
--            ${OUTPUT_ROOT}/latest-${type}-partition.html
--        ln -sf ${dir}/categories.html \
--            ${OUTPUT_ROOT}/latest-${type}-categories.html
--        ln -sf ${dir}/pageids.html \
--            ${OUTPUT_ROOT}/latest-${type}-pageids.html
--        ln -sf ${dir}/combined.html \
--            ${OUTPUT_ROOT}/latest-${type}-combined.html
--        ln -sf ${dir}/metrics.dat ${OUTPUT_ROOT}/latest-${type}-metrics.dat
--        ln -sf ${dir}/top200.html ${OUTPUT_ROOT}/latest-${type}-top200.html
--        ln -sf ${dir}/timeout-candidates.html   \
--            ${OUTPUT_ROOT}/latest-${type}-timeout-candidates.html
--    fi
--
--    return 0
--}
--
--local link
--if [ "$3" = "-l" ]; then
--    link="link"
--fi
--
--if [ "$1" = '-d' ]; then
--    report daily `date -d $2 $DAY_FMT` `date -d "$2 + 1 day" $DAY_FMT` $link
--elif [ "$1" = '-w' ]; then
--    report weekly `date -d $2 $DAY_FMT` `date -d "$2 + 1 week" $DAY_FMT` $link
--elif [ "$1" = '-m' ]; then
--    report monthly `date -d $2 $DAY_FMT` `date -d "$2 + 1 month" $DAY_FMT` $link
--else
--    # Default invocation used from cron to generate latest one.
--    now=`date $DAY_FMT`
--    report daily `date -d yesterday $DAY_FMT` $now link
--
--    if [ `date +%a` = 'Sun' ]; then
--        report weekly `date -d 'last week' $DAY_FMT` $now link
--    fi
--
--    if [ `date +%d` = '01' ]; then
--        report monthly `date -d 'last month' $DAY_FMT` $now link
--    fi
--fi
 === removed file 'utilities/page-performance-report.ini'
 --- utilities/page-performance-report.ini	2011-09-21 21:12:02 +0000
 +++ utilities/page-performance-report.ini	1970-01-01 00:00:00 +0000
@@ -1,79 +0,0 @@
--[categories]
--# Category -> Python regular expression.
--# Remeber to quote ?, ., + & ? characters to match litterally.
--# 'kodos' is useful for interactively testing regular expressions.
--All Launchpad=.
--All Launchpad except operational pages=(?<!\+opstats|\+haproxy)$
--
--API=(^https?://api\.|/\+access-token$)
--Operational=(\+opstats|\+haproxy)$
--Web (Non API/non operational/non XML-RPC)=^https?://(?!api\.)
--    [^/]+($|/
--     (?!\+haproxy|\+opstats|\+access-token
--      |((authserver|bugs|bazaar|codehosting|
--         codeimportscheduler|mailinglists|softwarecenteragent|
--         featureflags)/\w+$)))
--Other=^/
--
--Launchpad Frontpage=^https?://launchpad\.[^/]+(/index\.html)?$
--
--# Note that the bug text dump is served on the main launchpad domain
--# and we need to exlude it from the registry stats.
--Registry=^https?://launchpad\..*(?<!/\+text)(?<!/\+access-token)$
--Registry - Person Index=^https?://launchpad\.[^/]+/%7E[^/]+(/\+index)?$
--Registry - Pillar Index=^https?://launchpad\.[^/]+/\w[^/]*(/\+index)?$
--
--Answers=^https?://answers\.
--Answers - Front page=^https?://answers\.[^/]+(/questions/\+index)?$
--
--Blueprints=^https?://blueprints\.
--Blueprints - Front page=^https?://blueprints\.[^/]+(/specs/\+index)?$
--
--# Note that the bug text dump is not served on the bugs domain,
--# probably for hysterical reasons. This is why the bugs regexp is
--# confusing.
--Bugs=^https?://(bugs\.|.+/bugs/\d+/\+text$)
--Bugs - Front page=^https?://bugs\.[^/]+(/bugs/\+index)?$
--Bugs - Bug Page=^https?://bugs\.[^/]+/.+/\+bug/\d+(/\+index)?$
--Bugs - Pillar Index=^https?://bugs\.[^/]+/\w[^/]*(/\+bugs-index)?$
--Bugs - Search=^https?://bugs\.[^/]+/.+/\+bugs$
--Bugs - Text Dump=^https?://launchpad\..+/\+text$
--
--Code=^https?://code\.
--Code - Front page=^https?://code\.[^/]+(/\+code/\+index)?$
--Code - Pillar Branches=^https?://code\.[^/]+/\w[^/]*(/\+code-index)?$
--Code - Branch Page=^https?://code\.[^/]+/%7E[^/]+/[^/]+/[^/]+(/\+index)?$
--Code - Merge Proposal=^https?://code\.[^/]+/.+/\+merge/\d+(/\+index)$
--
--Soyuz - PPA Index=^https?://launchpad\.[^/]+/.+/\+archive/[^/]+(/\+index)?$
--
--Translations=^https?://translations\.
--Translations - Front page=^https?://translations\.[^/]+/translations/\+index$
--Translations - Overview=^https?://translations\..*/\+lang/\w+(/\+index)?$
--
--Public XML-RPC=^https://(launchpad|xmlrpc)[^/]+/bazaar/\w+$
--Private XML-RPC=^https://(launchpad|xmlrpc)[^/]+/
--    (authserver|bugs|codehosting|
--     codeimportscheduler|mailinglists|
--     softwarecenteragent|featureflags)/\w+$
--
--[metrics]
--ppr_all=All Launchpad except operational pages
--ppr_web=Web (Non API/non operational/non XML-RPC)
--ppr_operational=Operational
--ppr_bugs=Bugs
--ppr_api=API
--ppr_code=Code
--ppr_public_xmlrpc=Public XML-RPC
--ppr_private_xmlrpc=Private XML-RPC
--ppr_translations=Translations
--ppr_registry=Registry
--ppr_other=Other
--
--[partition]
--API=
--Operational=
--Private XML-RPC=
--Public XML-RPC=
--Web (Non API/non operational/non XML-RPC)=
--Other=
 === removed file 'utilities/page-performance-report.py'
 --- utilities/page-performance-report.py	2010-04-27 19:48:39 +0000
 +++ utilities/page-performance-report.py	1970-01-01 00:00:00 +0000
@@ -1,18 +0,0 @@
--#!/usr/bin/python -S
--#
--# Copyright 2010 Canonical Ltd.  This software is licensed under the
--# GNU Affero General Public License version 3 (see the file LICENSE).
--
--"""Page performance report generated from zserver tracelogs."""
--
--__metaclass__ = type
--
--import _pythonpath
--
--import sys
--
--from lp.scripts.utilities.pageperformancereport import main
--
--
--if __name__ == '__main__':
--    sys.exit(main())