debian-django-cachalot/benchmark.py

#!/usr/bin/env python
# coding: utf-8

from __future__ import unicode_literals, print_function
from collections import OrderedDict
import io
import os
import platform
from random import choice
import re
import sqlite3
from subprocess import check_output
from time import time


os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'settings')

import django
django.setup()

from django.conf import settings
from django.contrib.auth.models import User, Group
from django.core.cache import caches
from django.db import connections, connection
from django.test.utils import CaptureQueriesContext, override_settings
from django.utils.encoding import force_text
import matplotlib.pyplot as plt
import _mysql
import pandas as pd
import psycopg2

import cachalot
from cachalot.api import invalidate
from cachalot.tests.models import Test


RESULTS_PATH = 'benchmark/'
DATA_PATH = '/var/lib/'
CONTEXTS = ('Control', 'Cold cache', 'Hot cache')
DIVIDER = 'divider'
DISK_DATA_RE = re.compile(r'^MODEL="(.*)" MOUNTPOINT="(.*)"$')


def get_disk_model_for_path(path):
    out = force_text(check_output(['lsblk', '-Po', 'MODEL,MOUNTPOINT']))
    mount_points = []
    previous_model = None
    for model, mount_point in [DISK_DATA_RE.match(line).groups()
                               for line in out.split('\n') if line]:
        if model:
            previous_model = model.strip()
        if mount_point:
            mount_points.append((previous_model, mount_point))
    mount_points = sorted(mount_points, key=lambda t: -len(t[1]))
    for model, mount_point in mount_points:
        if path.startswith(mount_point):
            return model


def write_conditions():
    versions = OrderedDict()

    # CPU
    with open('/proc/cpuinfo') as f:
        versions['CPU'] = re.search(r'^model name\s+: (.+)$', f.read(),
                                    flags=re.MULTILINE).group(1)
    # RAM
    with open('/proc/meminfo') as f:
        versions['RAM'] = re.search(r'^MemTotal:\s+(.+)$', f.read(),
                                    flags=re.MULTILINE).group(1)
    versions.update((
        ('Disk', get_disk_model_for_path(DATA_PATH)),
    ))
    # OS
    linux_dist = ' '.join(platform.linux_distribution()).strip()
    if linux_dist:
        versions['Linux distribution'] = linux_dist
    else:
        versions['OS'] = platform.system() + ' ' + platform.release()

    versions.update((
        ('Python', platform.python_version()),
        ('Django', django.__version__),
        ('cachalot', cachalot.__version__),
        ('sqlite', sqlite3.sqlite_version),
    ))
    # PostgreSQL
    with connections['postgresql'].cursor() as cursor:
        cursor.execute('SELECT version();')
        versions['PostgreSQL'] = re.match(r'^PostgreSQL ([\d\.]+) on .+$',
                                          cursor.fetchone()[0]).group(1)
    # MySQL
    with connections['mysql'].cursor() as cursor:
        cursor.execute('SELECT version();')
        versions['MySQL'] = cursor.fetchone()[0].split('-')[0]
    # Redis
    out = force_text(
        check_output(['redis-cli', 'INFO', 'server'])).replace('\r', '')
    versions['Redis'] = re.search(r'^redis_version:([\d\.]+)$', out,
                                  flags=re.MULTILINE).group(1)
    # memcached
    out = force_text(check_output(['memcached', '-h']))
    versions['memcached'] = re.match(r'^memcached ([\d\.]+)$', out,
                                     flags=re.MULTILINE).group(1)

    versions.update((
        ('psycopg2', psycopg2.__version__.split()[0]),
        ('mysqlclient', _mysql.__version__),
    ))

    with io.open(os.path.join('benchmark', 'conditions.rst'), 'w') as f:
        f.write('In this benchmark, a small database is generated, '
                'and each test is executed %s times '
                'under the following conditions:\n\n' % Benchmark.n)

        def write_table_sep(char='='):
            f.write((char * 20) + ' ' + (char * 50) + '\n')
        write_table_sep()
        for k, v in versions.items():
            f.write(k.ljust(20) + ' ' + v + '\n')
        write_table_sep()


class AssertNumQueries(CaptureQueriesContext):
    def __init__(self, n, using=None):
        self.n = n
        self.using = using
        super(AssertNumQueries, self).__init__(self.get_connection())

    def get_connection(self):
        if self.using is None:
            return connection
        return connections[self.using]

    def __exit__(self, exc_type, exc_val, exc_tb):
        super(AssertNumQueries, self).__exit__(exc_type, exc_val, exc_tb)
        if len(self) != self.n:
            print('The amount of queries should be %s, but %s were captured.'
                  % (self.n, len(self)))


class Benchmark(object):
    n = 20

    def __init__(self):
        self.data = []

    def bench_once(self, context, num_queries, invalidate_before=False):
        for _ in range(self.n):
            if invalidate_before:
                invalidate(db_alias=self.db_alias)
            with AssertNumQueries(num_queries, using=self.db_alias):
                start = time()
                self.query_function(self.db_alias)
                end = time()
            self.data.append(
                {'query': self.query_name,
                 'time': end - start,
                 'context': context,
                 'db': self.db_vendor,
                 'cache': self.cache_name})

    def benchmark(self, query_str, to_list=True, num_queries=1):
        # Clears the cache before a single benchmark to ensure the same
        # conditions across single benchmarks.
        caches[settings.CACHALOT_CACHE].clear()

        self.query_name = query_str
        query_str = 'Test.objects.using(using)' + query_str
        if to_list:
            query_str = 'list(%s)' % query_str
        self.query_function = eval('lambda using: ' + query_str)

        with override_settings(CACHALOT_ENABLED=False):
            self.bench_once(CONTEXTS[0], num_queries)

        self.bench_once(CONTEXTS[1], num_queries, invalidate_before=True)

        self.bench_once(CONTEXTS[2], 0)

    def execute_benchmark(self):
        self.benchmark('.count()', to_list=False)
        self.benchmark('.first()', to_list=False)
        self.benchmark('[:10]')
        self.benchmark('[5000:5010]')
        self.benchmark(".filter(name__icontains='e')[0:10]")
        self.benchmark(".filter(name__icontains='e')[5000:5010]")
        self.benchmark(".order_by('owner')[0:10]")
        self.benchmark(".order_by('owner')[5000:5010]")
        self.benchmark(".select_related('owner')[0:10]")
        self.benchmark(".select_related('owner')[5000:5010]")
        self.benchmark(".prefetch_related('owner__groups')[0:10]",
                       num_queries=3)
        self.benchmark(".prefetch_related('owner__groups')[5000:5010]",
                       num_queries=3)

    def run(self):
        for db_alias in settings.DATABASES:
            self.db_alias = db_alias
            self.db_vendor = connections[self.db_alias].vendor
            print('Benchmarking %s…' % self.db_vendor)
            for cache_alias in settings.CACHES:
                cache = caches[cache_alias]
                self.cache_name = cache.__class__.__name__[:-5].lower()
                with override_settings(CACHALOT_CACHE=cache_alias):
                    self.execute_benchmark()

        self.df = pd.DataFrame.from_records(self.data)
        if not os.path.exists(RESULTS_PATH):
            os.mkdir(RESULTS_PATH)
        self.df.to_csv(os.path.join(RESULTS_PATH, 'data.csv'))

        self.xlim = (0, self.df['time'].max() * 1.01)
        self.output('db')
        self.output('cache')

    def output(self, param):
        gp = self.df.groupby(('context', 'query', param))['time']
        self.means = gp.mean().unstack().unstack().reindex(CONTEXTS)
        los = self.means - gp.min().unstack().unstack().reindex(CONTEXTS)
        ups = gp.max().unstack().unstack().reindex(CONTEXTS) - self.means
        self.errors = dict(
            (key, dict(
                (subkey,
                 [[los[key][subkey][context] for context in self.means.index],
                  [ups[key][subkey][context] for context in self.means.index]])
                for subkey in self.means.columns.levels[1]))
            for key in self.means.columns.levels[0])
        self.get_perfs(param)
        self.plot_detail(param)

        gp = self.df.groupby(('context', param))['time']
        self.means = gp.mean().unstack().reindex(CONTEXTS)
        los = self.means - gp.min().unstack().reindex(CONTEXTS)
        ups = gp.max().unstack().reindex(CONTEXTS) - self.means
        self.errors = [
            [[los[key][context] for context in self.means.index],
             [ups[key][context] for context in self.means.index]]
            for key in self.means]
        self.plot_general(param)

    def get_perfs(self, param):
        with io.open(os.path.join(RESULTS_PATH, param + '_results.rst'),
                     'w') as f:
            for v in self.means.columns.levels[0]:
                g = self.means[v].mean(axis=1)
                perf = ('%s is %.1f× slower then %.1f× faster'
                        % (v.ljust(10), g[CONTEXTS[1]] / g[CONTEXTS[0]],
                           g[CONTEXTS[0]] / g[CONTEXTS[2]]))
                print(perf)
                f.write('- %s\n' % perf)

    def plot_detail(self, param):
        for v in self.means.columns.levels[0]:
            plt.figure()
            axes = self.means[v].plot(
                kind='barh', xerr=self.errors[v],
                xlim=self.xlim, figsize=(15, 15), subplots=True, layout=(6, 2),
                sharey=True, legend=False)
            plt.gca().invert_yaxis()
            for row in axes:
                for ax in row:
                    ax.xaxis.grid(True)
                    ax.set_ylabel('')
                    ax.set_xlabel('Time (s)')
            plt.savefig(os.path.join(RESULTS_PATH, '%s_%s.svg' % (param, v)))

    def plot_general(self, param):
        plt.figure()
        ax = self.means.plot(kind='barh', xerr=self.errors, xlim=self.xlim)
        ax.invert_yaxis()
        ax.xaxis.grid(True)
        ax.set_ylabel('')
        ax.set_xlabel('Time (s)')
        plt.savefig(os.path.join(RESULTS_PATH, '%s.svg' % param))


def create_data(using):
    User.objects.using(using).bulk_create(
        [User(username='user%d' % i) for i in range(50)])
    Group.objects.using(using).bulk_create(
        [Group(name='test%d' % i) for i in range(10)])
    groups = list(Group.objects.using(using))
    for u in User.objects.using(using):
        u.groups.add(choice(groups), choice(groups))
    users = list(User.objects.using(using))
    Test.objects.using(using).bulk_create(
        [Test(name='test%d' % i, owner=choice(users)) for i in range(10000)])


if __name__ == '__main__':
    if not os.path.exists(RESULTS_PATH):
        os.mkdir(RESULTS_PATH)

    write_conditions()

    old_db_names = {}
    for alias in connections:
        conn = connections[alias]
        old_db_names[alias] = conn.settings_dict['NAME']
        conn.creation.create_test_db(autoclobber=True)

        print("Populating %s…" % connections[alias].vendor)
        create_data(alias)

    Benchmark().run()

    for alias in connections:
        connections[alias].creation.destroy_test_db(old_db_names[alias])
-												Fixes Django 1.7 tests.

											
										
										
											2014-12-07 04:16:07 +01:00
+								#!/usr/bin/env python
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								# coding: utf-8
 								from __future__ import unicode_literals, print_function
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								from collections import OrderedDict
 								import io
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								import os
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								import platform
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								from random import choice
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								import re
 								import sqlite3
 								from subprocess import check_output
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								from time import time
-												Adds benchmark results to the docs.

											
										
										
											2014-12-14 10:46:52 +01:00
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
-												Simplifies settings setup.

											
										
										
											2014-12-07 03:43:16 +01:00
+								os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'settings')
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
-												Fixes Django 1.7 tests.

											
										
										
											2014-12-07 04:16:07 +01:00
+								import django
-												Fixes the benchmark by setting up django before importing a model.

Otherwise, Django thinks the Test model is from a 'tests' application instead of 'cachalot'.

											
										
										
											2015-10-05 21:06:15 +02:00
+								django.setup()
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								from django.conf import settings
 								from django.contrib.auth.models import User, Group
-												Fixes a removed function in Django 1.9.

											
										
										
											2015-12-18 12:37:21 +01:00
+								from django.core.cache import caches
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								from django.db import connections, connection
-												Simplifies cachalot_settings and forbids its modification.

											
										
										
											2014-12-08 19:43:43 +01:00
+								from django.test.utils import CaptureQueriesContext, override_settings
-												Adds Python 3 compatibility to the benchmark.

											
										
										
											2015-03-15 15:12:05 +01:00
+								from django.utils.encoding import force_text
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								import matplotlib.pyplot as plt
-												Updates test requirements to the latest Python 3 compatible ones.

											
										
										
											2015-12-28 00:38:37 +01:00
+								import _mysql
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								import pandas as pd
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								import psycopg2
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								import cachalot
-												Merges invalidate_all, invalidate_tables and invalidate_models, while optimising it.

											
										
										
											2015-10-05 22:31:47 +02:00
+								from cachalot.api import invalidate
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								from cachalot.tests.models import Test
 								RESULTS_PATH = 'benchmark/'
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								DATA_PATH = '/var/lib/'
-												Improves the benchmark.

											
										
										
											2014-12-13 20:05:17 +01:00
+								CONTEXTS = ('Control', 'Cold cache', 'Hot cache')
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								DIVIDER = 'divider'
 								DISK_DATA_RE = re.compile(r'^MODEL="(.*)" MOUNTPOINT="(.*)"$')
 								def get_disk_model_for_path(path):
 								    out = force_text(check_output(['lsblk', '-Po', 'MODEL,MOUNTPOINT']))
 								    mount_points = []
 								    previous_model = None
 								    for model, mount_point in [DISK_DATA_RE.match(line).groups()
 								                               for line in out.split('\n') if line]:
 								        if model:
 								            previous_model = model.strip()
 								        if mount_point:
 								            mount_points.append((previous_model, mount_point))
 								    mount_points = sorted(mount_points, key=lambda t: -len(t[1]))
 								    for model, mount_point in mount_points:
 								        if path.startswith(mount_point):
 								            return model
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								def write_conditions():
 								    versions = OrderedDict()
 								    # CPU
 								    with open('/proc/cpuinfo') as f:
 								        versions['CPU'] = re.search(r'^model name\s+: (.+)$', f.read(),
 								                                    flags=re.MULTILINE).group(1)
 								    # RAM
 								    with open('/proc/meminfo') as f:
 								        versions['RAM'] = re.search(r'^MemTotal:\s+(.+)$', f.read(),
 								                                    flags=re.MULTILINE).group(1)
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								    versions.update((
 								        ('Disk', get_disk_model_for_path(DATA_PATH)),
 								    ))
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    # OS
 								    linux_dist = ' '.join(platform.linux_distribution()).strip()
 								    if linux_dist:
 								        versions['Linux distribution'] = linux_dist
 								    else:
 								        versions['OS'] = platform.system() + ' ' + platform.release()
 								    versions.update((
 								        ('Python', platform.python_version()),
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								        ('Django', django.__version__),
 								        ('cachalot', cachalot.__version__),
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								        ('sqlite', sqlite3.sqlite_version),
 								    ))
 								    # PostgreSQL
-												Use cursors as context managers in benchmark.py.

											
										
										
											2015-04-11 02:39:27 +02:00
+								    with connections['postgresql'].cursor() as cursor:
 								        cursor.execute('SELECT version();')
 								        versions['PostgreSQL'] = re.match(r'^PostgreSQL ([\d\.]+) on .+$',
 								                                          cursor.fetchone()[0]).group(1)
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    # MySQL
-												Use cursors as context managers in benchmark.py.

											
										
										
											2015-04-11 02:39:27 +02:00
+								    with connections['mysql'].cursor() as cursor:
 								        cursor.execute('SELECT version();')
 								        versions['MySQL'] = cursor.fetchone()[0].split('-')[0]
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    # Redis
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								    out = force_text(
 								        check_output(['redis-cli', 'INFO', 'server'])).replace('\r', '')
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    versions['Redis'] = re.search(r'^redis_version:([\d\.]+)$', out,
 								                                  flags=re.MULTILINE).group(1)
 								    # memcached
-												Adds Python 3 compatibility to the benchmark.

											
										
										
											2015-03-15 15:12:05 +01:00
+								    out = force_text(check_output(['memcached', '-h']))
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    versions['memcached'] = re.match(r'^memcached ([\d\.]+)$', out,
 								                                     flags=re.MULTILINE).group(1)
 								    versions.update((
 								        ('psycopg2', psycopg2.__version__.split()[0]),
-												Updates test requirements to the latest Python 3 compatible ones.

											
										
										
											2015-12-28 00:38:37 +01:00
+								        ('mysqlclient', _mysql.__version__),
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    ))
 								    with io.open(os.path.join('benchmark', 'conditions.rst'), 'w') as f:
-												Adds an introduction to the benchmark.

											
										
										
											2015-02-22 05:00:48 +01:00
+								        f.write('In this benchmark, a small database is generated, '
 								                'and each test is executed %s times '
 								                'under the following conditions:\n\n' % Benchmark.n)
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								        def write_table_sep(char='='):
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								            f.write((char * 20) + ' ' + (char * 50) + '\n')
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								        write_table_sep()
 								        for k, v in versions.items():
 								            f.write(k.ljust(20) + ' ' + v + '\n')
 								        write_table_sep()
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								class AssertNumQueries(CaptureQueriesContext):
 								    def __init__(self, n, using=None):
 								        self.n = n
 								        self.using = using
 								        super(AssertNumQueries, self).__init__(self.get_connection())
 								    def get_connection(self):
 								        if self.using is None:
 								            return connection
 								        return connections[self.using]
 								    def __exit__(self, exc_type, exc_val, exc_tb):
 								        super(AssertNumQueries, self).__exit__(exc_type, exc_val, exc_tb)
 								        if len(self) != self.n:
 								            print('The amount of queries should be %s, but %s were captured.'
 								                  % (self.n, len(self)))
 								class Benchmark(object):
-												Adds an introduction to the benchmark.

											
										
										
											2015-02-22 05:00:48 +01:00
+								    n = 20
 								    def __init__(self):
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								        self.data = []
-												Fixes an invalidation order issue in the benchmark.

											
										
										
											2014-11-23 23:11:51 +01:00
+								    def bench_once(self, context, num_queries, invalidate_before=False):
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								        for _ in range(self.n):
-												Fixes an invalidation order issue in the benchmark.

											
										
										
											2014-11-23 23:11:51 +01:00
+								            if invalidate_before:
-												Merges invalidate_all, invalidate_tables and invalidate_models, while optimising it.

											
										
										
											2015-10-05 22:31:47 +02:00
+								                invalidate(db_alias=self.db_alias)
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								            with AssertNumQueries(num_queries, using=self.db_alias):
 								                start = time()
 								                self.query_function(self.db_alias)
 								                end = time()
 								            self.data.append(
 								                {'query': self.query_name,
 								                 'time': end - start,
 								                 'context': context,
 								                 'db': self.db_vendor,
 								                 'cache': self.cache_name})
 								    def benchmark(self, query_str, to_list=True, num_queries=1):
-												Clears caches during benchmark to ensure the same conditions for each test.

											
										
										
											2017-06-04 18:38:13 +02:00
+								        # Clears the cache before a single benchmark to ensure the same
 								        # conditions across single benchmarks.
 								        caches[settings.CACHALOT_CACHE].clear()
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								        self.query_name = query_str
 								        query_str = 'Test.objects.using(using)' + query_str
 								        if to_list:
 								            query_str = 'list(%s)' % query_str
 								        self.query_function = eval('lambda using: ' + query_str)
-												Simplifies cachalot_settings and forbids its modification.

											
										
										
											2014-12-08 19:43:43 +01:00
+								        with override_settings(CACHALOT_ENABLED=False):
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								            self.bench_once(CONTEXTS[0], num_queries)
-												Fixes an invalidation order issue in the benchmark.

											
										
										
											2014-11-23 23:11:51 +01:00
+								        self.bench_once(CONTEXTS[1], num_queries, invalidate_before=True)
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
 								        self.bench_once(CONTEXTS[2], 0)
 								    def execute_benchmark(self):
 								        self.benchmark('.count()', to_list=False)
 								        self.benchmark('.first()', to_list=False)
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        self.benchmark('[:10]')
-												Improves the benchmark.

											
										
										
											2014-12-13 20:05:17 +01:00
+								        self.benchmark('[5000:5010]')
 								        self.benchmark(".filter(name__icontains='e')[0:10]")
 								        self.benchmark(".filter(name__icontains='e')[5000:5010]")
 								        self.benchmark(".order_by('owner')[0:10]")
 								        self.benchmark(".order_by('owner')[5000:5010]")
 								        self.benchmark(".select_related('owner')[0:10]")
 								        self.benchmark(".select_related('owner')[5000:5010]")
 								        self.benchmark(".prefetch_related('owner__groups')[0:10]",
 								                       num_queries=3)
 								        self.benchmark(".prefetch_related('owner__groups')[5000:5010]",
 								                       num_queries=3)
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
 								    def run(self):
 								        for db_alias in settings.DATABASES:
 								            self.db_alias = db_alias
 								            self.db_vendor = connections[self.db_alias].vendor
 								            print('Benchmarking %s…' % self.db_vendor)
 								            for cache_alias in settings.CACHES:
-												Fixes a removed function in Django 1.9.

											
										
										
											2015-12-18 12:37:21 +01:00
+								                cache = caches[cache_alias]
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								                self.cache_name = cache.__class__.__name__[:-5].lower()
-												Simplifies cachalot_settings and forbids its modification.

											
										
										
											2014-12-08 19:43:43 +01:00
+								                with override_settings(CACHALOT_CACHE=cache_alias):
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								                    self.execute_benchmark()
 								        self.df = pd.DataFrame.from_records(self.data)
 								        if not os.path.exists(RESULTS_PATH):
 								            os.mkdir(RESULTS_PATH)
 								        self.df.to_csv(os.path.join(RESULTS_PATH, 'data.csv'))
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        self.xlim = (0, self.df['time'].max() * 1.01)
-												Generates benchmark plots about caches too.

											
										
										
											2014-11-24 00:13:29 +01:00
+								        self.output('db')
 								        self.output('cache')
 								    def output(self, param):
 								        gp = self.df.groupby(('context', 'query', param))['time']
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        self.means = gp.mean().unstack().unstack().reindex(CONTEXTS)
 								        los = self.means - gp.min().unstack().unstack().reindex(CONTEXTS)
 								        ups = gp.max().unstack().unstack().reindex(CONTEXTS) - self.means
 								        self.errors = dict(
 								            (key, dict(
 								                (subkey,
 								                 [[los[key][subkey][context] for context in self.means.index],
 								                  [ups[key][subkey][context] for context in self.means.index]])
 								                for subkey in self.means.columns.levels[1]))
 								            for key in self.means.columns.levels[0])
-												Adds benchmark results to the docs.

											
										
										
											2014-12-14 10:46:52 +01:00
+								        self.get_perfs(param)
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        self.plot_detail(param)
 								        gp = self.df.groupby(('context', param))['time']
 								        self.means = gp.mean().unstack().reindex(CONTEXTS)
 								        los = self.means - gp.min().unstack().reindex(CONTEXTS)
 								        ups = gp.max().unstack().reindex(CONTEXTS) - self.means
 								        self.errors = [
 								            [[los[key][context] for context in self.means.index],
 								             [ups[key][context] for context in self.means.index]]
 								            for key in self.means]
 								        self.plot_general(param)
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
-												Adds benchmark results to the docs.

											
										
										
											2014-12-14 10:46:52 +01:00
+								    def get_perfs(self, param):
 								        with io.open(os.path.join(RESULTS_PATH, param + '_results.rst'),
 								                     'w') as f:
 								            for v in self.means.columns.levels[0]:
 								                g = self.means[v].mean(axis=1)
 								                perf = ('%s is %.1f× slower then %.1f× faster'
 								                        % (v.ljust(10), g[CONTEXTS[1]] / g[CONTEXTS[0]],
 								                           g[CONTEXTS[0]] / g[CONTEXTS[2]]))
 								                print(perf)
 								                f.write('- %s\n' % perf)
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								    def plot_detail(self, param):
-												Generates benchmark plots about caches too.

											
										
										
											2014-11-24 00:13:29 +01:00
+								        for v in self.means.columns.levels[0]:
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								            plt.figure()
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								            axes = self.means[v].plot(
 								                kind='barh', xerr=self.errors[v],
-												Improves the benchmark.

											
										
										
											2014-12-13 20:05:17 +01:00
+								                xlim=self.xlim, figsize=(15, 15), subplots=True, layout=(6, 2),
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								                sharey=True, legend=False)
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								            plt.gca().invert_yaxis()
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								            for row in axes:
 								                for ax in row:
-												Generates a grid on the benchmark results.

											
										
										
											2016-01-10 21:56:48 +01:00
+								                    ax.xaxis.grid(True)
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								                    ax.set_ylabel('')
 								                    ax.set_xlabel('Time (s)')
 								            plt.savefig(os.path.join(RESULTS_PATH, '%s_%s.svg' % (param, v)))
 								    def plot_general(self, param):
 								        plt.figure()
-												Generates a grid on the benchmark results.

											
										
										
											2016-01-10 21:56:48 +01:00
+								        ax = self.means.plot(kind='barh', xerr=self.errors, xlim=self.xlim)
 								        ax.invert_yaxis()
 								        ax.xaxis.grid(True)
 								        ax.set_ylabel('')
 								        ax.set_xlabel('Time (s)')
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        plt.savefig(os.path.join(RESULTS_PATH, '%s.svg' % param))
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
 								def create_data(using):
 								    User.objects.using(using).bulk_create(
 								        [User(username='user%d' % i) for i in range(50)])
 								    Group.objects.using(using).bulk_create(
 								        [Group(name='test%d' % i) for i in range(10)])
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								    groups = list(Group.objects.using(using))
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								    for u in User.objects.using(using):
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        u.groups.add(choice(groups), choice(groups))
 								    users = list(User.objects.using(using))
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								    Test.objects.using(using).bulk_create(
-												Improves benchmark plots.

											
										
										
											2014-11-24 12:04:01 +01:00
+								        [Test(name='test%d' % i, owner=choice(users)) for i in range(10000)])
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
 								if __name__ == '__main__':
-												Adds the disk model name to the benchmark conditions.

											
										
										
											2016-01-11 21:06:22 +01:00
+								    if not os.path.exists(RESULTS_PATH):
 								        os.mkdir(RESULTS_PATH)
-												Adds benchmark conditions.

											
										
										
											2015-02-16 21:25:19 +01:00
+								    write_conditions()
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								    old_db_names = {}
 								    for alias in connections:
 								        conn = connections[alias]
 								        old_db_names[alias] = conn.settings_dict['NAME']
 								        conn.creation.create_test_db(autoclobber=True)
-												Improves a benchmark message.

											
										
										
											2016-01-11 22:08:44 +01:00
+								        print("Populating %s…" % connections[alias].vendor)
-												Adds a benchmark.

											
										
										
											2014-11-23 20:09:42 +01:00
+								        create_data(alias)
 								    Benchmark().run()
 								    for alias in connections:
 								        connections[alias].creation.destroy_test_db(old_db_names[alias])