summaryrefslogtreecommitdiff
path: root/speed-test
blob: 42d4cf2b28aa7755d8a8687fe25fd6295a3216ca (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
#!/usr/bin/python
# Copyright 2010  Lars Wirzenius
# 
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
# 
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
# 
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.

# Excercise my btree implementation, for simple benchmarking purposes.
# The benchmark gets a location and an operation count as command line
# arguments.
#
# If the location is the empty string, an in-memory node store is used.
# Otherwise it must be a non-existent directory name.
#
# The benchmark will do the given number of insertions into the tree, and
# measure the speed of that. Then it will look up each of those, and measure
# the lookups.


import cProfile
import os
import random
import shutil
import sys
import time

import btree


def measure(keys, func, final):
    start = time.clock()
    for key in keys:
        func(key)
    final()
    end = time.clock()
    return end - start


def profile(keys, func, final, basename):
    def helper():
        for key in keys:
            func(key)
        final()
    globaldict = globals().copy()
    localdict = locals().copy()
    cProfile.runctx('helper()', globaldict, localdict, '%s.prof' % basename)


def main():
    if False:
        import logging
        logging.basicConfig(filename='btree.log', level=logging.DEBUG)

    location = sys.argv[1]
    n = int(sys.argv[2])
    do_profile = True if sys.argv[3] == 'yes' else False

    key_size = 19
    value_size = 128
    node_size = 64*1024

    codec = btree.NodeCodec(key_size)

    if location == '':
        ns = btree.NodeStoreMemory(node_size, codec)
    else:
        if os.path.exists(location):
            raise Exception('%s exists already' % location)
        os.mkdir(location)
        ns = btree.NodeStoreDisk(location, node_size, codec)

    forest = btree.Forest(ns)
    tree = forest.new_tree()
    
    # Create list of keys.
    keys = ['%0*d' % (key_size, i) for i in xrange(n)]
    
    # Calibrate.
    looptime = measure(keys, lambda key: None, lambda: None)

    # Measure inserts.
    random.shuffle(keys)
    value = 'x' * value_size
    if do_profile:
        profile(keys, lambda key: tree.insert(key, value), 
                lambda: forest.commit(), 'insert')
    else:
        insert_time = measure(keys, lambda key: tree.insert(key, value),
                              lambda: forest.commit())
        
    # Measure lookups.
    random.shuffle(keys)
    if do_profile:
        profile(keys, tree.lookup, lambda: None, 'lookup')
    else:
        lookup_time = measure(keys, lambda key: tree.lookup(key),
                              lambda: None) - looptime

    # Report
    if do_profile:
        print 'See insert.prof, lookup.prof for profiling data (try viewprof)'
    else:
        print 'num_operations: %d' % n
        print 'insert: %.3f s (%.1f/s)' % (insert_time, n/insert_time)
        print 'lookup-time: %.3f s (%.1f/s)' % (lookup_time, n/lookup_time)

    # Clean up
    if location:
        shutil.rmtree(location)

if __name__ == '__main__':
    main()