1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
|
# Copyright 2010 Lars Wirzenius
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
import hashlib
import os
import sys
import larch
def compute(filename):
f = open(filename)
md5 = hashlib.md5()
while True:
data = f.read(1024)
if not data:
break
md5.update(data)
f.close()
return md5.hexdigest()
def open_tree(allow_writes, dirname):
key_size = len(compute('/dev/null'))
node_size = 4096
forest = larch.open_forest(
allow_writes=allow_writes, key_size=key_size, node_size=node_size,
dirname=dirname)
if forest.trees:
tree = forest.trees[0]
else:
tree = forest.new_tree()
return forest, tree
def add(filenames):
forest, tree = open_tree(allow_writes=True, dirname='example.tree')
for filename in filenames:
checksum = compute(filename)
tree.insert(checksum, filename)
forest.commit()
def find(checksums):
forest, tree = open_tree(allow_writes=False, dirname='example.tree')
for checksum in checksums:
filename = tree.lookup(checksum)
print checksum, filename
def list_checksums():
forest, tree = open_tree(allow_writes=False, dirname='example.tree')
key_size = len(compute('/dev/null'))
minkey = '0' * key_size
maxkey = 'f' * key_size
for checksum, filename in tree.lookup_range(minkey, maxkey):
print checksum, filename
def main():
if sys.argv[1] == 'add':
add(sys.argv[2:])
elif sys.argv[1] == 'find':
find(sys.argv[2:])
elif sys.argv[1] == 'list':
list_checksums()
else:
raise Exception('Unknown operation %s' % sys.argv[1])
if __name__ == '__main__':
main()
|