X-Git-Url: https://arthur.barton.de/gitweb/?a=blobdiff_plain;f=cmd%2Fmemtest-cmd.py;h=88ee06d92cd919700dacd31467a1e0257b0f7d64;hb=aeafe13a9330e7deca3dc6b9c0496937d904663a;hp=745550c3cd483f397ba029669c63a63f305acaf4;hpb=8d350c66622ec8a2c3ee75d1fd2ed60f249d78a8;p=bup.git diff --git a/cmd/memtest-cmd.py b/cmd/memtest-cmd.py index 745550c..88ee06d 100755 --- a/cmd/memtest-cmd.py +++ b/cmd/memtest-cmd.py @@ -1,29 +1,72 @@ -#!/usr/bin/env python -import sys, re, struct, mmap -from bup import git, options -from bup.helpers import * +#!/bin/sh +"""": # -*-python-*- +bup_python="$(dirname "$0")/bup-python" || exit $? +exec "$bup_python" "$0" ${1+"$@"} +""" +# end of bup preamble + +from __future__ import absolute_import, print_function +import sys, re, struct, time, resource + +from bup import git, bloom, midx, options, _helpers +from bup.helpers import handle_ctrl_c + handle_ctrl_c() -def s_from_bytes(bytes): - clist = [chr(b) for b in bytes] - return ''.join(clist) + +_linux_warned = 0 +def linux_memstat(): + global _linux_warned + #fields = ['VmSize', 'VmRSS', 'VmData', 'VmStk', 'ms'] + d = {} + try: + f = open('/proc/self/status') + except IOError as e: + if not _linux_warned: + log('Warning: %s\n' % e) + _linux_warned = 1 + return {} + for line in f: + # Note that on Solaris, this file exists but is binary. If that + # happens, this split() might not return two elements. We don't + # really need to care about the binary format since this output + # isn't used for much and report() can deal with missing entries. + t = re.split(r':\s*', line.strip(), 1) + if len(t) == 2: + k,v = t + d[k] = v + return d +last = last_u = last_s = start = 0 def report(count): - fields = ['VmSize', 'VmRSS', 'VmData', 'VmStk'] - d = {} - for line in open('/proc/self/status').readlines(): - l = re.split(r':\s*', line.strip(), 1) - d[l[0]] = l[1] + global last, last_u, last_s, start + headers = ['RSS', 'MajFlt', 'user', 'sys', 'ms'] + ru = resource.getrusage(resource.RUSAGE_SELF) + now = time.time() + rss = int(ru.ru_maxrss/1024) + if not rss: + rss = linux_memstat().get('VmRSS', '??') + fields = [rss, + ru.ru_majflt, + int((ru.ru_utime - last_u) * 1000), + int((ru.ru_stime - last_s) * 1000), + int((now - last) * 1000)] + fmt = '%9s ' + ('%10s ' * len(fields)) if count >= 0: - e1 = count - fields = [d[k] for k in fields] + print(fmt % tuple([count] + fields)) else: - e1 = '' - print ('%9s ' + ('%10s ' * len(fields))) % tuple([e1] + fields) + start = now + print(fmt % tuple([''] + headers)) sys.stdout.flush() + # don't include time to run report() in usage counts + ru = resource.getrusage(resource.RUSAGE_SELF) + last_u = ru.ru_utime + last_s = ru.ru_stime + last = time.time() + optspec = """ bup memtest [-n elements] [-c cycles] @@ -31,8 +74,9 @@ bup memtest [-n elements] [-c cycles] n,number= number of objects per cycle [10000] c,cycles= number of cycles to run [100] ignore-midx ignore .midx files, use only .idx files +existing test with existing objects instead of fake ones """ -o = options.Options('bup memtest', optspec) +o = options.Options(optspec) (opt, flags, extra) = o.parse(sys.argv[1:]) if extra: @@ -44,20 +88,41 @@ git.check_repo_or_die() m = git.PackIdxList(git.repo('objects/pack')) report(-1) -f = open('/dev/urandom') -a = mmap.mmap(-1, 20) +_helpers.random_sha() report(0) + +if opt.existing: + def foreverit(mi): + while 1: + for e in mi: + yield e + objit = iter(foreverit(m)) + for c in xrange(opt.cycles): for n in xrange(opt.number): - b = f.read(3) - if 0: - bytes = list(struct.unpack('!BBB', b)) + [0]*17 - bytes[2] &= 0xf0 - bin = struct.pack('!20s', s_from_bytes(bytes)) + if opt.existing: + bin = next(objit) + assert(m.exists(bin)) else: - a[0:2] = b[0:2] - a[2] = chr(ord(b[2]) & 0xf0) - bin = str(a[0:20]) - #print bin.encode('hex') - m.exists(bin) + bin = _helpers.random_sha() + + # technically, a randomly generated object id might exist. + # but the likelihood of that is the likelihood of finding + # a collision in sha-1 by accident, which is so unlikely that + # we don't care. + assert(not m.exists(bin)) report((c+1)*opt.number) + +if bloom._total_searches: + print('bloom: %d objects searched in %d steps: avg %.3f steps/object' + % (bloom._total_searches, bloom._total_steps, + bloom._total_steps*1.0/bloom._total_searches)) +if midx._total_searches: + print('midx: %d objects searched in %d steps: avg %.3f steps/object' + % (midx._total_searches, midx._total_steps, + midx._total_steps*1.0/midx._total_searches)) +if git._total_searches: + print('idx: %d objects searched in %d steps: avg %.3f steps/object' + % (git._total_searches, git._total_steps, + git._total_steps*1.0/git._total_searches)) +print('Total time: %.3fs' % (time.time() - start))