md5sum.py 2.45 KB
Newer Older
1
#! /usr/bin/env python3
2 3 4 5 6

"""Python utility to print MD5 checksums of argument files.
"""


7 8
bufsize = 8096
fnfilter = None
9
rmode = 'rb'
10

11
usage = """
12
usage: md5sum.py [-b] [-t] [-l] [-s bufsize] [file ...]
13 14
-b        : read files in binary mode (default)
-t        : read files in text mode (you almost certainly don't want this!)
15 16 17 18 19
-l        : print last pathname component only
-s bufsize: read buffer size (default %d)
file ...  : files to sum; '-' or no files means stdin
""" % bufsize

20
import io
21 22 23
import sys
import os
import getopt
24
from hashlib import md5
25 26 27

def sum(*files):
    sts = 0
28
    if files and isinstance(files[-1], io.IOBase):
29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
        out, files = files[-1], files[:-1]
    else:
        out = sys.stdout
    if len(files) == 1 and not isinstance(files[0], str):
        files = files[0]
    for f in files:
        if isinstance(f, str):
            if f == '-':
                sts = printsumfp(sys.stdin, '<stdin>', out) or sts
            else:
                sts = printsum(f, out) or sts
        else:
            sts = sum(f, out) or sts
    return sts

44
def printsum(filename, out=sys.stdout):
45 46
    try:
        fp = open(filename, rmode)
47
    except IOError as msg:
48 49 50 51 52 53 54 55
        sys.stderr.write('%s: Can\'t open: %s\n' % (filename, msg))
        return 1
    if fnfilter:
        filename = fnfilter(filename)
    sts = printsumfp(fp, filename, out)
    fp.close()
    return sts

56
def printsumfp(fp, filename, out=sys.stdout):
57
    m = md5()
58
    try:
59
        while 1:
60
            data = fp.read(bufsize)
61 62
            if not data:
                break
63 64
            if isinstance(data, str):
                data = data.encode(fp.encoding)
65
            m.update(data)
66
    except IOError as msg:
67 68 69 70 71
        sys.stderr.write('%s: I/O error: %s\n' % (filename, msg))
        return 1
    out.write('%s %s\n' % (m.hexdigest(), filename))
    return 0

72
def main(args = sys.argv[1:], out=sys.stdout):
73 74 75
    global fnfilter, rmode, bufsize
    try:
        opts, args = getopt.getopt(args, 'blts:')
76
    except getopt.error as msg:
77 78 79 80 81
        sys.stderr.write('%s: %s\n%s' % (sys.argv[0], msg, usage))
        return 2
    for o, a in opts:
        if o == '-l':
            fnfilter = os.path.basename
82
        elif o == '-b':
83
            rmode = 'rb'
84
        elif o == '-t':
85
            rmode = 'r'
86
        elif o == '-s':
87 88 89 90 91 92 93
            bufsize = int(a)
    if not args:
        args = ['-']
    return sum(args, out)

if __name__ == '__main__' or __name__ == sys.argv[0]:
    sys.exit(main(sys.argv[1:], sys.stdout))