minigzip.py 3.75 KB
Newer Older
1
#!/usr/bin/env python
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33
# Demo program for zlib; it compresses or decompresses files, but *doesn't*
# delete the original.  This doesn't support all of gzip's options.

FTEXT, FHCRC, FEXTRA, FNAME, FCOMMENT = 1, 2, 4, 8, 16

def write32(output, value):
    output.write(chr(value & 255)) ; value=value / 256
    output.write(chr(value & 255)) ; value=value / 256
    output.write(chr(value & 255)) ; value=value / 256
    output.write(chr(value & 255))
    
def read32(input):
    v=ord(input.read(1))
    v=v+ (ord(input.read(1))<<8 )
    v=v+ (ord(input.read(1))<<16)
    v=v+ (ord(input.read(1))<<24)
    return v

import zlib, sys
if len(sys.argv)!=2:
   print 'Usage: minigzip.py <filename>'
   print '  The file will be compressed or decompressed.'
   sys.exit(0)

filename=sys.argv[1]
compressing=1 ; outputname=filename+'.gz'
if filename[-3:]=='.gz':
    compressing=0 ; outputname=filename[:-3]
input=open(filename) ; output=open(outputname, 'w')

if compressing:
    output.write('\037\213\010')        # Write the header, ...
Guido van Rossum's avatar
Guido van Rossum committed
34
    output.write(chr(FNAME))            # ... flag byte ...
35

Guido van Rossum's avatar
Guido van Rossum committed
36
    import os                           # ... modification time ...
37 38 39
    statval=os.stat(filename)
    mtime=statval[8]
    write32(output, mtime)
Guido van Rossum's avatar
Guido van Rossum committed
40 41 42
    output.write('\002')                # ... slowest compression alg. ...
    output.write('\377')                # ... OS (=unknown) ...
    output.write(filename+'\000')       # ... original filename ...
43 44 45

    crcval=zlib.crc32("")
    compobj=zlib.compressobj(9, zlib.DEFLATED, -zlib.MAX_WBITS,
Guido van Rossum's avatar
Guido van Rossum committed
46
                             zlib.DEF_MEM_LEVEL, 0)
47
    while (1):
Guido van Rossum's avatar
Guido van Rossum committed
48 49 50 51
        data=input.read(1024)
        if data=="": break
        crcval=zlib.crc32(data, crcval)
        output.write(compobj.compress(data))
52
    output.write(compobj.flush())
Guido van Rossum's avatar
Guido van Rossum committed
53 54
    write32(output, crcval)             # ... the CRC ...
    write32(output, statval[6])         # and the file size.
55 56 57 58

else:
    magic=input.read(2)
    if magic!='\037\213':
Guido van Rossum's avatar
Guido van Rossum committed
59
        print 'Not a gzipped file' ; sys.exit(0)
60
    if ord(input.read(1))!=8:
Guido van Rossum's avatar
Guido van Rossum committed
61
        print 'Unknown compression method' ; sys.exit(0)
62
    flag=ord(input.read(1))
Guido van Rossum's avatar
Guido van Rossum committed
63 64
    input.read(4+1+1)                   # Discard modification time,
                                        # extra flags, and OS byte.
65
    if flag & FEXTRA:
Guido van Rossum's avatar
Guido van Rossum committed
66 67 68 69
        # Read & discard the extra field, if present
        xlen=ord(input.read(1))         
        xlen=xlen+256*ord(input.read(1))
        input.read(xlen)
70
    if flag & FNAME:
Guido van Rossum's avatar
Guido van Rossum committed
71 72 73 74
        # Read and discard a null-terminated string containing the filename
        while (1):
            s=input.read(1)
            if s=='\000': break
75
    if flag & FCOMMENT:
Guido van Rossum's avatar
Guido van Rossum committed
76 77 78 79
        # Read and discard a null-terminated string containing a comment
        while (1):
            s=input.read(1)
            if s=='\000': break
80
    if flag & FHCRC:
Guido van Rossum's avatar
Guido van Rossum committed
81
        input.read(2)                   # Read & discard the 16-bit header CRC
82 83 84 85
    decompobj=zlib.decompressobj(-zlib.MAX_WBITS)
    crcval=zlib.crc32("")
    length=0
    while (1):
Guido van Rossum's avatar
Guido van Rossum committed
86 87 88 89 90 91
        data=input.read(1024)
        if data=="": break
        decompdata=decompobj.decompress(data)
        print len(decompdata)
        output.write(decompdata) ; length=length+len(decompdata)
        crcval=zlib.crc32(decompdata, crcval)
92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107
    decompdata=decompobj.flush()
    output.write(decompdata) ; length=length+len(decompdata)
    crcval=zlib.crc32(decompdata, crcval)
    
    # We've read to the end of the file, so we have to rewind in order
    # to reread the 8 bytes containing the CRC and the file size.  The
    # decompressor is smart and knows when to stop, so feeding it
    # extra data is harmless.  
    input.seek(-8, 2)
    crc32=read32(input)
    isize=read32(input)
    if crc32!=crcval: print 'CRC check failed.'
    if isize!=length: print 'Incorrect length of data produced'

input.close() ; output.close()