cmpcsyms 4.47 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157
#! /usr/bin/env python
from __future__ import with_statement
import errno
import os
import re
import sys
import string

if __name__ == "__main__":
    _base = sys.argv[0]
else:
    _base = __file__

_script_home = os.path.abspath(os.path.dirname(_base))

srcdir = os.path.dirname(os.path.dirname(_script_home))

EXCLUDES = ["bitset.h", "cStringIO.h", "graminit.h", "grammar.h",
            "longintrepr.h", "metagrammar.h",
            "node.h", "opcode.h", "osdefs.h", "pgenheaders.h",
            "py_curses.h", "parsetok.h", "symtable.h", "token.h"]


def list_headers():
    """Return a list of headers."""
    incdir = os.path.join(srcdir, "Include")
    return [os.path.join(incdir, fn) for fn in os.listdir(incdir)
            if fn.endswith(".h") and fn not in EXCLUDES]


def matcher(pattern):
    return re.compile(pattern).search

MATCHERS = [
    # XXX this should also deal with ctypedesc, cvardesc and cmemberdesc
    matcher(r"\\begin\{cfuncdesc\}\{(?P<result>[^}]*)\}\{(?P<sym>[^}]*)\}{(?P<params>[^}]*)\}"),
    matcher(r"\\cfuncline\{(?P<result>[^})]*)\}\{(?P<sym>[^}]*)\}{(?P<params>[^}]*)\}"),
    ]

def list_documented_items():
    """Return a list of everything that's already documented."""
    apidir = os.path.join(srcdir, "Doc", "api")
    files = [fn for fn in os.listdir(apidir) if fn.endswith(".tex")]
    L = []
    for fn in files:
        fullname = os.path.join(apidir, fn)
	data = open(fullname).read()
        for matcher in MATCHERS:
            pos = 0
            while 1:
                m = matcher(data, pos)
                if not m: break
                pos = m.end()
                sym = m.group("sym")
                result = m.group("result")
                params = m.group("params")
		# replace all whitespace with a single one
		params = " ".join(params.split()) 
                L.append((sym, result, params, fn))
    return L

def normalize_type(t):
    t = t.strip()
    s = t.rfind("*")
    if s != -1:
        # strip everything after the pointer name
        t = t[:s+1]
    # Drop the variable name
    s = t.split()
    typenames = 1
    if len(s)>1 and s[0]=='unsigned' and s[1]=='int':
        typenames = 2
    if len(s) > typenames and s[-1][0] in string.letters:
        del s[-1]
    if not s:
       print "XXX", t
       return ""
    # Drop register
    if s[0] == "register":
        del s[0]
    # discard all spaces
    return ''.join(s)
    
def compare_type(t1, t2):
    t1 = normalize_type(t1)
    t2 = normalize_type(t2)
    if t1 == r'\moreargs' and t2 == '...':
        return False
    if t1 != t2:
        #print "different:", t1, t2
        return False
    return True


def compare_types(ret, params, hret, hparams):
    if not compare_type(ret, hret):
        return False
    params = params.split(",")
    hparams = hparams.split(",")
    if not params and hparams == ['void']:
        return True
    if not hparams and params == ['void']:
        return True
    if len(params) != len(hparams):
        return False
    for p1, p2 in zip(params, hparams):
        if not compare_type(p1, p2):
            return False
    return True

def main():
    headers = list_headers()
    documented = list_documented_items()

    lines = []
    for h in headers:
        data = open(h).read()
        data, n = re.subn(r"PyAPI_FUNC\(([^)]*)\)", r"\1", data)
        name = os.path.basename(h)
        with open(name, "w") as f:
            f.write(data)
        cmd = ("ctags -f - --file-scope=no --c-kinds=p --fields=S "
               "-Istaticforward -Istatichere=static " + name)
        with os.popen(cmd) as f:
            lines.extend(f.readlines())
        os.unlink(name)
    L = {}
    prevsym = None
    for line in lines:
        if not line:
            break
        sym, filename, signature = line.split(None, 2)
        if sym == prevsym:
            continue
	expr = "\^(.*)%s" % sym
	m = re.search(expr, signature)
        if not m:
    	    print "Could not split",signature, "using",expr
	rettype = m.group(1).strip()
	m = re.search("signature:\(([^)]*)\)", signature)
	if not m:
	    print "Could not get signature from", signature
	params = m.group(1)
	L[sym] = (rettype, params)

    for sym, ret, params, fn in documented:
        if sym not in L:
           print "No declaration for '%s'" % sym
           continue
        hret, hparams = L[sym]
        if not compare_types(ret, params, hret, hparams):
           print "Declaration error for %s (%s):" % (sym, fn)
           print ret+": "+params
           print hret+": "+hparams

if __name__ == "__main__":
    main()