": parseSection() elif len(line) >= 1 and line[0] == "<": print "unhandled %s" % (line) print "Parsed: %d files %d identifiers" % (len(files), len(identifiers_file.keys())) ################################################################## # # Parsing: xml/*.xml # To enrich the existing info with extracted comments # ################################################################## nbcomments = 0 def insertParameterComment(id, name, value, is_param): global nbcomments indexString(id, value) if functions.has_key(id): if is_param == 1: args = functions[id][1] found = 0 for arg in args: if arg[1] == name: arg[2] = value found = 1 break if found == 0 and name != '...': print "Arg %s not found on function %s description" % (name, id) return else: ret = functions[id][0] ret[1] = value elif user_functions.has_key(id): if is_param == 1: args = user_functions[id][1] found = 0 for arg in args: if arg[1] == name: arg[2] = value found = 1 break if found == 0 and name != '...': print "Arg %s not found on functype %s description" % (name, id) print args return else: ret = user_functions[id][0] ret[1] = value elif macros.has_key(id): if is_param == 1: args = macros[id][0] found = 0 for arg in args: if arg[0] == name: arg[1] = value found = 1 break if found == 0: args.append([name, value]) else: print "Return info for macro %s: %s" % (id, value) # ret = macros[id][0] # ret[1] = value else: print "lost specific comment %s: %s: %s" % (id, name, value) return nbcomments = nbcomments + 1 def insertComment(name, title, value, id): global nbcomments ids[name] = id indexString(name, value) if functions.has_key(name): functions[name][2] = value return "function" elif typedefs.has_key(name): typedefs[name] = value return "typedef" elif macros.has_key(name): macros[name][1] = value return "macro" elif variables.has_key(name): variables[name][1] = value return "variable" elif structs.has_key(name): structs[name] = value return "struct" elif enums.has_key(name): enums[name][1] = value return "enum" elif user_functions.has_key(name): user_functions[name][2] = value return "user_function" else: print "lost comment %s: %s" % (name, value) return "unknown" nbcomments = nbcomments + 1 import libxml2 import os def analyzeXMLDescriptionRow(doc, desc, id, row): if doc == None or desc == None or id == None or row == None: return ctxt = doc.xpathNewContext() ctxt.setContextNode(row) param = ctxt.xpathEval("entry[1]/parameter") entries = ctxt.xpathEval("entry") if param == []: is_param = 0 name = None else: name = param[0].content is_param = 1 str = entries[1].content str = string.replace(str, '\n', ' ') str = string.replace(str, '\r', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') while len(str) >= 1 and str[0] == ' ': str=str[1:] insertParameterComment(id, name, str, is_param) def analyzeXMLDescription(doc, desc): if doc == None or desc == None: return ctxt = doc.xpathNewContext() ctxt.setContextNode(desc) # # get the function name # try: title = ctxt.xpathEval("title")[0].content except: return old_id = ctxt.xpathEval("string(title/anchor/@id)") id = string.replace(title, '(', ' '); id = string.replace(id, ')', ' '); id = string.split(id) [0] # # get the function comments # comment = "" paras = ctxt.xpathEval("para") for para in paras: str = para.content str = string.replace(str, '\n', ' ') str = string.replace(str, '\r', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') while len(str) >= 1 and str[0] == ' ': str=str[1:] comment = comment + str insertComment(id, title, comment, old_id) rows = ctxt.xpathEval("informaltable/tgroup/tbody/row") for row in rows: analyzeXMLDescriptionRow(doc, desc, id, row) def analyzeXMLDoc(doc): if doc == None: return ctxt = doc.xpathNewContext() descriptions = ctxt.xpathEval("//refsect2") print len(descriptions) for description in descriptions: analyzeXMLDescription(doc, description) xmlfiles = 0 filenames = os.listdir("xml") for filename in filenames: print filename try: doc = libxml2.parseFile("xml/" + filename) analyzeXMLDoc(doc) doc.freeDoc() xmlfiles = xmlfiles + 1 except: print "failed to parse XML description %s" % ("xml/" + filename) continue print "Parsed: %d XML files collexting %d comments" % (xmlfiles, nbcomments) ################################################################## # # Saving: libxslt-api.xml # ################################################################## def escape(raw): raw = string.replace(raw, '&', '&') raw = string.replace(raw, '<', '<') raw = string.replace(raw, '>', '>') raw = string.replace(raw, "'", ''') raw = string.replace(raw, '"', '"') return raw print "Saving XML description libxslt-api.xml" output = open("libxslt-api.xml", "w") output.write('\n') output.write("\n") output.write(" \n") for file in files.keys(): output.write(" \n" % file) for symbol in files[file]: output.write(" \n" % (symbol)) output.write(" \n") output.write(" \n") output.write(" \n") symbols=macros.keys() for i in structs.keys(): symbols.append(i) for i in variables.keys(): variables.append(i) for i in typedefs.keys(): symbols.append(i) for i in enums.keys(): symbols.append(i) for j in enums[i][0]: symbols.append(j) for i in functions.keys(): symbols.append(i) for i in user_functions.keys(): symbols.append(i) symbols.sort() prev = None for i in symbols: if i == prev: # print "Symbol %s redefined" % (i) continue else: prev = i if identifiers_type.has_key(i): type = identifiers_type[i] if identifiers_file.has_key(i): file = identifiers_file[i] else: file = None output.write(" <%s name='%s'" % (type, i)) if file != None: output.write(" file='%s'" % (file)) if type == "function": output.write(">\n"); (ret, args, doc) = functions[i] if doc != None and doc != '': output.write(" %s\n" % (escape(doc))) if ret[1] != None and ret[1] != '': output.write(" \n" % ( ret[0], escape(ret[1]))) else: if ret[0] != 'void' and\ ret[0][0:4] != 'void': # This one is actually a bug in GTK Doc print "Description for return on %s is missing" % (i) output.write(" \n" % (ret[0])) for arg in args: if arg[2] != None and arg[2] != '': output.write(" \n" % (arg[1], arg[0], escape(arg[2]))) else: if arg[0] != '...': print "Description for %s on %s is missing" % (arg[1], i) output.write(" \n" % ( arg[1], arg[0])) output.write(" \n" % (type)); elif type == 'functype': output.write(">\n"); (ret, args, doc) = user_functions[i] if doc != None and doc != '': output.write(" %s\n" % (escape(doc))) if ret[1] != None and ret[1] != '': output.write(" \n" % ( ret[0], escape(ret[1]))) else: if ret[0] != 'void' and\ ret[0][0:4] != 'void': # This one is actually a bug in GTK Doc print "Description for return on %s is missing" % (i) output.write(" \n" % (ret[0])) for arg in args: if arg[2] != None and arg[2] != '': output.write(" \n" % (arg[1], arg[0], escape(arg[2]))) else: if arg[0] != '...': print "Description for %s on %s is missing" % (arg[1], i) output.write(" \n" % ( arg[1], arg[0])) output.write(" \n" % (type)); elif type == 'macro': output.write(">\n"); if macros[i][1] != None and macros[i][1] != '': output.write(" %s\n" % (escape(macros[i][1]))) else: print "Description for %s is missing" % (i) args = macros[i][0] for arg in args: if arg[1] != None and arg[1] != '': output.write(" \n" % (arg[0], escape(arg[1]))) else: print "Description for %s on %s is missing" % (arg[1], i) output.write(" \n" % (arg[0])) output.write(" \n" % (type)); elif type == 'struct': if structs[i] != None and structs[i] != '': output.write(" info='%s'/>\n" % (escape(structs[i]))) else: output.write("/>\n"); elif type == 'variable': if variables[i][1] != None and variables[i][1] != '': output.write(" info='%s'/>\n" % (escape(variables[i]))) else: output.write("/>\n"); elif type == 'typedef': if typedefs[i] != None and typedefs[i] != '': output.write(" info='%s'/>\n" % (escape(typedefs[i]))) else: output.write("/>\n"); else: output.write("/>\n"); else: print "Symbol %s not found in identifiers list" % (i) output.write(" \n") output.write("\n") output.close() print "generated XML for %d symbols" % (len(symbols)) ################################################################## # # Saving: libxslt-api.xml # ################################################################## hash = {} for file in files.keys(): for symbol in files[file]: hash[symbol] = file def link(id): if ids.has_key(id): target = string.upper(ids[id]) else: target = string.upper(id) if hash.has_key(id): module = string.lower(hash[id]) else: module = 'index' file = 'html/libxslt-' + module + '.html'; return file + '#' + target print "Saving XML crossreferences libxslt-refs.xml" output = open("libxslt-refs.xml", "w") output.write('\n') output.write("\n") output.write(" \n") typ = ids.keys() typ.sort() for id in typ: output.write(" \n" % (id, link(id))) output.write(" \n") output.write(" \n") letter = None ids = ids.keys() ids.sort() for id in ids: if id[0] != letter: if letter != None: output.write(" \n") letter = id[0] output.write(" \n" % (letter)) output.write(" \n" % (id)) if letter != None: output.write(" \n") output.write(" \n") output.write(" \n") typ = ret_types.keys() typ.sort() for type in typ: if type == '' or type == 'void' or type == "int" or type == "char *" or \ type == "const char *" : continue output.write(" \n" % (type)) ids = ret_types[type] for id in ids: output.write(" \n" % (id)) output.write(" \n") output.write(" \n") output.write(" \n") typ = types.keys() typ.sort() for type in typ: if type == '' or type == 'void' or type == "int" or type == "char *" or \ type == "const char *" : continue output.write(" \n" % (type)) ids = types[type] for id in ids: output.write(" \n" % (id)) output.write(" \n") output.write(" \n") output.write(" \n") typ = files.keys() typ.sort() for file in typ: output.write(" \n" % (file)) for id in files[file]: output.write(" \n" % (id)) output.write(" \n") output.write(" \n") output.write(" \n") typ = index.keys() typ.sort() letter = None count = 0 chunk = 0 chunks = [] for id in typ: if len(index[id]) > 30: continue if id[0] != letter: if letter == None or count > 200: if letter != None: output.write(" \n") output.write(" \n") count = 0 chunks.append(["chunk%s" % (chunk -1), first_letter, letter]) output.write(" \n" % (chunk)) first_letter = id[0] chunk = chunk + 1 elif letter != None: output.write(" \n") letter = id[0] output.write(" \n" % (letter)) output.write(" \n" % (id)) tokens = index[id]; tokens.sort() tok = None for token in index[id]: if tok == token: continue tok = token output.write(" \n" % (token)) count = count + 1 output.write(" \n") if letter != None: output.write(" \n") output.write(" \n") output.write(" \n") for ch in chunks: output.write(" \n" % ( ch[0], ch[1], ch[2])) output.write(" \n") output.write(" \n") output.write("\n") output.close()