": parseSection() elif len(line) >= 1 and line[0] == "<": print "unhandled %s" % (line) print "Parsed: %d files %d identifiers" % (len(files), len(identifiers_file.keys())) ################################################################## # # Parsing: xml/*.xml # To enrich the existing info with extracted comments # ################################################################## nbcomments = 0 def insertParameterComment(id, name, value, is_param): global nbcomments indexString(id, value) if functions.has_key(id): if is_param == 1: args = functions[id][1] found = 0 for arg in args: if arg[1] == name: arg[2] = value found = 1 break if found == 0 and name != '...': print "Arg %s not found on function %s description" % (name, id) return else: ret = functions[id][0] ret[1] = value elif user_functions.has_key(id): if is_param == 1: args = user_functions[id][1] found = 0 for arg in args: if arg[1] == name: arg[2] = value found = 1 break if found == 0 and name != '...': print "Arg %s not found on functype %s description" % (name, id) print args return else: ret = user_functions[id][0] ret[1] = value elif macros.has_key(id): if is_param == 1: args = macros[id][0] found = 0 for arg in args: if arg[0] == name: arg[1] = value found = 1 break if found == 0: args.append([name, value]) else: print "Return info for macro %s: %s" % (id, value) # ret = macros[id][0] # ret[1] = value else: print "lost specific comment %s: %s: %s" % (id, name, value) return nbcomments = nbcomments + 1 def insertComment(name, title, value, id): global nbcomments ids[name] = id indexString(name, value) if functions.has_key(name): functions[name][2] = value return "function" elif typedefs.has_key(name): typedefs[name] = value return "typedef" elif macros.has_key(name): macros[name][1] = value return "macro" elif variables.has_key(name): variables[name][1] = value return "variable" elif structs.has_key(name): structs[name] = value return "struct" elif enums.has_key(name): enums[name][1] = value return "enum" elif user_functions.has_key(name): user_functions[name][2] = value return "user_function" else: print "lost comment %s: %s" % (name, value) return "unknown" nbcomments = nbcomments + 1 import os import xmllib try: import sgmlop except ImportError: sgmlop = None # accelerator not available debug = 0 if sgmlop: class FastParser: """sgmlop based XML parser. this is typically 15x faster than SlowParser...""" def __init__(self, target): # setup callbacks self.finish_starttag = target.start self.finish_endtag = target.end self.handle_data = target.data # activate parser self.parser = sgmlop.XMLParser() self.parser.register(self) self.feed = self.parser.feed self.entity = { "amp": "&", "gt": ">", "lt": "<", "apos": "'", "quot": '"' } def close(self): try: self.parser.close() finally: self.parser = self.feed = None # nuke circular reference def handle_entityref(self, entity): # entity try: self.handle_data(self.entity[entity]) except KeyError: self.handle_data("&%s;" % entity) else: FastParser = None class SlowParser(xmllib.XMLParser): """slow but safe standard parser, based on the XML parser in Python's standard library.""" def __init__(self, target): self.unknown_starttag = target.start self.handle_data = target.data self.unknown_endtag = target.end xmllib.XMLParser.__init__(self) def getparser(target = None): # get the fastest available parser, and attach it to an # unmarshalling object. return both objects. if target == None: target = docParser() if FastParser: return FastParser(target), target return SlowParser(target), target class docParser: def __init__(self): self._methodname = None self._data = [] self.id = None self.title = None self.descr = None self.string = None def close(self): if debug: print "close" def getmethodname(self): return self._methodname def data(self, text): if debug: print "data %s" % text self._data.append(text) def start(self, tag, attrs): if debug: print "start %s, %s" % (tag, attrs) if tag == 'refsect2': self.id = None self.title = None self.descr = None self.string = None self.type = None self.in_parameter = 0 self.is_parameter = 0 self.parameter = None self.parameter_info = None self.entry = 0 elif tag == 'para': self._data = [] elif tag == 'title': self._data = [] elif tag == 'tgroup': self.in_parameter = 1 elif tag == 'row': self._data = [] self.entry = 0 elif tag == 'entry': self.entry = self.entry + 1 elif tag == 'parameter' and self.in_parameter == 1: self._data = [] elif tag == 'anchor' and self.id == None: if attrs.has_key('id'): self.orig_id = attrs['id'] self.id = string.replace(self.orig_id, '-CAPS', '') self.id = string.replace(self.id, '-', '_') def end(self, tag): if debug: print "end %s" % tag if tag == 'refsect2': self.type = insertComment(self.id, self.title, self.string, self.orig_id) self.string = None elif tag == 'row': if self.parameter_info != None and self.parameter_info != '': insertParameterComment(self.id, self.parameter, self.parameter_info, self.is_parameter) self.parameter_info = None self.parameter = 0 self.is_parameter = 0 elif tag == 'parameter' and self.in_parameter == 1 and self.entry == 1: str = '' for c in self._data: str = str + c str = string.replace(str, '\n', ' ') str = string.replace(str, '\r', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') while len(str) >= 1 and str[0] == ' ': str=str[1:] self.parameter = str self.is_parameter = 1 self._data = [] elif tag == 'para' or tag == 'entry': str = '' for c in self._data: str = str + c str = string.replace(str, '\n', ' ') str = string.replace(str, '\r', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') while len(str) >= 1 and str[0] == ' ': str=str[1:] if self.string == None: self.string = str elif self.in_parameter == 1: self.parameter_info = str self._data = [] elif tag == 'title': str = '' for c in self._data: str = str + c str = string.replace(str, '\n', ' ') str = string.replace(str, '\r', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') str = string.replace(str, ' ', ' ') while len(str) >= 1 and str[0] == ' ': str=str[1:] self.title = str xmlfiles = 0 filenames = os.listdir("xml") for filename in filenames: try: f = open("xml/" + filename, 'r') except IOError, msg: print file, ":", msg continue data = f.read() (parser, target) = getparser() parser.feed(data) parser.close() xmlfiles = xmlfiles + 1 print "Parsed: %d XML files collexting %d comments" % (xmlfiles, nbcomments) ################################################################## # # Saving: libxml2-api.xml # ################################################################## def escape(raw): raw = string.replace(raw, '&', '&') raw = string.replace(raw, '<', '<') raw = string.replace(raw, '>', '>') raw = string.replace(raw, "'", ''') raw = string.replace(raw, '"', '"') return raw print "Saving XML description libxml2-api.xml" output = open("libxml2-api.xml", "w") output.write('\n') output.write("\n") output.write(" \n") for file in files.keys(): output.write(" \n" % file) for symbol in files[file]: output.write(" \n" % (symbol)) output.write(" \n") output.write(" \n") output.write(" \n") symbols=macros.keys() for i in structs.keys(): symbols.append(i) for i in variables.keys(): variables.append(i) for i in typedefs.keys(): symbols.append(i) for i in enums.keys(): symbols.append(i) for j in enums[i][0]: symbols.append(j) for i in functions.keys(): symbols.append(i) for i in user_functions.keys(): symbols.append(i) symbols.sort() prev = None for i in symbols: if i == prev: # print "Symbol %s redefined" % (i) continue else: prev = i if identifiers_type.has_key(i): type = identifiers_type[i] if identifiers_file.has_key(i): file = identifiers_file[i] else: file = None output.write(" <%s name='%s'" % (type, i)) if file != None: output.write(" file='%s'" % (file)) if type == "function": output.write(">\n"); (ret, args, doc) = functions[i] if doc != None and doc != '': output.write(" %s\n" % (escape(doc))) if ret[1] != None and ret[1] != '': output.write(" \n" % ( ret[0], escape(ret[1]))) else: if ret[0] != 'void' and\ ret[0][0:4] != 'void': # This one is actually a bug in GTK Doc print "Description for return on %s is missing" % (i) output.write(" \n" % (ret[0])) for arg in args: if arg[2] != None and arg[2] != '': output.write(" \n" % (arg[1], arg[0], escape(arg[2]))) else: if arg[0] != '...': print "Description for %s on %s is missing" % (arg[1], i) output.write(" \n" % ( arg[1], arg[0])) output.write(" \n" % (type)); elif type == 'functype': output.write(">\n"); (ret, args, doc) = user_functions[i] if doc != None and doc != '': output.write(" %s\n" % (escape(doc))) if ret[1] != None and ret[1] != '': output.write(" \n" % ( ret[0], escape(ret[1]))) else: if ret[0] != 'void' and\ ret[0][0:4] != 'void': # This one is actually a bug in GTK Doc print "Description for return on %s is missing" % (i) output.write(" \n" % (ret[0])) for arg in args: if arg[2] != None and arg[2] != '': output.write(" \n" % (arg[1], arg[0], escape(arg[2]))) else: if arg[0] != '...': print "Description for %s on %s is missing" % (arg[1], i) output.write(" \n" % ( arg[1], arg[0])) output.write(" \n" % (type)); elif type == 'macro': output.write(">\n"); if macros[i][1] != None and macros[i][1] != '': output.write(" %s\n" % (escape(macros[i][1]))) else: print "Description for %s is missing" % (i) args = macros[i][0] for arg in args: if arg[1] != None and arg[1] != '': output.write(" \n" % (arg[0], escape(arg[1]))) else: print "Description for %s on %s is missing" % (arg[1], i) output.write(" \n" % (arg[0])) output.write(" \n" % (type)); elif type == 'struct': if structs[i] != None and structs[i] != '': output.write(" info='%s'/>\n" % (escape(structs[i]))) else: output.write("/>\n"); elif type == 'variable': if variables[i][1] != None and variables[i][1] != '': output.write(" info='%s'/>\n" % (escape(variables[i]))) else: output.write("/>\n"); elif type == 'typedef': if typedefs[i] != None and typedefs[i] != '': output.write(" info='%s'/>\n" % (escape(typedefs[i]))) else: output.write("/>\n"); else: output.write("/>\n"); else: print "Symbol %s not found in identifiers list" % (i) output.write(" \n") output.write("\n") output.close() print "generated XML for %d symbols" % (len(symbols)) ################################################################## # # Saving: libxml2-api.xml # ################################################################## hash = {} for file in files.keys(): for symbol in files[file]: hash[symbol] = file def link(id): if ids.has_key(id): target = string.upper(ids[id]) else: target = string.upper(id) if hash.has_key(id): module = string.lower(hash[id]) else: module = 'index' file = 'html/libxml-' + module + '.html'; return file + '#' + target print "Saving XML crossreferences libxml2-refs.xml" output = open("libxml2-refs.xml", "w") output.write('\n') output.write("\n") output.write(" \n") typ = ids.keys() typ.sort() for id in typ: output.write(" \n" % (id, link(id))) output.write(" \n") output.write(" \n") letter = None ids = ids.keys() ids.sort() for id in ids: if id[0] != letter: if letter != None: output.write(" \n") letter = id[0] output.write(" \n" % (letter)) output.write(" \n" % (id)) if letter != None: output.write(" \n") output.write(" \n") output.write(" \n") typ = ret_types.keys() typ.sort() for type in typ: if type == '' or type == 'void' or type == "int" or type == "char *" or \ type == "const char *" : continue output.write(" \n" % (type)) ids = ret_types[type] for id in ids: output.write(" \n" % (id)) output.write(" \n") output.write(" \n") output.write(" \n") typ = types.keys() typ.sort() for type in typ: if type == '' or type == 'void' or type == "int" or type == "char *" or \ type == "const char *" : continue output.write(" \n" % (type)) ids = types[type] for id in ids: output.write(" \n" % (id)) output.write(" \n") output.write(" \n") output.write(" \n") typ = files.keys() typ.sort() for file in typ: output.write(" \n" % (file)) for id in files[file]: output.write(" \n" % (id)) output.write(" \n") output.write(" \n") output.write(" \n") typ = index.keys() typ.sort() letter = None count = 0 chunk = 0 chunks = [] for id in typ: if len(index[id]) > 30: continue if id[0] != letter: if letter == None or count > 200: if letter != None: output.write(" \n") output.write(" \n") count = 0 chunks.append(["chunk%s" % (chunk -1), first_letter, letter]) output.write(" \n" % (chunk)) first_letter = id[0] chunk = chunk + 1 elif letter != None: output.write(" \n") letter = id[0] output.write(" \n" % (letter)) output.write(" \n" % (id)) tokens = index[id]; tokens.sort() tok = None for token in index[id]: if tok == token: continue tok = token output.write(" \n" % (token)) count = count + 1 output.write(" \n") if letter != None: output.write(" \n") output.write(" \n") output.write(" \n") for ch in chunks: output.write(" \n" % ( ch[0], ch[1], ch[2])) output.write(" \n") output.write(" \n") output.write("\n") output.close()