3 # This file is part of the GROMACS molecular simulation package.
5 # Copyright (c) 2014, by the GROMACS development team, led by
6 # Mark Abraham, David van der Spoel, Berk Hess, and Erik Lindahl,
7 # and including many others, as listed in the AUTHORS file in the
8 # top-level source directory and at http://www.gromacs.org.
10 # GROMACS is free software; you can redistribute it and/or
11 # modify it under the terms of the GNU Lesser General Public License
12 # as published by the Free Software Foundation; either version 2.1
13 # of the License, or (at your option) any later version.
15 # GROMACS is distributed in the hope that it will be useful,
16 # but WITHOUT ANY WARRANTY; without even the implied warranty of
17 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 # Lesser General Public License for more details.
20 # You should have received a copy of the GNU Lesser General Public
21 # License along with GROMACS; if not, see
22 # http://www.gnu.org/licenses, or write to the Free Software Foundation,
23 # Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
25 # If you want to redistribute modifications to GROMACS, please
26 # consider that scientific software is very special. Version
27 # control is crucial - bugs must be traceable. We will be happy to
28 # consider code for inclusion in the official distribution, but
29 # derived work must not be called official GROMACS. Details are found
30 # in the README & COPYING files - if they are missing, get the
31 # official version at http://www.gromacs.org.
33 # To help us fund GROMACS development, we humbly ask that you cite
34 # the research papers on the package. Check out http://www.gromacs.org.
36 """Doxygen XML output parser.
38 This module implements a parser for the Doxygen XML output, converting it into
39 an object model that can be used to navigate the documentation. It also uses
40 knowledge from how Doxygen works to provide access to things like visibility of
41 individual member documentation (e.g., based on what is the visibility of its
42 parent compound objects).
44 The object model is rooted at a DocumentationSet object. Each documented
45 entity is modeled as an Entity, and this has subclasses Member and Compound to
46 correspond to the two categories of items that Doxygen handles. These classes
47 are further subclassed to match each kind of entity that Doxygen produces.
48 Only kinds produced by Doxygen from C/C++ code are modeled. Everything else
49 is ignored after a warning.
51 Currently the member entities are not completely parsed from the XML files, and
52 the interface may need additional work to provide convenient access to all
53 member types and their common properties. For now, focus is in modeling the
56 The implementation is mostly independent of any GROMACS-specific rules, except
58 - DocType.library is a GROMACS-specific construct that is deduced from the
59 contents of the detailed description (presence of a \libinternal command in
60 the Doxygen comment triggers it).
61 - DocType.internal is deduced from the presence of a \internal command that
62 covers the whole detailed description.
63 - List of extensions for determining whether a file is a source file only
64 contains extensions actually used by GROMACS.
65 It would be possible to move these out from this file, but that would require
66 exposing the XML representation for the descriptions, which is not nice either.
68 The module can also be run as a script that can dump out different parts of the
69 object model. This can be used to debug the parser, as well as check what is
70 actually in the XML documentation.
74 import xml.etree.ElementTree as ET
78 #####################################################################
79 # Helper functions and classes
81 def _show_list(title, objlist):
82 """Helper function for formatting a list of objects for debug output."""
84 print '{0}:'.format(title)
88 class DocType(object):
90 """Documentation visibility in the generated documentation."""
92 # Mapping to string representations for the internal integer values
93 _names = ['undocumented', 'internal', 'library', 'public']
95 def __init__(self, value):
96 """Initialize a DocType instance.
98 DocType.{none,internal,library,public} should be used outside the class
99 instead of calling the constructor.
104 """Return string representation for the documentation type."""
105 return self._names[self._value]
107 def __cmp__(self, other):
108 """Order documentation types in the order of visibility."""
109 return cmp(self._value, other._value)
111 # Static values for documentation types.
112 DocType.none = DocType(0)
113 DocType.internal = DocType(1)
114 DocType.library = DocType(2)
115 DocType.public = DocType(3)
117 class Location(object):
119 """Location of a Doxygen entity.
121 This class contains the logic to parse a <location> tag in Doxygen XML.
122 It is used as the entity location in cases where body location is not
123 expected, or as part of a LocationWithBody.
126 def __init__(self, elem):
127 """Initialize location from a <location> element."""
128 self.filepath = elem.attrib['file']
129 self.line = int(elem.attrib['line'])
130 self.column = elem.attrib['column']
133 return '{0}:{1}'.format(self.filepath, self.line)
135 def get_reporter_location(self):
136 return reporter.Location(self.filepath, self.line)
138 def get_full_string(self):
139 return '{0}:{1}:{2}'.format(self.filepath, self.line, self.column)
141 class BodyLocation(object):
143 """Body location of a Doxygen entity.
145 This class contains the logic to parse a body location from a <location>
146 tag in Doxygen XML. Not all entities have these attributes.
147 This is only used as part of a LocationWithBody, which handles cases where
148 the body location is optional.
150 The body location can be compared and hashed so that it can be used in
151 a dictionary for DocumentationSet.merge_duplicates().
154 def __init__(self, elem):
155 """Initialize body location from a <location> element."""
156 self.filepath = elem.attrib['bodyfile']
157 self.startline = int(elem.attrib['bodystart'])
158 self.endline = int(elem.attrib['bodyend'])
160 def __cmp__(self, other):
161 result = cmp(self.filepath, other.filepath)
163 result = cmp(self.startline, other.startline)
165 result = cmp(self.endline, other.endline)
169 return hash(self.filepath) ^ hash(self.startline) ^ hash(self.endline)
172 return '{0}:{1}'.format(self.filepath, self.startline)
174 def get_full_string(self):
176 return self.__str__()
177 return '{0}:{1}-{2}'.format(self.filepath, self.startline, self.endline)
179 class LocationWithBody(object):
181 """Location for a Doxygen entity that can have a body location.
183 This class is used to represent the location of a Doxygen entity that can
184 have a body location.
187 def __init__(self, elem):
188 """Initialize location from a <location> element."""
189 self._location = Location(elem)
190 if 'bodyfile' in elem.attrib:
191 self._bodylocation = BodyLocation(elem)
193 self._bodylocation = None
196 if not self._bodylocation:
197 return '{0} (no body)'.format(self._location)
199 return '{0} / {1}'.format(self._location, self._bodylocation)
201 def get_reporter_location(self):
202 """Return reporter location for this location.
204 All issues are reported at the main location, which should match with
205 the declaration, where most of the documentation typically is.
207 return self._location.get_reporter_location()
209 def get_location(self):
210 return self._location
212 def get_body_location(self):
213 return self._bodylocation
215 def has_same_body_location(self):
216 """Check whether main location matches body location.
218 If the main location is different, then it likely points to the
219 declaration of the function.
221 return self._location.filepath == self._bodylocation.filepath and \
222 self._location.line == self._bodylocation.startline
224 class MemberSection(object):
226 """Section of members within a compound entity."""
228 def __init__(self, kind):
235 def add_member(self, member):
236 self._members.append(member)
238 def replace_member(self, old, new):
240 pos = self._members.index(old)
243 self._members[pos] = new
245 #####################################################################
246 # Documentation entities
248 class Entity(object):
250 """Doxygen documentation entity.
252 This class represents common properties of an entity that can contain
253 Doxygen documentation.
256 def __init__(self, name, refid):
260 self._has_brief_description = False
261 self._has_detailed_description = False
262 self._has_inbody_description = False
263 self._visibility = DocType.none
268 def _get_reporter(self):
269 """Return reporter to use for parsing issues."""
270 return self._docset.get_reporter()
272 def set_documentation_set(self, docset):
273 """Set the documentation set this entity belongs to.
275 The documentation set parent provides access to a common reporter
276 object, and also allows the entity to resolve references to other
277 entities while loading XML information.
279 assert self._docset is None
280 self._docset = docset
288 def get_reporter_location(self):
289 return reporter.Location('<{0}>'.format(self._name), None)
291 def get_visibility(self):
292 return self._visibility
294 def is_documented(self):
295 return self._visibility != DocType.none
297 def has_brief_description(self):
298 return self._has_brief_description
300 def has_inbody_description(self):
301 return self._has_inbody_description
303 def _process_descriptions(self, briefelem, detailselem, inbodyelem):
304 reporter = self._get_reporter()
305 if briefelem is not None and len(briefelem) > 0:
306 self._has_brief_description = True
307 self._visibility = DocType.public
308 if detailselem is not None and len(detailselem) > 0:
309 self._visibility = DocType.public
311 # \internal is used at the beginning of a comment block to
312 # mark the block internal to the module.
313 # \libinternal is used similarly, and inserts custom XML
315 if detailselem[0].tag == 'internal':
316 if len(detailselem) == 1:
317 self._visibility = DocType.internal
319 # TODO: Should we also check if internal appears elsewhere?
320 reporter.doc_note(self, '\internal does not cover whole documentation')
321 if detailselem[0].find('libinternal') is not None:
322 if self._visibility == DocType.public:
323 self._visibility = DocType.library
325 reporter.doc_error(self, '\libinternal should not be used inside \internal')
326 self._has_detailed_description = True
327 if inbodyelem is not None:
328 self._has_inbody_description = (len(inbodyelem) > 0)
331 """Format information for common properties.
333 This is called from subclass show() methods to show base information
336 print 'ID: {0}'.format(self._id)
337 print 'Name: {0}'.format(self._name)
338 print 'Location: {0}'.format(self.get_reporter_location())
340 if self._has_brief_description:
341 doctype.append('brief')
342 if self._has_detailed_description:
343 doctype.append('details')
344 if self._has_inbody_description:
345 doctype.append('in-body')
347 doctype.append('none')
348 print 'Doc: {0}'.format(', '.join(doctype))
349 print 'Visibility: {0}'.format(self._visibility)
353 class Member(Entity):
357 In Doxygen, a member entity is an entity such as a function or an enum that
358 cannot contain other documented entities (an enum is a slight exception, as
359 enum values are still nested within the enum member). A member always
360 belongs to one (or more) compounds, which means that the detailed
361 documentation for the member appears on the documentation page for that
362 compound. If none of the parent compounds are documented, the member
363 doesn't appear anywhere, even if it is documented.
365 Member information is loaded from a parent compound's XML file. If there
366 is more than one parent, the first one encountered will be used
367 (presumably, Doxygen duplicates the information into each XML file).
370 def __init__(self, name, refid):
371 Entity.__init__(self, name, refid)
372 self._parents = set()
374 self._namespace = None
377 self._location = None
378 self._alternates = set()
380 # TODO: Move to Entity?
383 def add_parent_compound(self, compound):
384 """Add a compound that contains this member."""
385 self._parents.add(compound)
386 if isinstance(compound, Class):
387 assert self._class is None
388 self._class = compound
389 elif isinstance(compound, Namespace):
390 assert self._namespace is None
391 self._namespace = compound
392 elif isinstance(compound, File):
393 self._files.add(compound)
394 elif isinstance(compound, Group):
395 assert self._group is None
396 self._group = compound
400 def merge_definition(self, definition):
401 """Merge another member into this.
403 See DocumentationSet.merge_duplicates().
405 assert self._class is None
406 assert definition._class is None
407 assert self._group == definition._group
408 assert self._namespace == definition._namespace
409 self._parents.update(definition._parents)
410 self._files.update(definition._files)
411 self._alternates.add(definition)
413 def load_details_from_element(self, rootelem, xmlpath):
414 """Load details for the member from a given XML element.
416 This method is called when encountering member definitions while
417 processing a compound XML file to load the information for that member.
418 It processes common properties for a member, and delegates other
419 elements to _load_element().
422 # TODO: It would be nice to verify that the same information
423 # is present in all instances
425 self._xmlpath = xmlpath
426 # TODO: Process the attributes
427 reporter = self._get_reporter()
431 for elem in rootelem:
432 if elem.tag == 'name':
433 if elem.text != self.get_name():
434 reporter.xml_assert(xmlpath,
435 "member name mismatch: '{0}' (in index.xml) vs. '{1}'".format(
436 self.get_name(), elem.text))
437 elif elem.tag == 'briefdescription':
439 elif elem.tag == 'detaileddescription':
441 elif elem.tag == 'inbodydescription':
442 # TODO: in-body description is probably only possible for
443 # functions; move it there.
445 elif elem.tag == 'location':
446 self._location = LocationWithBody(elem)
448 if not self._load_element(elem):
449 # TODO Process the rest of the elements so that we can check this
450 #reporter.xml_assert(xmlpath,
451 # "unknown member child element '{0}'".format(elem.tag))
453 self._process_descriptions(briefelem, detailselem, inbodyelem)
456 def _load_element(self, element):
457 """Load data from a child XML element.
459 This method is called for all XML elements under the <memberdef>
460 element that are not handled directly by the Member class.
461 Derived classes should return True if they process the element.
465 def _get_raw_location(self):
466 """Returns the BodyLocation object associated with this member.
468 This is necessary so that EnumValue can override it report a non-empty
469 location: Doxygen doesn't provide any location for <enumvalue>.
471 return self._location
473 def get_reporter_location(self):
474 return self._get_raw_location().get_reporter_location()
476 def get_location(self):
477 """Return main location for the member.
479 This typically corresponds to the declaration.
481 return self._get_raw_location().get_location()
483 def get_body_location(self):
484 """Return location of the body for the member.
486 Some types of members do not have a body location, in which case this
489 return self._get_raw_location().get_body_location()
491 def has_same_body_location(self):
492 """Check whether the main location is the same as body location."""
493 return self._get_raw_location().has_same_body_location()
495 def get_namespace(self):
496 return self._namespace
498 def get_parent_compounds(self):
501 def get_inherited_visibility(self):
502 return max([parent.get_visibility() for parent in self._parents])
507 idlist = [x.get_id() for x in self._alternates]
508 print 'Alt. IDs: {0}'.format(', '.join(idlist))
509 print 'Parent vis: {0}'.format(self.get_inherited_visibility())
510 print 'Location: {0}'.format(self.get_location().get_full_string())
511 print 'Body loc: {0}'.format(self.get_body_location().get_full_string())
512 _show_list('Parents', self._parents)
514 class Define(Member):
517 class Variable(Member):
520 class Typedef(Member):
524 def __init__(self, name, refid):
525 Member.__init__(self, name, refid)
528 def _load_element(self, elem):
529 if elem.tag == 'enumvalue':
530 refid = elem.attrib['id']
531 # Doxygen seems to sometimes assign the same ID to a singleton enum
532 # value (this already triggers a warning in loading index.xml).
533 if refid == self.get_id():
535 member = self._docset.get_member(refid)
536 member.set_enum(self)
537 member.load_details_from_element(elem, self._xmlpath)
538 self._values.add(member)
542 def get_values(self):
545 class EnumValue(Member):
546 def __init__(self, name, refid):
547 Member.__init__(self, name, refid)
550 def set_enum(self, member):
551 assert self._enum is None
554 def _get_raw_location(self):
555 return self._enum._get_raw_location()
557 class Function(Member):
560 class FriendDeclaration(Member):
565 class Compound(Entity):
569 In Doxygen, a compound entity is an entity that has its own documentation
570 page, and can contain other documented entities (either members, or other
571 compounds). Examples of compounds are files and classes.
572 A compound entity always appears in the documentation, even if it is
573 contained in another compound that is not documented.
575 The list of members for a compound is initialized when the XML index file
576 is read. All other information is loaded from an XML file that is specific
577 to the compound. In addition to describing the compound, this XML file
578 contains references to contained compounds, and details of all members
582 def __init__(self, name, refid):
583 Entity.__init__(self, name, refid)
584 self._members = dict()
585 self._children = set()
590 def _get_xml_path(self):
591 """Return path to the details XML file for this compound."""
592 return os.path.join(self._docset.get_xmlroot(), self.get_id() + '.xml')
594 def add_member(self, member):
595 """Add a contained member."""
596 self._members[member.get_id()] = member
598 def add_group(self, compound):
599 """Add a group (a compound entity) that contains this entity."""
600 self._groups.add(compound)
602 def replace_member(self, old, new):
603 if old.get_id() not in self._members:
604 raise ValueError("Trying to replace a non-existent member")
605 elif new.get_id() in self._members:
606 raise ValueError("Trying to replace with an existing member")
607 self._members[old.get_id()] = new
608 for section in self._sections:
609 section.replace_member(old, new)
611 def load_details(self):
612 """Load details for the compound from its details XML file.
614 This method processes common properties for a compound.
615 References to inner compounds are delegated to _load_inner_*() methods,
616 and all members encountered in the XML file are loaded with
617 Member.load_details_from_element().
618 Other elements are delegated to _load_element().
622 reporter = self._get_reporter()
623 xmlpath = self._get_xml_path()
624 compoundtree = ET.parse(xmlpath)
625 root = compoundtree.getroot()
627 reporter.xml_assert(xmlpath, "more than one compound in a file")
628 if root[0].tag != 'compounddef':
629 reporter.xml_assert(xmlpath, "expected <compounddef> as the first tag")
633 missing_members = set(self._members.values())
635 if elem.tag == 'compoundname':
636 if elem.text != self.get_name():
637 reporter.xml_assert(xmlpath,
638 "compound name mismatch: '{0}' (in index.xml) vs. '{1}'"
639 .format(self.get_name(), elem.text))
640 elif elem.tag == 'briefdescription':
642 elif elem.tag == 'detaileddescription':
644 elif elem.tag in ('includes', 'includedby', 'incdepgraph',
645 'invincdepgraph', 'inheritancegraph', 'collaborationgraph',
646 'programlisting', 'templateparamlist', 'listofallmembers'):
648 elif elem.tag.startswith('inner'):
649 refid = elem.attrib['refid']
650 reftype = elem.tag[5:]
651 # TODO: Handle 'prot' attribute?
652 refcompound = self._docset.get_compound(refid)
653 self._children.add(refcompound)
654 if reftype == 'file':
655 self._load_inner_file(refcompound)
656 elif reftype == 'dir':
657 self._load_inner_dir(refcompound)
658 elif reftype == 'group':
659 self._load_inner_group(refcompound)
660 elif reftype == 'namespace':
661 self._load_inner_namespace(refcompound)
662 elif reftype == 'class':
663 self._load_inner_class(refcompound)
665 reporter.xml_assert(xmlpath,
666 "unknown inner compound type '{0}'".format(reftype))
667 elif elem.tag == 'sectiondef':
668 # TODO: Handle header and description elements
669 kind = elem.attrib['kind']
670 section = MemberSection(kind)
671 self._sections.append(section)
672 for memberelem in elem.iter('memberdef'):
673 refid = memberelem.attrib['id']
674 member = self._members[refid]
675 member.load_details_from_element(memberelem, xmlpath)
676 section.add_member(member)
677 if member in missing_members:
678 missing_members.remove(member)
679 # Enum values need special handling, but are not worth
680 # extra generalization.
681 if isinstance(member, Enum):
682 missing_members.difference_update(member.get_values())
684 if not self._load_element(elem):
685 reporter.xml_assert(xmlpath,
686 "unknown compound child element '{0}'".format(elem.tag))
688 reporter.xml_assert(xmlpath, 'members without section')
689 self._process_descriptions(briefelem, detailselem, None)
692 def _unexpected_inner_compound(self, typename, compound):
693 """Report a parsing error for an unexpected inner compound reference."""
694 reporter = self._get_reporter()
695 xmlpath = self._get_xml_path()
696 reporter.xml_assert(xmlpath,
697 "unexpected inner {0}: {1}".format(typename, compound))
699 def _load_inner_file(self, compound):
700 """Process a reference to an inner file.
702 Derived classes should override the method if the compound type can
703 contain files as nested compounds.
705 self._unexpected_inner_compound("file", compound)
707 def _load_inner_dir(self, compound):
708 """Process a reference to an inner directory.
710 Derived classes should override the method if the compound type can
711 contain directories as nested compounds.
713 self._unexpected_inner_compound("dir", compound)
715 def _load_inner_group(self, compound):
716 """Process a reference to an inner group.
718 Derived classes should override the method if the compound type can
719 contain groups as nested compounds.
721 self._unexpected_inner_compound("group", compound)
723 def _load_inner_namespace(self, compound):
724 """Process a reference to an inner namespace.
726 Derived classes should override the method if the compound type can
727 contain namespaces as nested compounds.
729 self._unexpected_inner_compound("namespace", compound)
731 def _load_inner_class(self, compound):
732 """Process a reference to an inner class.
734 Derived classes should override the method if the compound type can
735 contain classes as nested compounds.
737 self._unexpected_inner_compound("class", compound)
739 def _load_element(self, element):
740 """Load data from a child XML element.
742 This method is called for all XML elements under the <compounddef>
743 element that are not handled directly by the Compound class.
744 Derived classes should return True if they process the element.
748 def get_groups(self):
752 """Format information for common properties.
754 This extends Entity.show_base() by adding properties that are common to
757 Entity.show_base(self)
759 print 'Groups: {0}'.format(', '.join(map(str, self._groups)))
761 def show_members(self):
762 """Show list of members.
764 This method is provided for use in show() methods of derived classes
765 to print the list of members.
767 for section in self._sections:
768 print 'Member section: {0}'.format(section)
769 for member in section._members:
772 class File(Compound):
773 def __init__(self, name, refid):
774 Compound.__init__(self, name, refid)
776 self._directory = None
777 self._classes = set()
778 self._namespaces = set()
779 self._is_source_file = None
781 def _load_inner_class(self, compound):
782 compound.add_file(self)
783 self._classes.add(compound)
785 def _load_inner_namespace(self, compound):
786 compound.add_file(self)
787 self._namespaces.add(compound)
789 def _load_element(self, elem):
790 if elem.tag == 'location':
791 self._path = elem.attrib['file']
792 extension = os.path.splitext(self._path)[1]
793 self._is_source_file = (extension in ('.c', '.cpp', '.cu'))
797 def set_directory(self, directory):
798 self._directory = directory
800 def get_reporter_location(self):
801 return reporter.Location(self._path, None)
806 def get_directory(self):
807 return self._directory
809 def is_source_file(self):
810 return self._is_source_file
814 print 'Path: {0}'.format(self._path)
815 print 'Directory: {0}'.format(self._directory)
816 print 'Source: {0}'.format(self._is_source_file)
817 _show_list('Namespaces', self._namespaces)
818 _show_list('Classes', self._classes)
821 class Directory(Compound):
822 def __init__(self, name, refid):
823 Compound.__init__(self, name, refid)
826 self._subdirs = set()
829 def _load_inner_file(self, compound):
830 compound.set_directory(self)
831 self._files.add(compound)
833 def _load_inner_dir(self, compound):
834 compound._parent = self
835 self._subdirs.add(compound)
837 def _load_element(self, elem):
838 if elem.tag == 'location':
839 self._path = elem.attrib['file']
843 def get_reporter_location(self):
844 return reporter.Location(self._path, None)
849 def get_parent(self):
852 def get_subdirectories(self):
857 print 'Path: {0}'.format(self._path)
859 print 'Parent: {0}'.format(self._parent)
860 _show_list('Subdirectories', self._subdirs)
861 _show_list('Files', self._files)
863 class Group(Compound):
864 def __init__(self, name, refid):
865 Compound.__init__(self, name, refid)
868 self._nestedgroups = set()
869 self._namespaces = set()
870 self._classes = set()
872 def _load_inner_file(self, compound):
873 compound.add_group(self)
874 self._files.add(compound)
876 # Doxygen 1.8.5 doesn't seem to put the directories into the XML output,
877 # even though they are in the HTML output as group members...
879 def _load_inner_group(self, compound):
880 compound.add_group(self)
881 self._nestedgroups.add(compound)
883 def _load_inner_namespace(self, compound):
884 compound.add_group(self)
885 self._namespaces.add(compound)
887 def _load_inner_class(self, compound):
888 compound.add_group(self)
889 self._classes.add(compound)
891 def _load_element(self, elem):
892 if elem.tag == 'title':
893 self._title = elem.text
899 print 'Title: {0}'.format(self._title)
900 print 'Inner compounds:'
901 for compound in self._children:
905 class Namespace(Compound):
906 def __init__(self, name, refid):
907 Compound.__init__(self, name, refid)
908 self._doclocation = None
911 self._innernamespaces = set()
912 self._classes = set()
914 def _load_inner_namespace(self, compound):
915 compound._parent = self
916 self._innernamespaces.add(compound)
918 def _load_inner_class(self, compound):
919 compound.set_namespace(self)
920 self._classes.add(compound)
922 def _load_element(self, elem):
923 if elem.tag == 'location':
924 self._doclocation = Location(elem)
928 def add_file(self, compound):
929 self._files.add(compound)
931 def get_reporter_location(self):
932 return self._doclocation.get_reporter_location()
934 def is_anonymous(self):
935 return 'anonymous_namespace{' in self.get_name()
939 print 'Doc. loc.: {0}'.format(self._doclocation.get_full_string())
940 _show_list('Inner namespaces', self._innernamespaces)
941 _show_list('Classes', self._classes)
944 class Class(Compound):
945 def __init__(self, name, refid):
946 Compound.__init__(self, name, refid)
947 self._location = None
948 self._namespace = None
950 self._baseclasses = []
951 self._derivedclasses = set()
952 self._outerclass = None
953 self._innerclasses = set()
955 def _load_inner_class(self, compound):
956 compound.set_outer_class(self)
957 self._innerclasses.add(compound)
959 def _load_element(self, elem):
960 if elem.tag == 'basecompoundref':
961 # TODO: Handle unknown bases?
962 if 'refid' in elem.attrib:
963 refid = elem.attrib['refid']
964 # TODO: Handle prot and virt attributes, check name?
965 base = self._docset.get_compound(refid)
966 self._baseclasses.append(base)
968 if elem.tag == 'derivedcompoundref':
969 refid = elem.attrib['refid']
970 # TODO: Handle prot and virt attributes, check name?
971 derived = self._docset.get_compound(refid)
972 self._derivedclasses.add(derived)
974 elif elem.tag == 'location':
975 self._location = LocationWithBody(elem)
979 def add_file(self, compound):
980 self._files.add(compound)
982 def set_namespace(self, compound):
983 self._namespace = compound
985 def set_outer_class(self, compound):
986 self._outerclass = compound
988 def get_reporter_location(self):
989 return self._location.get_reporter_location()
995 if len(self._files) > 1:
997 for fileobj in self._files:
998 if not fileobj.is_source_file():
1004 print 'Namespace: {0}'.format(self._namespace)
1005 if self._outerclass:
1006 print 'Outer cls: {0}'.format(self._outerclass)
1007 location = self._location
1008 print 'Location: {0}'.format(location.get_location().get_full_string())
1009 print 'Body loc: {0}'.format(location.get_body_location().get_full_string())
1010 _show_list('Inner classes', self._innerclasses)
1013 #####################################################################
1014 # Top-level container class
1016 def _get_compound_type_from_kind(kind):
1017 """Map compound kinds from Doxygen XML to internal class types."""
1022 elif kind == 'group':
1024 elif kind == 'namespace':
1026 elif kind in ('class', 'struct', 'union'):
1031 def _get_member_type_from_kind(kind):
1032 """Map member kinds from Doxygen XML to internal class types."""
1033 if kind == 'define':
1035 elif kind == 'variable':
1037 elif kind == 'typedef':
1039 elif kind == 'enum':
1041 elif kind == 'enumvalue':
1043 elif kind == 'function':
1045 elif kind == 'friend':
1046 return FriendDeclaration
1050 class DocumentationSet(object):
1052 """Root object for Doxygen XML documentation tree.
1054 On initialization, it reads the index.xml file from the Doxygen XML output,
1055 which contains the list of entities. Only the ID and name for the entities,
1056 and the parent compounds for members, are available from this file.
1058 load_details() can be called to load the detailed compound XML files.
1059 This constructs relations between compound entities, and initializes other
1060 attributes for the entities.
1062 load_file_details() does the same as load_details(), except that it leaves
1063 those compound XML files unloaded that do not affect file objects or their
1064 parent hierarchy. This saves some time if details for actual code
1065 constructs like namespaces, classes or members are not necessary.
1067 merge_duplicates() can then be called to remove members with different IDs,
1068 but that actually reference the same code entity. For some reason, Doxygen
1069 seems to produce these in certain cases.
1072 def __init__(self, xmlroot, reporter):
1073 """Initialize the documentation set and read index data."""
1074 self._xmlroot = xmlroot
1075 self._reporter = reporter
1076 xmlpath = os.path.join(xmlroot, 'index.xml')
1077 indextree = ET.parse(xmlpath)
1078 self._compounds = dict()
1079 self._members = dict()
1080 self._files = dict()
1081 for compoundelem in indextree.getroot():
1082 name = compoundelem.find('name').text
1083 refid = compoundelem.attrib['refid']
1084 kind = compoundelem.attrib['kind']
1085 if kind in ('page', 'example'):
1086 # TODO: Model these types as well
1088 compoundtype = _get_compound_type_from_kind(kind)
1089 if compoundtype is None:
1090 reporter.xml_assert(xmlpath,
1091 "unknown compound kind '{0}'".format(kind))
1093 compound = compoundtype(name, refid)
1094 compound.set_documentation_set(self)
1095 self._compounds[refid] = compound
1096 for memberelem in compoundelem.iter('member'):
1097 name = memberelem.find('name').text
1098 refid = memberelem.attrib['refid']
1099 kind = memberelem.attrib['kind']
1100 if refid in self._members:
1101 member = self._members[refid]
1102 membertype = _get_member_type_from_kind(kind)
1103 if not isinstance(member, membertype):
1104 reporter.xml_assert(xmlpath,
1105 "id '{0}' used for multiple kinds of members"
1109 membertype = _get_member_type_from_kind(kind)
1110 if membertype is None:
1111 reporter.xml_assert(xmlpath,
1112 "unknown member kind '{0}'".format(kind))
1114 member = membertype(name, refid)
1115 member.set_documentation_set(self)
1116 self._members[refid] = member
1117 member.add_parent_compound(compound)
1118 compound.add_member(member)
1120 def load_file_details(self):
1121 """Load detailed XML files for all files and possible parents of files."""
1122 for compound in self._compounds.itervalues():
1123 if isinstance(compound, (File, Directory, Group)):
1124 compound.load_details()
1125 if isinstance(compound, File):
1126 self._files[compound.get_path()] = compound
1128 def load_details(self):
1129 """Load detailed XML files for each compound."""
1130 for compound in self._compounds.itervalues():
1131 compound.load_details()
1132 if isinstance(compound, File):
1133 self._files[compound.get_path()] = compound
1134 # TODO: Add links to files using location
1136 def merge_duplicates(self):
1137 """Merge duplicate member definitions based on body location.
1139 At least for some functions that are declared in a header, but have
1140 their body in a source file, Doxygen seems to create two different IDs,
1141 but the contents of the members are the same, except for the location
1142 attribute. This method merges members that have identical name and
1143 body location into a single member that keeps the information from both
1144 instances (they should only differ in the location attribute and in
1145 parent compounds). Both IDs point to the merged member after this
1148 members_by_body = dict()
1149 for member in self._members.itervalues():
1150 bodyloc = member.get_body_location()
1152 index = (bodyloc, type(member), member.get_name())
1153 if index not in members_by_body:
1154 members_by_body[index] = []
1155 members_by_body[index].append(member)
1156 for memberlist in members_by_body.itervalues():
1157 if len(memberlist) > 1:
1159 otherdeclarations = []
1161 for member in memberlist:
1162 if member.has_same_body_location():
1163 if definition is not None:
1164 self._reporter.xml_assert(None,
1165 "duplicate definition for a member '{0}'"
1166 .format(definition))
1169 elif declaration is None:
1170 declaration = member
1172 otherdeclarations.append(member)
1173 if otherdeclarations:
1174 # TODO: gmx_cpuid.c produces some false positives
1176 for otherdeclaration in otherdeclarations:
1177 details.append('{0}: another declaration is here'
1178 .format(otherdeclaration.get_reporter_location()))
1179 details.append('{0}: definition is here'
1180 .format(declaration.get_body_location()))
1181 text = "duplicate declarations for a member '{0}'".format(declaration)
1182 self._reporter.code_issue(declaration, text, details)
1184 self._members[definition.get_id()] = declaration
1185 declaration.merge_definition(definition)
1186 for compound in definition.get_parent_compounds():
1187 compound.replace_member(definition, declaration)
1189 def get_reporter(self):
1190 """Return reporter object to use for reporting issues.
1192 This method is used in the entity classes to access the reporter when
1193 they are parsing the XML files.
1195 return self._reporter
1197 def get_xmlroot(self):
1198 """Return root of the Doxygen XML directory."""
1199 return self._xmlroot
1201 def get_compound(self, refid):
1202 return self._compounds[refid]
1204 def get_member(self, refid):
1205 return self._members[refid]
1207 def get_compounds(self, types, predicate=None):
1209 for compound in self._compounds.itervalues():
1210 if isinstance(compound, types) and \
1211 (predicate is None or predicate(compound)):
1212 result.append(compound)
1215 def get_members(self, types=None, predicate=None):
1216 # self._members can contain duplicates because of merge_duplicates()
1218 for member in self._members.itervalues():
1219 if (types is None or isinstance(member, types)) and \
1220 (predicate is None or predicate(member)):
1224 def get_files(self, paths=None):
1226 return self.get_compounds(File, lambda x: x.get_name().endswith(paths))
1228 return self.get_compounds(File)
1230 def get_directories(self, paths):
1231 return self.get_compounds(Directory, lambda x: x.get_name().endswith(paths))
1233 def get_groups(self, name):
1234 return self.get_compounds(Group, lambda x: x.get_name() in name)
1236 def get_namespaces(self, name=None):
1238 return self.get_compounds(Namespace, lambda x: x.get_name() in name)
1240 return self.get_compounds(Namespace)
1242 def get_classes(self, name=None):
1244 return self.get_compounds(Class, lambda x: x.get_name() in name)
1246 return self.get_compounds(Class)
1248 def get_functions(self, name):
1249 return self.get_members(Member, lambda x: x.get_name() in name)
1251 #####################################################################
1252 # Code for running in script mode
1255 """Run the script in for debugging/Doxygen XML output inspection."""
1258 from optparse import OptionParser
1260 from reporter import Reporter
1262 parser = OptionParser()
1263 parser.add_option('-R', '--root-dir',
1264 help='Doxygen XML root directory')
1265 parser.add_option('-F', '--show-file', action='append',
1266 help='Show contents of given file')
1267 parser.add_option('-d', '--show-dir', action='append',
1268 help='Show contents of given directory')
1269 parser.add_option('-g', '--show-group', action='append',
1270 help='Show contents of given group')
1271 parser.add_option('-n', '--show-namespace', action='append',
1272 help='Show contents of given namespace')
1273 parser.add_option('-c', '--show-class', action='append',
1274 help='Show contents of given class')
1275 # TODO: Add option for other types, and make them work
1276 parser.add_option('-f', '--show-function', action='append',
1277 help='Show details of given function')
1278 options, args = parser.parse_args()
1280 reporter = Reporter()
1282 sys.stderr.write('Loading index.xml...\n')
1283 docset = DocumentationSet(options.root_dir, reporter)
1284 reporter.write_pending()
1285 sys.stderr.write('Loading details...\n')
1286 docset.load_details()
1287 reporter.write_pending()
1288 sys.stderr.write('Processing...\n')
1289 docset.merge_duplicates()
1290 reporter.write_pending()
1293 if options.show_file:
1294 objlist.extend(docset.get_files(tuple(options.show_file)))
1295 if options.show_dir:
1296 objlist.extend(docset.get_directories(tuple(options.show_dir)))
1297 if options.show_group:
1298 objlist.extend(docset.get_groups(tuple(options.show_group)))
1299 if options.show_namespace:
1300 # TODO: Replace file names with anonymous_namespace{filename}
1301 objlist.extend(docset.get_namespaces(tuple(options.show_namespace)))
1302 if options.show_class:
1303 objlist.extend(docset.get_classes(tuple(options.show_class)))
1304 if options.show_function:
1305 objlist.extend(docset.get_functions(tuple(options.show_function)))
1309 if __name__ == '__main__':