1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
|
"""
Copyright 2008-2011 Free Software Foundation, Inc.
This file is part of GNU Radio
GNU Radio Companion is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License
as published by the Free Software Foundation; either version 2
of the License, or (at your option) any later version.
GNU Radio Companion is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA
"""
from Constants import DOCS_DIR
from lxml import etree
import os
import re
DOXYGEN_NAME_XPATH = '/doxygen/compounddef/compoundname'
DOXYGEN_BRIEFDESC_GR_XPATH = '/doxygen/compounddef/briefdescription'
DOXYGEN_DETAILDESC_GR_XPATH = '/doxygen/compounddef/detaileddescription'
def extract_txt(xml):
"""
Recursivly pull the text out of an xml tree.
@param xml the xml tree
@return a string
"""
text = (xml.text or '').replace('\n', '')
tail = (xml.tail or '').replace('\n', '')
if xml.tag == 'para': tail += '\n\n'
if xml.tag == 'linebreak': text += '\n'
if xml.tag == 'parametername': text += ': '
return text + ''.join(
map(lambda x: extract_txt(x), xml)
) + tail
def _extract(key):
"""
Extract the documentation from the doxygen generated xml files.
If multiple files match, combine the docs.
@param key the block key
@return a string with documentation
"""
docs_dir = os.path.join(DOCS_DIR, 'xml')
if not os.path.exists(docs_dir): return ''
#extract matches
pattern = key.replace('_', '_*').replace('x', '\w')
class_file_matcher = re.compile('^class%s\..*$'%pattern) #xml or xml.gz
matches = filter(lambda f: class_file_matcher.match(f), os.listdir(docs_dir))
#combine all matches
doc_strs = list()
for match in matches:
try:
xml_file = os.path.join(docs_dir, match)
xml = etree.parse(xml_file)
#extract descriptions
comp_name = extract_txt(xml.xpath(DOXYGEN_NAME_XPATH)[0]).strip()
comp_name = ' --- ' + comp_name + ' --- '
if re.match('(gr|usrp2|trellis|noaa)_.*', key):
brief_desc = extract_txt(xml.xpath(DOXYGEN_BRIEFDESC_GR_XPATH)[0]).strip()
detailed_desc = extract_txt(xml.xpath(DOXYGEN_DETAILDESC_GR_XPATH)[0]).strip()
else:
brief_desc = ''
detailed_desc = ''
#combine
doc_strs.append('\n\n'.join([comp_name, brief_desc, detailed_desc]).strip())
except IndexError: pass #bad format
return '\n\n'.join(doc_strs)
_docs_cache = dict()
def extract(key):
"""
Call the private extract and cache the result.
@param key the block key
@return a string with documentation
"""
if not _docs_cache.has_key(key):
_docs_cache[key] = _extract(key)
return _docs_cache[key]
if __name__ == '__main__':
import sys
print extract(sys.argv[1])
|