summaryrefslogtreecommitdiff
path: root/grc/base/ParseXML.py
blob: 56097395dd35199fcfa585f919df070688b7b861 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
"""
Copyright 2008 Free Software Foundation, Inc.
This file is part of GNU Radio

GNU Radio Companion is free software; you can redistribute it and/or
modify it under the terms of the GNU General Public License
as published by the Free Software Foundation; either version 2
of the License, or (at your option) any later version.

GNU Radio Companion is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
GNU General Public License for more details.

You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA
"""

from lxml import etree
from . import odict

class XMLSyntaxError(Exception):
    def __init__(self, error_log):
        self._error_log = error_log
    def __str__(self):
        return '\n'.join(map(str, self._error_log.filter_from_errors()))

def validate_dtd(xml_file, dtd_file=None):
    """
    Validate an xml file against its dtd.
    
    Args:
        xml_file: the xml file
        dtd_file: the optional dtd file
    @throws Exception validation fails
    """
    #perform parsing, use dtd validation if dtd file is not specified
    parser = etree.XMLParser(dtd_validation=not dtd_file)
    xml = etree.parse(xml_file, parser=parser)
    if parser.error_log: raise XMLSyntaxError(parser.error_log)
    #perform dtd validation if the dtd file is specified
    if not dtd_file: return
    dtd = etree.DTD(dtd_file)
    if not dtd.validate(xml.getroot()): raise XMLSyntaxError(dtd.error_log)

def from_file(xml_file):
    """
    Create nested data from an xml file using the from xml helper.
    
    Args:
        xml_file: the xml file path
    
    Returns:
        the nested data
    """
    xml = etree.parse(xml_file).getroot()
    return _from_file(xml)

def _from_file(xml):
    """
    Recursivly parse the xml tree into nested data format.
    
    Args:
        xml: the xml tree
    
    Returns:
        the nested data
    """
    tag = xml.tag
    if not len(xml):
        return odict({tag: xml.text or ''}) #store empty tags (text is None) as empty string
    nested_data = odict()
    for elem in xml:
        key, value = _from_file(elem).items()[0]
        if nested_data.has_key(key): nested_data[key].append(value)
        else: nested_data[key] = [value]
    #delistify if the length of values is 1
    for key, values in nested_data.iteritems():
        if len(values) == 1: nested_data[key] = values[0]

    return odict({tag: nested_data})

def to_file(nested_data, xml_file):
    """
    Write an xml file and use the to xml helper method to load it.
    
    Args:
        nested_data: the nested data
        xml_file: the xml file path
    """
    xml = _to_file(nested_data)[0]
    open(xml_file, 'w').write(etree.tostring(xml, xml_declaration=True, pretty_print=True))

def _to_file(nested_data):
    """
    Recursivly parse the nested data into xml tree format.
    
    Args:
        nested_data: the nested data
    
    Returns:
        the xml tree filled with child nodes
    """
    nodes = list()
    for key, values in nested_data.iteritems():
        #listify the values if not a list
        if not isinstance(values, (list, set, tuple)):
            values = [values]
        for value in values:
            node = etree.Element(key)
            if isinstance(value, (str, unicode)): node.text = value
            else: node.extend(_to_file(value))
            nodes.append(node)
    return nodes

if __name__ == '__main__':
    """Use the main method to test parse xml's functions."""
    pass