/
xml.py
64 lines (59 loc) · 1.37 KB
/
xml.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
from __future__ import division, print_function, absolute_import
import petl as etl
# setup a file to demonstrate with
d = '''<table>
<tr>
<td>foo</td><td>bar</td>
</tr>
<tr>
<td>a</td><td>1</td>
</tr>
<tr>
<td>b</td><td>2</td>
</tr>
<tr>
<td>c</td><td>2</td>
</tr>
</table>'''
with open('example1.xml', 'w') as f:
f.write(d)
table1 = etl.fromxml('example1.xml', 'tr', 'td')
table1
# if the data values are stored in an attribute, provide the attribute name
# as an extra positional argument
d = '''<table>
<tr>
<td v='foo'/><td v='bar'/>
</tr>
<tr>
<td v='a'/><td v='1'/>
</tr>
<tr>
<td v='b'/><td v='2'/>
</tr>
<tr>
<td v='c'/><td v='2'/>
</tr>
</table>'''
with open('example2.xml', 'w') as f:
f.write(d)
table2 = etl.fromxml('example2.xml', 'tr', 'td', 'v')
table2
# data values can also be extracted by providing a mapping of field
# names to element paths
d = '''<table>
<row>
<foo>a</foo><baz><bar v='1'/><bar v='3'/></baz>
</row>
<row>
<foo>b</foo><baz><bar v='2'/></baz>
</row>
<row>
<foo>c</foo><baz><bar v='2'/></baz>
</row>
</table>'''
with open('example3.xml', 'w') as f:
f.write(d)
table3 = etl.fromxml('example3.xml', 'row',
{'foo': 'foo', 'bar': ('baz/bar', 'v')})
table3