1
|
|
|
# |
2
|
|
|
# Copyright (c) 2015 SUSE Linux GmbH |
3
|
|
|
# |
4
|
|
|
# This program is free software; you can redistribute it and/or |
5
|
|
|
# modify it under the terms of version 3 of the GNU General Public License as |
6
|
|
|
# published by the Free Software Foundation. |
7
|
|
|
# |
8
|
|
|
# This program is distributed in the hope that it will be useful, |
9
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of |
10
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
11
|
|
|
# GNU General Public License for more details. |
12
|
|
|
# |
13
|
|
|
# You should have received a copy of the GNU General Public License |
14
|
|
|
# along with this program; if not, contact SUSE LLC. |
15
|
|
|
# |
16
|
|
|
# To contact SUSE about this file by physical or electronic mail, |
17
|
|
|
# you may find current contact information at www.suse.com |
18
|
|
|
|
19
|
|
|
import sys |
20
|
|
|
from collections import OrderedDict |
21
|
|
|
from docmanager.core import DEFAULT_DM_PROPERTIES, \ |
22
|
|
|
NS, ReturnCodes, VALIDROOTS, BT_ELEMENTLIST |
23
|
|
|
from docmanager.exceptions import * |
24
|
|
|
from docmanager.fileutil import FileUtil |
25
|
|
|
from docmanager.logmanager import log, logmgr_flog |
26
|
|
|
from docmanager.xmlutil import check_root_element, compilestarttag, \ |
27
|
|
|
ensurefileobj, findprolog, get_namespace, localname, recover_entities, \ |
28
|
|
|
replaceinstream, preserve_entities, findinfo_pos, xml_indent, \ |
29
|
|
|
get_property_xpath |
30
|
|
|
from lxml import etree |
31
|
|
|
from xml.sax._exceptions import SAXParseException |
32
|
|
|
|
33
|
|
|
class XmlHandler(object): |
34
|
|
|
"""An XmlHandler instance represents an XML tree of a file |
35
|
|
|
""" |
36
|
|
|
|
37
|
|
|
def __init__(self, filename, stoponerror=True): |
38
|
|
|
"""Initializes the XmlHandler class |
39
|
|
|
|
40
|
|
|
:param str filename: filename of XML file |
41
|
|
|
""" |
42
|
|
|
logmgr_flog() |
43
|
|
|
log.debug("Initialized a new XML Handler for file %r.", filename) |
44
|
|
|
|
45
|
|
|
# general |
46
|
|
|
self._filename = "" |
47
|
|
|
self._buffer = None # StringIO |
48
|
|
|
|
49
|
|
|
# file util |
50
|
|
|
self._fileutil = FileUtil(filename) |
51
|
|
|
|
52
|
|
|
# prolog |
53
|
|
|
self._offset = 0 |
54
|
|
|
self._header = "" |
55
|
|
|
self._root = "" |
56
|
|
|
self.roottag = "" |
57
|
|
|
|
58
|
|
|
# parser |
59
|
|
|
self.__xmlparser = None |
60
|
|
|
self.invalidfile = False |
61
|
|
|
self.fileerror = "" |
62
|
|
|
self.xmlerrorstring = "" |
63
|
|
|
self.stoponerror = stoponerror |
64
|
|
|
|
65
|
|
|
# lxml |
66
|
|
|
self.__tree = None |
67
|
|
|
self.__root = None |
68
|
|
|
self.__docmanager = None |
69
|
|
|
|
70
|
|
|
# load the file into a StringIO buffer |
71
|
|
|
self._filename = filename |
72
|
|
|
self._buffer = ensurefileobj(self._filename) |
73
|
|
|
|
74
|
|
|
# log |
75
|
|
|
self.xmllogerrorstring = "" |
76
|
|
|
|
77
|
|
|
# parse the given file with lxml |
78
|
|
|
self.parse() |
79
|
|
|
|
80
|
|
|
def parse(self): |
81
|
|
|
"""This function parses the whole XML file |
82
|
|
|
""" |
83
|
|
|
logmgr_flog() |
84
|
|
|
|
85
|
|
|
# find the prolog of the XML file (everything before the start tag) |
86
|
|
|
try: |
87
|
|
|
prolog = findprolog(self._buffer) |
88
|
|
|
except SAXParseException as err: |
89
|
|
|
self.invalidfile = True |
90
|
|
|
self.fileerror = "<{}:{}> {} in {!r}.".format(\ |
91
|
|
|
err.getLineNumber(), \ |
92
|
|
|
err.getColumnNumber(), \ |
93
|
|
|
err.getMessage(), \ |
94
|
|
|
self.filename,) |
95
|
|
|
|
96
|
|
|
if self.stoponerror: |
97
|
|
|
raise DMXmlParseError(self.fileerror, ReturnCodes.E_XML_PARSE_ERROR) |
98
|
|
|
|
99
|
|
|
if not self.invalidfile: |
100
|
|
|
# save prolog details |
101
|
|
|
self._offset, self._header, self._root, self._roottag = prolog['offset'], \ |
102
|
|
|
prolog['header'], \ |
103
|
|
|
prolog['root'], \ |
104
|
|
|
prolog['roottag'] |
105
|
|
|
|
106
|
|
|
# replace any entities |
107
|
|
|
self.replace_entities() |
108
|
|
|
|
109
|
|
|
# register namespace |
110
|
|
|
# etree.register_namespace("dm", "{dm}".format(**NS)) |
111
|
|
|
self.__xmlparser = etree.XMLParser(remove_blank_text=False, |
112
|
|
|
resolve_entities=False, |
113
|
|
|
dtd_validation=False) |
114
|
|
|
|
115
|
|
|
# load the file and set a reference to the dm group |
116
|
|
|
try: |
117
|
|
|
self.__tree = etree.parse(self._buffer, self.__xmlparser) |
118
|
|
|
except etree.XMLSyntaxError as err: |
119
|
|
|
self.invalidfile = True |
120
|
|
|
self.fileerror = err.msg |
121
|
|
|
|
122
|
|
|
if self.stoponerror: |
123
|
|
|
raise DMXmlParseError(err, ReturnCodes.E_XML_PARSE_ERROR) |
124
|
|
|
|
125
|
|
|
if not self.invalidfile: |
126
|
|
|
self.__root = self.__tree.getroot() |
127
|
|
|
|
128
|
|
|
try: |
129
|
|
|
check_root_element(self.__root, etree) |
130
|
|
|
except ValueError as err: |
131
|
|
|
self.invalidfile = True |
132
|
|
|
self.fileerror = err |
133
|
|
|
|
134
|
|
|
if self.stoponerror: |
135
|
|
|
raise DMXmlParseError(err, ReturnCodes.E_XML_PARSE_ERROR) |
136
|
|
|
|
137
|
|
|
if not self.invalidfile: |
138
|
|
|
# check for DocBook 5 namespace in start tag |
139
|
|
|
try: |
140
|
|
|
self.check_docbook5_ns() |
141
|
|
|
|
142
|
|
|
# check for docmanager element |
143
|
|
|
self.__docmanager = self.__tree.find("//dm:docmanager", namespaces=NS) |
144
|
|
|
|
145
|
|
|
if self.__docmanager is None: |
146
|
|
|
log.info("No docmanager element found") |
147
|
|
|
self.create_group() |
148
|
|
|
else: |
149
|
|
|
log.debug("Found docmanager element %s", self.__docmanager.getparent()) |
150
|
|
|
except DMNotDocBook5File as err: |
151
|
|
|
if self.stoponerror == True: |
152
|
|
|
raise DMNotDocBook5File(err.errorstr, err.error) |
153
|
|
|
|
154
|
|
|
def check_docbook5_ns(self): |
155
|
|
|
"""Checks if the current file is a valid DocBook 5 file. |
156
|
|
|
""" |
157
|
|
|
rootns = get_namespace(self.__root.tag) |
158
|
|
|
if rootns != NS['d']: |
159
|
|
|
self.invalidfile = True |
160
|
|
|
self.fileerror = "The document is not a valid DocBook 5 document." |
161
|
|
|
raise DMNotDocBook5File(self.fileerror, ReturnCodes.E_NOT_DOCBOOK5_FILE) |
162
|
|
|
|
163
|
|
|
def replace_entities(self): |
164
|
|
|
"""This function replaces entities in the StringIO buffer |
165
|
|
|
""" |
166
|
|
|
logmgr_flog() |
167
|
|
|
|
168
|
|
|
self._buffer.seek(self._offset) |
169
|
|
|
self._buffer = replaceinstream(self._buffer, preserve_entities) |
170
|
|
|
|
171
|
|
|
def init_default_props(self, force=False, bugtracker=False): |
172
|
|
|
"""Initializes the default properties for the given XML files |
173
|
|
|
|
174
|
|
|
:param bool force: Ignore if there are already properties in an |
175
|
|
|
XML - just overwrite them |
176
|
|
|
""" |
177
|
|
|
logmgr_flog() |
178
|
|
|
|
179
|
|
|
props = list(DEFAULT_DM_PROPERTIES) |
180
|
|
|
|
181
|
|
|
if bugtracker: |
182
|
|
|
for i in BT_ELEMENTLIST: |
183
|
|
|
props.append(i) |
184
|
|
|
|
185
|
|
|
ret = 0 |
186
|
|
|
for i in props: |
187
|
|
|
if (i not in self.get(i)) or \ |
188
|
|
|
(self.get(i)[i] is None) or \ |
189
|
|
|
(self.get(i)[i] is not None and force): |
190
|
|
|
self.set({i: ""}) |
191
|
|
|
else: |
192
|
|
|
ret += 1 |
193
|
|
|
return ret |
194
|
|
|
|
195
|
|
|
def check_root_element(self): |
196
|
|
|
"""Checks if root element is valid""" |
197
|
|
|
logmgr_flog() |
198
|
|
|
|
199
|
|
|
tag = etree.QName(self.__root.tag) |
200
|
|
|
if tag.localname not in VALIDROOTS: |
201
|
|
|
raise DMInvalidXMLRootElement("Cannot add info element to file %r. " |
202
|
|
|
"This file does not contain a valid " |
203
|
|
|
"DocBook 5 root element. Found %s", |
204
|
|
|
self._filename, localname(self.__root.tag), |
205
|
|
|
ReturnCodes.E_INVALID_ROOT_ELEMENT) |
206
|
|
|
|
207
|
|
|
def create_group(self): |
208
|
|
|
"""Creates the docmanager group element""" |
209
|
|
|
logmgr_flog() |
210
|
|
|
|
211
|
|
|
#search the info-element if not exists raise an error |
212
|
|
|
info = self.__tree.find("//d:info", namespaces=NS) |
213
|
|
|
# TODO: We need to check for a --force option |
214
|
|
|
if info is None: |
215
|
|
|
log.debug("No <info> element found!") |
216
|
|
|
pos = findinfo_pos(self.__root) |
217
|
|
|
log.debug("Using position %d", pos) |
218
|
|
|
info = etree.Element("{%s}info" % NS["d"]) |
219
|
|
|
info.tail = '\n' |
220
|
|
|
info.text = '\n' |
221
|
|
|
self.__root.insert(pos, info) |
222
|
|
|
|
223
|
|
|
log.debug("Adding <info> element in '%s'", self.filename) |
224
|
|
|
|
225
|
|
|
log.debug("Adding <dm:docmanager> to <info>") |
226
|
|
|
# dm = etree.Element("{%s}docmanager" % NS["dm"]) |
227
|
|
|
# self.__docmanager = info.insert(0, dm) |
228
|
|
|
self.__docmanager = etree.SubElement(info, |
229
|
|
|
"{{{dm}}}docmanager".format(**NS), |
230
|
|
|
nsmap={'dm': NS['dm']}, |
231
|
|
|
) |
232
|
|
|
|
233
|
|
|
def set(self, pairs): |
234
|
|
|
"""Sets the key as element and value as content |
235
|
|
|
|
236
|
|
|
:param key: name of the element |
237
|
|
|
:param value: value that this element will contain |
238
|
|
|
|
239
|
|
|
If key="foo" and value="bar" you will get: |
240
|
|
|
<foo>bar</foo> |
241
|
|
|
whereas foo belongs to the DocManager namespace |
242
|
|
|
""" |
243
|
|
|
logmgr_flog() |
244
|
|
|
|
245
|
|
|
#import pdb |
246
|
|
|
#pdb.set_trace() |
247
|
|
|
|
248
|
|
|
dm = self.__docmanager |
249
|
|
|
dmelem = list() |
250
|
|
|
lastnode = dm |
251
|
|
|
|
252
|
|
|
for key in pairs: |
253
|
|
|
elemlist = key.split("/") |
254
|
|
|
|
255
|
|
|
for e in elemlist: |
256
|
|
|
name = "dm:" + e |
257
|
|
|
|
258
|
|
|
dmelem.append(name) |
259
|
|
|
node = dm.find("/".join(dmelem), namespaces=NS) |
260
|
|
|
|
261
|
|
|
if node is None: |
262
|
|
|
node = etree.SubElement(lastnode, "{{{dm}}}{key}".format(key=e, **NS)) |
263
|
|
|
|
264
|
|
|
lastnode = node |
265
|
|
|
node.text = "" |
266
|
|
|
|
267
|
|
|
node.text = pairs[key] |
268
|
|
|
|
269
|
|
|
def is_set(self, key, values): |
270
|
|
|
"""Checks if element 'key' exists with 'values' |
271
|
|
|
|
272
|
|
|
:param str key: the element to search for |
273
|
|
|
:param str values: the value inside the element |
274
|
|
|
|
275
|
|
|
:return: if conditions are met |
276
|
|
|
:rtype: bool |
277
|
|
|
""" |
278
|
|
|
logmgr_flog() |
279
|
|
|
|
280
|
|
|
#check if the key has on of the given values |
281
|
|
|
element = self.__docmanager.find("./dm:"+key, |
282
|
|
|
namespaces=NS) |
283
|
|
|
if self.is_prop_set(key) is True and element.text in values: |
284
|
|
|
return True |
285
|
|
|
|
286
|
|
|
return False |
287
|
|
|
|
288
|
|
|
def is_prop_set(self, prop): |
289
|
|
|
""" |
290
|
|
|
Checks if a property is set in an XML element |
291
|
|
|
|
292
|
|
|
:param str prop: the property |
293
|
|
|
|
294
|
|
|
:return: if property is set |
295
|
|
|
:rtype: bool |
296
|
|
|
""" |
297
|
|
|
logmgr_flog() |
298
|
|
|
|
299
|
|
|
element = self.__docmanager.find("./dm:{}".format(prop), namespaces=NS) |
300
|
|
|
if element is not None: |
301
|
|
|
return True |
302
|
|
|
|
303
|
|
|
return False |
304
|
|
|
|
305
|
|
|
def set_attr(self, prop, data): |
306
|
|
|
"""Sets an attribute for a property |
307
|
|
|
:param str prop: The property |
308
|
|
|
:param dict data: A dictionary of attributes and values |
309
|
|
|
example: {"attr1": "val1", "attr2": "val2"} |
310
|
|
|
""" |
311
|
|
|
node = self.find_elem(prop) |
312
|
|
|
|
313
|
|
|
if node is None: |
314
|
|
|
raise DMPropertyNotFound(self.filename, prop) |
315
|
|
|
|
316
|
|
|
for i in data: |
317
|
|
|
node.set(i, data[i]) |
318
|
|
|
|
319
|
|
|
def del_attr(self, prop, data): |
320
|
|
|
"""Deletes one or more attributes of a property |
321
|
|
|
:param str prop: The property |
322
|
|
|
:param list data: A list of all attributes |
323
|
|
|
""" |
324
|
|
|
node = self.find_elem(prop) |
325
|
|
|
|
326
|
|
|
if node is None: |
327
|
|
|
raise DMPropertyNotFound(self.filename, prop) |
328
|
|
|
|
329
|
|
|
errors = [] |
330
|
|
|
for i in data: |
331
|
|
|
try: |
332
|
|
|
del node.attrib[i] |
333
|
|
|
except KeyError: |
334
|
|
|
errors.append(i) |
335
|
|
|
|
336
|
|
|
return errors |
337
|
|
|
|
338
|
|
|
def get_attr(self, props, data): |
339
|
|
|
"""Gets one or more attributes of a property |
340
|
|
|
:param list props: The properties |
341
|
|
|
:param list data: A list of all attributes |
342
|
|
|
""" |
343
|
|
|
attrs = OrderedDict() |
344
|
|
|
nodes = [] |
345
|
|
|
|
346
|
|
|
if props: |
347
|
|
|
for prop in props: |
348
|
|
|
attrs[prop] = OrderedDict() |
349
|
|
|
node = self.find_elem(prop) |
350
|
|
|
|
351
|
|
|
if node is not None: |
352
|
|
|
nodes.append((localname(node.tag), node)) |
353
|
|
|
else: |
354
|
|
|
for idx, i in enumerate(self.__docmanager.iter()): |
355
|
|
|
# this is needed because otherwise we also get the "docmanager" |
356
|
|
|
# element |
357
|
|
|
if idx: |
358
|
|
|
xpath = get_property_xpath(i) |
359
|
|
|
|
360
|
|
|
attrs[xpath] = OrderedDict() |
361
|
|
|
nodes.append((xpath, i)) |
362
|
|
|
|
363
|
|
|
for node in nodes: |
364
|
|
|
prop = node[0] |
365
|
|
|
elem = node[1] |
366
|
|
|
|
367
|
|
|
if data: |
368
|
|
|
for i in data: |
369
|
|
|
try: |
370
|
|
|
attrs[prop][i] = elem.attrib[i] |
371
|
|
|
except KeyError: |
372
|
|
|
pass |
373
|
|
|
else: |
374
|
|
|
for i in elem.attrib: |
375
|
|
|
attrs[prop][i] = elem.attrib[i] |
376
|
|
|
|
377
|
|
|
return attrs |
378
|
|
|
|
379
|
|
|
def get(self, keys=None): |
380
|
|
|
"""Returns all matching values for a key in docmanager element |
381
|
|
|
|
382
|
|
|
:param key: localname of element to search for |
383
|
|
|
:type key: string, list, tuple, or None |
384
|
|
|
:return: the values |
385
|
|
|
:rtype: dict |
386
|
|
|
""" |
387
|
|
|
logmgr_flog() |
388
|
|
|
|
389
|
|
|
if len(keys) == 0: |
390
|
|
|
return self.get_all() |
391
|
|
|
|
392
|
|
|
dm = self.__docmanager |
393
|
|
|
dmelem = list() |
394
|
|
|
values = OrderedDict() |
395
|
|
|
|
396
|
|
|
if not isinstance(keys, list): |
397
|
|
|
keys = [ keys ] |
398
|
|
|
|
399
|
|
|
for key in keys: |
400
|
|
|
elemlist = key.split("/") |
401
|
|
|
dmelem = list() |
402
|
|
|
|
403
|
|
|
for e in elemlist: |
404
|
|
|
name = "dm:" + e |
405
|
|
|
|
406
|
|
|
dmelem.append(name) |
407
|
|
|
node = dm.find("/".join(dmelem), namespaces=NS) |
408
|
|
|
|
409
|
|
|
if node is None: |
410
|
|
|
break |
411
|
|
|
|
412
|
|
|
values.update({key: None if node is None else node.text}) |
413
|
|
|
|
414
|
|
|
return values |
415
|
|
|
|
416
|
|
|
def get_all(self): |
417
|
|
|
"""Returns all keys and values in a docmanager xml file |
418
|
|
|
""" |
419
|
|
|
logmgr_flog() |
420
|
|
|
|
421
|
|
|
ret = OrderedDict() |
422
|
|
|
for idx, i in enumerate(self.__docmanager.iter()): |
423
|
|
|
# we want to skip the "docmanager" element here |
424
|
|
|
if idx: |
425
|
|
|
xpath = get_property_xpath(i) |
426
|
|
|
ret[xpath] = i.text |
427
|
|
|
|
428
|
|
|
return ret |
429
|
|
|
|
430
|
|
|
def delete(self, key, condition=None): |
431
|
|
|
"""Deletes an element inside docmanager element |
432
|
|
|
|
433
|
|
|
:param str key: element name to delete |
434
|
|
|
:param str condition: the condition for the deletion (the var condition has to be equal with the property value) |
435
|
|
|
:return boolean: True = success | False = no property has been deleted |
436
|
|
|
""" |
437
|
|
|
logmgr_flog() |
438
|
|
|
|
439
|
|
|
key = key.split("/") |
440
|
|
|
lastnode = None |
441
|
|
|
|
442
|
|
|
key_handler = self.__docmanager.find("dm:{}".format(key[0]), namespaces=NS) |
443
|
|
|
|
444
|
|
|
for idx, prop in enumerate(key): |
445
|
|
|
if lastnode is not None: |
446
|
|
|
key_handler = lastnode.find("dm:{}".format(prop), namespaces=NS) |
447
|
|
|
|
448
|
|
|
lastnode = key_handler |
449
|
|
|
|
450
|
|
|
if key_handler is None: |
451
|
|
|
break |
452
|
|
|
|
453
|
|
|
if idx == len(key)-1: |
454
|
|
|
if condition is not None: |
455
|
|
|
if condition != key_handler.text: |
456
|
|
|
break |
457
|
|
|
|
458
|
|
|
key_handler.getparent().remove(key_handler) |
459
|
|
|
return True |
460
|
|
|
|
461
|
|
|
return False |
462
|
|
|
|
463
|
|
|
def find_elem(self, prop): |
464
|
|
|
"""Searches for the an XML element |
465
|
|
|
:param str prop: The property |
466
|
|
|
:return lxml.etree._Element: |
467
|
|
|
""" |
468
|
|
|
props = prop.split("/") |
469
|
|
|
|
470
|
|
|
dm = self.__docmanager |
471
|
|
|
lastnode = None |
472
|
|
|
|
473
|
|
|
for i in props: |
474
|
|
|
if lastnode is None: |
475
|
|
|
lastnode = dm |
476
|
|
|
|
477
|
|
|
lastnode = lastnode.find("dm:{}".format(i), namespaces=NS) |
478
|
|
|
|
479
|
|
|
if lastnode is None: |
480
|
|
|
return None |
481
|
|
|
|
482
|
|
|
return lastnode |
483
|
|
|
|
484
|
|
|
def get_indentation(self, node, indentation=""): |
485
|
|
|
"""Calculates indentation level |
486
|
|
|
|
487
|
|
|
:param lxml.etree._Element node: node where to start |
488
|
|
|
:param str indentation: Additional indentation |
489
|
|
|
""" |
490
|
|
|
logmgr_flog() |
491
|
|
|
|
492
|
|
|
indent = "" |
493
|
|
|
if node is not None: |
494
|
|
|
indent = "".join(["".join(n.tail.split("\n")) |
495
|
|
|
for n in node.iterancestors() |
496
|
|
|
if n.tail is not None ]) |
497
|
|
|
return indent+indentation |
498
|
|
|
|
499
|
|
|
def indent_dm(self): |
500
|
|
|
"""Indents only dm:docmanager element and its children""" |
501
|
|
|
logmgr_flog() |
502
|
|
|
|
503
|
|
|
dmindent=' ' |
504
|
|
|
dm = self.__tree.find("//dm:docmanager", |
505
|
|
|
namespaces=NS) |
506
|
|
|
log.debug("dm is %s", dm) |
507
|
|
|
if dm is None: |
508
|
|
|
return |
509
|
|
|
log.debug("-----") |
510
|
|
|
info = dm.getparent() #.getprevious() |
511
|
|
|
log.info("info: %s", info) |
512
|
|
|
prev = info.getprevious() |
513
|
|
|
log.info("prev: %s", prev) |
514
|
|
|
parent = info.getparent() |
515
|
|
|
log.info("parent of info: %s", parent) |
516
|
|
|
log.info("child of info: %s", info.getchildren()) |
517
|
|
|
|
518
|
|
|
if info.tail is None: |
519
|
|
|
info.tail = "" |
520
|
|
|
|
521
|
|
|
infoindent = "".join(info.tail.split('\n')) |
522
|
|
|
prev = dm.getprevious() |
523
|
|
|
#log.info("prev: %s", prev) |
524
|
|
|
if prev is not None: |
525
|
|
|
log.info("prev: %s", prev) |
526
|
|
|
prev.tail = '\n' + infoindent |
527
|
|
|
indent=self.get_indentation(dm.getprevious()) |
528
|
|
|
dm.text = '\n' + indent + ' ' |
529
|
|
|
dm.tail = '\n' + infoindent |
530
|
|
|
for node in dm.iterchildren(): |
531
|
|
|
i = dmindent if node.getnext() is not None else '' |
532
|
|
|
node.tail = '\n' + indent + i |
533
|
|
|
|
534
|
|
|
def write(self): |
535
|
|
|
"""Write XML tree to original filename""" |
536
|
|
|
logmgr_flog() |
537
|
|
|
|
538
|
|
|
# Only indent docmanager child elements |
539
|
|
|
self.indent_dm() |
540
|
|
|
|
541
|
|
|
log.debug("root: %s", repr(self._root)) |
542
|
|
|
with open(self._filename, 'w') as f: |
543
|
|
|
info = self.__root.find("d:info", namespaces=NS) |
544
|
|
|
|
545
|
|
|
xml_indent(info, 2) |
546
|
|
|
content = recover_entities(etree.tostring(self.__tree, \ |
547
|
|
|
encoding='unicode', \ |
548
|
|
|
# doctype=self._header.rstrip()) |
549
|
|
|
)) |
550
|
|
|
# self._offset, self._header, self._root, self._roottag |
551
|
|
|
starttag = compilestarttag(self._roottag) |
552
|
|
|
content = starttag.sub(lambda _: self._root.rstrip(), content, 1) |
553
|
|
|
|
554
|
|
|
# log.debug("content: %s", repr(content)) |
555
|
|
|
f.write(self._header.rstrip()+"\n" + content) |
556
|
|
|
|
557
|
|
|
@property |
558
|
|
|
def filename(self): |
559
|
|
|
"""Returns filename of the input source |
560
|
|
|
|
561
|
|
|
:return: filename |
562
|
|
|
:rtype: str |
563
|
|
|
""" |
564
|
|
|
# return self.__tree.docinfo.URL |
565
|
|
|
return self._filename |
566
|
|
|
|
567
|
|
|
@filename.setter |
568
|
|
|
def filename(self, _): |
569
|
|
|
raise ValueError("filename is only readable") |
570
|
|
|
@filename.deleter |
571
|
|
|
def filename(self): |
572
|
|
|
raise ValueError("filename cannot be deleted") |
573
|
|
|
|
574
|
|
|
@property |
575
|
|
|
def tree(self): |
576
|
|
|
"""Return our parsed tree object |
577
|
|
|
|
578
|
|
|
:return: tree object |
579
|
|
|
:rtype: lxml.etree._ElementTree |
580
|
|
|
""" |
581
|
|
|
return self.__tree |
582
|
|
|
|
583
|
|
|
@tree.setter |
584
|
|
|
def tree(self, _): |
585
|
|
|
raise ValueError("tree is only readable") |
586
|
|
|
@tree.deleter |
587
|
|
|
def tree(self): |
588
|
|
|
raise ValueError("tree cannot be deleted") |
589
|
|
|
|
590
|
|
|
@property |
591
|
|
|
def root(self): |
592
|
|
|
"""Returns the root element of the XML tree |
593
|
|
|
|
594
|
|
|
:return: root element |
595
|
|
|
:rtype: lxml.etree._Element |
596
|
|
|
""" |
597
|
|
|
return self.__root |
598
|
|
|
|
599
|
|
|
@root.setter |
600
|
|
|
def root(self, _): |
601
|
|
|
raise ValueError("root is only readable") |
602
|
|
|
|
603
|
|
|
@root.deleter |
604
|
|
|
def root(self): |
605
|
|
|
raise ValueError("root cannot be deleted") |
606
|
|
|
|
607
|
|
|
@property |
608
|
|
|
def dm(self): |
609
|
|
|
return self.__docmanager |
610
|
|
|
|
611
|
|
|
@property |
612
|
|
|
def fileutil(self): |
613
|
|
|
return self._fileutil |
614
|
|
|
|