1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
|
# Copyright (C) 2009 Canonical Ltd
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
"""Python implementation of _read_stanza_*."""
import re
from bzrlib.rio import (
Stanza,
)
_tag_re = re.compile(r'^[-a-zA-Z0-9_]+$')
def _valid_tag(tag):
if type(tag) != str:
raise TypeError(tag)
return bool(_tag_re.match(tag))
def _read_stanza_utf8(line_iter):
def iter_unicode_lines():
for line in line_iter:
if type(line) != str:
raise TypeError(line)
yield line.decode('utf-8')
return _read_stanza_unicode(iter_unicode_lines())
def _read_stanza_unicode(unicode_iter):
stanza = Stanza()
tag = None
accum_value = None
# TODO: jam 20060922 This code should raise real errors rather than
# using 'assert' to process user input, or raising ValueError
# rather than a more specific error.
for line in unicode_iter:
if line is None or line == u'':
break # end of file
if line == u'\n':
break # end of stanza
real_l = line
if line[0] == u'\t': # continues previous value
if tag is None:
raise ValueError('invalid continuation line %r' % real_l)
accum_value.append(u'\n' + line[1:-1])
else: # new tag:value line
if tag is not None:
stanza.add(tag, u''.join(accum_value))
try:
colon_index = line.index(u': ')
except ValueError:
raise ValueError('tag/value separator not found in line %r'
% real_l)
tag = str(line[:colon_index])
if not _valid_tag(tag):
raise ValueError("invalid rio tag %r" % (tag,))
accum_value = [line[colon_index+2:-1]]
if tag is not None: # add last tag-value
stanza.add(tag, u''.join(accum_value))
return stanza
else: # didn't see any content
return None
|