~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/_rio_pyx.pyx

Committer: Robert J. Tanner
Date: 2009-06-10 03:56:49 UTC
mfrom: (4423 +trunk)
mto: This revision was merged to the branch mainline in revision 4425.
Revision ID: tanner@real-time.com-20090610035649-7rfx4cls4550zc3c

Merge 1.15.1 back to trunk

files added:
bzrlib/_bencode_pyx.h

bzrlib/_bencode_pyx.pyx

bzrlib/_rio_py.py

bzrlib/_rio_pyx.pyx

bzrlib/benchmarks/bench_tags.py

bzrlib/bencode.py

bzrlib/send.py

bzrlib/tests/per_repository_reference/test_fetch.py

bzrlib/tests/per_repository_reference/test_initialize.py

bzrlib/tests/per_repository_reference/test_unlock.py

bzrlib/tests/test__rio.py

bzrlib/tests/test_bencode.py

bzrlib/tests/test_chk_serializer.py

bzrlib/util/bencode.py

files removed:
bzrlib/util/tests/test_bencode.py

files renamed:
bzrlib/tests/workingtree_implementations/test_get_file_with_stat.py => bzrlib/tests/tree_implementations/test_get_file_with_stat.py

bzrlib/util/bencode.py => bzrlib/util/_bencode_py.py

files modified:
.bzrignore

Makefile

NEWS

bzrlib/__init__.py

bzrlib/_groupcompress_pyx.pyx

bzrlib/benchmarks/__init__.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/serializer/v4.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/chk_serializer.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/foreign.py

bzrlib/graph.py

bzrlib/groupcompress.py

bzrlib/index.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mail_client.py

bzrlib/multiparent.py

bzrlib/mutabletree.py

bzrlib/osutils.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/python-compat.h

bzrlib/reconcile.py

bzrlib/remote.py

bzrlib/repofmt/groupcompress_repo.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/pack_repo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/serializer.py

bzrlib/shelf.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/server.py

bzrlib/tag.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_dpush.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_send.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_switch.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_check.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_reconcile.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/inventory_implementations/basics.py

bzrlib/tests/per_repository/test_fetch.py

bzrlib/tests/per_repository/test_fileid_involved.py

bzrlib/tests/per_repository/test_iter_reverse_revision_history.py

bzrlib/tests/per_repository/test_reconcile.py

bzrlib/tests/per_repository/test_revision.py

bzrlib/tests/per_repository/test_write_group.py

bzrlib/tests/per_repository_reference/__init__.py

bzrlib/tests/per_repository_reference/test_default_stacking.py

bzrlib/tests/test__groupcompress.py

bzrlib/tests/test_config.py

bzrlib/tests/test_foreign.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_groupcompress.py

bzrlib/tests/test_http.py

bzrlib/tests/test_mail_client.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_pack_repository.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_serializer.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_source.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_ui.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/ui/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

doc/en/user-guide/svn_plugin.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/_rio_pyx.pyx

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

"""Pyrex implementation of _read_stanza_*."""

#python2.4 support

cdef extern from "python-compat.h":

pass

cdef extern from "stdlib.h":

void *malloc(int)

void *realloc(void *, int)

void free(void *)

cdef extern from "Python.h":

ctypedef int Py_ssize_t # Required for older pyrex versions

ctypedef int Py_UNICODE

char *PyString_AS_STRING(object s)

Py_ssize_t PyString_GET_SIZE(object t) except -1

object PyUnicode_DecodeUTF8(char *string, Py_ssize_t length, char *errors)

object PyString_FromStringAndSize(char *s, Py_ssize_t len)

int PyString_CheckExact(object)

int PyUnicode_CheckExact(object)

object PyUnicode_Join(object, object)

object PyUnicode_EncodeASCII(Py_UNICODE *, int, char *)

Py_UNICODE *PyUnicode_AS_UNICODE(object)

Py_UNICODE *PyUnicode_AsUnicode(object)

Py_ssize_t PyUnicode_GET_SIZE(object) except -1

int PyList_Append(object, object) except -1

int Py_UNICODE_ISLINEBREAK(Py_UNICODE)

object PyUnicode_FromUnicode(Py_UNICODE *, int)

void *Py_UNICODE_COPY(Py_UNICODE *, Py_UNICODE *, int)

cdef extern from "string.h":

void *memcpy(void *, void *, int)

from bzrlib.rio import Stanza

cdef int _valid_tag_char(char c):

return (c == c'_' or c == c'-' or

(c >= c'a' and c <= c'z') or

(c >= c'A' and c <= c'Z') or

(c >= c'0' and c <= c'9'))

def _valid_tag(tag):

cdef char *c_tag

cdef Py_ssize_t c_len

cdef int i

if not PyString_CheckExact(tag):

raise TypeError(tag)

c_tag = PyString_AS_STRING(tag)

c_len = PyString_GET_SIZE(tag)

if c_len < 1:

return False

for i from 0 <= i < c_len:

if not _valid_tag_char(c_tag[i]):

return False

return True

cdef object _split_first_line_utf8(char *line, int len,

char *value, Py_ssize_t *value_len):

cdef int i

for i from 0 <= i < len:

if line[i] == c':':

if line[i+1] != c' ':

raise ValueError("invalid tag in line %r" % line)

memcpy(value, line+i+2, len-i-2)

value_len[0] = len-i-2

return PyString_FromStringAndSize(line, i)

raise ValueError('tag/value separator not found in line %r' % line)

cdef object _split_first_line_unicode(Py_UNICODE *line, int len,

Py_UNICODE *value, Py_ssize_t *value_len):

cdef int i

for i from 0 <= i < len:

if line[i] == c':':

if line[i+1] != c' ':

raise ValueError("invalid tag in line %r" %

PyUnicode_FromUnicode(line, len))

memcpy(value, &line[i+2], (len-i-2) * sizeof(Py_UNICODE))

value_len[0] = len-i-2

return PyUnicode_EncodeASCII(line, i, "strict")

raise ValueError("tag/value separator not found in line %r" %

100

PyUnicode_FromUnicode(line, len))

101

102

103

def _read_stanza_utf8(line_iter):

104

cdef char *c_line

105

cdef Py_ssize_t c_len

106

cdef char *accum_value, *new_accum_value

107

cdef Py_ssize_t accum_len, accum_size

108

pairs = []

109

tag = None

110

accum_len = 0

111

accum_size = 4096

112

accum_value = <char *>malloc(accum_size)

113

if accum_value == NULL:

114

raise MemoryError

115

try:

116

for line in line_iter:

117

if line is None:

118

break # end of file

119

if not PyString_CheckExact(line):

120

raise TypeError("%r is not a plain string" % line)

121

c_line = PyString_AS_STRING(line)

122

c_len = PyString_GET_SIZE(line)

123

if c_len < 1:

124

break # end of file

125

if c_len == 1 and c_line[0] == c"\n":

126

break # end of stanza

127

if accum_len + c_len > accum_size:

128

accum_size = (accum_len + c_len)

129

new_accum_value = <char *>realloc(accum_value, accum_size)

130

if new_accum_value == NULL:

131

raise MemoryError

132

else:

133

accum_value = new_accum_value

134

if c_line[0] == c'\t': # continues previous value

135

if tag is None:

136

raise ValueError('invalid continuation line %r' % line)

137

memcpy(accum_value+accum_len, c_line+1, c_len-1)

138

accum_len = accum_len + c_len-1

139

else: # new tag:value line

140

if tag is not None:

141

PyList_Append(pairs,

142

(tag, PyUnicode_DecodeUTF8(accum_value, accum_len-1,

143

"strict")))

144

tag = _split_first_line_utf8(c_line, c_len, accum_value,

145

&accum_len)

146

if not _valid_tag(tag):

147

raise ValueError("invalid rio tag %r" % (tag,))

148

if tag is not None: # add last tag-value

149

PyList_Append(pairs,

150

(tag, PyUnicode_DecodeUTF8(accum_value, accum_len-1, "strict")))

151

return Stanza.from_pairs(pairs)

152

else: # didn't see any content

153

return None

154

finally:

155

free(accum_value)

156

157

158

def _read_stanza_unicode(unicode_iter):

159

cdef Py_UNICODE *c_line

160

cdef int c_len

161

cdef Py_UNICODE *accum_value, *new_accum_value

162

cdef Py_ssize_t accum_len, accum_size

163

pairs = []

164

tag = None

165

accum_len = 0

166

accum_size = 4096

167

accum_value = <Py_UNICODE *>malloc(accum_size*sizeof(Py_UNICODE))

168

if accum_value == NULL:

169

raise MemoryError

170

try:

171

for line in unicode_iter:

172

if line is None:

173

break # end of file

174

if not PyUnicode_CheckExact(line):

175

raise TypeError("%r is not a unicode string" % line)

176

c_line = PyUnicode_AS_UNICODE(line)

177

c_len = PyUnicode_GET_SIZE(line)

178

if c_len < 1:

179

break # end of file

180

if Py_UNICODE_ISLINEBREAK(c_line[0]):

181

break # end of stanza

182

if accum_len + c_len > accum_size:

183

accum_size = accum_len + c_len

184

new_accum_value = <Py_UNICODE *>realloc(accum_value,

185

accum_size*sizeof(Py_UNICODE))

186

if new_accum_value == NULL:

187

raise MemoryError

188

else:

189

accum_value = new_accum_value

190

if c_line[0] == c'\t': # continues previous value,

191

if tag is None:

192

raise ValueError('invalid continuation line %r' % line)

193

memcpy(&accum_value[accum_len], &c_line[1],

194

(c_len-1)*sizeof(Py_UNICODE))

195

accum_len = accum_len + (c_len-1)

196

else: # new tag:value line

197

if tag is not None:

198

PyList_Append(pairs,

199

(tag, PyUnicode_FromUnicode(accum_value, accum_len-1)))

200

tag = _split_first_line_unicode(c_line, c_len, accum_value,

201

&accum_len)

202

if not _valid_tag(tag):

203

raise ValueError("invalid rio tag %r" % (tag,))

204

if tag is not None: # add last tag-value

205

PyList_Append(pairs,

206

(tag, PyUnicode_FromUnicode(accum_value, accum_len-1)))

207

return Stanza.from_pairs(pairs)

208

else: # didn't see any content

209

return None

210

finally:

211

free(accum_value)

Older »