~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/rio.py

Committer: John Arbash Meinel
Date: 2006-03-08 14:31:23 UTC
mfrom: (1598 +trunk)
mto: (1685.1.1 bzr-encoding)
mto: This revision was merged to the branch mainline in revision 1752.
Revision ID: john@arbash-meinel.com-20060308143123-448308b0db4de410

[merge] bzr.dev 1573, lots of updates

files added:
BRANCH.TODO

HACKING

INSTALL

Makefile

NEWS.developers

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/builtins.py

bzrlib/bzrdir.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/glob_matcher.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_log.py.moved

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_status.py.moved

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_glob_matcher.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py.moved

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_source.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/win32console.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

generate_docs.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
bzrlib/mdiff.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/tests.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/faq.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quickref.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes/new-inventory-sample.xml

notes/performance.txt

test.sh

testbzr

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

elementtree/ => bzrlib/util/elementtree/

urlgrabber/ => bzrlib/util/urlgrabber/

bzrlib/xml.py => bzrlib/xml_serializer.py

contrib/bash/bzr => contrib/bash/bzr.simple

bzrlib/newinventory.py => contrib/newinventory.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/urlgrabber/keepalive.py

contrib/zsh/_bzr

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/rio.py

# Distributed under the GNU General Public Licence v2

# \subsection{\emph{rio} - simple text metaformat}

# \emph{r} stands for `restricted', `reproducible', or `rfc822-like'.

# The stored data consists of a series of \emph{stanzas}, each of which contains

# \emph{fields} identified by an ascii name, with Unicode or string contents.

# The field tag is constrained to alphanumeric characters.

# There may be more than one field in a stanza with the same name.

# The format itself does not deal with character encoding issues, though

# the result will normally be written in Unicode.

# The format is intended to be simple enough that there is exactly one character

# stream representation of an object and vice versa, and that this relation

# will continue to hold for future versions of bzr.

import re

# XXX: some redundancy is allowing to write stanzas in isolation as well as

# through a writer object.

class RioWriter(object):

def __init__(self, to_file):

self._soft_nl = False

self._to_file = to_file

def write_stanza(self, stanza):

if self._soft_nl:

print >>self._to_file

stanza.write(self._to_file)

self._soft_nl = True

class RioReader(object):

"""Read stanzas from a file as a sequence

to_file can be anything that can be enumerated as a sequence of

lines (with newlines.)

"""

def __init__(self, from_file):

self._from_file = from_file

def __iter__(self):

while True:

s = read_stanza(self._from_file)

if s is None:

break

else:

yield s

def read_stanzas(from_file):

while True:

s = read_stanza(from_file)

if s is None:

break

else:

yield s

class Stanza(object):

"""One stanza for rio.

Each stanza contains a set of named fields.

Names must be non-empty ascii alphanumeric plus _. Names can be repeated

within a stanza. Names are case-sensitive. The ordering of fields is

preserved.

Each field value must be either an int or a string.

"""

__slots__ = ['items']

def __init__(self, **kwargs):

"""Construct a new Stanza.

The keyword arguments, if any, are added in sorted order to the stanza.

"""

self.items = []

if kwargs:

for tag, value in sorted(kwargs.items()):

self.add(tag, value)

def add(self, tag, value):

"""Append a name and value to the stanza."""

assert valid_tag(tag), \

("invalid tag %r" % tag)

if isinstance(value, str):

value = unicode(value)

elif isinstance(value, unicode):

pass

## elif isinstance(value, (int, long)):

## value = str(value) # XXX: python2.4 without L-suffix

else:

raise TypeError("invalid type for rio value: %r of type %s"

% (value, type(value)))

100

self.items.append((tag, value))

101

102

def __contains__(self, find_tag):

103

"""True if there is any field in this stanza with the given tag."""

104

for tag, value in self.items:

105

if tag == find_tag:

106

return True

107

return False

108

109

def __len__(self):

110

"""Return number of pairs in the stanza."""

111

return len(self.items)

112

113

def __eq__(self, other):

114

if not isinstance(other, Stanza):

115

return False

116

return self.items == other.items

117

118

def __ne__(self, other):

119

return not self.__eq__(other)

120

121

def __repr__(self):

122

return "Stanza(%r)" % self.items

123

124

def iter_pairs(self):

125

"""Return iterator of tag, value pairs."""

126

return iter(self.items)

127

128

def to_lines(self):

129

"""Generate sequence of lines for external version of this file.

130

131

The lines are always utf-8 encoded strings.

132

"""

133

if not self.items:

134

# max() complains if sequence is empty

135

return []

136

result = []

137

for tag, value in self.items:

138

assert isinstance(tag, str)

139

assert isinstance(value, unicode)

140

if value == '':

141

result.append(tag + ': \n')

142

elif '\n' in value:

143

# don't want splitlines behaviour on empty lines

144

val_lines = value.split('\n')

145

result.append(tag + ': ' + val_lines[0].encode('utf-8') + '\n')

146

for line in val_lines[1:]:

147

result.append('\t' + line.encode('utf-8') + '\n')

148

else:

149

result.append(tag + ': ' + value.encode('utf-8') + '\n')

150

return result

151

152

def to_string(self):

153

"""Return stanza as a single string"""

154

return ''.join(self.to_lines())

155

156

def write(self, to_file):

157

"""Write stanza to a file"""

158

to_file.writelines(self.to_lines())

159

160

def get(self, tag):

161

"""Return the value for a field wih given tag.

162

163

If there is more than one value, only the first is returned. If the

164

tag is not present, KeyError is raised.

165

"""

166

for t, v in self.items:

167

if t == tag:

168

return v

169

else:

170

raise KeyError(tag)

171

172

__getitem__ = get

173

174

def get_all(self, tag):

175

r = []

176

for t, v in self.items:

177

if t == tag:

178

r.append(v)

179

return r

180

181

def as_dict(self):

182

"""Return a dict containing the unique values of the stanza.

183

"""

184

d = {}

185

for tag, value in self.items:

186

assert tag not in d

187

d[tag] = value

188

return d

189

190

_tag_re = re.compile(r'^[-a-zA-Z0-9_]+$')

191

def valid_tag(tag):

192

return bool(_tag_re.match(tag))

193

194

195

def read_stanza(line_iter):

196

"""Return new Stanza read from list of lines or a file

197

198

Returns one Stanza that was read, or returns None at end of file. If a

199

blank line follows the stanza, it is consumed. It's not an error for

200

there to be no blank at end of file. If there is a blank file at the

201

start of the input this is really an empty stanza and that is returned.

202

203

Only the stanza lines and the trailing blank (if any) are consumed

204

from the line_iter.

205

206

The raw lines must be in utf-8 encoding.

207

"""

208

items = []

209

stanza = Stanza()

210

tag = None

211

accum_value = None

212

for line in line_iter:

213

if line == None or line == '':

214

break # end of file

215

if line == '\n':

216

break # end of stanza

217

line = line.decode('utf-8')

218

assert line[-1] == '\n'

219

real_l = line

220

if line[0] == '\t': # continues previous value

221

if tag is None:

222

raise ValueError('invalid continuation line %r' % real_l)

223

accum_value += '\n' + line[1:-1]

224

else: # new tag:value line

225

if tag is not None:

226

stanza.add(tag, accum_value)

227

try:

228

colon_index = line.index(': ')

229

except ValueError:

230

raise ValueError('tag/value separator not found in line %r' % real_l)

231

tag = line[:colon_index]

232

assert valid_tag(tag), \

233

"invalid rio tag %r" % tag

234

accum_value = line[colon_index+2:-1]

235

if tag is not None: # add last tag-value

236

stanza.add(tag, accum_value)

237

return stanza

238

else: # didn't see any content

239

return None

Older »