~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/urlutils.py

Committer: Aaron Bentley
Date: 2006-09-27 21:25:21 UTC
mfrom: (2049 +trunk)
mto: (1731.2.9 nested-trees) (2234.6.1 bzr.0.14) (2229.2.4 reserved-ids) (2323.6.9 0.15-integration) (1551.19.24 Aaron's mergeable stuff)
mto: This revision was merged to the branch mainline in revision 2054.
Revision ID: abentley@panoramicfeedback.com-20060927212521-2306c9722b5eb4d0

merge bzr.dev

files added:
NEWS.developers

build-api

bzrlib/tests/test_doc_generate.py

files removed:
bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/dirstate.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/lazy_regex.py

bzrlib/merge_directive.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/strace.py

bzrlib/tag.py

bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_help.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/timestamp.py

bzrlib/transport/chroot.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/wsgi.py

bzrlib/util/bencode.py

bzrlib/workingtree_4.py

bzrlib/xml7.py

doc/bazaar-vcs.org.kid

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/bundle-creation.txt

doc/developers/container-format.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/merge-scaling.txt

doc/developers/performance-commit.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-performance-changes.txt

doc/developers/revert.txt

doc/http_smart_server.txt

doc/shared_repository_layouts.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/rst2prettyhtml.py

tools/win32/info.txt

files renamed:
doc/developers/HACKING => HACKING

bzrlib/tests/test_commands.py => bzrlib/tests/test_command.py

bzrlib/transport/remote.py => bzrlib/transport/smart.py

bzrlib/win32utils.py => bzrlib/win32console.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

profile_imports.py

setup.py *

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/urlutils.py

# Bazaar -- distributed version control

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

"""A collection of function for handling URL operations."""

import os

from posixpath import split as _posix_split, normpath as _posix_normpath

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from posixpath import split as _posix_split, normpath as _posix_normpath

import urllib

from bzrlib import (

errors,

osutils,

)

""")

import bzrlib.errors as errors

import bzrlib.osutils

def basename(url, exclude_trailing_slash=True):

base = local_path_from_url(base)

path = local_path_from_url(path)

return escape(osutils.relpath(base, path))

return escape(bzrlib.osutils.relpath(base, path))

def _find_scheme_and_separator(url):

117

111

join('http://foo', 'bar') => 'http://foo/bar'

118

112

join('http://foo', 'bar', '../baz') => 'http://foo/baz'

119

113

"""

120

if not args:

121

return base

122

match = _url_scheme_re.match(base)

114

m = _url_scheme_re.match(base)

123

115

scheme = None

124

if match:

125

scheme = match.group('scheme')

126

path = match.group('path').split('/')

116

if m:

117

scheme = m.group('scheme')

118

path = m.group('path').split('/')

127

119

if path[-1:] == ['']:

128

120

# Strip off a trailing slash

129

121

# This helps both when we are at the root, and when

132

124

else:

133

125

path = base.split('/')

134

126

135

if scheme is not None and len(path) >= 1:

136

host = path[:1]

137

# the path should be represented as an abs path.

138

# we know this must be absolute because of the presence of a URL scheme.

139

remove_root = True

140

path = [''] + path[1:]

141

else:

142

# create an empty host, but dont alter the path - this might be a

143

# relative url fragment.

144

host = []

145

remove_root = False

146

147

127

for arg in args:

148

match = _url_scheme_re.match(arg)

149

if match:

128

m = _url_scheme_re.match(arg)

129

if m:

150

130

# Absolute URL

151

scheme = match.group('scheme')

131

scheme = m.group('scheme')

152

132

# this skips .. normalisation, making http://host/../../..

153

133

# be rather strange.

154

path = match.group('path').split('/')

155

# set the host and path according to new absolute URL, discarding

156

# any previous values.

157

# XXX: duplicates mess from earlier in this function. This URL

158

# manipulation code needs some cleaning up.

159

if scheme is not None and len(path) >= 1:

160

host = path[:1]

161

path = path[1:]

162

# url scheme implies absolute path.

163

path = [''] + path

164

else:

165

# no url scheme we take the path as is.

166

host = []

134

path = m.group('path').split('/')

167

135

else:

168

path = '/'.join(path)

169

path = joinpath(path, arg)

170

path = path.split('/')

171

if remove_root and path[0:1] == ['']:

172

del path[0]

173

if host:

174

# Remove the leading slash from the path, so long as it isn't also the

175

# trailing slash, which we want to keep if present.

176

if path and path[0] == '' and len(path) > 1:

177

del path[0]

178

path = host + path

136

for chunk in arg.split('/'):

137

if chunk == '.':

138

continue

139

elif chunk == '..':

140

if len(path) >= 2:

141

# Don't pop off the host portion

142

path.pop()

143

else:

144

raise errors.InvalidURLJoin('Cannot go above root',

145

base, args)

146

else:

147

path.append(chunk)

179

148

180

149

if scheme is None:

181

150

return '/'.join(path)

182

151

return scheme + '://' + '/'.join(path)

183

152

184

153

185

def joinpath(base, *args):

186

"""Join URL path segments to a URL path segment.

187

188

This is somewhat like osutils.joinpath, but intended for URLs.

189

190

XXX: this duplicates some normalisation logic, and also duplicates a lot of

191

path handling logic that already exists in some Transport implementations.

192

We really should try to have exactly one place in the code base responsible

193

for combining paths of URLs.

194

"""

195

path = base.split('/')

196

if len(path) > 1 and path[-1] == '':

197

#If the path ends in a trailing /, remove it.

198

path.pop()

199

for arg in args:

200

if arg.startswith('/'):

201

path = []

202

for chunk in arg.split('/'):

203

if chunk == '.':

204

continue

205

elif chunk == '..':

206

if path == ['']:

207

raise errors.InvalidURLJoin('Cannot go above root',

208

base, args)

209

path.pop()

210

else:

211

path.append(chunk)

212

if path == ['']:

213

return '/'

214

else:

215

return '/'.join(path)

216

217

218

154

# jam 20060502 Sorted to 'l' because the final target is 'local_path_from_url'

219

155

def _posix_local_path_from_url(url):

220

156

"""Convert a url like file:///path/to/foo into /path/to/foo"""

232

168

# importing directly from posixpath allows us to test this

233

169

# on non-posix platforms

234

170

return 'file://' + escape(_posix_normpath(

235

osutils._posix_abspath(path)))

171

bzrlib.osutils._posix_abspath(path)))

236

172

237

173

238

174

def _win32_local_path_from_url(url):

239

175

"""Convert a url like file:///C:/path/to/foo into C:/path/to/foo"""

240

if not url.startswith('file://'):

241

raise errors.InvalidURL(url, 'local urls must start with file:///, '

242

'UNC path urls must start with file://')

176

if not url.startswith('file:///'):

177

raise errors.InvalidURL(url, 'local urls must start with file:///')

243

178

# We strip off all 3 slashes

244

win32_url = url[len('file:'):]

245

# check for UNC path: //HOST/path

246

if not win32_url.startswith('///'):

247

if (win32_url[2] == '/'

248

or win32_url[3] in '|:'):

249

raise errors.InvalidURL(url, 'Win32 UNC path urls'

250

' have form file://HOST/path')

251

return unescape(win32_url)

252

# usual local path with drive letter

253

if (win32_url[3] not in ('abcdefghijklmnopqrstuvwxyz'

179

win32_url = url[len('file:///'):]

180

if (win32_url[0] not in ('abcdefghijklmnopqrstuvwxyz'

254

181

'ABCDEFGHIJKLMNOPQRSTUVWXYZ')

255

or win32_url[4] not in '|:'

256

or win32_url[5] != '/'):

182

or win32_url[1] not in '|:'

183

or win32_url[2] != '/'):

257

184

raise errors.InvalidURL(url, 'Win32 file urls start with'

258

185

' file:///x:/, where x is a valid drive letter')

259

return win32_url[3].upper() + u':' + unescape(win32_url[5:])

186

return win32_url[0].upper() + u':' + unescape(win32_url[2:])

260

187

261

188

262

189

def _win32_local_path_to_url(path):

270

197

# which actually strips trailing space characters.

271

198

# The worst part is that under linux ntpath.abspath has different

272

199

# semantics, since 'nt' is not an available module.

273

win32_path = osutils._win32_abspath(path)

274

# check for UNC path \\HOST\path

275

if win32_path.startswith('//'):

276

return 'file:' + escape(win32_path)

200

win32_path = bzrlib.osutils._nt_normpath(

201

bzrlib.osutils._win32_abspath(path)).replace('\\', '/')

277

202

return 'file:///' + win32_path[0].upper() + ':' + escape(win32_path[2:])

278

203

279

204

290

215

291

216

292

217

_url_scheme_re = re.compile(r'^(?P<scheme>[^:/]{2,})://(?P<path>.*)$')

293

_url_hex_escapes_re = re.compile(r'(%[0-9a-fA-F]{2})')

294

295

296

def _unescape_safe_chars(matchobj):

297

"""re.sub callback to convert hex-escapes to plain characters (if safe).

298

299

e.g. '%7E' will be converted to '~'.

300

"""

301

hex_digits = matchobj.group(0)[1:]

302

char = chr(int(hex_digits, 16))

303

if char in _url_dont_escape_characters:

304

return char

305

else:

306

return matchobj.group(0).upper()

307

218

308

219

309

220

def normalize_url(url):

310

221

"""Make sure that a path string is in fully normalized URL form.

311

222

312

This handles URLs which have unicode characters, spaces,

223

This handles URLs which have unicode characters, spaces,

313

224

special characters, etc.

314

225

315

226

It has two basic modes of operation, depending on whether the

328

239

m = _url_scheme_re.match(url)

329

240

if not m:

330

241

return local_path_to_url(url)

331

scheme = m.group('scheme')

332

path = m.group('path')

333

242

if not isinstance(url, unicode):

334

243

for c in url:

335

244

if c not in _url_safe_characters:

336

245

raise errors.InvalidURL(url, 'URLs can only contain specific'

337

246

' safe characters (not %r)' % c)

338

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

339

return str(scheme + '://' + ''.join(path))

340

247

return url

341

248

# We have a unicode (hybrid) url

342

path_chars = list(path)

249

scheme = m.group('scheme')

250

path = list(m.group('path'))

343

251

344

for i in xrange(len(path_chars)):

345

if path_chars[i] not in _url_safe_characters:

346

chars = path_chars[i].encode('utf-8')

347

path_chars[i] = ''.join(

348

['%%%02X' % ord(c) for c in path_chars[i].encode('utf-8')])

349

path = ''.join(path_chars)

350

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

351

return str(scheme + '://' + path)

252

for i in xrange(len(path)):

253

if path[i] not in _url_safe_characters:

254

chars = path[i].encode('utf-8')

255

path[i] = ''.join(['%%%02X' % ord(c) for c in path[i].encode('utf-8')])

256

return scheme + '://' + ''.join(path)

352

257

353

258

354

259

def relative_url(base, other):

482

387

if not url.endswith('/'):

483

388

# Nothing to do

484

389

return url

485

if sys.platform == 'win32' and url.startswith('file://'):

390

if sys.platform == 'win32' and url.startswith('file:///'):

486

391

return _win32_strip_local_trailing_slash(url)

487

392

488

393

scheme_loc, first_path_slash = _find_scheme_and_separator(url)

534

439

#These entries get mapped to themselves

535

440

_hex_display_map.update((hex,'%'+hex) for hex in _no_decode_hex)

536

441

537

# These characters shouldn't be percent-encoded, and it's always safe to

538

# unencode them if they are.

539

_url_dont_escape_characters = set(

540

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

541

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

542

"0123456789" # Numbers

543

"-._~" # Unreserved characters

544

)

545

546

442

# These characters should not be escaped

547

_url_safe_characters = set(

548

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

549

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

550

"0123456789" # Numbers

551

"_.-!~*'()" # Unreserved characters

552

"/;?:@&=+$," # Reserved characters

553

"%#" # Extra reserved characters

554

)

443

_url_safe_characters = set('abcdefghijklmnopqrstuvwxyz'

444

'ABCDEFGHIJKLMNOPQRSTUVWXYZ'

445

'0123456789' '_.-/'

446

';?:@&=+$,%#')

447

555

448

556

449

def unescape_for_display(url, encoding):

557

450

"""Decode what you can for a URL, so that we get a nice looking path.

608

501

# Otherwise take the url decoded one

609

502

res[i] = decoded

610

503

return u'/'.join(res)

611

612

613

def derive_to_location(from_location):

614

"""Derive a TO_LOCATION given a FROM_LOCATION.

615

616

The normal case is a FROM_LOCATION of http://foo/bar => bar.

617

The Right Thing for some logical destinations may differ though

618

because no / may be present at all. In that case, the result is

619

the full name without the scheme indicator, e.g. lp:foo-bar => foo-bar.

620

This latter case also applies when a Windows drive

621

is used without a path, e.g. c:foo-bar => foo-bar.

622

If no /, path separator or : is found, the from_location is returned.

623

"""

624

if from_location.find("/") >= 0 or from_location.find(os.sep) >= 0:

625

return os.path.basename(from_location.rstrip("/\\"))

626

else:

627

sep = from_location.find(":")

628

if sep > 0:

629

return from_location[sep+1:]

630

else:

631

return from_location

Older »