~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/urlutils.py

Committer: Robert Collins
Date: 2007-07-04 08:08:13 UTC
mfrom: (2572 +trunk)
mto: This revision was merged to the branch mainline in revision 2587.
Revision ID: robertc@robertcollins.net-20070704080813-wzebx0r88fvwj5rq

Merge bzr.dev.

files added:
bzrlib/api.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/dirstate.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/lazy_regex.py

bzrlib/merge_directive.py

bzrlib/pack.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/strace.py

bzrlib/tag.py

bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_info.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/timestamp.py

bzrlib/transport/chroot.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/wsgi.py

bzrlib/util/bencode.py

bzrlib/workingtree_4.py

bzrlib/xml7.py

doc/bazaar-vcs.org.kid

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/bundle-creation.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/merge-scaling.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/revert.txt

doc/developers/scratch.txt

doc/developers/uncommit.txt

doc/http_smart_server.txt

doc/shared_repository_layouts.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/rst2prettyhtml.py

tools/win32/info.txt

files removed:
NEWS.developers

build-api

bzrlib/tests/test_doc_generate.py

files renamed:
bzrlib/graph.py => bzrlib/deprecated_graph.py

bzrlib/tests/test_command.py => bzrlib/tests/test_commands.py

bzrlib/tests/test_graph.py => bzrlib/tests/test_deprecated_graph.py

bzrlib/transport/smart.py => bzrlib/transport/remote.py

bzrlib/win32console.py => bzrlib/win32utils.py

HACKING => doc/developers/HACKING

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/check.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/doc/__init__.py

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml_serializer.py

contrib/bash/bzr.simple

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

profile_imports.py

setup.py *

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/urlutils.py

# Bazaar -- distributed version control

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

"""A collection of function for handling URL operations."""

import os

from posixpath import split as _posix_split, normpath as _posix_normpath

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from posixpath import split as _posix_split, normpath as _posix_normpath

import urllib

import bzrlib.errors as errors

import bzrlib.osutils

from bzrlib import (

errors,

osutils,

)

""")

def basename(url, exclude_trailing_slash=True):

base = local_path_from_url(base)

path = local_path_from_url(path)

return escape(bzrlib.osutils.relpath(base, path))

return escape(osutils.relpath(base, path))

def _find_scheme_and_separator(url):

111

117

join('http://foo', 'bar') => 'http://foo/bar'

112

118

join('http://foo', 'bar', '../baz') => 'http://foo/baz'

113

119

"""

114

m = _url_scheme_re.match(base)

120

if not args:

121

return base

122

match = _url_scheme_re.match(base)

115

123

scheme = None

116

if m:

117

scheme = m.group('scheme')

118

path = m.group('path').split('/')

124

if match:

125

scheme = match.group('scheme')

126

path = match.group('path').split('/')

119

127

if path[-1:] == ['']:

120

128

# Strip off a trailing slash

121

129

# This helps both when we are at the root, and when

124

132

else:

125

133

path = base.split('/')

126

134

135

if scheme is not None and len(path) >= 1:

136

host = path[:1]

137

# the path should be represented as an abs path.

138

# we know this must be absolute because of the presence of a URL scheme.

139

remove_root = True

140

path = [''] + path[1:]

141

else:

142

# create an empty host, but dont alter the path - this might be a

143

# relative url fragment.

144

host = []

145

remove_root = False

146

127

147

for arg in args:

128

m = _url_scheme_re.match(arg)

129

if m:

148

match = _url_scheme_re.match(arg)

149

if match:

130

150

# Absolute URL

131

scheme = m.group('scheme')

151

scheme = match.group('scheme')

132

152

# this skips .. normalisation, making http://host/../../..

133

153

# be rather strange.

134

path = m.group('path').split('/')

154

path = match.group('path').split('/')

155

# set the host and path according to new absolute URL, discarding

156

# any previous values.

157

# XXX: duplicates mess from earlier in this function. This URL

158

# manipulation code needs some cleaning up.

159

if scheme is not None and len(path) >= 1:

160

host = path[:1]

161

path = path[1:]

162

# url scheme implies absolute path.

163

path = [''] + path

164

else:

165

# no url scheme we take the path as is.

166

host = []

135

167

else:

136

for chunk in arg.split('/'):

137

if chunk == '.':

138

continue

139

elif chunk == '..':

140

if len(path) >= 2:

141

# Don't pop off the host portion

142

path.pop()

143

else:

144

raise errors.InvalidURLJoin('Cannot go above root',

145

base, args)

146

else:

147

path.append(chunk)

168

path = '/'.join(path)

169

path = joinpath(path, arg)

170

path = path.split('/')

171

if remove_root and path[0:1] == ['']:

172

del path[0]

173

if host:

174

# Remove the leading slash from the path, so long as it isn't also the

175

# trailing slash, which we want to keep if present.

176

if path and path[0] == '' and len(path) > 1:

177

del path[0]

178

path = host + path

148

179

149

180

if scheme is None:

150

181

return '/'.join(path)

151

182

return scheme + '://' + '/'.join(path)

152

183

153

184

185

def joinpath(base, *args):

186

"""Join URL path segments to a URL path segment.

187

188

This is somewhat like osutils.joinpath, but intended for URLs.

189

190

XXX: this duplicates some normalisation logic, and also duplicates a lot of

191

path handling logic that already exists in some Transport implementations.

192

We really should try to have exactly one place in the code base responsible

193

for combining paths of URLs.

194

"""

195

path = base.split('/')

196

if len(path) > 1 and path[-1] == '':

197

#If the path ends in a trailing /, remove it.

198

path.pop()

199

for arg in args:

200

if arg.startswith('/'):

201

path = []

202

for chunk in arg.split('/'):

203

if chunk == '.':

204

continue

205

elif chunk == '..':

206

if path == ['']:

207

raise errors.InvalidURLJoin('Cannot go above root',

208

base, args)

209

path.pop()

210

else:

211

path.append(chunk)

212

if path == ['']:

213

return '/'

214

else:

215

return '/'.join(path)

216

217

154

218

# jam 20060502 Sorted to 'l' because the final target is 'local_path_from_url'

155

219

def _posix_local_path_from_url(url):

156

220

"""Convert a url like file:///path/to/foo into /path/to/foo"""

168

232

# importing directly from posixpath allows us to test this

169

233

# on non-posix platforms

170

234

return 'file://' + escape(_posix_normpath(

171

bzrlib.osutils._posix_abspath(path)))

235

osutils._posix_abspath(path)))

172

236

173

237

174

238

def _win32_local_path_from_url(url):

175

239

"""Convert a url like file:///C:/path/to/foo into C:/path/to/foo"""

176

if not url.startswith('file:///'):

177

raise errors.InvalidURL(url, 'local urls must start with file:///')

240

if not url.startswith('file://'):

241

raise errors.InvalidURL(url, 'local urls must start with file:///, '

242

'UNC path urls must start with file://')

178

243

# We strip off all 3 slashes

179

win32_url = url[len('file:///'):]

180

if (win32_url[0] not in ('abcdefghijklmnopqrstuvwxyz'

244

win32_url = url[len('file:'):]

245

# check for UNC path: //HOST/path

246

if not win32_url.startswith('///'):

247

if (win32_url[2] == '/'

248

or win32_url[3] in '|:'):

249

raise errors.InvalidURL(url, 'Win32 UNC path urls'

250

' have form file://HOST/path')

251

return unescape(win32_url)

252

# usual local path with drive letter

253

if (win32_url[3] not in ('abcdefghijklmnopqrstuvwxyz'

181

254

'ABCDEFGHIJKLMNOPQRSTUVWXYZ')

182

or win32_url[1] not in '|:'

183

or win32_url[2] != '/'):

255

or win32_url[4] not in '|:'

256

or win32_url[5] != '/'):

184

257

raise errors.InvalidURL(url, 'Win32 file urls start with'

185

258

' file:///x:/, where x is a valid drive letter')

186

return win32_url[0].upper() + u':' + unescape(win32_url[2:])

259

return win32_url[3].upper() + u':' + unescape(win32_url[5:])

187

260

188

261

189

262

def _win32_local_path_to_url(path):

197

270

# which actually strips trailing space characters.

198

271

# The worst part is that under linux ntpath.abspath has different

199

272

# semantics, since 'nt' is not an available module.

200

win32_path = bzrlib.osutils._nt_normpath(

201

bzrlib.osutils._win32_abspath(path)).replace('\\', '/')

273

win32_path = osutils._win32_abspath(path)

274

# check for UNC path \\HOST\path

275

if win32_path.startswith('//'):

276

return 'file:' + escape(win32_path)

202

277

return 'file:///' + win32_path[0].upper() + ':' + escape(win32_path[2:])

203

278

204

279

215

290

216

291

217

292

_url_scheme_re = re.compile(r'^(?P<scheme>[^:/]{2,})://(?P<path>.*)$')

293

_url_hex_escapes_re = re.compile(r'(%[0-9a-fA-F]{2})')

294

295

296

def _unescape_safe_chars(matchobj):

297

"""re.sub callback to convert hex-escapes to plain characters (if safe).

298

299

e.g. '%7E' will be converted to '~'.

300

"""

301

hex_digits = matchobj.group(0)[1:]

302

char = chr(int(hex_digits, 16))

303

if char in _url_dont_escape_characters:

304

return char

305

else:

306

return matchobj.group(0).upper()

218

307

219

308

220

309

def normalize_url(url):

221

310

"""Make sure that a path string is in fully normalized URL form.

222

311

223

This handles URLs which have unicode characters, spaces,

312

This handles URLs which have unicode characters, spaces,

224

313

special characters, etc.

225

314

226

315

It has two basic modes of operation, depending on whether the

239

328

m = _url_scheme_re.match(url)

240

329

if not m:

241

330

return local_path_to_url(url)

331

scheme = m.group('scheme')

332

path = m.group('path')

242

333

if not isinstance(url, unicode):

243

334

for c in url:

244

335

if c not in _url_safe_characters:

245

336

raise errors.InvalidURL(url, 'URLs can only contain specific'

246

337

' safe characters (not %r)' % c)

247

return url

338

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

339

return str(scheme + '://' + ''.join(path))

340

248

341

# We have a unicode (hybrid) url

249

scheme = m.group('scheme')

250

path = list(m.group('path'))

342

path_chars = list(path)

251

343

252

for i in xrange(len(path)):

253

if path[i] not in _url_safe_characters:

254

chars = path[i].encode('utf-8')

255

path[i] = ''.join(['%%%02X' % ord(c) for c in path[i].encode('utf-8')])

256

return scheme + '://' + ''.join(path)

344

for i in xrange(len(path_chars)):

345

if path_chars[i] not in _url_safe_characters:

346

chars = path_chars[i].encode('utf-8')

347

path_chars[i] = ''.join(

348

['%%%02X' % ord(c) for c in path_chars[i].encode('utf-8')])

349

path = ''.join(path_chars)

350

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

351

return str(scheme + '://' + path)

257

352

258

353

259

354

def relative_url(base, other):

387

482

if not url.endswith('/'):

388

483

# Nothing to do

389

484

return url

390

if sys.platform == 'win32' and url.startswith('file:///'):

485

if sys.platform == 'win32' and url.startswith('file://'):

391

486

return _win32_strip_local_trailing_slash(url)

392

487

393

488

scheme_loc, first_path_slash = _find_scheme_and_separator(url)

439

534

#These entries get mapped to themselves

440

535

_hex_display_map.update((hex,'%'+hex) for hex in _no_decode_hex)

441

536

537

# These characters shouldn't be percent-encoded, and it's always safe to

538

# unencode them if they are.

539

_url_dont_escape_characters = set(

540

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

541

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

542

"0123456789" # Numbers

543

"-._~" # Unreserved characters

544

)

545

442

546

# These characters should not be escaped

443

_url_safe_characters = set('abcdefghijklmnopqrstuvwxyz'

444

'ABCDEFGHIJKLMNOPQRSTUVWXYZ'

445

'0123456789' '_.-/'

446

';?:@&=+$,%#')

447

547

_url_safe_characters = set(

548

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

549

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

550

"0123456789" # Numbers

551

"_.-!~*'()" # Unreserved characters

552

"/;?:@&=+$," # Reserved characters

553

"%#" # Extra reserved characters

554

)

448

555

449

556

def unescape_for_display(url, encoding):

450

557

"""Decode what you can for a URL, so that we get a nice looking path.

501

608

# Otherwise take the url decoded one

502

609

res[i] = decoded

503

610

return u'/'.join(res)

611

612

613

def derive_to_location(from_location):

614

"""Derive a TO_LOCATION given a FROM_LOCATION.

615

616

The normal case is a FROM_LOCATION of http://foo/bar => bar.

617

The Right Thing for some logical destinations may differ though

618

because no / may be present at all. In that case, the result is

619

the full name without the scheme indicator, e.g. lp:foo-bar => foo-bar.

620

This latter case also applies when a Windows drive

621

is used without a path, e.g. c:foo-bar => foo-bar.

622

If no /, path separator or : is found, the from_location is returned.

623

"""

624

if from_location.find("/") >= 0 or from_location.find(os.sep) >= 0:

625

return os.path.basename(from_location.rstrip("/\\"))

626

else:

627

sep = from_location.find(":")

628

if sep > 0:

629

return from_location[sep+1:]

630

else:

631

return from_location

Older »