~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/urlutils.py

Committer: John Arbash Meinel
Date: 2006-11-10 15:38:16 UTC
mto: This revision was merged to the branch mainline in revision 2129.
Revision ID: john@arbash-meinel.com-20061110153816-46acf76fc86a512b

use try/finally to clean up a nested progress bar during weave fetching

files added:
NEWS.developers

build-api

bzrlib/tests/test_doc_generate.py

files removed:
bzrlib/api.py

bzrlib/branchbuilder.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/counted_lock.py

bzrlib/dirstate.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/graph.py

bzrlib/hooks.py

bzrlib/merge_directive.py

bzrlib/pack.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/smtp_connection.py

bzrlib/strace.py

bzrlib/tag.py

bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_lsprof.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_sprout.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_branchbuilder.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_help.py

bzrlib/tests/test_hooks.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_info.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_pack.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smtp_connection.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/timestamp.py

bzrlib/transport/brokenrename.py

bzrlib/transport/chroot.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/wsgi.py

bzrlib/util/bencode.py

bzrlib/workingtree_4.py

bzrlib/xml7.py

doc/developers

doc/developers/add.txt

doc/developers/annotate.txt

doc/developers/api-versioning.txt

doc/developers/bundle-creation.txt

doc/developers/bundles.txt

doc/developers/commit.txt

doc/developers/container-format.txt

doc/developers/dirstate.txt

doc/developers/gc.txt

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/initial-push-pull.txt

doc/developers/merge-scaling.txt

doc/developers/performance-contributing.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/performance.dot

doc/developers/planned-change-integration.txt

doc/developers/planned-performance-changes.txt

doc/developers/profiling.txt

doc/developers/revert.txt

doc/developers/scratch.txt

doc/developers/status.txt

doc/developers/uncommit.txt

doc/http_smart_server.txt

doc/shared_repository_layouts.txt

man1

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

files renamed:
doc/developers/HACKING => HACKING

bzrlib/deprecated_graph.py => bzrlib/graph.py

bzrlib/tests/test_commands.py => bzrlib/tests/test_command.py

bzrlib/tests/test_deprecated_graph.py => bzrlib/tests/test_graph.py

bzrlib/transport/remote.py => bzrlib/transport/smart.py

bzrlib/win32utils.py => bzrlib/win32console.py

files modified:
.bzrignore

BRANCH.TODO

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/help_topics.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/info.py

bzrlib/inter.py

bzrlib/inventory.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/log.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patches.py

bzrlib/plugin.py

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/repository.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/trace.py

bzrlib/transform.py

bzrlib/transport/__init__.py

bzrlib/transport/decorator.py

bzrlib/transport/ftp.py

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/response.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/ssh.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/version.py

bzrlib/version_info_formats/__init__.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/workingtree.py

bzrlib/xml5.py

bzrlib/xml6.py

contrib/bash/bzr.simple

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

setup.py *

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/start_bzr.bat

Show diffs side-by-side

added added

removed removed

bzrlib/urlutils.py

117

join('http://foo', 'bar') => 'http://foo/bar'

118

join('http://foo', 'bar', '../baz') => 'http://foo/baz'

119

"""

120

if not args:

121

return base

122

match = _url_scheme_re.match(base)

120

m = _url_scheme_re.match(base)

123

121

scheme = None

124

if match:

125

scheme = match.group('scheme')

126

path = match.group('path').split('/')

122

if m:

123

scheme = m.group('scheme')

124

path = m.group('path').split('/')

127

125

if path[-1:] == ['']:

128

126

# Strip off a trailing slash

129

127

# This helps both when we are at the root, and when

132

130

else:

133

131

path = base.split('/')

134

132

135

if scheme is not None and len(path) >= 1:

136

host = path[:1]

137

# the path should be represented as an abs path.

138

# we know this must be absolute because of the presence of a URL scheme.

139

remove_root = True

140

path = [''] + path[1:]

141

else:

142

# create an empty host, but dont alter the path - this might be a

143

# relative url fragment.

144

host = []

145

remove_root = False

146

147

133

for arg in args:

148

match = _url_scheme_re.match(arg)

149

if match:

134

m = _url_scheme_re.match(arg)

135

if m:

150

136

# Absolute URL

151

scheme = match.group('scheme')

137

scheme = m.group('scheme')

152

138

# this skips .. normalisation, making http://host/../../..

153

139

# be rather strange.

154

path = match.group('path').split('/')

155

# set the host and path according to new absolute URL, discarding

156

# any previous values.

157

# XXX: duplicates mess from earlier in this function. This URL

158

# manipulation code needs some cleaning up.

159

if scheme is not None and len(path) >= 1:

160

host = path[:1]

161

path = path[1:]

162

# url scheme implies absolute path.

163

path = [''] + path

164

else:

165

# no url scheme we take the path as is.

166

host = []

140

path = m.group('path').split('/')

167

141

else:

168

path = '/'.join(path)

169

path = joinpath(path, arg)

170

path = path.split('/')

171

if remove_root and path[0:1] == ['']:

172

del path[0]

173

if host:

174

# Remove the leading slash from the path, so long as it isn't also the

175

# trailing slash, which we want to keep if present.

176

if path and path[0] == '' and len(path) > 1:

177

del path[0]

178

path = host + path

142

for chunk in arg.split('/'):

143

if chunk == '.':

144

continue

145

elif chunk == '..':

146

if len(path) >= 2:

147

# Don't pop off the host portion

148

path.pop()

149

else:

150

raise errors.InvalidURLJoin('Cannot go above root',

151

base, args)

152

else:

153

path.append(chunk)

179

154

180

155

if scheme is None:

181

156

return '/'.join(path)

182

157

return scheme + '://' + '/'.join(path)

183

158

184

159

185

def joinpath(base, *args):

186

"""Join URL path segments to a URL path segment.

187

188

This is somewhat like osutils.joinpath, but intended for URLs.

189

190

XXX: this duplicates some normalisation logic, and also duplicates a lot of

191

path handling logic that already exists in some Transport implementations.

192

We really should try to have exactly one place in the code base responsible

193

for combining paths of URLs.

194

"""

195

path = base.split('/')

196

if len(path) > 1 and path[-1] == '':

197

#If the path ends in a trailing /, remove it.

198

path.pop()

199

for arg in args:

200

if arg.startswith('/'):

201

path = []

202

for chunk in arg.split('/'):

203

if chunk == '.':

204

continue

205

elif chunk == '..':

206

if path == ['']:

207

raise errors.InvalidURLJoin('Cannot go above root',

208

base, args)

209

path.pop()

210

else:

211

path.append(chunk)

212

if path == ['']:

213

return '/'

214

else:

215

return '/'.join(path)

216

217

218

160

# jam 20060502 Sorted to 'l' because the final target is 'local_path_from_url'

219

161

def _posix_local_path_from_url(url):

220

162

"""Convert a url like file:///path/to/foo into /path/to/foo"""

237

179

238

180

def _win32_local_path_from_url(url):

239

181

"""Convert a url like file:///C:/path/to/foo into C:/path/to/foo"""

240

if not url.startswith('file://'):

241

raise errors.InvalidURL(url, 'local urls must start with file:///, '

242

'UNC path urls must start with file://')

182

if not url.startswith('file:///'):

183

raise errors.InvalidURL(url, 'local urls must start with file:///')

243

184

# We strip off all 3 slashes

244

win32_url = url[len('file:'):]

245

# check for UNC path: //HOST/path

246

if not win32_url.startswith('///'):

247

if (win32_url[2] == '/'

248

or win32_url[3] in '|:'):

249

raise errors.InvalidURL(url, 'Win32 UNC path urls'

250

' have form file://HOST/path')

251

return unescape(win32_url)

252

# usual local path with drive letter

253

if (win32_url[3] not in ('abcdefghijklmnopqrstuvwxyz'

185

win32_url = url[len('file:///'):]

186

if (win32_url[0] not in ('abcdefghijklmnopqrstuvwxyz'

254

187

'ABCDEFGHIJKLMNOPQRSTUVWXYZ')

255

or win32_url[4] not in '|:'

256

or win32_url[5] != '/'):

188

or win32_url[1] not in '|:'

189

or win32_url[2] != '/'):

257

190

raise errors.InvalidURL(url, 'Win32 file urls start with'

258

191

' file:///x:/, where x is a valid drive letter')

259

return win32_url[3].upper() + u':' + unescape(win32_url[5:])

192

return win32_url[0].upper() + u':' + unescape(win32_url[2:])

260

193

261

194

262

195

def _win32_local_path_to_url(path):

270

203

# which actually strips trailing space characters.

271

204

# The worst part is that under linux ntpath.abspath has different

272

205

# semantics, since 'nt' is not an available module.

273

win32_path = osutils._win32_abspath(path)

274

# check for UNC path \\HOST\path

275

if win32_path.startswith('//'):

276

return 'file:' + escape(win32_path)

206

win32_path = osutils._nt_normpath(

207

osutils._win32_abspath(path)).replace('\\', '/')

277

208

return 'file:///' + win32_path[0].upper() + ':' + escape(win32_path[2:])

278

209

279

210

290

221

291

222

292

223

_url_scheme_re = re.compile(r'^(?P<scheme>[^:/]{2,})://(?P<path>.*)$')

293

_url_hex_escapes_re = re.compile(r'(%[0-9a-fA-F]{2})')

294

295

296

def _unescape_safe_chars(matchobj):

297

"""re.sub callback to convert hex-escapes to plain characters (if safe).

298

299

e.g. '%7E' will be converted to '~'.

300

"""

301

hex_digits = matchobj.group(0)[1:]

302

char = chr(int(hex_digits, 16))

303

if char in _url_dont_escape_characters:

304

return char

305

else:

306

return matchobj.group(0).upper()

307

224

308

225

309

226

def normalize_url(url):

310

227

"""Make sure that a path string is in fully normalized URL form.

311

228

312

This handles URLs which have unicode characters, spaces,

229

This handles URLs which have unicode characters, spaces,

313

230

special characters, etc.

314

231

315

232

It has two basic modes of operation, depending on whether the

328

245

m = _url_scheme_re.match(url)

329

246

if not m:

330

247

return local_path_to_url(url)

331

scheme = m.group('scheme')

332

path = m.group('path')

333

248

if not isinstance(url, unicode):

334

249

for c in url:

335

250

if c not in _url_safe_characters:

336

251

raise errors.InvalidURL(url, 'URLs can only contain specific'

337

252

' safe characters (not %r)' % c)

338

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

339

return str(scheme + '://' + ''.join(path))

340

253

return url

341

254

# We have a unicode (hybrid) url

342

path_chars = list(path)

255

scheme = m.group('scheme')

256

path = list(m.group('path'))

343

257

344

for i in xrange(len(path_chars)):

345

if path_chars[i] not in _url_safe_characters:

346

chars = path_chars[i].encode('utf-8')

347

path_chars[i] = ''.join(

348

['%%%02X' % ord(c) for c in path_chars[i].encode('utf-8')])

349

path = ''.join(path_chars)

350

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

351

return str(scheme + '://' + path)

258

for i in xrange(len(path)):

259

if path[i] not in _url_safe_characters:

260

chars = path[i].encode('utf-8')

261

path[i] = ''.join(['%%%02X' % ord(c) for c in path[i].encode('utf-8')])

262

return scheme + '://' + ''.join(path)

352

263

353

264

354

265

def relative_url(base, other):

482

393

if not url.endswith('/'):

483

394

# Nothing to do

484

395

return url

485

if sys.platform == 'win32' and url.startswith('file://'):

396

if sys.platform == 'win32' and url.startswith('file:///'):

486

397

return _win32_strip_local_trailing_slash(url)

487

398

488

399

scheme_loc, first_path_slash = _find_scheme_and_separator(url)

534

445

#These entries get mapped to themselves

535

446

_hex_display_map.update((hex,'%'+hex) for hex in _no_decode_hex)

536

447

537

# These characters shouldn't be percent-encoded, and it's always safe to

538

# unencode them if they are.

539

_url_dont_escape_characters = set(

540

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

541

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

542

"0123456789" # Numbers

543

"-._~" # Unreserved characters

544

)

545

546

448

# These characters should not be escaped

547

_url_safe_characters = set(

548

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

549

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

550

"0123456789" # Numbers

551

"_.-!~*'()" # Unreserved characters

552

"/;?:@&=+$," # Reserved characters

553

"%#" # Extra reserved characters

554

)

449

_url_safe_characters = set('abcdefghijklmnopqrstuvwxyz'

450

'ABCDEFGHIJKLMNOPQRSTUVWXYZ'

451

'0123456789' '_.-/'

452

';?:@&=+$,%#')

453

555

454

556

455

def unescape_for_display(url, encoding):

557

456

"""Decode what you can for a URL, so that we get a nice looking path.

608

507

# Otherwise take the url decoded one

609

508

res[i] = decoded

610

509

return u'/'.join(res)

611

612

613

def derive_to_location(from_location):

614

"""Derive a TO_LOCATION given a FROM_LOCATION.

615

616

The normal case is a FROM_LOCATION of http://foo/bar => bar.

617

The Right Thing for some logical destinations may differ though

618

because no / may be present at all. In that case, the result is

619

the full name without the scheme indicator, e.g. lp:foo-bar => foo-bar.

620

This latter case also applies when a Windows drive

621

is used without a path, e.g. c:foo-bar => foo-bar.

622

If no /, path separator or : is found, the from_location is returned.

623

"""

624

if from_location.find("/") >= 0 or from_location.find(os.sep) >= 0:

625

return os.path.basename(from_location.rstrip("/\\"))

626

else:

627

sep = from_location.find(":")

628

if sep > 0:

629

return from_location[sep+1:]

630

else:

631

return from_location

Older »