~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/urlutils.py

Committer: Martin Pool
Date: 2005-11-22 04:30:14 UTC
mto: (1508.1.15) (1185.74.1 bzr.dev (Main development branch)) (1505.1.19 bzr-bound-branch) (1526.1.3 run_tests_twice_for_i18n) (1540.1.3 bzr.dev (Main development branch)) (1685.1.1 bzr-encoding) (1534.1.1 integration) (1553.5.1 bzr.dev (Main development branch)) (1608.2.1 bzr.mbp.escape-stores)
mto: This revision was merged to the branch mainline in revision 1510.
Revision ID: mbp@sourcefrog.net-20051122043014-6df209fd93033b59

Exclude more files from dumb-rsync upload

files added:
NEWS.developers

build-api

bzrlib/clone.py

bzrlib/merge_core.py

bzrlib/selftest/testreweave.py

bzrlib/util/configobj/validate.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/split-join-files.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/performance.txt

notes/revfile.txt

notes/schemas.xml

patches

files removed:
BRANCH.TODO

COPYING.txt

bzr.ico

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/breakin.py

bzrlib/bugtracker.py

bzrlib/bundle

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/counted_lock.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/help_topics.py

bzrlib/hooks.py

bzrlib/ignores.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge_directive.py

bzrlib/mutabletree.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/remote.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/sign_my_commits.py

bzrlib/smart

bzrlib/smart/__init__.py

bzrlib/smart/branch.py

bzrlib/smart/bzrdir.py

bzrlib/smart/client.py

bzrlib/smart/medium.py

bzrlib/smart/protocol.py

bzrlib/smart/repository.py

bzrlib/smart/request.py

bzrlib/smart/server.py

bzrlib/smart/vfs.py

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/versioned

bzrlib/strace.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HttpServer.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_breakin.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_cat_revision.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_create_checkout.py

bzrlib/tests/branch_implementations/test_get_revision_id_to_revno_map.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_revision_history.py

bzrlib/tests/branch_implementations/test_revision_id_to_revno.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/per_lock/test_temporary_write_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bugtracker.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_counted_lock.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_help.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_lsprof.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_remote.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_smart.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_strace.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_file_mtime.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_remove.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transform.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/http

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/readonly.py

bzrlib/transport/remote.py

bzrlib/transport/ssh.py

bzrlib/treebuilder.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/urlutils.py

bzrlib/util/bencode.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave_commands.py

bzrlib/workingtree_4.py

bzrlib/xml6.py

bzrlib/xml7.py

doc/README.1st

doc/bazaar-vcs.org.kid

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/developers

doc/developers/incremental-push-pull.txt

doc/developers/index.txt

doc/developers/performance-roadmap-rationale.txt

doc/developers/performance-roadmap.txt

doc/developers/performance-use-case-analysis.txt

doc/developers/profiling.txt

doc/http_smart_server.txt

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/shared_repository_layouts.txt

doc/specifying_revisions.txt

doc/using_aliases.txt

doc/version_info.txt

generate_docs.py

man1

profile_imports.py

tools/__init__.py

tools/biobench.py

tools/bzr_epydoc

tools/bzr_epydoc_uid.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_rstx.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

files renamed:
doc/developers/HACKING => HACKING

tools/doc_generate/autodoc_man.py => bzr_man.py

bzrlib/bundle/__init__.py => bzrlib/changeset.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_commands.py => bzrlib/selftest/test_command.py

bzrlib/tests/branch_implementations/test_parent.py => bzrlib/selftest/test_parent.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/blackbox/test_annotate.py => bzrlib/selftest/testannotate.py

bzrlib/tests/test_api.py => bzrlib/selftest/testapi.py

bzrlib/tests/branch_implementations/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_config.py => bzrlib/selftest/testconfig.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_gpg.py => bzrlib/selftest/testgpg.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_http.py => bzrlib/selftest/testhttp.py

bzrlib/tests/test_identitymap.py => bzrlib/selftest/testidentitymap.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_nonascii.py => bzrlib/selftest/testnonascii.py

bzrlib/tests/test_options.py => bzrlib/selftest/testoptions.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/testplugins.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/repository_implementations/test_revision.py => bzrlib/selftest/testrevprops.py

bzrlib/tests/test_sampler.py => bzrlib/selftest/testsampler.py

bzrlib/tests/test_sftp_transport.py => bzrlib/selftest/testsftp.py

bzrlib/tests/blackbox/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_testament.py => bzrlib/selftest/testtestament.py

bzrlib/tests/test_trace.py => bzrlib/selftest/testtrace.py

bzrlib/tests/test_transactions.py => bzrlib/selftest/testtransactions.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/test_tsort.py => bzrlib/selftest/testtsort.py

bzrlib/tests/test_workingtree.py => bzrlib/selftest/testworkingtree.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/versioned/__init__.py => bzrlib/store/weave.py

bzrlib/transport/http/__init__.py => bzrlib/transport/http.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/win32utils.py => bzrlib/win32console.py

bzrlib/xml_serializer.py => bzrlib/xml.py

doc/tutorial.txt => tutorial.txt

files modified:
.bzrignore

INSTALL

Makefile

NEWS

README

TODO

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/identitymap.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/option.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/stub_sftp.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/treeshape.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/testament.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/transactions.py

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tree.py

bzrlib/tsort.py

bzrlib/upgrade.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/elementtree/ElementTree.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/newinventory.py

contrib/pwk

setup.py

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

Show diffs side-by-side

added added

removed removed

bzrlib/urlutils.py

# Bazaar -- distributed version control

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""A collection of function for handling URL operations."""

import os

import re

import sys

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

from posixpath import split as _posix_split, normpath as _posix_normpath

import urllib

from bzrlib import (

errors,

osutils,

)

""")

def basename(url, exclude_trailing_slash=True):

"""Return the last component of a URL.

:param url: The URL in question

:param exclude_trailing_slash: If the url looks like "path/to/foo/"

ignore the final slash and return 'foo' rather than ''

:return: Just the final component of the URL. This can return ''

if you don't exclude_trailing_slash, or if you are at the

root of the URL.

"""

return split(url, exclude_trailing_slash=exclude_trailing_slash)[1]

def dirname(url, exclude_trailing_slash=True):

"""Return the parent directory of the given path.

:param url: Relative or absolute URL

:param exclude_trailing_slash: Remove a final slash

(treat http://host/foo/ as http://host/foo, but

http://host/ stays http://host/)

:return: Everything in the URL except the last path chunk

"""

# TODO: jam 20060502 This was named dirname to be consistent

# with the os functions, but maybe "parent" would be better

return split(url, exclude_trailing_slash=exclude_trailing_slash)[0]

def escape(relpath):

"""Escape relpath to be a valid url."""

if isinstance(relpath, unicode):

relpath = relpath.encode('utf-8')

# After quoting and encoding, the path should be perfectly

# safe as a plain ASCII string, str() just enforces this

return str(urllib.quote(relpath))

def file_relpath(base, path):

"""Compute just the relative sub-portion of a url

This assumes that both paths are already fully specified file:// URLs.

"""

assert len(base) >= MIN_ABS_FILEURL_LENGTH, ('Length of base must be equal or'

' exceed the platform minimum url length (which is %d)' %

MIN_ABS_FILEURL_LENGTH)

base = local_path_from_url(base)

path = local_path_from_url(path)

return escape(osutils.relpath(base, path))

def _find_scheme_and_separator(url):

"""Find the scheme separator (://) and the first path separator

This is just a helper functions for other path utilities.

It could probably be replaced by urlparse

"""

m = _url_scheme_re.match(url)

if not m:

return None, None

scheme = m.group('scheme')

path = m.group('path')

100

# Find the path separating slash

101

# (first slash after the ://)

102

first_path_slash = path.find('/')

103

if first_path_slash == -1:

104

return len(scheme), None

105

return len(scheme), first_path_slash+len(scheme)+3

106

107

108

def join(base, *args):

109

"""Create a URL by joining sections.

110

111

This will normalize '..', assuming that paths are absolute

112

(it assumes no symlinks in either path)

113

114

If any of *args is an absolute URL, it will be treated correctly.

115

Example:

116

join('http://foo', 'http://bar') => 'http://bar'

117

join('http://foo', 'bar') => 'http://foo/bar'

118

join('http://foo', 'bar', '../baz') => 'http://foo/baz'

119

"""

120

if not args:

121

return base

122

match = _url_scheme_re.match(base)

123

scheme = None

124

if match:

125

scheme = match.group('scheme')

126

path = match.group('path').split('/')

127

if path[-1:] == ['']:

128

# Strip off a trailing slash

129

# This helps both when we are at the root, and when

130

# 'base' has an extra slash at the end

131

path = path[:-1]

132

else:

133

path = base.split('/')

134

135

if scheme is not None and len(path) >= 1:

136

host = path[:1]

137

# the path should be represented as an abs path.

138

# we know this must be absolute because of the presence of a URL scheme.

139

remove_root = True

140

path = [''] + path[1:]

141

else:

142

# create an empty host, but dont alter the path - this might be a

143

# relative url fragment.

144

host = []

145

remove_root = False

146

147

for arg in args:

148

match = _url_scheme_re.match(arg)

149

if match:

150

# Absolute URL

151

scheme = match.group('scheme')

152

# this skips .. normalisation, making http://host/../../..

153

# be rather strange.

154

path = match.group('path').split('/')

155

# set the host and path according to new absolute URL, discarding

156

# any previous values.

157

# XXX: duplicates mess from earlier in this function. This URL

158

# manipulation code needs some cleaning up.

159

if scheme is not None and len(path) >= 1:

160

host = path[:1]

161

path = path[1:]

162

# url scheme implies absolute path.

163

path = [''] + path

164

else:

165

# no url scheme we take the path as is.

166

host = []

167

else:

168

path = '/'.join(path)

169

path = joinpath(path, arg)

170

path = path.split('/')

171

if remove_root and path[0:1] == ['']:

172

del path[0]

173

if host:

174

# Remove the leading slash from the path, so long as it isn't also the

175

# trailing slash, which we want to keep if present.

176

if path and path[0] == '' and len(path) > 1:

177

del path[0]

178

path = host + path

179

180

if scheme is None:

181

return '/'.join(path)

182

return scheme + '://' + '/'.join(path)

183

184

185

def joinpath(base, *args):

186

"""Join URL path segments to a URL path segment.

187

188

This is somewhat like osutils.joinpath, but intended for URLs.

189

190

XXX: this duplicates some normalisation logic, and also duplicates a lot of

191

path handling logic that already exists in some Transport implementations.

192

We really should try to have exactly one place in the code base responsible

193

for combining paths of URLs.

194

"""

195

path = base.split('/')

196

if len(path) > 1 and path[-1] == '':

197

#If the path ends in a trailing /, remove it.

198

path.pop()

199

for arg in args:

200

if arg.startswith('/'):

201

path = []

202

for chunk in arg.split('/'):

203

if chunk == '.':

204

continue

205

elif chunk == '..':

206

if path == ['']:

207

raise errors.InvalidURLJoin('Cannot go above root',

208

base, args)

209

path.pop()

210

else:

211

path.append(chunk)

212

if path == ['']:

213

return '/'

214

else:

215

return '/'.join(path)

216

217

218

# jam 20060502 Sorted to 'l' because the final target is 'local_path_from_url'

219

def _posix_local_path_from_url(url):

220

"""Convert a url like file:///path/to/foo into /path/to/foo"""

221

if not url.startswith('file:///'):

222

raise errors.InvalidURL(url, 'local urls must start with file:///')

223

# We only strip off 2 slashes

224

return unescape(url[len('file://'):])

225

226

227

def _posix_local_path_to_url(path):

228

"""Convert a local path like ./foo into a URL like file:///path/to/foo

229

230

This also handles transforming escaping unicode characters, etc.

231

"""

232

# importing directly from posixpath allows us to test this

233

# on non-posix platforms

234

return 'file://' + escape(_posix_normpath(

235

osutils._posix_abspath(path)))

236

237

238

def _win32_local_path_from_url(url):

239

"""Convert a url like file:///C:/path/to/foo into C:/path/to/foo"""

240

if not url.startswith('file://'):

241

raise errors.InvalidURL(url, 'local urls must start with file:///, '

242

'UNC path urls must start with file://')

243

# We strip off all 3 slashes

244

win32_url = url[len('file:'):]

245

# check for UNC path: //HOST/path

246

if not win32_url.startswith('///'):

247

if (win32_url[2] == '/'

248

or win32_url[3] in '|:'):

249

raise errors.InvalidURL(url, 'Win32 UNC path urls'

250

' have form file://HOST/path')

251

return unescape(win32_url)

252

# usual local path with drive letter

253

if (win32_url[3] not in ('abcdefghijklmnopqrstuvwxyz'

254

'ABCDEFGHIJKLMNOPQRSTUVWXYZ')

255

or win32_url[4] not in '|:'

256

or win32_url[5] != '/'):

257

raise errors.InvalidURL(url, 'Win32 file urls start with'

258

' file:///x:/, where x is a valid drive letter')

259

return win32_url[3].upper() + u':' + unescape(win32_url[5:])

260

261

262

def _win32_local_path_to_url(path):

263

"""Convert a local path like ./foo into a URL like file:///C:/path/to/foo

264

265

This also handles transforming escaping unicode characters, etc.

266

"""

267

# importing directly from ntpath allows us to test this

268

# on non-win32 platform

269

# FIXME: It turns out that on nt, ntpath.abspath uses nt._getfullpathname

270

# which actually strips trailing space characters.

271

# The worst part is that under linux ntpath.abspath has different

272

# semantics, since 'nt' is not an available module.

273

win32_path = osutils._win32_abspath(path)

274

# check for UNC path \\HOST\path

275

if win32_path.startswith('//'):

276

return 'file:' + escape(win32_path)

277

return 'file:///' + win32_path[0].upper() + ':' + escape(win32_path[2:])

278

279

280

local_path_to_url = _posix_local_path_to_url

281

local_path_from_url = _posix_local_path_from_url

282

MIN_ABS_FILEURL_LENGTH = len('file:///')

283

WIN32_MIN_ABS_FILEURL_LENGTH = len('file:///C:/')

284

285

if sys.platform == 'win32':

286

local_path_to_url = _win32_local_path_to_url

287

local_path_from_url = _win32_local_path_from_url

288

289

MIN_ABS_FILEURL_LENGTH = WIN32_MIN_ABS_FILEURL_LENGTH

290

291

292

_url_scheme_re = re.compile(r'^(?P<scheme>[^:/]{2,})://(?P<path>.*)$')

293

_url_hex_escapes_re = re.compile(r'(%[0-9a-fA-F]{2})')

294

295

296

def _unescape_safe_chars(matchobj):

297

"""re.sub callback to convert hex-escapes to plain characters (if safe).

298

299

e.g. '%7E' will be converted to '~'.

300

"""

301

hex_digits = matchobj.group(0)[1:]

302

char = chr(int(hex_digits, 16))

303

if char in _url_dont_escape_characters:

304

return char

305

else:

306

return matchobj.group(0).upper()

307

308

309

def normalize_url(url):

310

"""Make sure that a path string is in fully normalized URL form.

311

312

This handles URLs which have unicode characters, spaces,

313

special characters, etc.

314

315

It has two basic modes of operation, depending on whether the

316

supplied string starts with a url specifier (scheme://) or not.

317

If it does not have a specifier it is considered a local path,

318

and will be converted into a file:/// url. Non-ascii characters

319

will be encoded using utf-8.

320

If it does have a url specifier, it will be treated as a "hybrid"

321

URL. Basically, a URL that should have URL special characters already

322

escaped (like +?&# etc), but may have unicode characters, etc

323

which would not be valid in a real URL.

324

325

:param url: Either a hybrid URL or a local path

326

:return: A normalized URL which only includes 7-bit ASCII characters.

327

"""

328

m = _url_scheme_re.match(url)

329

if not m:

330

return local_path_to_url(url)

331

scheme = m.group('scheme')

332

path = m.group('path')

333

if not isinstance(url, unicode):

334

for c in url:

335

if c not in _url_safe_characters:

336

raise errors.InvalidURL(url, 'URLs can only contain specific'

337

' safe characters (not %r)' % c)

338

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

339

return str(scheme + '://' + ''.join(path))

340

341

# We have a unicode (hybrid) url

342

path_chars = list(path)

343

344

for i in xrange(len(path_chars)):

345

if path_chars[i] not in _url_safe_characters:

346

chars = path_chars[i].encode('utf-8')

347

path_chars[i] = ''.join(

348

['%%%02X' % ord(c) for c in path_chars[i].encode('utf-8')])

349

path = ''.join(path_chars)

350

path = _url_hex_escapes_re.sub(_unescape_safe_chars, path)

351

return str(scheme + '://' + path)

352

353

354

def relative_url(base, other):

355

"""Return a path to other from base.

356

357

If other is unrelated to base, return other. Else return a relative path.

358

This assumes no symlinks as part of the url.

359

"""

360

dummy, base_first_slash = _find_scheme_and_separator(base)

361

if base_first_slash is None:

362

return other

363

364

dummy, other_first_slash = _find_scheme_and_separator(other)

365

if other_first_slash is None:

366

return other

367

368

# this takes care of differing schemes or hosts

369

base_scheme = base[:base_first_slash]

370

other_scheme = other[:other_first_slash]

371

if base_scheme != other_scheme:

372

return other

373

374

base_path = base[base_first_slash+1:]

375

other_path = other[other_first_slash+1:]

376

377

if base_path.endswith('/'):

378

base_path = base_path[:-1]

379

380

base_sections = base_path.split('/')

381

other_sections = other_path.split('/')

382

383

if base_sections == ['']:

384

base_sections = []

385

if other_sections == ['']:

386

other_sections = []

387

388

output_sections = []

389

for b, o in zip(base_sections, other_sections):

390

if b != o:

391

break

392

output_sections.append(b)

393

394

match_len = len(output_sections)

395

output_sections = ['..' for x in base_sections[match_len:]]

396

output_sections.extend(other_sections[match_len:])

397

398

return "/".join(output_sections) or "."

399

400

401

def _win32_extract_drive_letter(url_base, path):

402

"""On win32 the drive letter needs to be added to the url base."""

403

# Strip off the drive letter

404

# path is currently /C:/foo

405

if len(path) < 3 or path[2] not in ':|' or path[3] != '/':

406

raise errors.InvalidURL(url_base + path,

407

'win32 file:/// paths need a drive letter')

408

url_base += path[0:3] # file:// + /C:

409

path = path[3:] # /foo

410

return url_base, path

411

412

413

def split(url, exclude_trailing_slash=True):

414

"""Split a URL into its parent directory and a child directory.

415

416

:param url: A relative or absolute URL

417

:param exclude_trailing_slash: Strip off a final '/' if it is part

418

of the path (but not if it is part of the protocol specification)

419

420

:return: (parent_url, child_dir). child_dir may be the empty string if we're at

421

the root.

422

"""

423

scheme_loc, first_path_slash = _find_scheme_and_separator(url)

424

425

if first_path_slash is None:

426

# We have either a relative path, or no separating slash

427

if scheme_loc is None:

428

# Relative path

429

if exclude_trailing_slash and url.endswith('/'):

430

url = url[:-1]

431

return _posix_split(url)

432

else:

433

# Scheme with no path

434

return url, ''

435

436

# We have a fully defined path

437

url_base = url[:first_path_slash] # http://host, file://

438

path = url[first_path_slash:] # /file/foo

439

440

if sys.platform == 'win32' and url.startswith('file:///'):

441

# Strip off the drive letter

442

# url_base is currently file://

443

# path is currently /C:/foo

444

url_base, path = _win32_extract_drive_letter(url_base, path)

445

# now it should be file:///C: and /foo

446

447

if exclude_trailing_slash and len(path) > 1 and path.endswith('/'):

448

path = path[:-1]

449

head, tail = _posix_split(path)

450

return url_base + head, tail

451

452

453

def _win32_strip_local_trailing_slash(url):

454

"""Strip slashes after the drive letter"""

455

if len(url) > WIN32_MIN_ABS_FILEURL_LENGTH:

456

return url[:-1]

457

else:

458

return url

459

460

461

def strip_trailing_slash(url):

462

"""Strip trailing slash, except for root paths.

463

464

The definition of 'root path' is platform-dependent.

465

This assumes that all URLs are valid netloc urls, such that they

466

form:

467

scheme://host/path

468

It searches for ://, and then refuses to remove the next '/'.

469

It can also handle relative paths

470

Examples:

471

path/to/foo => path/to/foo

472

path/to/foo/ => path/to/foo

473

http://host/path/ => http://host/path

474

http://host/path => http://host/path

475

http://host/ => http://host/

476

file:/// => file:///

477

file:///foo/ => file:///foo

478

# This is unique on win32 platforms, and is the only URL

479

# format which does it differently.

480

file:///c|/ => file:///c:/

481

"""

482

if not url.endswith('/'):

483

# Nothing to do

484

return url

485

if sys.platform == 'win32' and url.startswith('file://'):

486

return _win32_strip_local_trailing_slash(url)

487

488

scheme_loc, first_path_slash = _find_scheme_and_separator(url)

489

if scheme_loc is None:

490

# This is a relative path, as it has no scheme

491

# so just chop off the last character

492

return url[:-1]

493

494

if first_path_slash is None or first_path_slash == len(url)-1:

495

# Don't chop off anything if the only slash is the path

496

# separating slash

497

return url

498

499

return url[:-1]

500

501

502

def unescape(url):

503

"""Unescape relpath from url format.

504

505

This returns a Unicode path from a URL

506

"""

507

# jam 20060427 URLs are supposed to be ASCII only strings

508

# If they are passed in as unicode, urllib.unquote

509

# will return a UNICODE string, which actually contains

510

# utf-8 bytes. So we have to ensure that they are

511

# plain ASCII strings, or the final .decode will

512

# try to encode the UNICODE => ASCII, and then decode

513

# it into utf-8.

514

try:

515

url = str(url)

516

except UnicodeError, e:

517

raise errors.InvalidURL(url, 'URL was not a plain ASCII url: %s' % (e,))

518

519

unquoted = urllib.unquote(url)

520

try:

521

unicode_path = unquoted.decode('utf-8')

522

except UnicodeError, e:

523

raise errors.InvalidURL(url, 'Unable to encode the URL as utf-8: %s' % (e,))

524

return unicode_path

525

526

527

# These are characters that if escaped, should stay that way

528

_no_decode_chars = ';/?:@&=+$,#'

529

_no_decode_ords = [ord(c) for c in _no_decode_chars]

530

_no_decode_hex = (['%02x' % o for o in _no_decode_ords]

531

+ ['%02X' % o for o in _no_decode_ords])

532

_hex_display_map = dict(([('%02x' % o, chr(o)) for o in range(256)]

533

+ [('%02X' % o, chr(o)) for o in range(256)]))

534

#These entries get mapped to themselves

535

_hex_display_map.update((hex,'%'+hex) for hex in _no_decode_hex)

536

537

# These characters shouldn't be percent-encoded, and it's always safe to

538

# unencode them if they are.

539

_url_dont_escape_characters = set(

540

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

541

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

542

"0123456789" # Numbers

543

"-._~" # Unreserved characters

544

)

545

546

# These characters should not be escaped

547

_url_safe_characters = set(

548

"abcdefghijklmnopqrstuvwxyz" # Lowercase alpha

549

"ABCDEFGHIJKLMNOPQRSTUVWXYZ" # Uppercase alpha

550

"0123456789" # Numbers

551

"_.-!~*'()" # Unreserved characters

552

"/;?:@&=+$," # Reserved characters

553

"%#" # Extra reserved characters

554

)

555

556

def unescape_for_display(url, encoding):

557

"""Decode what you can for a URL, so that we get a nice looking path.

558

559

This will turn file:// urls into local paths, and try to decode

560

any portions of a http:// style url that it can.

561

562

Any sections of the URL which can't be represented in the encoding or

563

need to stay as escapes are left alone.

564

565

:param url: A 7-bit ASCII URL

566

:param encoding: The final output encoding

567

568

:return: A unicode string which can be safely encoded into the

569

specified encoding.

570

"""

571

assert encoding is not None, 'you cannot specify None for the display encoding.'

572

if url.startswith('file://'):

573

try:

574

path = local_path_from_url(url)

575

path.encode(encoding)

576

return path

577

except UnicodeError:

578

return url

579

580

# Split into sections to try to decode utf-8

581

res = url.split('/')

582

for i in xrange(1, len(res)):

583

escaped_chunks = res[i].split('%')

584

for j in xrange(1, len(escaped_chunks)):

585

item = escaped_chunks[j]

586

try:

587

escaped_chunks[j] = _hex_display_map[item[:2]] + item[2:]

588

except KeyError:

589

# Put back the percent symbol

590

escaped_chunks[j] = '%' + item

591

except UnicodeDecodeError:

592

escaped_chunks[j] = unichr(int(item[:2], 16)) + item[2:]

593

unescaped = ''.join(escaped_chunks)

594

try:

595

decoded = unescaped.decode('utf-8')

596

except UnicodeDecodeError:

597

# If this path segment cannot be properly utf-8 decoded

598

# after doing unescaping we will just leave it alone

599

pass

600

else:

601

try:

602

decoded.encode(encoding)

603

except UnicodeEncodeError:

604

# If this chunk cannot be encoded in the local

605

# encoding, then we should leave it alone

606

pass

607

else:

608

# Otherwise take the url decoded one

609

res[i] = decoded

610

return u'/'.join(res)

Older »