~bzr-pqm/bzr/bzr.dev

Committer: John Arbash Meinel
Date: 2007-03-15 22:35:35 UTC
mto: This revision was merged to the branch mainline in revision 2363.
Revision ID: john@arbash-meinel.com-20070315223535-d3d4964oe1hc8zhg

Add an overzealous test, for Unicode support of _iter_changes.
For both knowns and unknowns.
And include a basic, if suboptimal, fix.
I would rather defer the decoding until we've determined that we are going to return the tuple.
There is still something broken with added files, but I'll get to that.

files added:
BRANCH.TODO

COPYING.txt

HACKING

INSTALL

Makefile

NEWS.developers

bzr.ico

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/benchmarks

bzrlib/benchmarks/__init__.py

bzrlib/benchmarks/bench_add.py

bzrlib/benchmarks/bench_bench.py

bzrlib/benchmarks/bench_bundle.py

bzrlib/benchmarks/bench_cache_utf8.py

bzrlib/benchmarks/bench_checkout.py

bzrlib/benchmarks/bench_commit.py

bzrlib/benchmarks/bench_info.py

bzrlib/benchmarks/bench_inventory.py

bzrlib/benchmarks/bench_log.py

bzrlib/benchmarks/bench_osutils.py

bzrlib/benchmarks/bench_rocks.py

bzrlib/benchmarks/bench_sftp.py

bzrlib/benchmarks/bench_startup.py

bzrlib/benchmarks/bench_status.py

bzrlib/benchmarks/bench_transform.py

bzrlib/benchmarks/bench_workingtree.py

bzrlib/benchmarks/bench_xml.py

bzrlib/benchmarks/tree_creator

bzrlib/benchmarks/tree_creator/__init__.py

bzrlib/benchmarks/tree_creator/heavily_merged.py

bzrlib/benchmarks/tree_creator/kernel_like.py

bzrlib/benchmarks/tree_creator/many_commit.py

bzrlib/benchmarks/tree_creator/simple_many_commit.py

bzrlib/builtins.py

bzrlib/bundle

bzrlib/bundle/__init__.py

bzrlib/bundle/apply_bundle.py

bzrlib/bundle/bundle_data.py

bzrlib/bundle/commands.py

bzrlib/bundle/common.py

bzrlib/bundle/old

bzrlib/bundle/old/send_changeset.py

bzrlib/bundle/serializer

bzrlib/bundle/serializer/__init__.py

bzrlib/bundle/serializer/v08.py

bzrlib/bundle/serializer/v09.py

bzrlib/bzrdir.py

bzrlib/cache_utf8.py

bzrlib/cmd_version_info.py

bzrlib/commit.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/debug.py

bzrlib/decorators.py

bzrlib/delta.py

bzrlib/dirstate.py

bzrlib/doc

bzrlib/doc/__init__.py

bzrlib/doc/api

bzrlib/doc/api/__init__.py

bzrlib/doc/api/branch.txt

bzrlib/doc/api/transport.txt

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/generate_ids.py

bzrlib/globbing.py

bzrlib/gpg.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help_topics.py

bzrlib/identitymap.py

bzrlib/ignores.py

bzrlib/inspect_for_copy.py

bzrlib/inter.py

bzrlib/intset.py

bzrlib/iterablefile.py

bzrlib/knit.py

bzrlib/lazy_import.py

bzrlib/lazy_regex.py

bzrlib/lock.py

bzrlib/lockable_files.py

bzrlib/lockdir.py

bzrlib/lsprof.py

bzrlib/memorytree.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_directive.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/mutabletree.py

bzrlib/option.py

bzrlib/patch.py

bzrlib/patches.py

bzrlib/patiencediff.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/launchpad

bzrlib/plugins/launchpad/__init__.py

bzrlib/plugins/launchpad/lp_indirect.py

bzrlib/plugins/launchpad/lp_registration.py

bzrlib/plugins/launchpad/test_lp_indirect.py

bzrlib/plugins/launchpad/test_register.py

bzrlib/progress.py

bzrlib/reconcile.py

bzrlib/registry.py

bzrlib/repofmt

bzrlib/repofmt/__init__.py

bzrlib/repofmt/knitrepo.py

bzrlib/repofmt/weaverepo.py

bzrlib/repository.py

bzrlib/revisionspec.py

bzrlib/revisiontree.py

bzrlib/rio.py

bzrlib/shellcomplete.py

bzrlib/sign_my_commits.py

bzrlib/store

bzrlib/store/revision

bzrlib/store/revision/__init__.py

bzrlib/store/revision/knit.py

bzrlib/store/revision/text.py

bzrlib/store/text.py

bzrlib/store/versioned

bzrlib/store/versioned/__init__.py

bzrlib/symbol_versioning.py

bzrlib/tag.py

bzrlib/testament.py

bzrlib/tests

bzrlib/tests/EncodingAdapter.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/HttpServer.py

bzrlib/tests/TestUtil.py

bzrlib/tests/__init__.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_add.py

bzrlib/tests/blackbox/test_added.py

bzrlib/tests/blackbox/test_aliases.py

bzrlib/tests/blackbox/test_ancestry.py

bzrlib/tests/blackbox/test_annotate.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_branch.py

bzrlib/tests/blackbox/test_break_lock.py

bzrlib/tests/blackbox/test_bundle.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_checkout.py

bzrlib/tests/blackbox/test_command_encoding.py

bzrlib/tests/blackbox/test_commit.py

bzrlib/tests/blackbox/test_conflicts.py

bzrlib/tests/blackbox/test_debug.py

bzrlib/tests/blackbox/test_diff.py

bzrlib/tests/blackbox/test_exceptions.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_find_merge_base.py

bzrlib/tests/blackbox/test_help.py

bzrlib/tests/blackbox/test_ignore.py

bzrlib/tests/blackbox/test_ignored.py

bzrlib/tests/blackbox/test_info.py

bzrlib/tests/blackbox/test_init.py

bzrlib/tests/blackbox/test_inventory.py

bzrlib/tests/blackbox/test_join.py

bzrlib/tests/blackbox/test_locale.py

bzrlib/tests/blackbox/test_log.py

bzrlib/tests/blackbox/test_logformats.py

bzrlib/tests/blackbox/test_ls.py

bzrlib/tests/blackbox/test_merge.py

bzrlib/tests/blackbox/test_merge_directive.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_mv.py

bzrlib/tests/blackbox/test_nick.py

bzrlib/tests/blackbox/test_non_ascii.py

bzrlib/tests/blackbox/test_outside_wt.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_push.py

bzrlib/tests/blackbox/test_re_sign.py

bzrlib/tests/blackbox/test_reconcile.py

bzrlib/tests/blackbox/test_remerge.py

bzrlib/tests/blackbox/test_remove.py

bzrlib/tests/blackbox/test_remove_tree.py

bzrlib/tests/blackbox/test_revert.py

bzrlib/tests/blackbox/test_revision_history.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_selftest.py

bzrlib/tests/blackbox/test_serve.py

bzrlib/tests/blackbox/test_shared_repository.py

bzrlib/tests/blackbox/test_sign_my_commits.py

bzrlib/tests/blackbox/test_split.py

bzrlib/tests/blackbox/test_status.py

bzrlib/tests/blackbox/test_tags.py

bzrlib/tests/blackbox/test_testament.py

bzrlib/tests/blackbox/test_too_much.py

bzrlib/tests/blackbox/test_uncommit.py

bzrlib/tests/blackbox/test_update.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/blackbox/test_version.py

bzrlib/tests/blackbox/test_version_info.py

bzrlib/tests/blackbox/test_versioning.py

bzrlib/tests/blackbox/test_whoami.py

bzrlib/tests/branch_implementations

bzrlib/tests/branch_implementations/__init__.py

bzrlib/tests/branch_implementations/test_bound_sftp.py

bzrlib/tests/branch_implementations/test_branch.py

bzrlib/tests/branch_implementations/test_break_lock.py

bzrlib/tests/branch_implementations/test_commit.py

bzrlib/tests/branch_implementations/test_hooks.py

bzrlib/tests/branch_implementations/test_http.py

bzrlib/tests/branch_implementations/test_last_revision_info.py

bzrlib/tests/branch_implementations/test_locking.py

bzrlib/tests/branch_implementations/test_parent.py

bzrlib/tests/branch_implementations/test_permissions.py

bzrlib/tests/branch_implementations/test_pull.py

bzrlib/tests/branch_implementations/test_push.py

bzrlib/tests/branch_implementations/test_tags.py

bzrlib/tests/branch_implementations/test_uncommit.py

bzrlib/tests/branch_implementations/test_update.py

bzrlib/tests/bzrdir_implementations

bzrlib/tests/bzrdir_implementations/__init__.py

bzrlib/tests/bzrdir_implementations/test_bzrdir.py

bzrlib/tests/interrepository_implementations

bzrlib/tests/interrepository_implementations/__init__.py

bzrlib/tests/interrepository_implementations/test_interrepository.py

bzrlib/tests/intertree_implementations

bzrlib/tests/intertree_implementations/__init__.py

bzrlib/tests/intertree_implementations/test_compare.py

bzrlib/tests/interversionedfile_implementations

bzrlib/tests/interversionedfile_implementations/__init__.py

bzrlib/tests/interversionedfile_implementations/test_join.py

bzrlib/tests/lock_helpers.py

bzrlib/tests/per_lock

bzrlib/tests/per_lock/__init__.py

bzrlib/tests/per_lock/test_lock.py

bzrlib/tests/repository_implementations

bzrlib/tests/repository_implementations/__init__.py

bzrlib/tests/repository_implementations/test_break_lock.py

bzrlib/tests/repository_implementations/test_commit_builder.py

bzrlib/tests/repository_implementations/test_fileid_involved.py

bzrlib/tests/repository_implementations/test_iter_reverse_revision_history.py

bzrlib/tests/repository_implementations/test_reconcile.py

bzrlib/tests/repository_implementations/test_repository.py

bzrlib/tests/repository_implementations/test_revision.py

bzrlib/tests/repository_implementations/test_statistics.py

bzrlib/tests/revisionstore_implementations

bzrlib/tests/revisionstore_implementations/__init__.py

bzrlib/tests/revisionstore_implementations/test_all.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_atomicfile.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_bundle.py

bzrlib/tests/test_bzrdir.py

bzrlib/tests/test_cache_utf8.py

bzrlib/tests/test_commands.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_decorators.py

bzrlib/tests/test_delta.py

bzrlib/tests/test_diff.py

bzrlib/tests/test_dirstate.py

bzrlib/tests/test_doc_generate.py

bzrlib/tests/test_errors.py

bzrlib/tests/test_escaped_store.py

bzrlib/tests/test_extract.py

bzrlib/tests/test_fetch.py

bzrlib/tests/test_ftp_transport.py

bzrlib/tests/test_generate_docs.py

bzrlib/tests/test_generate_ids.py

bzrlib/tests/test_globbing.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_graph.py

bzrlib/tests/test_hashcache.py

bzrlib/tests/test_http.py

bzrlib/tests/test_http_response.py

bzrlib/tests/test_https_ca_bundle.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_ignores.py

bzrlib/tests/test_inv.py

bzrlib/tests/test_knit.py

bzrlib/tests/test_lazy_import.py

bzrlib/tests/test_lazy_regex.py

bzrlib/tests/test_lockable_files.py

bzrlib/tests/test_lockdir.py

bzrlib/tests/test_log.py

bzrlib/tests/test_memorytree.py

bzrlib/tests/test_merge.py

bzrlib/tests/test_merge3.py

bzrlib/tests/test_merge_core.py

bzrlib/tests/test_merge_directive.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_osutils_encodings.py

bzrlib/tests/test_patch.py

bzrlib/tests/test_patches.py

bzrlib/tests/test_patches_data

bzrlib/tests/test_patches_data/diff

bzrlib/tests/test_patches_data/diff-2

bzrlib/tests/test_patches_data/diff-3

bzrlib/tests/test_patches_data/diff-4

bzrlib/tests/test_patches_data/diff-5

bzrlib/tests/test_patches_data/diff-6

bzrlib/tests/test_patches_data/insert_top.patch

bzrlib/tests/test_patches_data/mod

bzrlib/tests/test_patches_data/mod-2

bzrlib/tests/test_patches_data/mod-3

bzrlib/tests/test_patches_data/mod-4

bzrlib/tests/test_patches_data/mod-5

bzrlib/tests/test_patches_data/mod-6

bzrlib/tests/test_patches_data/orig

bzrlib/tests/test_patches_data/orig-2

bzrlib/tests/test_patches_data/orig-3

bzrlib/tests/test_patches_data/orig-4

bzrlib/tests/test_patches_data/orig-5

bzrlib/tests/test_patches_data/orig-6

bzrlib/tests/test_patches_data/patchtext.patch

bzrlib/tests/test_permissions.py

bzrlib/tests/test_plugins.py

bzrlib/tests/test_progress.py

bzrlib/tests/test_read_bundle.py

bzrlib/tests/test_reconcile.py

bzrlib/tests/test_registry.py

bzrlib/tests/test_repository.py

bzrlib/tests/test_revert.py

bzrlib/tests/test_revision.py

bzrlib/tests/test_revisionnamespaces.py

bzrlib/tests/test_revisiontree.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_smart_add.py

bzrlib/tests/test_smart_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_ssh_transport.py

bzrlib/tests/test_status.py

bzrlib/tests/test_store.py

bzrlib/tests/test_subsume.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_tag.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_textfile.py

bzrlib/tests/test_textmerge.py

bzrlib/tests/test_timestamp.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transform.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tree.py

bzrlib/tests/test_treebuilder.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_tuned_gzip.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_urlutils.py

bzrlib/tests/test_version.py

bzrlib/tests/test_version_info.py

bzrlib/tests/test_versionedfile.py

bzrlib/tests/test_weave.py

bzrlib/tests/test_whitebox.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/test_workingtree_4.py

bzrlib/tests/test_wsgi.py

bzrlib/tests/test_xml.py

bzrlib/tests/tree_implementations

bzrlib/tests/tree_implementations/__init__.py

bzrlib/tests/tree_implementations/test_get_file_mtime.py

bzrlib/tests/tree_implementations/test_get_symlink_target.py

bzrlib/tests/tree_implementations/test_inv.py

bzrlib/tests/tree_implementations/test_list_files.py

bzrlib/tests/tree_implementations/test_revision_tree.py

bzrlib/tests/tree_implementations/test_test_trees.py

bzrlib/tests/tree_implementations/test_tree.py

bzrlib/tests/tree_implementations/test_walkdirs.py

bzrlib/tests/treeshape.py

bzrlib/tests/workingtree_implementations

bzrlib/tests/workingtree_implementations/__init__.py

bzrlib/tests/workingtree_implementations/test_add.py

bzrlib/tests/workingtree_implementations/test_add_reference.py

bzrlib/tests/workingtree_implementations/test_basis_inventory.py

bzrlib/tests/workingtree_implementations/test_basis_tree.py

bzrlib/tests/workingtree_implementations/test_break_lock.py

bzrlib/tests/workingtree_implementations/test_changes_from.py

bzrlib/tests/workingtree_implementations/test_commit.py

bzrlib/tests/workingtree_implementations/test_executable.py

bzrlib/tests/workingtree_implementations/test_flush.py

bzrlib/tests/workingtree_implementations/test_get_parent_ids.py

bzrlib/tests/workingtree_implementations/test_inv.py

bzrlib/tests/workingtree_implementations/test_is_control_filename.py

bzrlib/tests/workingtree_implementations/test_is_ignored.py

bzrlib/tests/workingtree_implementations/test_locking.py

bzrlib/tests/workingtree_implementations/test_merge_from_branch.py

bzrlib/tests/workingtree_implementations/test_mkdir.py

bzrlib/tests/workingtree_implementations/test_move.py

bzrlib/tests/workingtree_implementations/test_nested_specifics.py

bzrlib/tests/workingtree_implementations/test_parents.py

bzrlib/tests/workingtree_implementations/test_paths2ids.py

bzrlib/tests/workingtree_implementations/test_pull.py

bzrlib/tests/workingtree_implementations/test_put_file.py

bzrlib/tests/workingtree_implementations/test_read_working_inventory.py

bzrlib/tests/workingtree_implementations/test_readonly.py

bzrlib/tests/workingtree_implementations/test_rename_one.py

bzrlib/tests/workingtree_implementations/test_revision_tree.py

bzrlib/tests/workingtree_implementations/test_set_root_id.py

bzrlib/tests/workingtree_implementations/test_smart_add.py

bzrlib/tests/workingtree_implementations/test_unversion.py

bzrlib/tests/workingtree_implementations/test_walkdirs.py

bzrlib/tests/workingtree_implementations/test_workingtree.py

bzrlib/textfile.py

bzrlib/textmerge.py

bzrlib/timestamp.py

bzrlib/transactions.py

bzrlib/transform.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/chroot.py

bzrlib/transport/decorator.py

bzrlib/transport/fakenfs.py

bzrlib/transport/fakevfat.py

bzrlib/transport/ftp.py

bzrlib/transport/http

bzrlib/transport/http/__init__.py

bzrlib/transport/http/_pycurl.py

bzrlib/transport/http/_pycurl_errors.py

bzrlib/transport/http/_urllib.py

bzrlib/transport/http/_urllib2_wrappers.py

bzrlib/transport/http/ca_bundle.py

bzrlib/transport/http/response.py

bzrlib/transport/http/wsgi.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/transport/smart.py

bzrlib/transport/ssh.py

bzrlib/treebuilder.py

bzrlib/tsort.py

bzrlib/tuned_gzip.py

bzrlib/ui

bzrlib/ui/__init__.py

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/upgrade.py

bzrlib/urlutils.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/bencode.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/version.py

bzrlib/version_info_formats

bzrlib/version_info_formats/__init__.py

bzrlib/version_info_formats/format_python.py

bzrlib/version_info_formats/format_rio.py

bzrlib/versionedfile.py

bzrlib/weave.py

bzrlib/weave_commands.py

bzrlib/weavefile.py

bzrlib/win32utils.py

bzrlib/workingtree.py

bzrlib/workingtree_4.py

bzrlib/xml4.py

bzrlib/xml5.py

bzrlib/xml6.py

bzrlib/xml7.py

contrib/bash/bzr

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

doc/README.1st

doc/bazaar-vcs.org.kid

doc/centralized_workflow.txt

doc/configuration.txt

doc/default.css

doc/http_smart_server.txt

doc/index.txt

doc/plugins.txt

doc/server.txt

doc/setting_up_email.txt

doc/specifying_revisions.txt

doc/tutorial.txt

doc/using_aliases.txt

doc/version_info.txt

generate_docs.py

profile_imports.py

tools

tools/__init__.py

tools/biobench.py

tools/capture_tree.py

tools/convertfile.py

tools/convertinv.py

tools/doc_generate

tools/doc_generate/__init__.py

tools/doc_generate/autodoc_bash_completion.py

tools/doc_generate/autodoc_man.py

tools/doc_generate/autodoc_rstx.py

tools/history2revfiles.py

tools/http_client.py

tools/riodemo.py

tools/rst2html.py

tools/rst2prettyhtml.py

tools/trace-revisions

tools/weavebench.py

tools/weavemerge.sh

tools/win32

tools/win32/__init__.py

tools/win32/bazaar.url

tools/win32/bzr-win32-bdist-postinstall.py

tools/win32/bzr.iss.cog

tools/win32/bzr_postinstall.py

tools/win32/file_version.py

tools/win32/info.txt

tools/win32/ostools.py

tools/win32/start_bzr.bat

files removed:
bzrlib/cache.py

bzrlib/mdiff.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/tests.py

doc/Makefile

doc/adoption.txt

doc/bitkeeper.txt

doc/changelogs.txt

doc/cherry-picking.txt

doc/cmdref.txt

doc/common-format.txt

doc/compared-aegis.txt

doc/compared-codeville.txt

doc/compared-cvsnt.txt

doc/compared-opencm.txt

doc/compared-prcs.txt

doc/compared-teamware.txt

doc/compression.txt

doc/config-specs.txt

doc/conflicts.txt

doc/costs.txt

doc/darcs.txt

doc/deadly-sins.txt

doc/default.css

doc/design.txt

doc/extra-commands.txt

doc/formats.txt

doc/hashes.txt

doc/ignore.txt

doc/index.txt

doc/interrupted.txt

doc/intro.txt

doc/inventory.txt

doc/join-branches.txt

doc/kill-version.txt

doc/layers.txt

doc/library-interface.txt

doc/merge.txt

doc/mirroring.txt

doc/monotone.txt

doc/news.txt

doc/optional-edit.txt

doc/partial-commit.txt

doc/pool.txt

doc/purpose.txt

doc/python.txt

doc/quilt.txt

doc/quotes.txt

doc/random.txt

doc/requirements.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/revision-syntax.txt

doc/rollup.txt

doc/scalability.txt

doc/security.txt

doc/shared-branches.txt

doc/short-demo.txt

doc/supportability.txt

doc/svk.txt

doc/switch-in-branch.txt

doc/tagging.txt

doc/taxonomy.txt

doc/thanks.txt

doc/todo-from-arch.txt

doc/unchanged.txt

doc/unrelated-merge.txt

doc/usability.txt

doc/use-cases.txt

doc/web-interface.txt

doc/workflow.txt

doc/yaml.txt

notes

notes/new-inventory-sample.xml

notes/performance.txt

testbzr

urlgrabber

urlgrabber/__init__.py

urlgrabber/byterange.py

urlgrabber/grabber.py

urlgrabber/keepalive.py

urlgrabber/mirror.py

urlgrabber/progress.py

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

elementtree/ => bzrlib/util/elementtree/

bzrlib/xml.py => bzrlib/xml_serializer.py

contrib/bash/bzr => contrib/bash/bzr.simple

bzrlib/newinventory.py => contrib/newinventory.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/log.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/elementtree/ElementTree.py

contrib/add-bzr-to-baz

contrib/zsh/_bzr

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/osutils.py

# Bazaar-NG -- distributed version control

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import os, types, re, time, errno

from stat import S_ISREG, S_ISDIR, S_ISLNK, ST_MODE, ST_SIZE

from errors import bailout, BzrError

from trace import mutter

from cStringIO import StringIO

import os

import re

import stat

from stat import (S_ISREG, S_ISDIR, S_ISLNK, ST_MODE, ST_SIZE,

S_ISCHR, S_ISBLK, S_ISFIFO, S_ISSOCK)

import sys

import time

from bzrlib.lazy_import import lazy_import

lazy_import(globals(), """

import codecs

from datetime import datetime

import errno

from ntpath import (abspath as _nt_abspath,

join as _nt_join,

normpath as _nt_normpath,

realpath as _nt_realpath,

splitdrive as _nt_splitdrive,

)

import posixpath

import sha

import shutil

from shutil import (

rmtree,

)

import tempfile

from tempfile import (

mkdtemp,

)

import unicodedata

from bzrlib import (

cache_utf8,

errors,

win32utils,

)

""")

import bzrlib

from bzrlib import symbol_versioning

from bzrlib.symbol_versioning import (

deprecated_function,

zero_nine,

)

from bzrlib.trace import mutter

# On win32, O_BINARY is used to indicate the file should

# be opened in binary mode, rather than text mode.

# On other platforms, O_BINARY doesn't exist, because

# they always open in binary mode, so it is okay to

# OR with 0 on those platforms

O_BINARY = getattr(os, 'O_BINARY', 0)

def make_readonly(filename):

"""Make a filename read-only."""

# TODO: probably needs to be fixed for windows

mod = os.stat(filename).st_mode

mod = mod & 0777555

os.chmod(filename, mod)

_QUOTE_RE = re.compile(r'([^a-zA-Z0-9.,:/_~-])')

_QUOTE_RE = None

def quotefn(f):

"""Return shell-quoted filename"""

## We could be a bit more terse by using double-quotes etc

f = _QUOTE_RE.sub(r'\\\1', f)

if f[0] == '~':

f[0:1] = r'\~'

return f

def file_kind(f):

mode = os.lstat(f)[ST_MODE]

if S_ISREG(mode):

return 'file'

elif S_ISDIR(mode):

return 'directory'

elif S_ISLNK(mode):

return 'symlink'

else:

raise BzrError("can't handle file kind with mode %o of %r" % (mode, f))

"""Return a quoted filename filename

This previously used backslash quoting, but that works poorly on

Windows."""

# TODO: I'm not really sure this is the best format either.x

global _QUOTE_RE

if _QUOTE_RE is None:

_QUOTE_RE = re.compile(r'([^a-zA-Z0-9.,:/\\_~-])')

if _QUOTE_RE.search(f):

100

return '"' + f + '"'

101

else:

102

return f

103

104

105

_directory_kind = 'directory'

106

107

_formats = {

108

stat.S_IFDIR:_directory_kind,

109

stat.S_IFCHR:'chardev',

110

stat.S_IFBLK:'block',

111

stat.S_IFREG:'file',

112

stat.S_IFIFO:'fifo',

113

stat.S_IFLNK:'symlink',

114

stat.S_IFSOCK:'socket',

115

}

116

117

118

def file_kind_from_stat_mode(stat_mode, _formats=_formats, _unknown='unknown'):

119

"""Generate a file kind from a stat mode. This is used in walkdirs.

120

121

Its performance is critical: Do not mutate without careful benchmarking.

122

"""

123

try:

124

return _formats[stat_mode & 0170000]

125

except KeyError:

126

return _unknown

127

128

129

def file_kind(f, _lstat=os.lstat, _mapper=file_kind_from_stat_mode):

130

try:

131

return _mapper(_lstat(f).st_mode)

132

except OSError, e:

133

if getattr(e, 'errno', None) == errno.ENOENT:

134

raise errors.NoSuchFile(f)

135

raise

136

137

138

def get_umask():

139

"""Return the current umask"""

140

# Assume that people aren't messing with the umask while running

141

# XXX: This is not thread safe, but there is no way to get the

142

# umask without setting it

143

umask = os.umask(0)

144

os.umask(umask)

145

return umask

146

147

148

_kind_marker_map = {

149

"file": "",

150

_directory_kind: "/",

151

"symlink": "@",

152

'tree-reference': '+',

153

}

154

155

156

def kind_marker(kind):

157

try:

158

return _kind_marker_map[kind]

159

except KeyError:

160

raise errors.BzrError('invalid file kind %r' % kind)

161

162

163

lexists = getattr(os.path, 'lexists', None)

164

if lexists is None:

165

def lexists(f):

166

try:

167

stat = getattr(os, 'lstat', os.stat)

168

stat(f)

169

return True

170

except OSError, e:

171

if e.errno == errno.ENOENT:

172

return False;

173

else:

174

raise errors.BzrError("lstat/stat of (%r): %r" % (f, e))

175

176

177

def fancy_rename(old, new, rename_func, unlink_func):

178

"""A fancy rename, when you don't have atomic rename.

179

180

:param old: The old path, to rename from

181

:param new: The new path, to rename to

182

:param rename_func: The potentially non-atomic rename function

183

:param unlink_func: A way to delete the target file if the full rename succeeds

184

"""

185

186

# sftp rename doesn't allow overwriting, so play tricks:

187

import random

188

base = os.path.basename(new)

189

dirname = os.path.dirname(new)

190

tmp_name = u'tmp.%s.%.9f.%d.%s' % (base, time.time(), os.getpid(), rand_chars(10))

191

tmp_name = pathjoin(dirname, tmp_name)

192

193

# Rename the file out of the way, but keep track if it didn't exist

194

# We don't want to grab just any exception

195

# something like EACCES should prevent us from continuing

196

# The downside is that the rename_func has to throw an exception

197

# with an errno = ENOENT, or NoSuchFile

198

file_existed = False

199

try:

200

rename_func(new, tmp_name)

201

except (errors.NoSuchFile,), e:

202

pass

203

except IOError, e:

204

# RBC 20060103 abstraction leakage: the paramiko SFTP clients rename

205

# function raises an IOError with errno is None when a rename fails.

206

# This then gets caught here.

207

if e.errno not in (None, errno.ENOENT, errno.ENOTDIR):

208

raise

209

except Exception, e:

210

if (getattr(e, 'errno', None) is None

211

or e.errno not in (errno.ENOENT, errno.ENOTDIR)):

212

raise

213

else:

214

file_existed = True

215

216

success = False

217

try:

218

# This may throw an exception, in which case success will

219

# not be set.

220

rename_func(old, new)

221

success = True

222

finally:

223

if file_existed:

224

# If the file used to exist, rename it back into place

225

# otherwise just delete it from the tmp location

226

if success:

227

unlink_func(tmp_name)

228

else:

229

rename_func(tmp_name, new)

230

231

232

# In Python 2.4.2 and older, os.path.abspath and os.path.realpath

233

# choke on a Unicode string containing a relative path if

234

# os.getcwd() returns a non-sys.getdefaultencoding()-encoded

235

# string.

236

_fs_enc = sys.getfilesystemencoding() or 'utf-8'

237

def _posix_abspath(path):

238

# jam 20060426 rather than encoding to fsencoding

239

# copy posixpath.abspath, but use os.getcwdu instead

240

if not posixpath.isabs(path):

241

path = posixpath.join(getcwd(), path)

242

return posixpath.normpath(path)

243

244

245

def _posix_realpath(path):

246

return posixpath.realpath(path.encode(_fs_enc)).decode(_fs_enc)

247

248

249

def _win32_fixdrive(path):

250

"""Force drive letters to be consistent.

251

252

win32 is inconsistent whether it returns lower or upper case

253

and even if it was consistent the user might type the other

254

so we force it to uppercase

255

running python.exe under cmd.exe return capital C:\\

256

running win32 python inside a cygwin shell returns lowercase c:\\

257

"""

258

drive, path = _nt_splitdrive(path)

259

return drive.upper() + path

260

261

262

def _win32_abspath(path):

263

# Real _nt_abspath doesn't have a problem with a unicode cwd

264

return _win32_fixdrive(_nt_abspath(unicode(path)).replace('\\', '/'))

265

266

267

def _win98_abspath(path):

268

"""Return the absolute version of a path.

269

Windows 98 safe implementation (python reimplementation

270

of Win32 API function GetFullPathNameW)

271

"""

272

# Corner cases:

273

# C:\path => C:/path

274

# C:/path => C:/path

275

# \\HOST\path => //HOST/path

276

# //HOST/path => //HOST/path

277

# path => C:/cwd/path

278

# /path => C:/path

279

path = unicode(path)

280

# check for absolute path

281

drive = _nt_splitdrive(path)[0]

282

if drive == '' and path[:2] not in('//','\\\\'):

283

cwd = os.getcwdu()

284

# we cannot simply os.path.join cwd and path

285

# because os.path.join('C:','/path') produce '/path'

286

# and this is incorrect

287

if path[:1] in ('/','\\'):

288

cwd = _nt_splitdrive(cwd)[0]

289

path = path[1:]

290

path = cwd + '\\' + path

291

return _win32_fixdrive(_nt_normpath(path).replace('\\', '/'))

292

293

if win32utils.winver == 'Windows 98':

294

_win32_abspath = _win98_abspath

295

296

297

def _win32_realpath(path):

298

# Real _nt_realpath doesn't have a problem with a unicode cwd

299

return _win32_fixdrive(_nt_realpath(unicode(path)).replace('\\', '/'))

300

301

302

def _win32_pathjoin(*args):

303

return _nt_join(*args).replace('\\', '/')

304

305

306

def _win32_normpath(path):

307

return _win32_fixdrive(_nt_normpath(unicode(path)).replace('\\', '/'))

308

309

310

def _win32_getcwd():

311

return _win32_fixdrive(os.getcwdu().replace('\\', '/'))

312

313

314

def _win32_mkdtemp(*args, **kwargs):

315

return _win32_fixdrive(tempfile.mkdtemp(*args, **kwargs).replace('\\', '/'))

316

317

318

def _win32_rename(old, new):

319

"""We expect to be able to atomically replace 'new' with old.

320

321

On win32, if new exists, it must be moved out of the way first,

322

and then deleted.

323

"""

324

try:

325

fancy_rename(old, new, rename_func=os.rename, unlink_func=os.unlink)

326

except OSError, e:

327

if e.errno in (errno.EPERM, errno.EACCES, errno.EBUSY, errno.EINVAL):

328

# If we try to rename a non-existant file onto cwd, we get

329

# EPERM or EACCES instead of ENOENT, this will raise ENOENT

330

# if the old path doesn't exist, sometimes we get EACCES

331

# On Linux, we seem to get EBUSY, on Mac we get EINVAL

332

os.lstat(old)

333

raise

334

335

336

def _mac_getcwd():

337

return unicodedata.normalize('NFKC', os.getcwdu())

338

339

340

# Default is to just use the python builtins, but these can be rebound on

341

# particular platforms.

342

abspath = _posix_abspath

343

realpath = _posix_realpath

344

pathjoin = os.path.join

345

normpath = os.path.normpath

346

getcwd = os.getcwdu

347

rename = os.rename

348

dirname = os.path.dirname

349

basename = os.path.basename

350

split = os.path.split

351

splitext = os.path.splitext

352

# These were already imported into local scope

353

# mkdtemp = tempfile.mkdtemp

354

# rmtree = shutil.rmtree

355

356

MIN_ABS_PATHLENGTH = 1

357

358

359

if sys.platform == 'win32':

360

abspath = _win32_abspath

361

realpath = _win32_realpath

362

pathjoin = _win32_pathjoin

363

normpath = _win32_normpath

364

getcwd = _win32_getcwd

365

mkdtemp = _win32_mkdtemp

366

rename = _win32_rename

367

368

MIN_ABS_PATHLENGTH = 3

369

370

def _win32_delete_readonly(function, path, excinfo):

371

"""Error handler for shutil.rmtree function [for win32]

372

Helps to remove files and dirs marked as read-only.

373

"""

374

exception = excinfo[1]

375

if function in (os.remove, os.rmdir) \

376

and isinstance(exception, OSError) \

377

and exception.errno == errno.EACCES:

378

make_writable(path)

379

function(path)

380

else:

381

raise

382

383

def rmtree(path, ignore_errors=False, onerror=_win32_delete_readonly):

384

"""Replacer for shutil.rmtree: could remove readonly dirs/files"""

385

return shutil.rmtree(path, ignore_errors, onerror)

386

elif sys.platform == 'darwin':

387

getcwd = _mac_getcwd

388

389

390

def get_terminal_encoding():

391

"""Find the best encoding for printing to the screen.

392

393

This attempts to check both sys.stdout and sys.stdin to see

394

what encoding they are in, and if that fails it falls back to

395

bzrlib.user_encoding.

396

The problem is that on Windows, locale.getpreferredencoding()

397

is not the same encoding as that used by the console:

398

http://mail.python.org/pipermail/python-list/2003-May/162357.html

399

400

On my standard US Windows XP, the preferred encoding is

401

cp1252, but the console is cp437

402

"""

403

output_encoding = getattr(sys.stdout, 'encoding', None)

404

if not output_encoding:

405

input_encoding = getattr(sys.stdin, 'encoding', None)

406

if not input_encoding:

407

output_encoding = bzrlib.user_encoding

408

mutter('encoding stdout as bzrlib.user_encoding %r', output_encoding)

409

else:

410

output_encoding = input_encoding

411

mutter('encoding stdout as sys.stdin encoding %r', output_encoding)

412

else:

413

mutter('encoding stdout as sys.stdout encoding %r', output_encoding)

414

if output_encoding == 'cp0':

415

# invalid encoding (cp0 means 'no codepage' on Windows)

416

output_encoding = bzrlib.user_encoding

417

mutter('cp0 is invalid encoding.'

418

' encoding stdout as bzrlib.user_encoding %r', output_encoding)

419

# check encoding

420

try:

421

codecs.lookup(output_encoding)

422

except LookupError:

423

sys.stderr.write('bzr: warning:'

424

' unknown terminal encoding %s.\n'

425

' Using encoding %s instead.\n'

426

% (output_encoding, bzrlib.user_encoding)

427

)

428

output_encoding = bzrlib.user_encoding

429

430

return output_encoding

431

432

433

def normalizepath(f):

434

if getattr(os.path, 'realpath', None) is not None:

435

F = realpath

436

else:

437

F = abspath

438

[p,e] = os.path.split(f)

439

if e == "" or e == "." or e == "..":

440

return F(f)

441

else:

442

return pathjoin(F(p), e)

443

444

445

def backup_file(fn):

446

"""Copy a file to a backup.

447

448

Backups are named in GNU-style, with a ~ suffix.

449

450

If the file is already a backup, it's not copied.

451

"""

452

if fn[-1] == '~':

453

return

454

bfn = fn + '~'

455

456

if has_symlinks() and os.path.islink(fn):

457

target = os.readlink(fn)

458

os.symlink(target, bfn)

459

return

460

inf = file(fn, 'rb')

461

try:

462

content = inf.read()

463

finally:

464

inf.close()

465

466

outf = file(bfn, 'wb')

467

try:

468

outf.write(content)

469

finally:

470

outf.close()

471

472

473

def isdir(f):

478

return False

479

480

481

def isfile(f):

482

"""True if f is a regular file."""

483

try:

485

except OSError:

486

return False

487

488

def islink(f):

489

"""True if f is a symlink."""

490

try:

491

return S_ISLNK(os.lstat(f)[ST_MODE])

492

except OSError:

493

return False

494

495

def is_inside(dir, fname):

496

"""True if fname is inside dir.

497

498

The parameters should typically be passed to osutils.normpath first, so

499

that . and .. and repeated slashes are eliminated, and the separators

500

are canonical for the platform.

501

502

The empty string as a dir name is taken as top-of-tree and matches

503

everything.

504

"""

505

# XXX: Most callers of this can actually do something smarter by

506

# looking at the inventory

507

if dir == fname:

508

return True

509

510

if dir == '':

511

return True

512

513

if dir[-1] != '/':

514

dir += '/'

515

516

return fname.startswith(dir)

517

518

519

def is_inside_any(dir_list, fname):

520

"""True if fname is inside any of given dirs."""

521

for dirname in dir_list:

522

if is_inside(dirname, fname):

523

return True

524

return False

525

526

527

def is_inside_or_parent_of_any(dir_list, fname):

528

"""True if fname is a child or a parent of any of the given files."""

529

for dirname in dir_list:

530

if is_inside(dirname, fname) or is_inside(fname, dirname):

531

return True

532

return False

533

534

535

def pumpfile(fromfile, tofile):

536

"""Copy contents of one file to another."""

tofile.write(fromfile.read())

def uuid():

"""Return a new UUID"""

try:

return file('/proc/sys/kernel/random/uuid').readline().rstrip('\n')

except IOError:

return chomp(os.popen('uuidgen').readline())

537

BUFSIZE = 32768

538

while True:

539

b = fromfile.read(BUFSIZE)

540

if not b:

541

break

542

tofile.write(b)

543

544

545

def file_iterator(input_file, readsize=32768):

546

while True:

547

b = input_file.read(readsize)

548

if len(b) == 0:

549

break

550

yield b

551

552

553

def sha_file(f):

import sha

if hasattr(f, 'tell'):

554

if getattr(f, 'tell', None) is not None:

555

assert f.tell() == 0

556

s = sha.new()

557

BUFSIZE = 128<<10

104

563

return s.hexdigest()

105

564

106

565

566

567

def sha_strings(strings):

568

"""Return the sha-1 of concatenation of strings"""

569

s = sha.new()

570

map(s.update, strings)

571

return s.hexdigest()

572

573

107

574

def sha_string(f):

108

import sha

109

575

s = sha.new()

110

576

s.update(f)

111

577

return s.hexdigest()

112

578

113

579

114

115

580

def fingerprint_file(f):

116

import sha

117

581

s = sha.new()

118

582

b = f.read()

119

583

s.update(b)

122

586

'sha1': s.hexdigest()}

123

587

124

588

125

def config_dir():

126

"""Return per-user configuration directory.

127

128

By default this is ~/.bzr.conf/

129

130

TODO: Global option --config-dir to override this.

131

"""

132

return os.path.expanduser("~/.bzr.conf")

133

134

135

def _auto_user_id():

136

"""Calculate automatic user identification.

137

138

Returns (realname, email).

139

140

Only used when none is set in the environment or the id file.

141

142

This previously used the FQDN as the default domain, but that can

143

be very slow on machines where DNS is broken. So now we simply

144

use the hostname.

145

"""

146

import socket

147

148

# XXX: Any good way to get real user name on win32?

149

150

try:

151

import pwd

152

uid = os.getuid()

153

w = pwd.getpwuid(uid)

154

gecos = w.pw_gecos.decode(bzrlib.user_encoding)

155

username = w.pw_name.decode(bzrlib.user_encoding)

156

comma = gecos.find(',')

157

if comma == -1:

158

realname = gecos

159

else:

160

realname = gecos[:comma]

161

if not realname:

162

realname = username

163

164

except ImportError:

165

import getpass

166

realname = username = getpass.getuser().decode(bzrlib.user_encoding)

167

168

return realname, (username + '@' + socket.gethostname())

169

170

171

def _get_user_id():

172

"""Return the full user id from a file or environment variable.

173

174

TODO: Allow taking this from a file in the branch directory too

175

for per-branch ids."""

176

v = os.environ.get('BZREMAIL')

177

if v:

178

return v.decode(bzrlib.user_encoding)

179

180

try:

181

return (open(os.path.join(config_dir(), "email"))

182

.read()

183

.decode(bzrlib.user_encoding)

184

.rstrip("\r\n"))

185

except IOError, e:

186

if e.errno != errno.ENOENT:

187

raise e

188

189

v = os.environ.get('EMAIL')

190

if v:

191

return v.decode(bzrlib.user_encoding)

192

else:

193

return None

194

195

196

def username():

197

"""Return email-style username.

198

199

Something similar to 'Martin Pool <mbp@sourcefrog.net>'

200

201

TODO: Check it's reasonably well-formed.

202

"""

203

v = _get_user_id()

204

if v:

205

return v

206

207

name, email = _auto_user_id()

208

if name:

209

return '%s <%s>' % (name, email)

210

else:

211

return email

212

213

214

_EMAIL_RE = re.compile(r'[\w+.-]+@[\w+.-]+')

215

def user_email():

216

"""Return just the email component of a username."""

217

e = _get_user_id()

218

if e:

219

m = _EMAIL_RE.search(e)

220

if not m:

221

bailout("%r doesn't seem to contain a reasonable email address" % e)

222

return m.group(0)

223

224

return _auto_user_id()[1]

225

226

227

228

589

def compare_files(a, b):

229

590

"""Returns true if equal in contents"""

230

591

BUFSIZE = 4096

237

598

return True

238

599

239

600

240

241

601

def local_time_offset(t=None):

242

602

"""Return offset of local zone from GMT, either at present or at time t."""

243

# python2.3 localtime() can't take None

244

if t == None:

603

if t is None:

245

604

t = time.time()

246

247

if time.localtime(t).tm_isdst and time.daylight:

248

return -time.altzone

249

else:

250

return -time.timezone

605

offset = datetime.fromtimestamp(t) - datetime.utcfromtimestamp(t)

606

return offset.days * 86400 + offset.seconds

251

607

252

608

253

def format_date(t, offset=0, timezone='original'):

609

def format_date(t, offset=0, timezone='original', date_fmt=None,

610

show_offset=True):

254

611

## TODO: Perhaps a global option to use either universal or local time?

255

612

## Or perhaps just let people set $TZ?

256

613

assert isinstance(t, float)

259

616

tt = time.gmtime(t)

260

617

offset = 0

261

618

elif timezone == 'original':

262

if offset == None:

619

if offset is None:

263

620

offset = 0

264

621

tt = time.gmtime(t + offset)

265

622

elif timezone == 'local':

266

623

tt = time.localtime(t)

267

624

offset = local_time_offset(t)

268

625

else:

269

bailout("unsupported timezone format %r",

270

['options are "utc", "original", "local"'])

271

272

return (time.strftime("%a %Y-%m-%d %H:%M:%S", tt)

273

+ ' %+03d%02d' % (offset / 3600, (offset / 60) % 60))

626

raise errors.BzrError("unsupported timezone format %r" % timezone,

627

['options are "utc", "original", "local"'])

628

if date_fmt is None:

629

date_fmt = "%a %Y-%m-%d %H:%M:%S"

630

if show_offset:

631

offset_str = ' %+03d%02d' % (offset / 3600, (offset / 60) % 60)

632

else:

633

offset_str = ''

634

return (time.strftime(date_fmt, tt) + offset_str)

274

635

275

636

276

637

def compact_date(when):

277

638

return time.strftime('%Y%m%d%H%M%S', time.gmtime(when))

278

639

279

640

641

def format_delta(delta):

642

"""Get a nice looking string for a time delta.

643

644

:param delta: The time difference in seconds, can be positive or negative.

645

positive indicates time in the past, negative indicates time in the

646

future. (usually time.time() - stored_time)

647

:return: String formatted to show approximate resolution

648

"""

649

delta = int(delta)

650

if delta >= 0:

651

direction = 'ago'

652

else:

653

direction = 'in the future'

654

delta = -delta

655

656

seconds = delta

657

if seconds < 90: # print seconds up to 90 seconds

658

if seconds == 1:

659

return '%d second %s' % (seconds, direction,)

660

else:

661

return '%d seconds %s' % (seconds, direction)

662

663

minutes = int(seconds / 60)

664

seconds -= 60 * minutes

665

if seconds == 1:

666

plural_seconds = ''

667

else:

668

plural_seconds = 's'

669

if minutes < 90: # print minutes, seconds up to 90 minutes

670

if minutes == 1:

671

return '%d minute, %d second%s %s' % (

672

minutes, seconds, plural_seconds, direction)

673

else:

674

return '%d minutes, %d second%s %s' % (

675

minutes, seconds, plural_seconds, direction)

676

677

hours = int(minutes / 60)

678

minutes -= 60 * hours

679

if minutes == 1:

680

plural_minutes = ''

681

else:

682

plural_minutes = 's'

683

684

if hours == 1:

685

return '%d hour, %d minute%s %s' % (hours, minutes,

686

plural_minutes, direction)

687

return '%d hours, %d minute%s %s' % (hours, minutes,

688

plural_minutes, direction)

280

689

281

690

def filesize(f):

282

691

"""Return size of given open file."""

283

692

return os.fstat(f.fileno())[ST_SIZE]

284

693

285

694

286

if hasattr(os, 'urandom'): # python 2.4 and later

695

# Define rand_bytes based on platform.

696

try:

697

# Python 2.4 and later have os.urandom,

698

# but it doesn't work on some arches

699

os.urandom(1)

287

700

rand_bytes = os.urandom

288

else:

289

# FIXME: No good on non-Linux

290

_rand_file = file('/dev/urandom', 'rb')

291

rand_bytes = _rand_file.read

701

except (NotImplementedError, AttributeError):

702

# If python doesn't have os.urandom, or it doesn't work,

703

# then try to first pull random data from /dev/urandom

704

try:

705

rand_bytes = file('/dev/urandom', 'rb').read

706

# Otherwise, use this hack as a last resort

707

except (IOError, OSError):

708

# not well seeded, but better than nothing

709

def rand_bytes(n):

710

import random

711

s = ''

712

while n:

713

s += chr(random.randint(0, 255))

714

n -= 1

715

return s

716

717

718

ALNUM = '0123456789abcdefghijklmnopqrstuvwxyz'

719

def rand_chars(num):

720

"""Return a random string of num alphanumeric characters

721

722

The result only contains lowercase chars because it may be used on

723

case-insensitive filesystems.

724

"""

725

s = ''

726

for raw_byte in rand_bytes(num):

727

s += ALNUM[ord(raw_byte) % 36]

728

return s

292

729

293

730

294

731

## TODO: We could later have path objects that remember their list

295

732

## decomposition (might be too tricksy though.)

296

733

297

734

def splitpath(p):

298

"""Turn string into list of parts.

299

300

>>> splitpath('a')

301

['a']

302

>>> splitpath('a/b')

303

['a', 'b']

304

>>> splitpath('a/./b')

305

['a', 'b']

306

>>> splitpath('a/.b')

307

['a', '.b']

308

>>> splitpath('a/../b')

309

Traceback (most recent call last):

310

...

311

BzrError: ("sorry, '..' not allowed in path", [])

312

"""

313

assert isinstance(p, types.StringTypes)

735

"""Turn string into list of parts."""

736

assert isinstance(p, basestring)

314

737

315

738

# split on either delimiter because people might use either on

316

739

# Windows

319

742

rps = []

320

743

for f in ps:

321

744

if f == '..':

322

bailout("sorry, %r not allowed in path" % f)

745

raise errors.BzrError("sorry, %r not allowed in path" % f)

323

746

elif (f == '.') or (f == ''):

324

747

pass

325

748

else:

327

750

return rps

328

751

329

752

def joinpath(p):

330

assert isinstance(p, list)

753

assert isinstance(p, (list, tuple))

331

754

for f in p:

332

if (f == '..') or (f == None) or (f == ''):

333

bailout("sorry, %r not allowed in path" % f)

334

return os.path.join(*p)

335

336

755

if (f == '..') or (f is None) or (f == ''):

756

raise errors.BzrError("sorry, %r not allowed in path" % f)

757

return pathjoin(*p)

758

759

760

@deprecated_function(zero_nine)

337

761

def appendpath(p1, p2):

338

762

if p1 == '':

339

763

return p2

340

764

else:

341

return os.path.join(p1, p2)

342

343

344

def extern_command(cmd, ignore_errors = False):

345

mutter('external command: %s' % `cmd`)

346

if os.system(cmd):

347

if not ignore_errors:

348

bailout('command failed')

349

765

return pathjoin(p1, p2)

766

767

768

def split_lines(s):

769

"""Split s into lines, but without removing the newline characters."""

770

lines = s.split('\n')

771

result = [line + '\n' for line in lines[:-1]]

772

if lines[-1]:

773

result.append(lines[-1])

774

return result

775

776

777

def hardlinks_good():

778

return sys.platform not in ('win32', 'cygwin', 'darwin')

779

780

781

def link_or_copy(src, dest):

782

"""Hardlink a file, or copy it if it can't be hardlinked."""

783

if not hardlinks_good():

784

shutil.copyfile(src, dest)

785

return

786

try:

787

os.link(src, dest)

788

except (OSError, IOError), e:

789

if e.errno != errno.EXDEV:

790

raise

791

shutil.copyfile(src, dest)

792

793

def delete_any(full_path):

794

"""Delete a file or directory."""

795

try:

796

os.unlink(full_path)

797

except OSError, e:

798

# We may be renaming a dangling inventory id

799

if e.errno not in (errno.EISDIR, errno.EACCES, errno.EPERM):

800

raise

801

os.rmdir(full_path)

802

803

804

def has_symlinks():

805

if getattr(os, 'symlink', None) is not None:

806

return True

807

else:

808

return False

809

810

811

def contains_whitespace(s):

812

"""True if there are any whitespace characters in s."""

813

# string.whitespace can include '\xa0' in certain locales, because it is

814

# considered "non-breaking-space" as part of ISO-8859-1. But it

815

# 1) Isn't a breaking whitespace

816

# 2) Isn't one of ' \t\r\n' which are characters we sometimes use as

817

# separators

818

# 3) '\xa0' isn't unicode safe since it is >128.

819

820

# This should *not* be a unicode set of characters in case the source

821

# string is not a Unicode string. We can auto-up-cast the characters since

822

# they are ascii, but we don't want to auto-up-cast the string in case it

823

# is utf-8

824

for ch in ' \t\n\r\v\f':

825

if ch in s:

826

return True

827

else:

828

return False

829

830

831

def contains_linebreaks(s):

832

"""True if there is any vertical whitespace in s."""

833

for ch in '\f\n\r':

834

if ch in s:

835

return True

836

else:

837

return False

838

839

840

def relpath(base, path):

841

"""Return path relative to base, or raise exception.

842

843

The path may be either an absolute path or a path relative to the

844

current working directory.

845

846

os.path.commonprefix (python2.4) has a bad bug that it works just

847

on string prefixes, assuming that '/u' is a prefix of '/u2'. This

848

avoids that problem.

849

"""

850

851

assert len(base) >= MIN_ABS_PATHLENGTH, ('Length of base must be equal or'

852

' exceed the platform minimum length (which is %d)' %

853

MIN_ABS_PATHLENGTH)

854

855

rp = abspath(path)

856

857

s = []

858

head = rp

859

while len(head) >= len(base):

860

if head == base:

861

break

862

head, tail = os.path.split(head)

863

if tail:

864

s.insert(0, tail)

865

else:

866

raise errors.PathNotChild(rp, base)

867

868

if s:

869

return pathjoin(*s)

870

else:

871

return ''

872

873

874

def safe_unicode(unicode_or_utf8_string):

875

"""Coerce unicode_or_utf8_string into unicode.

876

877

If it is unicode, it is returned.

878

Otherwise it is decoded from utf-8. If a decoding error

879

occurs, it is wrapped as a If the decoding fails, the exception is wrapped

880

as a BzrBadParameter exception.

881

"""

882

if isinstance(unicode_or_utf8_string, unicode):

883

return unicode_or_utf8_string

884

try:

885

return unicode_or_utf8_string.decode('utf8')

886

except UnicodeDecodeError:

887

raise errors.BzrBadParameterNotUnicode(unicode_or_utf8_string)

888

889

890

def safe_utf8(unicode_or_utf8_string):

891

"""Coerce unicode_or_utf8_string to a utf8 string.

892

893

If it is a str, it is returned.

894

If it is Unicode, it is encoded into a utf-8 string.

895

"""

896

if isinstance(unicode_or_utf8_string, str):

897

# TODO: jam 20070209 This is overkill, and probably has an impact on

898

# performance if we are dealing with lots of apis that want a

899

# utf-8 revision id

900

try:

901

# Make sure it is a valid utf-8 string

902

unicode_or_utf8_string.decode('utf-8')

903

except UnicodeDecodeError:

904

raise errors.BzrBadParameterNotUnicode(unicode_or_utf8_string)

905

return unicode_or_utf8_string

906

return unicode_or_utf8_string.encode('utf-8')

907

908

909

_revision_id_warning = ('Unicode revision ids were deprecated in bzr 0.15.'

910

' Revision id generators should be creating utf8'

911

' revision ids.')

912

913

914

def safe_revision_id(unicode_or_utf8_string, warn=True):

915

"""Revision ids should now be utf8, but at one point they were unicode.

916

917

:param unicode_or_utf8_string: A possibly Unicode revision_id. (can also be

918

utf8 or None).

919

:param warn: Functions that are sanitizing user data can set warn=False

920

:return: None or a utf8 revision id.

921

"""

922

if (unicode_or_utf8_string is None

923

or unicode_or_utf8_string.__class__ == str):

924

return unicode_or_utf8_string

925

if warn:

926

symbol_versioning.warn(_revision_id_warning, DeprecationWarning,

927

stacklevel=2)

928

return cache_utf8.encode(unicode_or_utf8_string)

929

930

931

_file_id_warning = ('Unicode file ids were deprecated in bzr 0.15. File id'

932

' generators should be creating utf8 file ids.')

933

934

935

def safe_file_id(unicode_or_utf8_string, warn=True):

936

"""File ids should now be utf8, but at one point they were unicode.

937

938

This is the same as safe_utf8, except it uses the cached encode functions

939

to save a little bit of performance.

940

941

:param unicode_or_utf8_string: A possibly Unicode file_id. (can also be

942

utf8 or None).

943

:param warn: Functions that are sanitizing user data can set warn=False

944

:return: None or a utf8 file id.

945

"""

946

if (unicode_or_utf8_string is None

947

or unicode_or_utf8_string.__class__ == str):

948

return unicode_or_utf8_string

949

if warn:

950

symbol_versioning.warn(_file_id_warning, DeprecationWarning,

951

stacklevel=2)

952

return cache_utf8.encode(unicode_or_utf8_string)

953

954

955

_platform_normalizes_filenames = False

956

if sys.platform == 'darwin':

957

_platform_normalizes_filenames = True

958

959

960

def normalizes_filenames():

961

"""Return True if this platform normalizes unicode filenames.

962

963

Mac OSX does, Windows/Linux do not.

964

"""

965

return _platform_normalizes_filenames

966

967

968

def _accessible_normalized_filename(path):

969

"""Get the unicode normalized path, and if you can access the file.

970

971

On platforms where the system normalizes filenames (Mac OSX),

972

you can access a file by any path which will normalize correctly.

973

On platforms where the system does not normalize filenames

974

(Windows, Linux), you have to access a file by its exact path.

975

976

Internally, bzr only supports NFC/NFKC normalization, since that is

977

the standard for XML documents.

978

979

So return the normalized path, and a flag indicating if the file

980

can be accessed by that path.

981

"""

982

983

return unicodedata.normalize('NFKC', unicode(path)), True

984

985

986

def _inaccessible_normalized_filename(path):

987

__doc__ = _accessible_normalized_filename.__doc__

988

989

normalized = unicodedata.normalize('NFKC', unicode(path))

990

return normalized, normalized == path

991

992

993

if _platform_normalizes_filenames:

994

normalized_filename = _accessible_normalized_filename

995

else:

996

normalized_filename = _inaccessible_normalized_filename

997

998

999

def terminal_width():

1000

"""Return estimated terminal width."""

1001

if sys.platform == 'win32':

1002

return win32utils.get_console_size()[0]

1003

width = 0

1004

try:

1005

import struct, fcntl, termios

1006

s = struct.pack('HHHH', 0, 0, 0, 0)

1007

x = fcntl.ioctl(1, termios.TIOCGWINSZ, s)

1008

width = struct.unpack('HHHH', x)[1]

1009

except IOError:

1010

pass

1011

if width <= 0:

1012

try:

1013

width = int(os.environ['COLUMNS'])

1014

except:

1015

pass

1016

if width <= 0:

1017

width = 80

1018

1019

return width

1020

1021

1022

def supports_executable():

1023

return sys.platform != "win32"

1024

1025

1026

def supports_posix_readonly():

1027

"""Return True if 'readonly' has POSIX semantics, False otherwise.

1028

1029

Notably, a win32 readonly file cannot be deleted, unlike POSIX where the

1030

directory controls creation/deletion, etc.

1031

1032

And under win32, readonly means that the directory itself cannot be

1033

deleted. The contents of a readonly directory can be changed, unlike POSIX

1034

where files in readonly directories cannot be added, deleted or renamed.

1035

"""

1036

return sys.platform != "win32"

1037

1038

1039

def set_or_unset_env(env_variable, value):

1040

"""Modify the environment, setting or removing the env_variable.

1041

1042

:param env_variable: The environment variable in question

1043

:param value: The value to set the environment to. If None, then

1044

the variable will be removed.

1045

:return: The original value of the environment variable.

1046

"""

1047

orig_val = os.environ.get(env_variable)

1048

if value is None:

1049

if orig_val is not None:

1050

del os.environ[env_variable]

1051

else:

1052

if isinstance(value, unicode):

1053

value = value.encode(bzrlib.user_encoding)

1054

os.environ[env_variable] = value

1055

return orig_val

1056

1057

1058

_validWin32PathRE = re.compile(r'^([A-Za-z]:[/\\])?[^:<>*"?\|]*$')

1059

1060

1061

def check_legal_path(path):

1062

"""Check whether the supplied path is legal.

1063

This is only required on Windows, so we don't test on other platforms

1064

right now.

1065

"""

1066

if sys.platform != "win32":

1067

return

1068

if _validWin32PathRE.match(path) is None:

1069

raise errors.IllegalPath(path)

1070

1071

1072

def walkdirs(top, prefix=""):

1073

"""Yield data about all the directories in a tree.

1074

1075

This yields all the data about the contents of a directory at a time.

1076

After each directory has been yielded, if the caller has mutated the list

1077

to exclude some directories, they are then not descended into.

1078

1079

The data yielded is of the form:

1080

((directory-relpath, directory-path-from-top),

1081

[(directory-relpath, basename, kind, lstat, path-from-top), ...]),

1082

- directory-relpath is the relative path of the directory being returned

1083

with respect to top. prefix is prepended to this.

1084

- directory-path-from-root is the path including top for this directory.

1085

It is suitable for use with os functions.

1086

- relpath is the relative path within the subtree being walked.

1087

- basename is the basename of the path

1088

- kind is the kind of the file now. If unknown then the file is not

1089

present within the tree - but it may be recorded as versioned. See

1090

versioned_kind.

1091

- lstat is the stat data *if* the file was statted.

1092

- planned, not implemented:

1093

path_from_tree_root is the path from the root of the tree.

1094

1095

:param prefix: Prefix the relpaths that are yielded with 'prefix'. This

1096

allows one to walk a subtree but get paths that are relative to a tree

1097

rooted higher up.

1098

:return: an iterator over the dirs.

1099

"""

1100

#TODO there is a bit of a smell where the results of the directory-

1101

# summary in this, and the path from the root, may not agree

1102

# depending on top and prefix - i.e. ./foo and foo as a pair leads to

1103

# potentially confusing output. We should make this more robust - but

1104

# not at a speed cost. RBC 20060731

1105

_lstat = os.lstat

1106

_directory = _directory_kind

1107

_listdir = os.listdir

1108

_kind_from_mode = _formats.get

1109

pending = [(safe_unicode(prefix), "", _directory, None, safe_unicode(top))]

1110

while pending:

1111

# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath

1112

relroot, _, _, _, top = pending.pop()

1113

if relroot:

1114

relprefix = relroot + u'/'

1115

else:

1116

relprefix = ''

1117

top_slash = top + u'/'

1118

1119

dirblock = []

1120

append = dirblock.append

1121

for name in sorted(_listdir(top)):

1122

abspath = top_slash + name

1123

statvalue = _lstat(abspath)

1124

kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')

1125

append((relprefix + name, name, kind, statvalue, abspath))

1126

yield (relroot, top), dirblock

1127

1128

# push the user specified dirs from dirblock

1129

pending.extend(d for d in reversed(dirblock) if d[2] == _directory)

1130

1131

1132

def _walkdirs_utf8(top, prefix=""):

1133

"""Yield data about all the directories in a tree.

1134

1135

This yields the same information as walkdirs() only each entry is yielded

1136

in utf-8. On platforms which have a filesystem encoding of utf8 the paths

1137

are returned as exact byte-strings.

1138

1139

:return: yields a tuple of (dir_info, [file_info])

1140

dir_info is (utf8_relpath, path-from-top)

1141

file_info is (utf8_relpath, utf8_name, kind, lstat, path-from-top)

1142

if top is an absolute path, path-from-top is also an absolute path.

1143

path-from-top might be unicode or utf8, but it is the correct path to

1144

pass to os functions to affect the file in question. (such as os.lstat)

1145

"""

1146

fs_encoding = sys.getfilesystemencoding()

1147

if (sys.platform == 'win32' or

1148

fs_encoding not in ('UTF-8', 'US-ASCII', 'ANSI_X3.4-1968')): # ascii

1149

return _walkdirs_unicode_to_utf8(top, prefix=prefix)

1150

else:

1151

return _walkdirs_fs_utf8(top, prefix=prefix)

1152

1153

1154

def _walkdirs_fs_utf8(top, prefix=""):

1155

"""See _walkdirs_utf8.

1156

1157

This sub-function is called when we know the filesystem is already in utf8

1158

encoding. So we don't need to transcode filenames.

1159

"""

1160

_lstat = os.lstat

1161

_directory = _directory_kind

1162

_listdir = os.listdir

1163

_kind_from_mode = _formats.get

1164

1165

# 0 - relpath, 1- basename, 2- kind, 3- stat, 4-toppath

1166

# But we don't actually uses 1-3 in pending, so set them to None

1167

pending = [(safe_utf8(prefix), None, None, None, safe_utf8(top))]

1168

while pending:

1169

relroot, _, _, _, top = pending.pop()

1170

if relroot:

1171

relprefix = relroot + '/'

1172

else:

1173

relprefix = ''

1174

top_slash = top + '/'

1175

1176

dirblock = []

1177

append = dirblock.append

1178

for name in sorted(_listdir(top)):

1179

abspath = top_slash + name

1180

statvalue = _lstat(abspath)

1181

kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')

1182

append((relprefix + name, name, kind, statvalue, abspath))

1183

yield (relroot, top), dirblock

1184

1185

# push the user specified dirs from dirblock

1186

pending.extend(d for d in reversed(dirblock) if d[2] == _directory)

1187

1188

1189

def _walkdirs_unicode_to_utf8(top, prefix=""):

1190

"""See _walkdirs_utf8

1191

1192

Because Win32 has a Unicode api, all of the 'path-from-top' entries will be

1193

Unicode paths.

1194

This is currently the fallback code path when the filesystem encoding is

1195

not UTF-8. It may be better to implement an alternative so that we can

1196

safely handle paths that are not properly decodable in the current

1197

encoding.

1198

"""

1199

_utf8_encode = codecs.getencoder('utf8')

1200

_lstat = os.lstat

1201

_directory = _directory_kind

1202

_listdir = os.listdir

1203

_kind_from_mode = _formats.get

1204

1205

pending = [(safe_utf8(prefix), None, None, None, safe_unicode(top))]

1206

while pending:

1207

relroot, _, _, _, top = pending.pop()

1208

if relroot:

1209

relprefix = relroot + '/'

1210

else:

1211

relprefix = ''

1212

top_slash = top + u'/'

1213

1214

dirblock = []

1215

append = dirblock.append

1216

for name in sorted(_listdir(top)):

1217

name_utf8 = _utf8_encode(name)[0]

1218

abspath = top_slash + name

1219

statvalue = _lstat(abspath)

1220

kind = _kind_from_mode(statvalue.st_mode & 0170000, 'unknown')

1221

append((relprefix + name_utf8, name_utf8, kind, statvalue, abspath))

1222

yield (relroot, top), dirblock

1223

1224

# push the user specified dirs from dirblock

1225

pending.extend(d for d in reversed(dirblock) if d[2] == _directory)

1226

1227

1228

def copy_tree(from_path, to_path, handlers={}):

1229

"""Copy all of the entries in from_path into to_path.

1230

1231

:param from_path: The base directory to copy.

1232

:param to_path: The target directory. If it does not exist, it will

1233

be created.

1234

:param handlers: A dictionary of functions, which takes a source and

1235

destinations for files, directories, etc.

1236

It is keyed on the file kind, such as 'directory', 'symlink', or 'file'

1237

'file', 'directory', and 'symlink' should always exist.

1238

If they are missing, they will be replaced with 'os.mkdir()',

1239

'os.readlink() + os.symlink()', and 'shutil.copy2()', respectively.

1240

"""

1241

# Now, just copy the existing cached tree to the new location

1242

# We use a cheap trick here.

1243

# Absolute paths are prefixed with the first parameter

1244

# relative paths are prefixed with the second.

1245

# So we can get both the source and target returned

1246

# without any extra work.

1247

1248

def copy_dir(source, dest):

1249

os.mkdir(dest)

1250

1251

def copy_link(source, dest):

1252

"""Copy the contents of a symlink"""

1253

link_to = os.readlink(source)

1254

os.symlink(link_to, dest)

1255

1256

real_handlers = {'file':shutil.copy2,

1257

'symlink':copy_link,

1258

'directory':copy_dir,

1259

}

1260

real_handlers.update(handlers)

1261

1262

if not os.path.exists(to_path):

1263

real_handlers['directory'](from_path, to_path)

1264

1265

for dir_info, entries in walkdirs(from_path, prefix=to_path):

1266

for relpath, name, kind, st, abspath in entries:

1267

real_handlers[kind](abspath, relpath)

1268

1269

1270

def path_prefix_key(path):

1271

"""Generate a prefix-order path key for path.

1272

1273

This can be used to sort paths in the same way that walkdirs does.

1274

"""

1275

return (dirname(path) , path)

1276

1277

1278

def compare_paths_prefix_order(path_a, path_b):

1279

"""Compare path_a and path_b to generate the same order walkdirs uses."""

1280

key_a = path_prefix_key(path_a)

1281

key_b = path_prefix_key(path_b)

1282

return cmp(key_a, key_b)

1283

1284

1285

_cached_user_encoding = None

1286

1287

1288

def get_user_encoding(use_cache=True):

1289

"""Find out what the preferred user encoding is.

1290

1291

This is generally the encoding that is used for command line parameters

1292

and file contents. This may be different from the terminal encoding

1293

or the filesystem encoding.

1294

1295

:param use_cache: Enable cache for detected encoding.

1296

(This parameter is turned on by default,

1297

and required only for selftesting)

1298

1299

:return: A string defining the preferred user encoding

1300

"""

1301

global _cached_user_encoding

1302

if _cached_user_encoding is not None and use_cache:

1303

return _cached_user_encoding

1304

1305

if sys.platform == 'darwin':

1306

# work around egregious python 2.4 bug

1307

sys.platform = 'posix'

1308

try:

1309

import locale

1310

finally:

1311

sys.platform = 'darwin'

1312

else:

1313

import locale

1314

1315

try:

1316

user_encoding = locale.getpreferredencoding()

1317

except locale.Error, e:

1318

sys.stderr.write('bzr: warning: %s\n'

1319

' Could not determine what text encoding to use.\n'

1320

' This error usually means your Python interpreter\n'

1321

' doesn\'t support the locale set by $LANG (%s)\n'

1322

" Continuing with ascii encoding.\n"

1323

% (e, os.environ.get('LANG')))

1324

user_encoding = 'ascii'

1325

1326

# Windows returns 'cp0' to indicate there is no code page. So we'll just

1327

# treat that as ASCII, and not support printing unicode characters to the

1328

# console.

1329

if user_encoding in (None, 'cp0'):

1330

user_encoding = 'ascii'

1331

else:

1332

# check encoding

1333

try:

1334

codecs.lookup(user_encoding)

1335

except LookupError:

1336

sys.stderr.write('bzr: warning:'

1337

' unknown encoding %s.'

1338

' Continuing with ascii encoding.\n'

1339

% user_encoding

1340

)

1341

user_encoding = 'ascii'

1342

1343

if use_cache:

1344

_cached_user_encoding = user_encoding

1345

1346

return user_encoding

1347

1348

1349

def recv_all(socket, bytes):

1350

"""Receive an exact number of bytes.

1351

1352

Regular Socket.recv() may return less than the requested number of bytes,

1353

dependning on what's in the OS buffer. MSG_WAITALL is not available

1354

on all platforms, but this should work everywhere. This will return

1355

less than the requested amount if the remote end closes.

1356

1357

This isn't optimized and is intended mostly for use in testing.

1358

"""

1359

b = ''

1360

while len(b) < bytes:

1361

new = socket.recv(bytes - len(b))

1362

if new == '':

1363

break # eof

1364

b += new

1365

return b

1366

1367

def dereference_path(path):

1368

"""Determine the real path to a file.

1369

1370

All parent elements are dereferenced. But the file itself is not

1371

dereferenced.

1372

:param path: The original path. May be absolute or relative.

1373

:return: the real path *to* the file

1374

"""

1375

parent, base = os.path.split(path)

1376

# The pathjoin for '.' is a workaround for Python bug #1213894.

1377

# (initial path components aren't dereferenced)

1378

return pathjoin(realpath(pathjoin('.', parent)), base)

Older »