~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to notes/performance.txt

Committer: mbp at sourcefrog
Date: 2005-03-28 02:24:18 UTC
Revision ID: mbp@sourcefrog.net-20050328022418-9d37f56361aa18e9

doc: more on ignore patterns

files added:
bzrlib/tests.py

doc/faq.txt

doc/quickref.txt

doc/roadmap.txt

doc/testing.txt

doc/work-order.txt

files removed:
.rsyncexclude

HACKING

Makefile

TODO

bzr-man.py

bzrlib/atomicfile.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/intset.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/newinventory.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/selftest

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/quotes.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/split-join-files.txt

doc/switch-in-branch.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

tools/testweave.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files renamed:
bzrlib/util/elementtree/ => elementtree/

files modified:
.bzrignore

NEWS

README

build-api

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/store.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/xml.py

doc/Makefile

doc/bitkeeper.txt

doc/formats.txt

doc/index.txt

doc/interrupted.txt

doc/merge.txt

doc/python.txt

doc/random.txt

doc/svk.txt

doc/tagging.txt

doc/todo-from-arch.txt

elementtree/ElementTree.py

notes/performance.txt

setup.py

Show diffs side-by-side

added added

removed removed

notes/performance.txt

269

2969 files changed, 372168 insertions(+), 153284 deletions(-)

270

271

I wonder why it is not exactly the same? Maybe because the python

272

diff algorithm is a bit differnt to GNU diff.

273

274

----

275

276

2005-03-29

277

278

full check, retrieving all file texts once for the 2.4 kernel branch

279

takes 10m elapsed, 1m cpu time. lots of random IO and seeking.

280

281

----

282

283

284

mbp@hope% time python =bzr deleted --show-ids

285

README README-fa1d8447b4fd0140-adbf4342752f0fc3

286

python =bzr deleted --show-ids 1.55s user 0.09s system 96% cpu 1.701 total

287

mbp@hope% time python -O =bzr deleted --show-ids

288

README README-fa1d8447b4fd0140-adbf4342752f0fc3

289

python -O =bzr deleted --show-ids 1.47s user 0.10s system 101% cpu 1.547 total

290

mbp@hope% time python -O =bzr deleted --show-ids

291

README README-fa1d8447b4fd0140-adbf4342752f0fc3

292

python -O =bzr deleted --show-ids 1.49s user 0.07s system 99% cpu 1.565 total

293

mbp@hope% time python =bzr deleted --show-ids

294

README README-fa1d8447b4fd0140-adbf4342752f0fc3

295

python =bzr deleted --show-ids 1.55s user 0.08s system 99% cpu 1.637 total

296

297

small but significant improvement from Python -O

298

299

----

300

301

Loading a large inventory through cElementTree is pretty quick; only

302

about 0.117s. By contrast reading the inventory into our data

303

structure takes about 0.7s.

304

305

So I think the problem must be in converting everything to

306

InventoryEntries and back again every time.

307

308

Thought about that way it seems pretty inefficient: why create all

309

those objects when most of them aren't called on most invocations?

310

Instead perhaps the Inventory object should hold the ElementTree and

311

pull things out of it only as necessary? We can even have an index

312

pointing into the ElementTree by id, path, etc.

313

314

315

as of r148

316

317

bzr deleted 1.46s user 0.08s system 98% cpu 1.561 total

318

319

320

Alternatively maybe keep an id2path and path2id cache? Keeping it

321

coherent may be hard...

272

diff algorithm is a bit differnt to GNU diff.

b'\\ No newline at end of file'

Older »