~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/merge.py

Committer: Martin Pool
Date: 2005-09-30 05:15:03 UTC
mto: (1185.14.2)
mto: This revision was merged to the branch mainline in revision 1396.
Revision ID: mbp@sourcefrog.net-20050930051503-9c049325215ddd1c

- fix up Branch.open_downlevel for Transport

files added:
HACKING

Makefile

NEWS.developers

bzr-man.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/clone.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/intset.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/progress.py

bzrlib/revisionspec.py

bzrlib/selftest

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/TestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_revision_info.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/testtransport.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store

bzrlib/store/compressed_text.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/ui.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/add-bzr-to-baz

contrib/bash/bzr

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

doc/revfile-annotation.txt

doc/split-join-files.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/revfile.txt

notes/schemas.xml

patches

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/symlink-support.patch

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/http_client.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files removed:
bzrlib/remotebranch.py

bzrlib/tests.py

doc/faq.txt

doc/quickref.txt

test.sh

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

elementtree/ => bzrlib/util/elementtree/

urlgrabber/ => bzrlib/util/urlgrabber/

contrib/bash/bzr => contrib/bash/bzr.simple

bzrlib/newinventory.py => contrib/newinventory.py

files modified:
.bzrignore

.rsyncexclude

NEWS

README

TODO

build-api

bzrlib/__init__.py

bzrlib/add.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/mdiff.py

bzrlib/osutils.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/textinv.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/xml.py

contrib/zsh/_bzr

doc/formats.txt

doc/index.txt

doc/revfile.txt

doc/tagging.txt

doc/todo-from-arch.txt

setup.py

testbzr

Show diffs side-by-side

added added

removed removed

bzrlib/merge.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import os

import tempfile

import shutil

import errno

import bzrlib.osutils

import bzrlib.revision

from bzrlib.merge_core import merge_flex, ApplyMerge3, BackupBeforeChange

from bzrlib.changeset import generate_changeset, ExceptionConflictHandler

from bzrlib.changeset import Inventory, Diff3Merge

from bzrlib.branch import Branch

from bzrlib.errors import BzrCommandError, UnrelatedBranches, NoCommonAncestor

from bzrlib.errors import NoCommits

from bzrlib.delta import compare_trees

from bzrlib.trace import mutter, warning

from bzrlib.fetch import greedy_fetch, fetch

from bzrlib.revision import is_ancestor

from bzrlib.osutils import rename

from bzrlib.revision import common_ancestor, MultipleRevisionSources

from bzrlib.errors import NoSuchRevision

# TODO: build_working_dir can be built on something simpler than merge()

# FIXME: merge() parameters seem oriented towards the command line

# comments from abentley on irc: merge happens in two stages, each

# of which generates a changeset object

# stage 1: generate OLD->OTHER,

# stage 2: use MINE and OLD->OTHER to generate MINE -> RESULT

class MergeConflictHandler(ExceptionConflictHandler):

"""Handle conflicts encountered while merging.

This subclasses ExceptionConflictHandler, so that any types of

conflict that are not explicitly handled cause an exception and

terminate the merge.

"""

def __init__(self, ignore_zero=False):

ExceptionConflictHandler.__init__(self)

self.conflicts = 0

self.ignore_zero = ignore_zero

def copy(self, source, dest):

"""Copy the text and mode of a file

:param source: The path of the file to copy

:param dest: The distination file to create

"""

s_file = file(source, "rb")

d_file = file(dest, "wb")

for line in s_file:

d_file.write(line)

os.chmod(dest, 0777 & os.stat(source).st_mode)

def dump(self, lines, dest):

"""Copy the text and mode of a file

:param source: The path of the file to copy

:param dest: The distination file to create

"""

d_file = file(dest, "wb")

for line in lines:

d_file.write(line)

def add_suffix(self, name, suffix, last_new_name=None):

"""Rename a file to append a suffix. If the new name exists, the

suffix is added repeatedly until a non-existant name is found

:param name: The path of the file

:param suffix: The suffix to append

:param last_new_name: (used for recursive calls) the last name tried

"""

if last_new_name is None:

last_new_name = name

new_name = last_new_name+suffix

try:

rename(name, new_name)

return new_name

except OSError, e:

if e.errno != errno.EEXIST and e.errno != errno.ENOTEMPTY:

raise

return self.add_suffix(name, suffix, last_new_name=new_name)

100

def conflict(self, text):

101

warning(text)

102

self.conflicts += 1

103

104

105

def merge_conflict(self, new_file, this_path, base_lines, other_lines):

106

"""

107

Handle diff3 conflicts by producing a .THIS, .BASE and .OTHER. The

108

main file will be a version with diff3 conflicts.

109

:param new_file: Path to the output file with diff3 markers

110

:param this_path: Path to the file text for the THIS tree

111

:param base_path: Path to the file text for the BASE tree

112

:param other_path: Path to the file text for the OTHER tree

113

"""

114

self.add_suffix(this_path, ".THIS")

115

self.dump(base_lines, this_path+".BASE")

116

self.dump(other_lines, this_path+".OTHER")

117

rename(new_file, this_path)

118

self.conflict("Diff3 conflict encountered in %s" % this_path)

119

120

def new_contents_conflict(self, filename, other_contents):

121

"""Conflicting contents for newly added file."""

122

self.copy(other_contents, filename + ".OTHER")

123

self.conflict("Conflict in newly added file %s" % filename)

124

125

126

def target_exists(self, entry, target, old_path):

127

"""Handle the case when the target file or dir exists"""

128

moved_path = self.add_suffix(target, ".moved")

129

self.conflict("Moved existing %s to %s" % (target, moved_path))

130

131

def rmdir_non_empty(self, filename):

132

"""Handle the case where the dir to be removed still has contents"""

133

self.conflict("Directory %s not removed because it is not empty"\

134

% filename)

135

return "skip"

136

137

def finalize(self):

138

if not self.ignore_zero:

139

print "%d conflicts encountered.\n" % self.conflicts

140

141

def get_tree(treespec, temp_root, label, local_branch=None):

142

location, revno = treespec

143

branch = Branch.open_containing(location)

144

if revno is None:

145

revision = None

146

elif revno == -1:

147

revision = branch.last_revision()

148

else:

149

revision = branch.get_rev_id(revno)

150

return branch, get_revid_tree(branch, revision, temp_root, label,

151

local_branch)

152

153

def get_revid_tree(branch, revision, temp_root, label, local_branch):

154

if revision is None:

155

base_tree = branch.working_tree()

156

else:

157

if local_branch is not None:

158

greedy_fetch(local_branch, branch, revision)

159

base_tree = local_branch.revision_tree(revision)

160

else:

161

base_tree = branch.revision_tree(revision)

162

temp_path = os.path.join(temp_root, label)

163

os.mkdir(temp_path)

164

return MergeTree(base_tree, temp_path)

165

166

167

def file_exists(tree, file_id):

168

return tree.has_filename(tree.id2path(file_id))

169

170

171

class MergeTree(object):

172

def __init__(self, tree, tempdir):

173

object.__init__(self)

174

if hasattr(tree, "basedir"):

175

self.root = tree.basedir

176

else:

177

self.root = None

178

self.tree = tree

179

self.tempdir = tempdir

180

os.mkdir(os.path.join(self.tempdir, "texts"))

181

self.cached = {}

182

183

def __iter__(self):

184

return self.tree.__iter__()

185

186

def __contains__(self, file_id):

187

return file_id in self.tree

188

189

def get_file(self, file_id):

190

return self.tree.get_file(file_id)

191

192

def get_file_sha1(self, id):

193

return self.tree.get_file_sha1(id)

194

195

def id2path(self, file_id):

196

return self.tree.id2path(file_id)

197

198

def has_id(self, file_id):

199

return self.tree.has_id(file_id)

200

201

def has_or_had_id(self, file_id):

202

if file_id == self.tree.inventory.root.file_id:

203

return True

204

return self.tree.inventory.has_id(file_id)

205

206

def has_or_had_id(self, file_id):

207

if file_id == self.tree.inventory.root.file_id:

208

return True

209

return self.tree.inventory.has_id(file_id)

210

211

def readonly_path(self, id):

212

if id not in self.tree:

213

return None

214

if self.root is not None:

215

return self.tree.abspath(self.tree.id2path(id))

216

else:

217

if self.tree.inventory[id].kind in ("directory", "root_directory"):

218

return self.tempdir

219

if not self.cached.has_key(id):

220

path = os.path.join(self.tempdir, "texts", id)

221

outfile = file(path, "wb")

222

outfile.write(self.tree.get_file(id).read())

223

assert(os.path.exists(path))

224

self.cached[id] = path

225

return self.cached[id]

226

227

228

def build_working_dir(to_dir):

229

"""Build a working directory in an empty directory.

230

231

to_dir is a directory containing branch metadata but no working files,

232

typically constructed by cloning an existing branch.

233

234

This is split out as a special idiomatic case of merge. It could

235

eventually be done by just building the tree directly calling into

236

lower-level code (e.g. constructing a changeset).

237

"""

238

merge((to_dir, -1), (to_dir, 0), this_dir=to_dir,

239

check_clean=False, ignore_zero=True)

240

241

242

def merge(other_revision, base_revision,

243

check_clean=True, ignore_zero=False,

244

this_dir=None, backup_files=False, merge_type=ApplyMerge3,

245

file_list=None):

246

"""Merge changes into a tree.

247

248

base_revision

249

tuple(path, revision) Base for three-way merge.

250

other_revision

251

tuple(path, revision) Other revision for three-way merge.

252

this_dir

253

Directory to merge changes into; '.' by default.

254

check_clean

255

If true, this_dir must have no uncommitted changes before the

256

merge begins.

257

ignore_zero - If true, suppress the "zero conflicts" message when

258

there are no conflicts; should be set when doing something we expect

259

to complete perfectly.

260

261

All available ancestors of other_revision and base_revision are

262

automatically pulled into the branch.

263

"""

264

tempdir = tempfile.mkdtemp(prefix="bzr-")

265

try:

266

if this_dir is None:

267

this_dir = '.'

268

this_branch = Branch.open_containing(this_dir)

269

this_rev_id = this_branch.last_revision()

270

if this_rev_id is None:

271

raise BzrCommandError("This branch has no commits")

272

if check_clean:

273

changes = compare_trees(this_branch.working_tree(),

274

this_branch.basis_tree(), False)

275

if changes.has_changed():

276

raise BzrCommandError("Working tree has uncommitted changes.")

277

other_branch, other_tree = get_tree(other_revision, tempdir, "other",

278

this_branch)

279

if other_revision[1] == -1:

280

other_rev_id = other_branch.last_revision()

281

if other_rev_id is None:

282

raise NoCommits(other_branch)

283

other_basis = other_rev_id

284

elif other_revision[1] is not None:

285

other_rev_id = other_branch.get_rev_id(other_revision[1])

286

other_basis = other_rev_id

287

else:

288

other_rev_id = None

289

other_basis = other_branch.last_revision()

290

if other_basis is None:

291

raise NoCommits(other_branch)

292

if base_revision == [None, None]:

293

try:

294

base_rev_id = common_ancestor(this_rev_id, other_basis,

295

this_branch)

296

except NoCommonAncestor:

297

raise UnrelatedBranches()

298

base_tree = get_revid_tree(this_branch, base_rev_id, tempdir,

299

"base", None)

300

base_is_ancestor = True

301

else:

302

base_branch, base_tree = get_tree(base_revision, tempdir, "base")

303

if base_revision[1] == -1:

304

base_rev_id = base_branch.last_revision()

305

elif base_revision[1] is None:

306

base_rev_id = None

307

else:

308

base_rev_id = base_branch.get_rev_id(base_revision[1])

309

fetch(from_branch=base_branch, to_branch=this_branch)

310

base_is_ancestor = is_ancestor(this_rev_id, base_rev_id,

311

this_branch)

312

if file_list is None:

313

interesting_ids = None

314

else:

315

interesting_ids = set()

316

this_tree = this_branch.working_tree()

317

for fname in file_list:

318

path = this_branch.relpath(fname)

319

found_id = False

320

for tree in (this_tree, base_tree.tree, other_tree.tree):

321

file_id = tree.inventory.path2id(path)

322

if file_id is not None:

323

interesting_ids.add(file_id)

324

found_id = True

325

if not found_id:

326

raise BzrCommandError("%s is not a source file in any"

327

" tree." % fname)

328

merge_inner(this_branch, other_tree, base_tree, tempdir,

329

ignore_zero=ignore_zero, backup_files=backup_files,

330

merge_type=merge_type, interesting_ids=interesting_ids)

331

if base_is_ancestor and other_rev_id is not None\

332

and other_rev_id not in this_branch.revision_history():

333

this_branch.add_pending_merge(other_rev_id)

334

finally:

335

shutil.rmtree(tempdir)

336

337

338

def set_interesting(inventory_a, inventory_b, interesting_ids):

339

"""Mark files whose ids are in interesting_ids as interesting

340

"""

341

for inventory in (inventory_a, inventory_b):

342

for path, source_file in inventory.iteritems():

343

source_file.interesting = source_file.id in interesting_ids

344

345

346

def generate_cset_optimized(tree_a, tree_b, interesting_ids=None):

347

"""Generate a changeset. If interesting_ids is supplied, only changes

348

to those files will be shown. Metadata changes are stripped.

349

"""

350

cset = generate_changeset(tree_a, tree_b, interesting_ids)

351

for entry in cset.entries.itervalues():

352

entry.metadata_change = None

353

return cset

354

355

356

def merge_inner(this_branch, other_tree, base_tree, tempdir,

357

ignore_zero=False, merge_type=ApplyMerge3, backup_files=False,

358

interesting_ids=None):

359

360

def merge_factory(file_id, base, other):

361

contents_change = merge_type(file_id, base, other)

362

if backup_files:

363

contents_change = BackupBeforeChange(contents_change)

364

return contents_change

365

366

this_tree = get_tree((this_branch.base, None), tempdir, "this")[1]

367

368

def get_inventory(tree):

369

return tree.tree.inventory

370

371

inv_changes = merge_flex(this_tree, base_tree, other_tree,

372

generate_cset_optimized, get_inventory,

373

MergeConflictHandler(ignore_zero=ignore_zero),

374

merge_factory=merge_factory,

375

interesting_ids=interesting_ids)

376

377

adjust_ids = []

378

for id, path in inv_changes.iteritems():

379

if path is not None:

380

if path == '.':

381

path = ''

382

else:

383

assert path.startswith('.' + os.sep), "path is %s" % path

384

path = path[2:]

385

adjust_ids.append((path, id))

386

if len(adjust_ids) > 0:

387

this_branch.set_inventory(regen_inventory(this_branch, this_tree.root,

388

adjust_ids))

389

390

391

def regen_inventory(this_branch, root, new_entries):

392

old_entries = this_branch.read_working_inventory()

393

new_inventory = {}

394

by_path = {}

395

new_entries_map = {}

396

for path, file_id in new_entries:

397

if path is None:

398

continue

399

new_entries_map[file_id] = path

400

401

def id2path(file_id):

402

path = new_entries_map.get(file_id)

403

if path is not None:

404

return path

405

entry = old_entries[file_id]

406

if entry.parent_id is None:

407

return entry.name

408

return os.path.join(id2path(entry.parent_id), entry.name)

409

410

for file_id in old_entries:

411

entry = old_entries[file_id]

412

path = id2path(file_id)

413

new_inventory[file_id] = (path, file_id, entry.parent_id, entry.kind)

414

by_path[path] = file_id

415

416

deletions = 0

417

insertions = 0

418

new_path_list = []

419

for path, file_id in new_entries:

420

if path is None:

421

del new_inventory[file_id]

422

deletions += 1

423

else:

424

new_path_list.append((path, file_id))

425

if file_id not in old_entries:

426

insertions += 1

427

# Ensure no file is added before its parent

428

new_path_list.sort()

429

for path, file_id in new_path_list:

430

if path == '':

431

parent = None

432

else:

433

parent = by_path[os.path.dirname(path)]

434

kind = bzrlib.osutils.file_kind(os.path.join(root, path))

435

new_inventory[file_id] = (path, file_id, parent, kind)

436

by_path[path] = file_id

437

438

# Get a list in insertion order

439

new_inventory_list = new_inventory.values()

440

mutter ("""Inventory regeneration:

441

old length: %i insertions: %i deletions: %i new_length: %i"""\

442

% (len(old_entries), insertions, deletions, len(new_inventory_list)))

443

assert len(new_inventory_list) == len(old_entries) + insertions - deletions

444

new_inventory_list.sort()

445

return new_inventory_list

446

447

merge_types = { "merge3": (ApplyMerge3, "Native diff3-style merge"),

448

"diff3": (Diff3Merge, "Merge using external diff3")

449

}

450

Older »