~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/osutils.py

Committer: mbp at sourcefrog
Date: 2005-03-22 00:02:45 UTC
Revision ID: mbp@sourcefrog.net-20050322000245-a4bf0592e9f6c6c1

suggestions from robert about the inventory format

files added:
bzrlib/tests.py

doc/faq.txt

doc/quickref.txt

doc/roadmap.txt

doc/testing.txt

doc/work-order.txt

files removed:
.rsyncexclude

HACKING

Makefile

NEWS

TODO

bzr-man.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/changeset.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/meta_store.py

bzrlib/missing.py

bzrlib/newinventory.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/plugins

bzrlib/plugins/__init__.py

bzrlib/plugins/checkperms

bzrlib/progress.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/selftest

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/plugins.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/upgrade.py

bzrlib/util

bzrlib/util/__init__.py

bzrlib/util/effbot

bzrlib/util/effbot/__init__.py

bzrlib/util/effbot/org

bzrlib/util/effbot/org/__init__.py

bzrlib/util/effbot/org/gzip_consumer.py

bzrlib/util/effbot/org/http_client.py

bzrlib/util/effbot/org/http_manager.py

bzrlib/util/elementtree

bzrlib/util/elementtree/ElementTree.py

bzrlib/util/elementtree/__init__.py

bzrlib/util/urlgrabber

bzrlib/util/urlgrabber/__init__.py

bzrlib/util/urlgrabber/byterange.py

bzrlib/util/urlgrabber/grabber.py

bzrlib/util/urlgrabber/keepalive.py

bzrlib/util/urlgrabber/mirror.py

bzrlib/util/urlgrabber/progress.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

contrib

contrib/add-bzr-to-baz

contrib/bash

contrib/bash/bzr

contrib/bash/bzr.simple

contrib/create_bzr_rollup.py

contrib/emacs

contrib/emacs/bzr-mode.el

contrib/fortune

contrib/pwclient.full

contrib/pwk

contrib/upload-bzr.dev

contrib/zsh

contrib/zsh/_bzr

doc/ignore.txt

doc/quotes.txt

doc/revfile-annotation.txt

doc/revfile.txt

doc/split-join-files.txt

doc/switch-in-branch.txt

notes/inventory-v2-sample.xml

notes/inventory-v2.rnc

notes/new-inventory-sample.xml

notes/revfile.txt

notes/schemas.xml

patches

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

tools

tools/convertfile.py

tools/convertinv.py

tools/history2revfiles.py

tools/history2weaves.py

tools/http_client.py

tools/testweave.py

tools/weavebench.py

tools/weavemerge.sh

tutorial.txt

files modified:
.bzrignore

README

build-api

bzrlib/__init__.py

bzrlib/branch.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/inventory.py

bzrlib/osutils.py

bzrlib/revision.py

bzrlib/store.py

bzrlib/textui.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/xml.py

doc/Makefile

doc/bitkeeper.txt

doc/darcs.txt

doc/formats.txt

doc/index.txt

doc/interrupted.txt

doc/merge.txt

doc/python.txt

doc/random.txt

doc/svk.txt

doc/tagging.txt

doc/todo-from-arch.txt

notes/performance.txt

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/osutils.py

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

import os, types, re, time, errno, sys

import os, types, re, time, types

from stat import S_ISREG, S_ISDIR, S_ISLNK, ST_MODE, ST_SIZE

from bzrlib.errors import BzrError

from bzrlib.trace import mutter

import bzrlib

from errors import bailout

def make_readonly(filename):

"""Make a filename read-only."""

os.chmod(filename, mod)

_QUOTE_RE = None

_QUOTE_RE = re.compile(r'([^a-zA-Z0-9.,:/_~-])')

def quotefn(f):

"""Return a quoted filename filename

This previously used backslash quoting, but that works poorly on

Windows."""

# TODO: I'm not really sure this is the best format either.x

global _QUOTE_RE

if _QUOTE_RE == None:

_QUOTE_RE = re.compile(r'([^a-zA-Z0-9.,:/_~-])')

if _QUOTE_RE.search(f):

return '"' + f + '"'

else:

return f

"""Return shell-quoted filename"""

## We could be a bit more terse by using double-quotes etc

f = _QUOTE_RE.sub(r'\\\1', f)

if f[0] == '~':

f[0:1] = r'\~'

return f

def file_kind(f):

elif S_ISLNK(mode):

return 'symlink'

else:

raise BzrError("can't handle file kind with mode %o of %r" % (mode, f))

def kind_marker(kind):

if kind == 'file':

return ''

elif kind == 'directory':

return '/'

elif kind == 'symlink':

return '@'

else:

raise BzrError('invalid file kind %r' % kind)

def backup_file(fn):

"""Copy a file to a backup.

Backups are named in GNU-style, with a ~ suffix.

If the file is already a backup, it's not copied.

"""

import os

if fn[-1] == '~':

return

bfn = fn + '~'

inf = file(fn, 'rb')

try:

content = inf.read()

finally:

inf.close()

100

101

outf = file(bfn, 'wb')

102

try:

103

outf.write(content)

104

finally:

105

outf.close()

106

107

def rename(path_from, path_to):

108

"""Basically the same as os.rename() just special for win32"""

109

if sys.platform == 'win32':

110

try:

111

os.remove(path_to)

112

except OSError, e:

113

if e.errno != e.ENOENT:

114

raise

115

os.rename(path_from, path_to)

116

117

bailout("can't handle file kind with mode %o of %r" % (mode, f))

118

119

120

135

return False

136

137

138

def is_inside(dir, fname):

139

"""True if fname is inside dir.

140

141

The parameters should typically be passed to os.path.normpath first, so

142

that . and .. and repeated slashes are eliminated, and the separators

143

are canonical for the platform.

144

145

The empty string as a dir name is taken as top-of-tree and matches

146

everything.

147

148

>>> is_inside('src', 'src/foo.c')

149

True

150

>>> is_inside('src', 'srccontrol')

151

False

152

>>> is_inside('src', 'src/a/a/a/foo.c')

153

True

154

>>> is_inside('foo.c', 'foo.c')

155

True

156

>>> is_inside('foo.c', '')

157

False

158

>>> is_inside('', 'foo.c')

159

True

160

"""

161

# XXX: Most callers of this can actually do something smarter by

162

# looking at the inventory

163

if dir == fname:

164

return True

165

166

if dir == '':

167

return True

168

169

if dir[-1] != os.sep:

170

dir += os.sep

171

172

return fname.startswith(dir)

173

174

175

def is_inside_any(dir_list, fname):

176

"""True if fname is inside any of given dirs."""

177

for dirname in dir_list:

178

if is_inside(dirname, fname):

179

return True

180

else:

181

return False

182

183

184

def pumpfile(fromfile, tofile):

185

"""Copy contents of one file to another."""

186

tofile.write(fromfile.read())

188

189

def uuid():

190

"""Return a new UUID"""

191

try:

192

return file('/proc/sys/kernel/random/uuid').readline().rstrip('\n')

193

except IOError:

194

return chomp(os.popen('uuidgen').readline())

## XXX: Could alternatively read /proc/sys/kernel/random/uuid on

## Linux, but we need something portable for other systems;

## preferably an implementation in Python.

bailout('uuids not allowed!')

return chomp(os.popen('uuidgen').readline())

def chomp(s):

if s and (s[-1] == '\n'):

return s[:-1]

else:

return s

195

196

197

def sha_file(f):

198

100

import sha

101

## TODO: Maybe read in chunks to handle big files

199

102

if hasattr(f, 'tell'):

200

103

assert f.tell() == 0

201

104

s = sha.new()

202

BUFSIZE = 128<<10

203

while True:

204

b = f.read(BUFSIZE)

205

if not b:

206

break

207

s.update(b)

105

s.update(f.read())

208

106

return s.hexdigest()

209

107

210

108

216

114

217

115

218

116

219

def fingerprint_file(f):

220

import sha

221

s = sha.new()

222

b = f.read()

223

s.update(b)

224

size = len(b)

225

return {'size': size,

226

'sha1': s.hexdigest()}

227

228

229

def config_dir():

230

"""Return per-user configuration directory.

231

232

By default this is ~/.bzr.conf/

233

234

TODO: Global option --config-dir to override this.

235

"""

236

return os.path.expanduser("~/.bzr.conf")

237

238

239

def _auto_user_id():

240

"""Calculate automatic user identification.

241

242

Returns (realname, email).

243

244

Only used when none is set in the environment or the id file.

245

246

This previously used the FQDN as the default domain, but that can

247

be very slow on machines where DNS is broken. So now we simply

248

use the hostname.

249

"""

117

def username():

118

"""Return email-style username.

119

120

Something similar to 'Martin Pool <mbp@sourcefrog.net>'

121

122

:todo: Check it's reasonably well-formed.

123

124

:todo: Allow taking it from a dotfile to help people on windows

125

who can't easily set variables.

126

127

:todo: Cope without pwd module, which is only on unix.

128

"""

129

e = os.environ.get('BZREMAIL') or os.environ.get('EMAIL')

130

if e: return e

131

250

132

import socket

251

252

# XXX: Any good way to get real user name on win32?

253

133

254

134

try:

255

135

import pwd

256

136

uid = os.getuid()

257

137

w = pwd.getpwuid(uid)

258

gecos = w.pw_gecos.decode(bzrlib.user_encoding)

259

username = w.pw_name.decode(bzrlib.user_encoding)

138

gecos = w.pw_gecos

260

139

comma = gecos.find(',')

261

140

if comma == -1:

262

141

realname = gecos

263

142

else:

264

143

realname = gecos[:comma]

265

if not realname:

266

realname = username

267

144

return '%s <%s@%s>' % (realname, w.pw_name, socket.getfqdn())

268

145

except ImportError:

269

import getpass

270

realname = username = getpass.getuser().decode(bzrlib.user_encoding)

271

272

return realname, (username + '@' + socket.gethostname())

273

274

275

def _get_user_id(branch):

276

"""Return the full user id from a file or environment variable.

277

278

e.g. "John Hacker <jhacker@foo.org>"

279

280

branch

281

A branch to use for a per-branch configuration, or None.

282

283

The following are searched in order:

284

285

1. $BZREMAIL

286

2. .bzr/email for this branch.

287

3. ~/.bzr.conf/email

288

4. $EMAIL

289

"""

290

v = os.environ.get('BZREMAIL')

291

if v:

292

return v.decode(bzrlib.user_encoding)

293

294

if branch:

295

try:

296

return (branch.controlfile("email", "r")

297

.read()

298

.decode(bzrlib.user_encoding)

299

.rstrip("\r\n"))

300

except IOError, e:

301

if e.errno != errno.ENOENT:

302

raise

303

except BzrError, e:

304

pass

305

306

try:

307

return (open(os.path.join(config_dir(), "email"))

308

.read()

309

.decode(bzrlib.user_encoding)

310

.rstrip("\r\n"))

311

except IOError, e:

312

if e.errno != errno.ENOENT:

313

raise e

314

315

v = os.environ.get('EMAIL')

316

if v:

317

return v.decode(bzrlib.user_encoding)

318

else:

319

return None

320

321

322

def username(branch):

323

"""Return email-style username.

324

325

Something similar to 'Martin Pool <mbp@sourcefrog.net>'

326

327

TODO: Check it's reasonably well-formed.

328

"""

329

v = _get_user_id(branch)

330

if v:

331

return v

332

333

name, email = _auto_user_id()

334

if name:

335

return '%s <%s>' % (name, email)

336

else:

337

return email

338

339

340

def user_email(branch):

146

pass

147

148

import getpass, socket

149

return '<%s@%s>' % (getpass.getuser(), socket.getfqdn())

150

151

152

def user_email():

341

153

"""Return just the email component of a username."""

342

e = _get_user_id(branch)

154

e = os.environ.get('BZREMAIL') or os.environ.get('EMAIL')

343

155

if e:

156

import re

344

157

m = re.search(r'[\w+.-]+@[\w+.-]+', e)

345

158

if not m:

346

raise BzrError("%r doesn't seem to contain a reasonable email address" % e)

159

bailout('%r is not a reasonable email address' % e)

347

160

return m.group(0)

348

161

349

return _auto_user_id()[1]

162

163

import getpass, socket

164

return '%s@%s' % (getpass.getuser(), socket.getfqdn())

165

350

166

351

167

352

168

353

169

def compare_files(a, b):

354

170

"""Returns true if equal in contents"""

355

BUFSIZE = 4096

356

while True:

357

ai = a.read(BUFSIZE)

358

bi = b.read(BUFSIZE)

359

if ai != bi:

360

return False

361

if ai == '':

362

return True

171

# TODO: don't read the whole thing in one go.

172

result = a.read() == b.read()

173

return result

363

174

364

175

365

176

366

177

def local_time_offset(t=None):

367

178

"""Return offset of local zone from GMT, either at present or at time t."""

368

# python2.3 localtime() can't take None

369

if t == None:

370

t = time.time()

371

372

179

if time.localtime(t).tm_isdst and time.daylight:

373

180

return -time.altzone

374

181

else:

378

185

def format_date(t, offset=0, timezone='original'):

379

186

## TODO: Perhaps a global option to use either universal or local time?

380

187

## Or perhaps just let people set $TZ?

188

import time

189

381

190

assert isinstance(t, float)

382

191

383

192

if timezone == 'utc':

391

200

tt = time.localtime(t)

392

201

offset = local_time_offset(t)

393

202

else:

394

raise BzrError("unsupported timezone format %r" % timezone,

395

['options are "utc", "original", "local"'])

203

bailout("unsupported timezone format %r",

204

['options are "utc", "original", "local"'])

396

205

397

206

return (time.strftime("%a %Y-%m-%d %H:%M:%S", tt)

398

207

+ ' %+03d%02d' % (offset / 3600, (offset / 60) % 60))

410

219

411

220

if hasattr(os, 'urandom'): # python 2.4 and later

412

221

rand_bytes = os.urandom

413

elif sys.platform == 'linux2':

414

rand_bytes = file('/dev/urandom', 'rb').read

415

222

else:

416

# not well seeded, but better than nothing

417

def rand_bytes(n):

418

import random

419

s = ''

420

while n:

421

s += chr(random.randint(0, 255))

422

n -= 1

423

return s

223

# FIXME: No good on non-Linux

224

_rand_file = file('/dev/urandom', 'rb')

225

rand_bytes = _rand_file.read

424

226

425

227

426

228

## TODO: We could later have path objects that remember their list

440

242

>>> splitpath('a/../b')

441

243

Traceback (most recent call last):

442

244

...

443

BzrError: sorry, '..' not allowed in path

245

BzrError: ("sorry, '..' not allowed in path", [])

444

246

"""

445

247

assert isinstance(p, types.StringTypes)

446

447

# split on either delimiter because people might use either on

448

# Windows

449

ps = re.split(r'[\\/]', p)

450

451

rps = []

248

ps = [f for f in p.split('/') if f != '.']

452

249

for f in ps:

453

250

if f == '..':

454

raise BzrError("sorry, %r not allowed in path" % f)

455

elif (f == '.') or (f == ''):

456

pass

457

else:

458

rps.append(f)

459

return rps

251

bailout("sorry, %r not allowed in path" % f)

252

return ps

460

253

461

254

def joinpath(p):

462

255

assert isinstance(p, list)

463

256

for f in p:

464

if (f == '..') or (f == None) or (f == ''):

465

raise BzrError("sorry, %r not allowed in path" % f)

466

return os.path.join(*p)

257

if (f == '..') or (f is None) or (f == ''):

258

bailout("sorry, %r not allowed in path" % f)

259

return '/'.join(p)

467

260

468

261

469

262

def appendpath(p1, p2):

470

263

if p1 == '':

471

264

return p2

472

265

else:

473

return os.path.join(p1, p2)

266

return p1 + '/' + p2

474

267

475

268

476

269

def extern_command(cmd, ignore_errors = False):

477

270

mutter('external command: %s' % `cmd`)

478

271

if os.system(cmd):

479

272

if not ignore_errors:

480

raise BzrError('command failed')

481

482

483

def _read_config_value(name):

484

"""Read a config value from the file ~/.bzr.conf/<name>

485

Return None if the file does not exist"""

486

try:

487

f = file(os.path.join(config_dir(), name), "r")

488

return f.read().decode(bzrlib.user_encoding).rstrip("\r\n")

489

except IOError, e:

490

if e.errno == errno.ENOENT:

491

return None

492

raise

493

494

495

def _get_editor():

496

"""Return a sequence of possible editor binaries for the current platform"""

497

e = _read_config_value("editor")

498

if e is not None:

499

yield e

500

501

if os.name == "windows":

502

yield "notepad.exe"

503

elif os.name == "posix":

504

try:

505

yield os.environ["EDITOR"]

506

except KeyError:

507

yield "/usr/bin/vi"

508

509

510

def _run_editor(filename):

511

"""Try to execute an editor to edit the commit message. Returns True on success,

512

False on failure"""

513

for e in _get_editor():

514

x = os.spawnvp(os.P_WAIT, e, (e, filename))

515

if x == 0:

516

return True

517

elif x == 127:

518

continue

519

else:

520

break

521

raise BzrError("Could not start any editor. Please specify $EDITOR or use ~/.bzr.conf/editor")

522

return False

523

524

525

def get_text_message(infotext, ignoreline = "default"):

526

import tempfile

527

528

if ignoreline == "default":

529

ignoreline = "-- This line and the following will be ignored --"

530

531

try:

532

tmp_fileno, msgfilename = tempfile.mkstemp()

533

msgfile = os.close(tmp_fileno)

534

if infotext is not None and infotext != "":

535

hasinfo = True

536

msgfile = file(msgfilename, "w")

537

msgfile.write("\n\n%s\n\n%s" % (ignoreline, infotext))

538

msgfile.close()

539

else:

540

hasinfo = False

541

542

if not _run_editor(msgfilename):

543

return None

544

545

started = False

546

msg = []

547

lastline, nlines = 0, 0

548

for line in file(msgfilename, "r"):

549

stripped_line = line.strip()

550

# strip empty line before the log message starts

551

if not started:

552

if stripped_line != "":

553

started = True

554

else:

555

continue

556

# check for the ignore line only if there

557

# is additional information at the end

558

if hasinfo and stripped_line == ignoreline:

559

break

560

nlines += 1

561

# keep track of the last line that had some content

562

if stripped_line != "":

563

lastline = nlines

564

msg.append(line)

565

566

if len(msg) == 0:

567

return None

568

# delete empty lines at the end

569

del msg[lastline:]

570

# add a newline at the end, if needed

571

if not msg[-1].endswith("\n"):

572

return "%s%s" % ("".join(msg), "\n")

573

else:

574

return "".join(msg)

575

finally:

576

# delete the msg file in any case

577

try: os.unlink(msgfilename)

578

except IOError: pass

273

bailout('command failed')

274

Older »