~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Martin Pool
Date: 2005-10-13 03:23:22 UTC
mto: (1185.41.1 bzr.sftp) (1464.1.1) (1534.1.1 integration) (1495.1.4) (1505.1.16 bzr-bound-branch) (1508.1.15) (1526.1.3 run_tests_twice_for_i18n) (1540.1.3 bzr.dev (Main development branch)) (1685.1.1 bzr-encoding) (1553.5.1 bzr.dev (Main development branch)) (1608.2.1 bzr.mbp.escape-stores)
mto: This revision was merged to the branch mainline in revision 1454.
Revision ID: mbp@sourcefrog.net-20051013032322-dc469f4b81f8e7f9

Tags: bzr-0.1

- testament symlink support

- more testament tests

files added:
bzrlib/mdiff.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files removed:
BRANCH.TODO

INSTALL

bzrlib/config.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/rio.py

bzrlib/symbol_versioning.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/blackbox/test_upgrade.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_branch.py

bzrlib/tests/test_command.py

bzrlib/tests/test_config.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_remove.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transport_implementations.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/transport/ftp.py

bzrlib/transport/memory.py

bzrlib/transport/readonly.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

tools/biobench.py

tools/riodemo.py

tools/trace-revisions

files renamed:
bzr_man.py => bzr-man.py

bzrlib/conflicts.py => bzrlib/plugins/conflicts.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/test_branch_implementations.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_identitymap.py => bzrlib/selftest/testidentitymap.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/test_sampler.py => bzrlib/selftest/testsampler.py

bzrlib/tests/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_testament.py => bzrlib/selftest/testtestament.py

bzrlib/tests/test_transactions.py => bzrlib/selftest/testtransactions.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/test_workingtree.py => bzrlib/selftest/testworkingtree.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/ui/__init__.py => bzrlib/ui.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/clone.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py *

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/treeshape.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/testament.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/zsh/_bzr

doc/random.txt

setup.py *

tutorial.txt

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

"""Implementation of Transport over http.

"""

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import urllib, urllib2

import urllib2

import urlparse

from warnings import warn

from bzrlib.transport import Transport, Server

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError)

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

def extract_auth(url, password_manager):

"""

Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert url.startswith('http://') or url.startswith('https://')

scheme, host = url.split('//', 1)

if '/' in host:

host, path = host.split('/', 1)

path = '/' + path

else:

path = ''

port = ''

if '@' in host:

auth, host = host.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in host:

host, port = host.split(':', 1)

port = ':' + port

# FIXME: if password isn't given, should we ask for it?

if password is not None:

username = urllib.unquote(username)

password = urllib.unquote(password)

password_manager.add_password(None, host, username, password)

url = scheme + '//' + host + port + path

return url

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

manager = urllib2.HTTPPasswordMgrWithDefaultRealm()

url = extract_auth(url, manager)

auth_handler = urllib2.HTTPBasicAuthHandler(manager)

opener = urllib2.build_opener(auth_handler)

url_f = opener.open(url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

def __init__(self, base):

"""Set the base path where files will be stored."""

assert base.startswith('http://') or base.startswith('https://')

if base[-1] != '/':

base = base + '/'

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

# rather than using get_url

109

"""Return the full url to the given relative path.

110

This can be supplied with a string or a list

111

"""

112

assert isinstance(relpath, basestring)

113

if isinstance(relpath, basestring):

114

relpath_parts = relpath.split('/')

115

else:

116

# TODO: Don't call this with an array - no magic interfaces

117

relpath_parts = relpath[:]

118

if len(relpath_parts) > 1:

119

if relpath_parts[0] == '':

120

raise ValueError("path %r within branch %r seems to be absolute"

121

% (relpath, self._path))

122

if relpath_parts[-1] == '':

123

raise ValueError("path %r within branch %r seems to be a directory"

124

% (relpath, self._path))

relpath = [relpath]

125

basepath = self._path.split('/')

126

if len(basepath) > 0 and basepath[-1] == '':

127

basepath = basepath[:-1]

128

for p in relpath_parts:

for p in relpath:

129

if p == '..':

130

if len(basepath) == 0:

if len(basepath) < 0:

131

# In most filesystems, a request for the parent

132

# of root, just returns root.

133

continue

134

basepath.pop()

135

elif p == '.' or p == '':

if len(basepath) > 0:

basepath.pop()

elif p == '.':

136

continue # No-op

137

else:

138

basepath.append(p)

139

# Possibly, we could use urlparse.urljoin() here, but

140

100

# I'm concerned about when it chooses to strip the last

141

101

# portion of the path, and when it doesn't.

143

103

return urlparse.urlunparse((self._proto,

144

104

self._host, path, '', '', ''))

145

105

106

def relpath(self, abspath):

107

if not abspath.startswith(self.base):

108

raise NonRelativePath('path %r is not under base URL %r'

109

% (abspath, self.base))

110

pl = len(self.base)

111

return abspath[pl:].lstrip('/')

112

146

113

def has(self, relpath):

147

114

"""Does the target location exist?

148

115

154

121

cleaner if we just do an http HEAD request, and parse

155

122

the return code.

156

123

"""

157

path = relpath

158

124

try:

159

path = self.abspath(relpath)

160

f = get_url(path)

125

f = get_url(self.abspath(relpath))

161

126

# Without the read and then close()

162

127

# we tend to have busy sockets.

163

128

f.read()

164

129

f.close()

165

130

return True

166

except urllib2.URLError, e:

167

mutter('url error code: %s for has url: %r', e.code, path)

168

if e.code == 404:

169

return False

170

raise

131

except BzrError:

132

return False

133

except urllib2.URLError:

134

return False

171

135

except IOError, e:

172

mutter('io error: %s %s for has url: %r',

173

e.errno, errno.errorcode.get(e.errno), path)

174

136

if e.errno == errno.ENOENT:

175

137

return False

176

raise TransportError(orig_error=e)

138

raise HttpTransportError(orig_error=e)

177

139

178

140

def get(self, relpath, decode=False):

179

141

"""Get the file at the given relative path.

180

142

181

143

:param relpath: The relative path to the file

182

144

"""

183

path = relpath

184

145

try:

185

path = self.abspath(relpath)

186

return get_url(path)

187

except urllib2.HTTPError, e:

188

mutter('url error code: %s for has url: %r', e.code, path)

189

if e.code == 404:

190

raise NoSuchFile(path, extra=e)

191

raise

192

except (BzrError, IOError), e:

193

if hasattr(e, 'errno'):

194

mutter('io error: %s %s for has url: %r',

195

e.errno, errno.errorcode.get(e.errno), path)

196

if e.errno == errno.ENOENT:

197

raise NoSuchFile(path, extra=e)

198

raise ConnectionError(msg = "Error retrieving %s: %s"

146

return get_url(self.abspath(relpath))

147

except (BzrError, urllib2.URLError, IOError), e:

148

raise NoSuchFile(msg = "Error retrieving %s: %s"

199

149

% (self.abspath(relpath), str(e)),

200

150

orig_error=e)

201

151

202

def put(self, relpath, f, mode=None):

152

def get_partial(self, relpath, start, length=None):

153

"""Get just part of a file.

154

155

:param relpath: Path to the file, relative to base

156

:param start: The starting position to read from

157

:param length: The length to read. A length of None indicates

158

read to the end of the file.

159

:return: A file-like object containing at least the specified bytes.

160

Some implementations may return objects which can be read

161

past this length, but this is not guaranteed.

162

"""

163

# TODO: You can make specialized http requests for just

164

# a portion of the file. Figure out how to do that.

165

# For now, urllib2 returns files that cannot seek() so

166

# we just read bytes off the beginning, until we

167

# get to the point that we care about.

168

f = self.get(relpath)

169

# TODO: read in smaller chunks, in case things are

170

# buffered internally.

171

f.read(start)

172

return f

173

174

def put(self, relpath, f):

203

175

"""Copy the file-like or string object into the location.

204

176

205

177

:param relpath: Location to put the contents, relative to base.

207

179

"""

208

180

raise TransportNotPossible('http PUT not supported')

209

181

210

def mkdir(self, relpath, mode=None):

182

def mkdir(self, relpath):

211

183

"""Create a directory at the given path."""

212

184

raise TransportNotPossible('http does not support mkdir()')

213

185

214

def rmdir(self, relpath):

215

"""See Transport.rmdir."""

216

raise TransportNotPossible('http does not support rmdir()')

217

218

186

def append(self, relpath, f):

219

187

"""Append the text in the file-like object into the final

220

188

location.

225

193

"""Copy the item at rel_from to the location at rel_to"""

226

194

raise TransportNotPossible('http does not support copy()')

227

195

228

def copy_to(self, relpaths, other, mode=None, pb=None):

196

def copy_to(self, relpaths, other, pb=None):

229

197

"""Copy a set of entries from self into another Transport.

230

198

231

199

:param relpaths: A list/generator of entries to be copied.

239

207

if isinstance(other, HttpTransport):

240

208

raise TransportNotPossible('http cannot be the target of copy_to()')

241

209

else:

242

return super(HttpTransport, self).copy_to(relpaths, other, mode=mode, pb=pb)

210

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

243

211

244

212

def move(self, rel_from, rel_to):

245

213

"""Move the item at rel_from to the location at rel_to"""

249

217

"""Delete the item at relpath"""

250

218

raise TransportNotPossible('http does not support delete()')

251

219

252

def is_readonly(self):

253

"""See Transport.is_readonly."""

254

return True

255

256

220

def listable(self):

257

221

"""See Transport.listable."""

258

222

return False

283

247

"""

284

248

raise TransportNotPossible('http does not support lock_write()')

285

249

286

287

#---------------- test server facilities ----------------

288

import BaseHTTPServer, SimpleHTTPServer, socket, time

289

import threading

290

291

292

class WebserverNotAvailable(Exception):

293

pass

294

295

296

class BadWebserverPath(ValueError):

297

def __str__(self):

298

return 'path %s is not in %s' % self.args

299

300

301

class TestingHTTPRequestHandler(SimpleHTTPServer.SimpleHTTPRequestHandler):

302

303

def log_message(self, format, *args):

304

self.server.test_case.log("webserver - %s - - [%s] %s",

305

self.address_string(),

306

self.log_date_time_string(),

307

format%args)

308

309

def handle_one_request(self):

310

"""Handle a single HTTP request.

311

312

You normally don't need to override this method; see the class

313

__doc__ string for information on how to handle specific HTTP

314

commands such as GET and POST.

315

316

"""

317

for i in xrange(1,11): # Don't try more than 10 times

318

try:

319

self.raw_requestline = self.rfile.readline()

320

except socket.error, e:

321

if e.args[0] in (errno.EAGAIN, errno.EWOULDBLOCK):

322

# omitted for now because some tests look at the log of

323

# the server and expect to see no errors. see recent

324

# email thread. -- mbp 20051021.

325

## self.log_message('EAGAIN (%d) while reading from raw_requestline' % i)

326

time.sleep(0.01)

327

continue

328

raise

329

else:

330

break

331

if not self.raw_requestline:

332

self.close_connection = 1

333

return

334

if not self.parse_request(): # An error code has been sent, just exit

335

return

336

mname = 'do_' + self.command

337

if not hasattr(self, mname):

338

self.send_error(501, "Unsupported method (%r)" % self.command)

339

return

340

method = getattr(self, mname)

341

method()

342

343

class TestingHTTPServer(BaseHTTPServer.HTTPServer):

344

def __init__(self, server_address, RequestHandlerClass, test_case):

345

BaseHTTPServer.HTTPServer.__init__(self, server_address,

346

RequestHandlerClass)

347

self.test_case = test_case

348

349

350

class HttpServer(Server):

351

"""A test server for http transports."""

352

353

_HTTP_PORTS = range(13000, 0x8000)

354

355

def _http_start(self):

356

httpd = None

357

for port in self._HTTP_PORTS:

358

try:

359

httpd = TestingHTTPServer(('localhost', port),

360

TestingHTTPRequestHandler,

361

self)

362

except socket.error, e:

363

if e.args[0] == errno.EADDRINUSE:

364

continue

365

print >>sys.stderr, "Cannot run webserver :-("

366

raise

367

else:

368

break

369

370

if httpd is None:

371

raise WebserverNotAvailable("Cannot run webserver :-( "

372

"no free ports in range %s..%s" %

373

(_HTTP_PORTS[0], _HTTP_PORTS[-1]))

374

375

self._http_base_url = 'http://localhost:%s/' % port

376

self._http_starting.release()

377

httpd.socket.settimeout(0.1)

378

379

while self._http_running:

380

try:

381

httpd.handle_request()

382

except socket.timeout:

383

pass

384

385

def _get_remote_url(self, path):

386

path_parts = path.split(os.path.sep)

387

if os.path.isabs(path):

388

if path_parts[:len(self._local_path_parts)] != \

389

self._local_path_parts:

390

raise BadWebserverPath(path, self.test_dir)

391

remote_path = '/'.join(path_parts[len(self._local_path_parts):])

392

else:

393

remote_path = '/'.join(path_parts)

394

395

self._http_starting.acquire()

396

self._http_starting.release()

397

return self._http_base_url + remote_path

398

399

def log(self, *args, **kwargs):

400

"""Capture Server log output."""

401

self.logs.append(args[3])

402

403

def setUp(self):

404

"""See bzrlib.transport.Server.setUp."""

405

self._home_dir = os.getcwdu()

406

self._local_path_parts = self._home_dir.split(os.path.sep)

407

self._http_starting = threading.Lock()

408

self._http_starting.acquire()

409

self._http_running = True

410

self._http_base_url = None

411

self._http_thread = threading.Thread(target=self._http_start)

412

self._http_thread.setDaemon(True)

413

self._http_thread.start()

414

self._http_proxy = os.environ.get("http_proxy")

415

if self._http_proxy is not None:

416

del os.environ["http_proxy"]

417

self.logs = []

418

419

def tearDown(self):

420

"""See bzrlib.transport.Server.tearDown."""

421

self._http_running = False

422

self._http_thread.join()

423

if self._http_proxy is not None:

424

import os

425

os.environ["http_proxy"] = self._http_proxy

426

427

def get_url(self):

428

"""See bzrlib.transport.Server.get_url."""

429

return self._get_remote_url(self._home_dir)

430

431

def get_bogus_url(self):

432

"""See bzrlib.transport.Server.get_bogus_url."""

433

return 'http://jasldkjsalkdjalksjdkljasd'

434

435

436

def get_test_permutations():

437

"""Return the permutations to be used in testing."""

438

warn("There are no HTTPS transport provider tests yet.")

439

return [(HttpTransport, HttpServer),

440

]

250

register_transport('http://', HttpTransport)

251

register_transport('https://', HttpTransport)

Older »