~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2005-10-06 22:15:52 UTC
mfrom: (1185.13.2)
mto: This revision was merged to the branch mainline in revision 1420.
Revision ID: robertc@robertcollins.net-20051006221552-9b15c96fa504e0ad

merge from upstream

files added:
bzrlib/mdiff.py

bzrlib/revfile.py

bzrlib/store/compressed_text.py

patches/cache-remote-revisions.diff

patches/cache_weave_inclusions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

testbzr

files removed:
BRANCH.TODO

INSTALL

bzrlib/config.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/identitymap.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/rio.py

bzrlib/testament.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_bound_branches.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_bound_sftp.py

bzrlib/tests/test_command.py

bzrlib/tests/test_config.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_remove.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/transactions.py

bzrlib/transport/ftp.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

tools/biobench.py

tools/riodemo.py

tools/trace-revisions

files renamed:
bzr_man.py => bzr-man.py

bzrlib/conflicts.py => bzrlib/plugins/conflicts.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/blackbox/test_revision_info.py => bzrlib/selftest/test_revision_info.py

bzrlib/tests/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/test_sampler.py => bzrlib/selftest/testsampler.py

bzrlib/tests/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/test_transport.py => bzrlib/selftest/testtransport.py

bzrlib/tests/test_workingtree.py => bzrlib/selftest/testworkingtree.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/ui/__init__.py => bzrlib/ui.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

NEWS.developers

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/annotate.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/clone.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py *

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/revisionspec.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/treeshape.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/upgrade.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

bzrlib/xml4.py

bzrlib/xml5.py

contrib/zsh/_bzr

doc/random.txt

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError)

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import urllib, urllib2

import urllib2

import urlparse

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

def extract_auth(url, password_manager):

"""

Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert url.startswith('http://') or url.startswith('https://')

scheme, host = url.split('//', 1)

if '/' in host:

host, path = host.split('/', 1)

path = '/' + path

else:

path = ''

port = ''

if '@' in host:

auth, host = host.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in host:

host, port = host.split(':', 1)

port = ':' + port

# FIXME: if password isn't given, should we ask for it?

if password is not None:

username = urllib.unquote(username)

password = urllib.unquote(password)

password_manager.add_password(None, host, username, password)

url = scheme + '//' + host + port + path

return url

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

manager = urllib2.HTTPPasswordMgrWithDefaultRealm()

url = extract_auth(url, manager)

auth_handler = urllib2.HTTPBasicAuthHandler(manager)

opener = urllib2.build_opener(auth_handler)

url_f = opener.open(url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

106

"""Return the full url to the given relative path.

107

This can be supplied with a string or a list

108

"""

109

assert isinstance(relpath, basestring)

110

if isinstance(relpath, basestring):

111

relpath_parts = relpath.split('/')

112

else:

113

# TODO: Don't call this with an array - no magic interfaces

114

relpath_parts = relpath[:]

115

if len(relpath_parts) > 1:

116

if relpath_parts[0] == '':

117

raise ValueError("path %r within branch %r seems to be absolute"

118

% (relpath, self._path))

119

if relpath_parts[-1] == '':

120

raise ValueError("path %r within branch %r seems to be a directory"

121

% (relpath, self._path))

relpath = [relpath]

122

basepath = self._path.split('/')

123

if len(basepath) > 0 and basepath[-1] == '':

124

basepath = basepath[:-1]

125

for p in relpath_parts:

for p in relpath:

126

if p == '..':

127

if len(basepath) == 0:

if len(basepath) < 0:

128

# In most filesystems, a request for the parent

129

# of root, just returns root.

130

continue

131

basepath.pop()

132

elif p == '.' or p == '':

elif p == '.':

133

continue # No-op

134

else:

135

basepath.append(p)

136

# Possibly, we could use urlparse.urljoin() here, but

137

# I'm concerned about when it chooses to strip the last

138

100

# portion of the path, and when it doesn't.

140

102

return urlparse.urlunparse((self._proto,

141

103

self._host, path, '', '', ''))

142

104

105

def relpath(self, abspath):

106

if not abspath.startswith(self.base):

107

raise NonRelativePath('path %r is not under base URL %r'

108

% (abspath, self.base))

109

pl = len(self.base)

110

return abspath[pl:].lstrip('/')

111

143

112

def has(self, relpath):

144

113

"""Does the target location exist?

145

114

151

120

cleaner if we just do an http HEAD request, and parse

152

121

the return code.

153

122

"""

154

path = relpath

155

123

try:

156

path = self.abspath(relpath)

157

f = get_url(path)

124

f = get_url(self.abspath(relpath))

158

125

# Without the read and then close()

159

126

# we tend to have busy sockets.

160

127

f.read()

161

128

f.close()

162

129

return True

163

except urllib2.URLError, e:

164

mutter('url error code: %s for has url: %r', e.code, path)

165

if e.code == 404:

166

return False

167

raise

130

except BzrError:

131

return False

132

except urllib2.URLError:

133

return False

168

134

except IOError, e:

169

mutter('io error: %s %s for has url: %r',

170

e.errno, errno.errorcode.get(e.errno), path)

171

135

if e.errno == errno.ENOENT:

172

136

return False

173

raise TransportError(orig_error=e)

137

raise HttpTransportError(orig_error=e)

174

138

175

139

def get(self, relpath, decode=False):

176

140

"""Get the file at the given relative path.

177

141

178

142

:param relpath: The relative path to the file

179

143

"""

180

path = relpath

181

144

try:

182

path = self.abspath(relpath)

183

return get_url(path)

184

except urllib2.HTTPError, e:

185

mutter('url error code: %s for has url: %r', e.code, path)

186

if e.code == 404:

187

raise NoSuchFile(path, extra=e)

188

raise

189

except (BzrError, IOError), e:

190

if hasattr(e, 'errno'):

191

mutter('io error: %s %s for has url: %r',

192

e.errno, errno.errorcode.get(e.errno), path)

193

if e.errno == errno.ENOENT:

194

raise NoSuchFile(path, extra=e)

195

raise ConnectionError(msg = "Error retrieving %s: %s"

196

% (self.abspath(relpath), str(e)),

197

orig_error=e)

198

199

def put(self, relpath, f, mode=None):

145

return get_url(self.abspath(relpath))

146

except (BzrError, urllib2.URLError, IOError), e:

147

raise NoSuchFile(orig_error=e)

148

except Exception,e:

149

raise HttpTransportError(orig_error=e)

150

151

def get_partial(self, relpath, start, length=None):

152

"""Get just part of a file.

153

154

:param relpath: Path to the file, relative to base

155

:param start: The starting position to read from

156

:param length: The length to read. A length of None indicates

157

read to the end of the file.

158

:return: A file-like object containing at least the specified bytes.

159

Some implementations may return objects which can be read

160

past this length, but this is not guaranteed.

161

"""

162

# TODO: You can make specialized http requests for just

163

# a portion of the file. Figure out how to do that.

164

# For now, urllib2 returns files that cannot seek() so

165

# we just read bytes off the beginning, until we

166

# get to the point that we care about.

167

f = self.get(relpath)

168

# TODO: read in smaller chunks, in case things are

169

# buffered internally.

170

f.read(start)

171

return f

172

173

def put(self, relpath, f):

200

174

"""Copy the file-like or string object into the location.

201

175

202

176

:param relpath: Location to put the contents, relative to base.

204

178

"""

205

179

raise TransportNotPossible('http PUT not supported')

206

180

207

def mkdir(self, relpath, mode=None):

181

def mkdir(self, relpath):

208

182

"""Create a directory at the given path."""

209

183

raise TransportNotPossible('http does not support mkdir()')

210

184

218

192

"""Copy the item at rel_from to the location at rel_to"""

219

193

raise TransportNotPossible('http does not support copy()')

220

194

221

def copy_to(self, relpaths, other, mode=None, pb=None):

195

def copy_to(self, relpaths, other, pb=None):

222

196

"""Copy a set of entries from self into another Transport.

223

197

224

198

:param relpaths: A list/generator of entries to be copied.

232

206

if isinstance(other, HttpTransport):

233

207

raise TransportNotPossible('http cannot be the target of copy_to()')

234

208

else:

235

return super(HttpTransport, self).copy_to(relpaths, other, mode=mode, pb=pb)

209

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

236

210

237

211

def move(self, rel_from, rel_to):

238

212

"""Move the item at rel_from to the location at rel_to"""

271

245

:return: A lock object, which should be passed to Transport.unlock()

272

246

"""

273

247

raise TransportNotPossible('http does not support lock_write()')

248

249

register_transport('http://', HttpTransport)

250

register_transport('https://', HttpTransport)

Older »