~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2005-09-14 09:03:27 UTC
mto: (1185.41.1 bzr.sftp) (1393.2.1) (1092.3.4) (1417.1.4) (1464.1.1) (1534.1.1 integration) (1495.1.4) (1505.1.16 bzr-bound-branch) (1508.1.15) (1526.1.3 run_tests_twice_for_i18n) (1540.1.3 bzr.dev (Main development branch)) (1685.1.1 bzr-encoding) (1553.5.1 bzr.dev (Main development branch)) (1608.2.1 bzr.mbp.escape-stores)
mto: This revision was merged to the branch mainline in revision 1390.
Revision ID: robertc@robertcollins.net-20050914090327-46efe0697fa7c84d

and the tutorial patch came back, the very next day

files added:
bzrlib/mdiff.py

bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/revfile.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/cache-remote-revisions.diff

patches/find-touching-from-seq.diff

patches/meta-data-in-inventory.patch

patches/ndiff.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testbzr

testsweet.py

files removed:
BRANCH.TODO

INSTALL

NEWS.developers

bzrlib/annotate.py

bzrlib/clone.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/export

bzrlib/export/__init__.py

bzrlib/export/dir_exporter.py

bzrlib/export/tar_exporter.py

bzrlib/export/zip_exporter.py

bzrlib/gpg.py

bzrlib/identitymap.py

bzrlib/lsprof.py

bzrlib/option.py

bzrlib/revisionspec.py

bzrlib/rio.py

bzrlib/store

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/symbol_versioning.py

bzrlib/testament.py

bzrlib/tests/HTTPTestUtil.py

bzrlib/tests/blackbox

bzrlib/tests/blackbox/__init__.py

bzrlib/tests/blackbox/test_cat.py

bzrlib/tests/blackbox/test_export.py

bzrlib/tests/blackbox/test_missing.py

bzrlib/tests/blackbox/test_pull.py

bzrlib/tests/blackbox/test_revision_info.py

bzrlib/tests/blackbox/test_revno.py

bzrlib/tests/stub_sftp.py

bzrlib/tests/test_ancestry.py

bzrlib/tests/test_annotate.py

bzrlib/tests/test_api.py

bzrlib/tests/test_bad_files.py

bzrlib/tests/test_basis_inventory.py

bzrlib/tests/test_command.py

bzrlib/tests/test_commit.py

bzrlib/tests/test_commit_merge.py

bzrlib/tests/test_config.py

bzrlib/tests/test_conflicts.py

bzrlib/tests/test_gpg.py

bzrlib/tests/test_http.py

bzrlib/tests/test_identitymap.py

bzrlib/tests/test_missing.py

bzrlib/tests/test_msgeditor.py

bzrlib/tests/test_nonascii.py

bzrlib/tests/test_options.py

bzrlib/tests/test_osutils.py

bzrlib/tests/test_permissions.py

bzrlib/tests/test_remove.py

bzrlib/tests/test_revprops.py

bzrlib/tests/test_reweave.py

bzrlib/tests/test_rio.py

bzrlib/tests/test_sampler.py

bzrlib/tests/test_selftest.py

bzrlib/tests/test_setup.py

bzrlib/tests/test_sftp_transport.py

bzrlib/tests/test_source.py

bzrlib/tests/test_symbol_versioning.py

bzrlib/tests/test_testament.py

bzrlib/tests/test_trace.py

bzrlib/tests/test_transactions.py

bzrlib/tests/test_transport.py

bzrlib/tests/test_tsort.py

bzrlib/tests/test_ui.py

bzrlib/tests/test_uncommit.py

bzrlib/tests/test_upgrade.py

bzrlib/tests/test_workingtree.py

bzrlib/tests/treeshape.py

bzrlib/transactions.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/ftp.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/ui

bzrlib/ui/text.py

bzrlib/uncommit.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

tools/biobench.py

tools/capture_tree.py

tools/riodemo.py

tools/trace-revisions

files renamed:
bzr_man.py => bzr-man.py

contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/tests/ => bzrlib/selftest/

bzrlib/tests/blackbox/test_too_much.py => bzrlib/selftest/blackbox.py

bzrlib/tests/test_plugins.py => bzrlib/selftest/plugins.py

bzrlib/tests/test_branch.py => bzrlib/selftest/testbranch.py

bzrlib/tests/test_diff.py => bzrlib/selftest/testdiff.py

bzrlib/tests/test_fetch.py => bzrlib/selftest/testfetch.py

bzrlib/tests/test_graph.py => bzrlib/selftest/testgraph.py

bzrlib/tests/test_hashcache.py => bzrlib/selftest/testhashcache.py

bzrlib/tests/test_inv.py => bzrlib/selftest/testinv.py

bzrlib/tests/test_log.py => bzrlib/selftest/testlog.py

bzrlib/tests/test_merge.py => bzrlib/selftest/testmerge.py

bzrlib/tests/test_merge3.py => bzrlib/selftest/testmerge3.py

bzrlib/tests/test_revision.py => bzrlib/selftest/testrevision.py

bzrlib/tests/test_revisionnamespaces.py => bzrlib/selftest/testrevisionnamespaces.py

bzrlib/tests/test_status.py => bzrlib/selftest/teststatus.py

bzrlib/tests/test_store.py => bzrlib/selftest/teststore.py

bzrlib/tests/blackbox/test_versioning.py => bzrlib/selftest/versioning.py

bzrlib/tests/test_whitebox.py => bzrlib/selftest/whitebox.py

bzrlib/store/__init__.py => bzrlib/store.py

bzrlib/ui/__init__.py => bzrlib/ui.py

bzrlib/upgrade.py => tools/history2weaves.py

bzrlib/tests/test_weave.py => tools/testweave.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

README

TODO

build-api

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/intset.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/merge.py *

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revision.py

bzrlib/selftest/__init__.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

contrib/zsh/_bzr

doc/random.txt

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Implementation of Transport over http.

"""

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

TransportError, ConnectionError)

import os, errno

from cStringIO import StringIO

import urllib, urllib2

import urlparse

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

def extract_auth(url, password_manager):

"""

Extract auth parameters from am HTTP/HTTPS url and add them to the given

password manager. Return the url, minus those auth parameters (which

confuse urllib2).

"""

assert url.startswith('http://') or url.startswith('https://')

scheme, host = url.split('//', 1)

if '/' in host:

host, path = host.split('/', 1)

path = '/' + path

else:

path = ''

port = ''

if '@' in host:

auth, host = host.split('@', 1)

if ':' in auth:

username, password = auth.split(':', 1)

else:

username, password = auth, None

if ':' in host:

host, port = host.split(':', 1)

port = ':' + port

# FIXME: if password isn't given, should we ask for it?

if password is not None:

username = urllib.unquote(username)

password = urllib.unquote(password)

password_manager.add_password(None, host, username, password)

url = scheme + '//' + host + port + path

return url

def get_url(url):

import urllib2

mutter("get_url %s" % url)

manager = urllib2.HTTPPasswordMgrWithDefaultRealm()

url = extract_auth(url, manager)

auth_handler = urllib2.HTTPBasicAuthHandler(manager)

opener = urllib2.build_opener(auth_handler)

url_f = opener.open(url)

return url_f

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

def __init__(self, base):

"""Set the base path where files will be stored."""

assert base.startswith('http://') or base.startswith('https://')

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

(self._proto, self._host,

self._path, self._parameters,

self._query, self._fragment) = urlparse.urlparse(self.base)

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

a new HttpTransport object.

"""

100

if offset is None:

101

return HttpTransport(self.base)

102

else:

103

return HttpTransport(self.abspath(offset))

104

105

def abspath(self, relpath):

106

"""Return the full url to the given relative path.

107

This can be supplied with a string or a list

108

"""

109

assert isinstance(relpath, basestring)

110

if isinstance(relpath, basestring):

111

relpath_parts = relpath.split('/')

112

else:

113

# TODO: Don't call this with an array - no magic interfaces

114

relpath_parts = relpath[:]

115

if len(relpath_parts) > 1:

116

if relpath_parts[0] == '':

117

raise ValueError("path %r within branch %r seems to be absolute"

118

% (relpath, self._path))

119

if relpath_parts[-1] == '':

120

raise ValueError("path %r within branch %r seems to be a directory"

121

% (relpath, self._path))

122

basepath = self._path.split('/')

123

if len(basepath) > 0 and basepath[-1] == '':

124

basepath = basepath[:-1]

125

for p in relpath_parts:

126

if p == '..':

127

if len(basepath) == 0:

128

# In most filesystems, a request for the parent

129

# of root, just returns root.

130

continue

131

basepath.pop()

132

elif p == '.' or p == '':

133

continue # No-op

134

else:

135

basepath.append(p)

136

# Possibly, we could use urlparse.urljoin() here, but

137

# I'm concerned about when it chooses to strip the last

138

# portion of the path, and when it doesn't.

139

path = '/'.join(basepath)

140

return urlparse.urlunparse((self._proto,

141

self._host, path, '', '', ''))

142

143

def has(self, relpath):

144

"""Does the target location exist?

145

146

TODO: HttpTransport.has() should use a HEAD request,

147

not a full GET request.

148

149

TODO: This should be changed so that we don't use

150

urllib2 and get an exception, the code path would be

151

cleaner if we just do an http HEAD request, and parse

152

the return code.

153

"""

154

path = relpath

155

try:

156

path = self.abspath(relpath)

157

f = get_url(path)

158

# Without the read and then close()

159

# we tend to have busy sockets.

160

f.read()

161

f.close()

162

return True

163

except urllib2.URLError, e:

164

mutter('url error code: %s for has url: %r', e.code, path)

165

if e.code == 404:

166

return False

167

raise

168

except IOError, e:

169

mutter('io error: %s %s for has url: %r',

170

e.errno, errno.errorcode.get(e.errno), path)

171

if e.errno == errno.ENOENT:

172

return False

173

raise TransportError(orig_error=e)

174

175

def get(self, relpath, decode=False):

176

"""Get the file at the given relative path.

177

178

:param relpath: The relative path to the file

179

"""

180

path = relpath

181

try:

182

path = self.abspath(relpath)

183

return get_url(path)

184

except urllib2.HTTPError, e:

185

mutter('url error code: %s for has url: %r', e.code, path)

186

if e.code == 404:

187

raise NoSuchFile(path, extra=e)

188

raise

189

except (BzrError, IOError), e:

190

if hasattr(e, 'errno'):

191

mutter('io error: %s %s for has url: %r',

192

e.errno, errno.errorcode.get(e.errno), path)

193

if e.errno == errno.ENOENT:

194

raise NoSuchFile(path, extra=e)

195

raise ConnectionError(msg = "Error retrieving %s: %s"

196

% (self.abspath(relpath), str(e)),

197

orig_error=e)

198

199

def put(self, relpath, f, mode=None):

200

"""Copy the file-like or string object into the location.

201

202

:param relpath: Location to put the contents, relative to base.

203

:param f: File-like or string object.

204

"""

205

raise TransportNotPossible('http PUT not supported')

206

207

def mkdir(self, relpath, mode=None):

208

"""Create a directory at the given path."""

209

raise TransportNotPossible('http does not support mkdir()')

210

211

def append(self, relpath, f):

212

"""Append the text in the file-like object into the final

213

location.

214

"""

215

raise TransportNotPossible('http does not support append()')

216

217

def copy(self, rel_from, rel_to):

218

"""Copy the item at rel_from to the location at rel_to"""

219

raise TransportNotPossible('http does not support copy()')

220

221

def copy_to(self, relpaths, other, mode=None, pb=None):

222

"""Copy a set of entries from self into another Transport.

223

224

:param relpaths: A list/generator of entries to be copied.

225

226

TODO: if other is LocalTransport, is it possible to

227

do better than put(get())?

228

"""

229

# At this point HttpTransport might be able to check and see if

230

# the remote location is the same, and rather than download, and

231

# then upload, it could just issue a remote copy_this command.

232

if isinstance(other, HttpTransport):

233

raise TransportNotPossible('http cannot be the target of copy_to()')

234

else:

235

return super(HttpTransport, self).copy_to(relpaths, other, mode=mode, pb=pb)

236

237

def move(self, rel_from, rel_to):

238

"""Move the item at rel_from to the location at rel_to"""

239

raise TransportNotPossible('http does not support move()')

240

241

def delete(self, relpath):

242

"""Delete the item at relpath"""

243

raise TransportNotPossible('http does not support delete()')

244

245

def listable(self):

246

"""See Transport.listable."""

247

return False

248

249

def stat(self, relpath):

250

"""Return the stat information for a file.

251

"""

252

raise TransportNotPossible('http does not support stat()')

253

254

def lock_read(self, relpath):

255

"""Lock the given file for shared (read) access.

256

:return: A lock object, which should be passed to Transport.unlock()

257

"""

258

# The old RemoteBranch ignore lock for reading, so we will

259

# continue that tradition and return a bogus lock object.

260

class BogusLock(object):

261

def __init__(self, path):

262

self.path = path

263

def unlock(self):

264

pass

265

return BogusLock(relpath)

266

267

def lock_write(self, relpath):

268

"""Lock the given file for exclusive (write) access.

269

WARNING: many transports do not support this, so trying avoid using it

270

271

:return: A lock object, which should be passed to Transport.unlock()

272

"""

273

raise TransportNotPossible('http does not support lock_write()')

Older »