~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: John Arbash Meinel
Date: 2005-11-08 18:36:26 UTC
mto: This revision was merged to the branch mainline in revision 1727.
Revision ID: john@arbash-meinel.com-20051108183626-71f8414338043265

Updating unified_diff to take a factory, using the new diff algorithm in the code.

files added:
INSTALL

NEWS.developers

bzrlib/annotate.py

bzrlib/cdvdifflib.py

bzrlib/clone.py

bzrlib/config.py

bzrlib/conflicts.py

bzrlib/gpg.py

bzrlib/identitymap.py

bzrlib/nofrillsprecisemerge.py

bzrlib/option.py

bzrlib/revisionspec.py

bzrlib/selftest/stub_sftp.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_command.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_conflicts.py

bzrlib/selftest/test_revision_info.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/testannotate.py

bzrlib/selftest/testapi.py

bzrlib/selftest/testconfig.py

bzrlib/selftest/testgpg.py

bzrlib/selftest/testhttp.py

bzrlib/selftest/testidentitymap.py

bzrlib/selftest/testnonascii.py

bzrlib/selftest/testoptions.py

bzrlib/selftest/testrevprops.py

bzrlib/selftest/testreweave.py

bzrlib/selftest/testsampler.py

bzrlib/selftest/testsftp.py

bzrlib/selftest/testtestament.py

bzrlib/selftest/testtransactions.py

bzrlib/selftest/testtsort.py

bzrlib/selftest/testworkingtree.py

bzrlib/selftest/treeshape.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/testament.py

bzrlib/transactions.py

bzrlib/transport/memory.py

bzrlib/transport/sftp.py

bzrlib/tsort.py

bzrlib/util/configobj

bzrlib/util/configobj/__init__.py

bzrlib/util/configobj/configobj.py

bzrlib/util/configobj/docs

bzrlib/util/configobj/docs/BSD-LICENSE.txt

bzrlib/util/configobj/docs/configobj.txt

bzrlib/util/configobj/docs/validate.txt

bzrlib/util/configobj/validate.py

bzrlib/win32console.py

bzrlib/xml4.py

bzrlib/xml5.py

patches/cache_weave_inclusions.diff

tools/capture_tree.py

files removed:
bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/selftest/testremotebranch.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testsweet.py

files renamed:
bzr-man.py => bzr_man.py

tools/testweave.py => bzrlib/selftest/test_weave.py

bzrlib/selftest/plugins.py => bzrlib/selftest/testplugins.py

tools/history2weaves.py => bzrlib/upgrade.py

bzrlib/newinventory.py => contrib/newinventory.py

files modified:
.bzrignore

.rsyncexclude

HACKING

Makefile

NEWS

README

TODO

bzr *

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge3.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/plugin.py

bzrlib/progress.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testdiff.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testmerge3.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/testtransport.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/shellcomplete.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/compressed_text.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/weave.py *

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

contrib/zsh/_bzr

setup.py *

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

#!/usr/bin/env python

"""\

An implementation of the Transport object for http access.

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Implementation of Transport over http.

"""

from bzrlib.transport import Transport, register_transport, \

TransportNotPossible, NoSuchFile, NonRelativePath, \

TransportError

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import urllib2

import urlparse

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch, BZR_BRANCH_FORMAT

from bzrlib.branch import Branch

from bzrlib.trace import mutter

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

ENABLE_URLGRABBER = False

if ENABLE_URLGRABBER:

import urlgrabber

import urlgrabber.keepalive

import urlgrabber.grabber

urlgrabber.keepalive.DEBUG = 0

def get_url(path, compressed=False):

try:

url = path

if compressed:

url += '.gz'

mutter("grab url %s" % url)

url_f = urlgrabber.urlopen(url, keepalive=1, close_connection=0)

if not compressed:

return url_f

else:

return gzip.GzipFile(fileobj=StringIO(url_f.read()))

except urllib2.URLError, e:

raise BzrError("remote fetch failed: %r: %s" % (url, e))

except urlgrabber.grabber.URLGrabError, e:

raise BzrError("remote fetch failed: %r: %s" % (url, e))

else:

def get_url(url, compressed=False):

import urllib2

if compressed:

url += '.gz'

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

if compressed:

return gzip.GzipFile(fileobj=StringIO(url_f.read()))

else:

return url_f

def _find_remote_root(url):

"""Return the prefix URL that corresponds to the branch root."""

orig_url = url

while True:

try:

ff = get_url(url + '/.bzr/branch-format')

fmt = ff.read()

ff.close()

fmt = fmt.rstrip('\r\n')

if fmt != BZR_BRANCH_FORMAT.rstrip('\r\n'):

raise BzrError("sorry, branch format %r not supported at url %s"

% (fmt, url))

return url

except urllib2.URLError:

pass

try:

idx = url.rindex('/')

except ValueError:

raise BzrError('no branch root found for URL %s' % orig_url)

url = url[:idx]

def get_url(url):

import urllib2

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

(self._proto, self._host,

self._path, self._parameters,

self._query, self._fragment) = urlparse.urlparse(self.base)

def should_cache(self):

100

"""Return True if the data pulled across should be cached locally.

115

"""Return the full url to the given relative path.

116

This can be supplied with a string or a list

117

"""

assert isinstance(relpath, basestring)

118

if isinstance(relpath, basestring):

119

relpath = [relpath]

120

baseurl = self.base.rstrip('/')

121

return '/'.join([baseurl] + relpath)

122

123

def relpath(self, abspath):

124

if not abspath.startswith(self.base):

125

raise NonRelativePath('path %r is not under base URL %r'

126

% (abspath, self.base))

127

pl = len(self.base)

128

return abspath[pl:].lstrip('/')

relpath_parts = relpath.split('/')

else:

# TODO: Don't call this with an array - no magic interfaces

relpath_parts = relpath[:]

if len(relpath_parts) > 1:

if relpath_parts[0] == '':

raise ValueError("path %r within branch %r seems to be absolute"

% (relpath, self._path))

if relpath_parts[-1] == '':

raise ValueError("path %r within branch %r seems to be a directory"

% (relpath, self._path))

basepath = self._path.split('/')

if len(basepath) > 0 and basepath[-1] == '':

basepath = basepath[:-1]

for p in relpath_parts:

if p == '..':

if len(basepath) == 0:

# In most filesystems, a request for the parent

# of root, just returns root.

continue

basepath.pop()

100

elif p == '.' or p == '':

101

continue # No-op

102

else:

103

basepath.append(p)

104

# Possibly, we could use urlparse.urljoin() here, but

105

# I'm concerned about when it chooses to strip the last

106

# portion of the path, and when it doesn't.

107

path = '/'.join(basepath)

108

return urlparse.urlunparse((self._proto,

109

self._host, path, '', '', ''))

129

110

130

111

def has(self, relpath):

131

112

"""Does the target location exist?

132

113

133

114

TODO: HttpTransport.has() should use a HEAD request,

134

115

not a full GET request.

116

117

TODO: This should be changed so that we don't use

118

urllib2 and get an exception, the code path would be

119

cleaner if we just do an http HEAD request, and parse

120

the return code.

135

121

"""

136

122

try:

137

123

f = get_url(self.abspath(relpath))

124

# Without the read and then close()

125

# we tend to have busy sockets.

126

f.read()

127

f.close()

138

128

return True

139

except BzrError:

140

return False

141

except urllib2.URLError:

142

return False

129

except urllib2.URLError, e:

130

if e.code == 404:

131

return False

132

raise

143

133

except IOError, e:

144

134

if e.errno == errno.ENOENT:

145

135

return False

152

142

"""

153

143

try:

154

144

return get_url(self.abspath(relpath))

155

except BzrError, e:

156

raise NoSuchFile(orig_error=e)

157

145

except urllib2.URLError, e:

158

raise NoSuchFile(orig_error=e)

159

except IOError, e:

160

raise NoSuchFile(orig_error=e)

161

except Exception,e:

162

raise HttpTransportError(orig_error=e)

146

if e.code == 404:

147

raise NoSuchFile(msg = "Error retrieving %s: %s"

148

% (self.abspath(relpath), str(e)),

149

orig_error=e)

150

raise

151

except (BzrError, IOError), e:

152

raise NoSuchFile(msg = "Error retrieving %s: %s"

153

% (self.abspath(relpath), str(e)),

154

orig_error=e)

163

155

164

156

def put(self, relpath, f):

165

157

"""Copy the file-like or string object into the location.

207

199

"""Delete the item at relpath"""

208

200

raise TransportNotPossible('http does not support delete()')

209

201

210

def async_get(self, relpath):

211

"""Make a request for an file at the given location, but

212

don't worry about actually getting it yet.

213

214

:rtype: AsyncFile

215

"""

216

raise NotImplementedError

217

218

def list_dir(self, relpath):

219

"""Return a list of all files at the given location.

220

WARNING: many transports do not support this, so trying avoid using

221

it if at all possible.

222

"""

223

raise TransportNotPossible('http does not support list_dir()')

202

def listable(self):

203

"""See Transport.listable."""

204

return False

224

205

225

206

def stat(self, relpath):

226

207

"""Return the stat information for a file.

247

228

:return: A lock object, which should be passed to Transport.unlock()

248

229

"""

249

230

raise TransportNotPossible('http does not support lock_write()')

250

251

register_transport('http://', HttpTransport)

252

register_transport('https://', HttpTransport)

253

Older »