~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: John Arbash Meinel
Date: 2005-09-15 21:35:53 UTC
mfrom: (907.1.57)
mto: (1393.2.1)
mto: This revision was merged to the branch mainline in revision 1396.
Revision ID: john@arbash-meinel.com-20050915213552-a6c83a5ef1e20897

(broken) Transport work is merged in. Tests do not pass yet.

files added:
bzrlib/meta_store.py

bzrlib/remotebranch.py

bzrlib/selftest/testremotebranch.py

bzrlib/upgrade.py

patches/annotate3.patch

patches/annotate4.patch

patches/pending-merge.patch

patches/plugins-no-plugins.patch

patches/progress.diff

patches/symlink-support.patch

testsweet.py

files removed:
NEWS.developers

bzrlib/annotate.py

bzrlib/clone.py

bzrlib/revisionspec.py

bzrlib/selftest/test_ancestry.py

bzrlib/selftest/test_bad_files.py

bzrlib/selftest/test_commit.py

bzrlib/selftest/test_commit_merge.py

bzrlib/selftest/test_revision_info.py

bzrlib/selftest/test_upgrade.py

bzrlib/selftest/testworkingtree.py

bzrlib/selftest/treeshape.py

bzrlib/store/text.py

bzrlib/store/weave.py

bzrlib/xml4.py

bzrlib/xml5.py

patches/cache_weave_inclusions.diff

tools/capture_tree.py

files renamed:
contrib/newinventory.py => bzrlib/newinventory.py

bzrlib/upgrade.py => tools/history2weaves.py

bzrlib/selftest/test_weave.py => tools/testweave.py

files modified:
.bzrignore

HACKING

NEWS

TODO

bzr-man.py

bzrlib/__init__.py

bzrlib/add.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/check.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/delta.py

bzrlib/diff.py

bzrlib/errors.py

bzrlib/externalcommand.py

bzrlib/fetch.py

bzrlib/graph.py

bzrlib/hashcache.py

bzrlib/help.py

bzrlib/info.py

bzrlib/inventory.py

bzrlib/lock.py

bzrlib/log.py

bzrlib/mdiff.py

bzrlib/merge.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/msgeditor.py

bzrlib/osutils.py

bzrlib/patch.py

bzrlib/progress.py

bzrlib/revfile.py

bzrlib/revision.py

bzrlib/selftest/HTTPTestUtil.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_smart_add.py

bzrlib/selftest/test_xml.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testfetch.py

bzrlib/selftest/testgraph.py

bzrlib/selftest/testhashcache.py

bzrlib/selftest/testinv.py

bzrlib/selftest/testlog.py

bzrlib/selftest/testmerge.py

bzrlib/selftest/testrevision.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststatus.py

bzrlib/selftest/teststore.py

bzrlib/selftest/testtransport.py

bzrlib/selftest/versioning.py

bzrlib/selftest/whitebox.py

bzrlib/status.py

bzrlib/store/__init__.py

bzrlib/store/compressed_text.py

bzrlib/textinv.py

bzrlib/trace.py

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

bzrlib/tree.py

bzrlib/weave.py

bzrlib/weavefile.py

bzrlib/workingtree.py

bzrlib/xml.py

setup.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Implementation of Transport over http.

#!/usr/bin/env python

"""\

An implementation of the Transport object for http access.

"""

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

from bzrlib.transport import Transport, register_transport, \

TransportNotPossible, NoSuchFile, NonRelativePath, \

TransportError

import os, errno

from cStringIO import StringIO

import urllib2

import urlparse

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.branch import Branch, BZR_BRANCH_FORMAT

from bzrlib.trace import mutter

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

return url_f

ENABLE_URLGRABBER = False

if ENABLE_URLGRABBER:

import urlgrabber

import urlgrabber.keepalive

import urlgrabber.grabber

urlgrabber.keepalive.DEBUG = 0

def get_url(path, compressed=False):

try:

url = path

if compressed:

url += '.gz'

mutter("grab url %s" % url)

url_f = urlgrabber.urlopen(url, keepalive=1, close_connection=0)

if not compressed:

return url_f

else:

return gzip.GzipFile(fileobj=StringIO(url_f.read()))

except urllib2.URLError, e:

raise BzrError("remote fetch failed: %r: %s" % (url, e))

except urlgrabber.grabber.URLGrabError, e:

raise BzrError("remote fetch failed: %r: %s" % (url, e))

else:

def get_url(url, compressed=False):

import urllib2

if compressed:

url += '.gz'

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

if compressed:

return gzip.GzipFile(fileobj=StringIO(url_f.read()))

else:

return url_f

def _find_remote_root(url):

"""Return the prefix URL that corresponds to the branch root."""

orig_url = url

while True:

try:

ff = get_url(url + '/.bzr/branch-format')

fmt = ff.read()

ff.close()

fmt = fmt.rstrip('\r\n')

if fmt != BZR_BRANCH_FORMAT.rstrip('\r\n'):

raise BzrError("sorry, branch format %r not supported at url %s"

% (fmt, url))

return url

except urllib2.URLError:

pass

try:

idx = url.rindex('/')

except ValueError:

raise BzrError('no branch root found for URL %s' % orig_url)

url = url[:idx]

class HttpTransportError(TransportError):

pass

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

(self._proto, self._host,

self._path, self._parameters,

self._query, self._fragment) = urlparse.urlparse(self.base)

def should_cache(self):

100

"""Return True if the data pulled across should be cached locally.

117

"""

118

if isinstance(relpath, basestring):

119

relpath = [relpath]

basepath = self._path.split('/')

if len(basepath) > 0 and basepath[-1] == '':

basepath = basepath[:-1]

for p in relpath:

if p == '..':

if len(basepath) < 0:

# In most filesystems, a request for the parent

# of root, just returns root.

continue

basepath.pop()

elif p == '.':

continue # No-op

else:

basepath.append(p)

# Possibly, we could use urlparse.urljoin() here, but

# I'm concerned about when it chooses to strip the last

100

# portion of the path, and when it doesn't.

101

path = '/'.join(basepath)

102

return urlparse.urlunparse((self._proto,

103

self._host, path, '', '', ''))

120

baseurl = self.base.rstrip('/')

121

return '/'.join([baseurl] + relpath)

104

122

105

123

def relpath(self, abspath):

106

124

if not abspath.startswith(self.base):

114

132

115

133

TODO: HttpTransport.has() should use a HEAD request,

116

134

not a full GET request.

117

118

TODO: This should be changed so that we don't use

119

urllib2 and get an exception, the code path would be

120

cleaner if we just do an http HEAD request, and parse

121

the return code.

122

135

"""

123

136

try:

124

137

f = get_url(self.abspath(relpath))

125

# Without the read and then close()

126

# we tend to have busy sockets.

127

f.read()

128

f.close()

129

138

return True

130

139

except BzrError:

131

140

return False

143

152

"""

144

153

try:

145

154

return get_url(self.abspath(relpath))

146

except (BzrError, urllib2.URLError, IOError), e:

155

except BzrError, e:

156

raise NoSuchFile(orig_error=e)

157

except urllib2.URLError, e:

158

raise NoSuchFile(orig_error=e)

159

except IOError, e:

147

160

raise NoSuchFile(orig_error=e)

148

161

except Exception,e:

149

162

raise HttpTransportError(orig_error=e)

150

163

151

def get_partial(self, relpath, start, length=None):

152

"""Get just part of a file.

153

154

:param relpath: Path to the file, relative to base

155

:param start: The starting position to read from

156

:param length: The length to read. A length of None indicates

157

read to the end of the file.

158

:return: A file-like object containing at least the specified bytes.

159

Some implementations may return objects which can be read

160

past this length, but this is not guaranteed.

161

"""

162

# TODO: You can make specialized http requests for just

163

# a portion of the file. Figure out how to do that.

164

# For now, urllib2 returns files that cannot seek() so

165

# we just read bytes off the beginning, until we

166

# get to the point that we care about.

167

f = self.get(relpath)

168

# TODO: read in smaller chunks, in case things are

169

# buffered internally.

170

f.read(start)

171

return f

172

173

164

def put(self, relpath, f):

174

165

"""Copy the file-like or string object into the location.

175

166

216

207

"""Delete the item at relpath"""

217

208

raise TransportNotPossible('http does not support delete()')

218

209

219

def listable(self):

220

"""See Transport.listable."""

221

return False

210

def async_get(self, relpath):

211

"""Make a request for an file at the given location, but

212

don't worry about actually getting it yet.

213

214

:rtype: AsyncFile

215

"""

216

raise NotImplementedError

217

218

def list_dir(self, relpath):

219

"""Return a list of all files at the given location.

220

WARNING: many transports do not support this, so trying avoid using

221

it if at all possible.

222

"""

223

raise TransportNotPossible('http does not support list_dir()')

222

224

223

225

def stat(self, relpath):

224

226

"""Return the stat information for a file.

248

250

249

251

register_transport('http://', HttpTransport)

250

252

register_transport('https://', HttpTransport)

253

Older »