~bzr-pqm/bzr/bzr.dev

« back to all changes in this revision

Viewing changes to bzrlib/transport/http.py

Committer: Robert Collins
Date: 2005-10-02 21:51:29 UTC
mfrom: (1396)
mto: This revision was merged to the branch mainline in revision 1397.
Revision ID: robertc@robertcollins.net-20051002215128-5686c7d24bf9bdb9

merge from martins newformat branch - brings in transport abstraction

files added:
bzrlib/clone.py

bzrlib/selftest/testtransport.py

bzrlib/store

bzrlib/store/compressed_text.py

bzrlib/store/text.py

bzrlib/transport

bzrlib/transport/__init__.py

bzrlib/transport/http.py

bzrlib/transport/local.py

files removed:
bzrlib/remotebranch.py

bzrlib/selftest/testremotebranch.py

testsweet.py

files renamed:
bzrlib/store.py => bzrlib/store/__init__.py

bzrlib/weavestore.py => bzrlib/store/weave.py

files modified:
NEWS

NEWS.developers

bzrlib/__init__.py

bzrlib/atomicfile.py

bzrlib/branch.py

bzrlib/builtins.py

bzrlib/changeset.py

bzrlib/commands.py

bzrlib/commit.py

bzrlib/errors.py

bzrlib/fetch.py

bzrlib/merge.py

bzrlib/merge_core.py

bzrlib/missing.py

bzrlib/selftest/__init__.py

bzrlib/selftest/blackbox.py

bzrlib/selftest/test_merge_core.py

bzrlib/selftest/test_parent.py

bzrlib/selftest/test_weave.py

bzrlib/selftest/testbranch.py

bzrlib/selftest/testrevisionnamespaces.py

bzrlib/selftest/teststore.py

bzrlib/upgrade.py

bzrlib/weave.py

Show diffs side-by-side

added added

removed removed

bzrlib/transport/http.py

# This program is free software; you can redistribute it and/or modify

# it under the terms of the GNU General Public License as published by

# the Free Software Foundation; either version 2 of the License, or

# (at your option) any later version.

# This program is distributed in the hope that it will be useful,

# but WITHOUT ANY WARRANTY; without even the implied warranty of

# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the

# GNU General Public License for more details.

# You should have received a copy of the GNU General Public License

# along with this program; if not, write to the Free Software

# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA

"""Implementation of Transport over http.

"""

from bzrlib.transport import Transport, register_transport

from bzrlib.errors import (TransportNotPossible, NoSuchFile,

NonRelativePath, TransportError)

import os, errno

from cStringIO import StringIO

import urllib2

import urlparse

from bzrlib.errors import BzrError, BzrCheckError

from bzrlib.branch import Branch

from bzrlib.trace import mutter

# velocitynet.com.au transparently proxies connections and thereby

# breaks keep-alive -- sucks!

def get_url(url):

import urllib2

mutter("get_url %s" % url)

url_f = urllib2.urlopen(url)

return url_f

class HttpTransportError(TransportError):

pass

class HttpTransport(Transport):

"""This is the transport agent for http:// access.

TODO: Implement pipelined versions of all of the *_multi() functions.

"""

def __init__(self, base):

"""Set the base path where files will be stored."""

assert base.startswith('http://') or base.startswith('https://')

super(HttpTransport, self).__init__(base)

# In the future we might actually connect to the remote host

# rather than using get_url

# self._connection = None

(self._proto, self._host,

self._path, self._parameters,

self._query, self._fragment) = urlparse.urlparse(self.base)

def should_cache(self):

"""Return True if the data pulled across should be cached locally.

"""

return True

def clone(self, offset=None):

"""Return a new HttpTransport with root at self.base + offset

For now HttpTransport does not actually connect, so just return

a new HttpTransport object.

"""

if offset is None:

return HttpTransport(self.base)

else:

return HttpTransport(self.abspath(offset))

def abspath(self, relpath):

"""Return the full url to the given relative path.

This can be supplied with a string or a list

"""

if isinstance(relpath, basestring):

relpath = [relpath]

basepath = self._path.split('/')

if len(basepath) > 0 and basepath[-1] == '':

basepath = basepath[:-1]

for p in relpath:

if p == '..':

if len(basepath) < 0:

# In most filesystems, a request for the parent

# of root, just returns root.

continue

basepath.pop()

elif p == '.':

continue # No-op

else:

basepath.append(p)

# Possibly, we could use urlparse.urljoin() here, but

# I'm concerned about when it chooses to strip the last

100

# portion of the path, and when it doesn't.

101

path = '/'.join(basepath)

102

return urlparse.urlunparse((self._proto,

103

self._host, path, '', '', ''))

104

105

def relpath(self, abspath):

106

if not abspath.startswith(self.base):

107

raise NonRelativePath('path %r is not under base URL %r'

108

% (abspath, self.base))

109

pl = len(self.base)

110

return abspath[pl:].lstrip('/')

111

112

def has(self, relpath):

113

"""Does the target location exist?

114

115

TODO: HttpTransport.has() should use a HEAD request,

116

not a full GET request.

117

118

TODO: This should be changed so that we don't use

119

urllib2 and get an exception, the code path would be

120

cleaner if we just do an http HEAD request, and parse

121

the return code.

122

"""

123

try:

124

f = get_url(self.abspath(relpath))

125

# Without the read and then close()

126

# we tend to have busy sockets.

127

f.read()

128

f.close()

129

return True

130

except BzrError:

131

return False

132

except urllib2.URLError:

133

return False

134

except IOError, e:

135

if e.errno == errno.ENOENT:

136

return False

137

raise HttpTransportError(orig_error=e)

138

139

def get(self, relpath, decode=False):

140

"""Get the file at the given relative path.

141

142

:param relpath: The relative path to the file

143

"""

144

try:

145

return get_url(self.abspath(relpath))

146

except (BzrError, urllib2.URLError, IOError), e:

147

raise NoSuchFile(orig_error=e)

148

except Exception,e:

149

raise HttpTransportError(orig_error=e)

150

151

def get_partial(self, relpath, start, length=None):

152

"""Get just part of a file.

153

154

:param relpath: Path to the file, relative to base

155

:param start: The starting position to read from

156

:param length: The length to read. A length of None indicates

157

read to the end of the file.

158

:return: A file-like object containing at least the specified bytes.

159

Some implementations may return objects which can be read

160

past this length, but this is not guaranteed.

161

"""

162

# TODO: You can make specialized http requests for just

163

# a portion of the file. Figure out how to do that.

164

# For now, urllib2 returns files that cannot seek() so

165

# we just read bytes off the beginning, until we

166

# get to the point that we care about.

167

f = self.get(relpath)

168

# TODO: read in smaller chunks, in case things are

169

# buffered internally.

170

f.read(start)

171

return f

172

173

def put(self, relpath, f):

174

"""Copy the file-like or string object into the location.

175

176

:param relpath: Location to put the contents, relative to base.

177

:param f: File-like or string object.

178

"""

179

raise TransportNotPossible('http PUT not supported')

180

181

def mkdir(self, relpath):

182

"""Create a directory at the given path."""

183

raise TransportNotPossible('http does not support mkdir()')

184

185

def append(self, relpath, f):

186

"""Append the text in the file-like object into the final

187

location.

188

"""

189

raise TransportNotPossible('http does not support append()')

190

191

def copy(self, rel_from, rel_to):

192

"""Copy the item at rel_from to the location at rel_to"""

193

raise TransportNotPossible('http does not support copy()')

194

195

def copy_to(self, relpaths, other, pb=None):

196

"""Copy a set of entries from self into another Transport.

197

198

:param relpaths: A list/generator of entries to be copied.

199

200

TODO: if other is LocalTransport, is it possible to

201

do better than put(get())?

202

"""

203

# At this point HttpTransport might be able to check and see if

204

# the remote location is the same, and rather than download, and

205

# then upload, it could just issue a remote copy_this command.

206

if isinstance(other, HttpTransport):

207

raise TransportNotPossible('http cannot be the target of copy_to()')

208

else:

209

return super(HttpTransport, self).copy_to(relpaths, other, pb=pb)

210

211

def move(self, rel_from, rel_to):

212

"""Move the item at rel_from to the location at rel_to"""

213

raise TransportNotPossible('http does not support move()')

214

215

def delete(self, relpath):

216

"""Delete the item at relpath"""

217

raise TransportNotPossible('http does not support delete()')

218

219

def list_dir(self, relpath):

220

"""Return a list of all files at the given location.

221

WARNING: many transports do not support this, so trying avoid using

222

it if at all possible.

223

"""

224

raise TransportNotPossible('http does not support list_dir()')

225

226

def stat(self, relpath):

227

"""Return the stat information for a file.

228

"""

229

raise TransportNotPossible('http does not support stat()')

230

231

def lock_read(self, relpath):

232

"""Lock the given file for shared (read) access.

233

:return: A lock object, which should be passed to Transport.unlock()

234

"""

235

# The old RemoteBranch ignore lock for reading, so we will

236

# continue that tradition and return a bogus lock object.

237

class BogusLock(object):

238

def __init__(self, path):

239

self.path = path

240

def unlock(self):

241

pass

242

return BogusLock(relpath)

243

244

def lock_write(self, relpath):

245

"""Lock the given file for exclusive (write) access.

246

WARNING: many transports do not support this, so trying avoid using it

247

248

:return: A lock object, which should be passed to Transport.unlock()

249

"""

250

raise TransportNotPossible('http does not support lock_write()')

251

252

register_transport('http://', HttpTransport)

253

register_transport('https://', HttpTransport)

Older »