Implementation.id doesn't have to be path or digest
[zeroinstall/solver.git] / zeroinstall / injector / fetch.py
blobb6013b93c4c904ec75b863520cf046aed2dbab0e
1 """
2 Downloads feeds, keys, packages and icons.
3 """
5 # Copyright (C) 2009, Thomas Leonard
6 # See the README file for details, or visit http://0install.net.
8 from zeroinstall import _
9 import os
10 from logging import info, debug, warn
12 from zeroinstall.support import tasks, basedir
13 from zeroinstall.injector.namespaces import XMLNS_IFACE, config_site
14 from zeroinstall.injector.model import DownloadSource, Recipe, SafeException, escape
15 from zeroinstall.injector.iface_cache import PendingFeed, ReplayAttack
16 from zeroinstall.injector.handler import NoTrustedKeys
17 from zeroinstall.injector import download
19 DEFAULT_KEY_LOOKUP_SERVER = 'https://keylookup.appspot.com'
21 def _escape_slashes(path):
22 return path.replace('/', '%23')
24 def _get_feed_dir(feed):
25 """The algorithm from 0mirror."""
26 if '#' in feed:
27 raise SafeException(_("Invalid URL '%s'") % feed)
28 scheme, rest = feed.split('://', 1)
29 domain, rest = rest.split('/', 1)
30 for x in [scheme, domain, rest]:
31 if not x or x.startswith(','):
32 raise SafeException(_("Invalid URL '%s'") % feed)
33 return os.path.join('feeds', scheme, domain, _escape_slashes(rest))
35 class KeyInfoFetcher:
36 """Fetches information about a GPG key from a key-info server.
37 See L{Fetcher.fetch_key_info} for details.
38 @since: 0.42
40 Example:
42 >>> kf = KeyInfoFetcher('https://server', fingerprint)
43 >>> while True:
44 print kf.info
45 if kf.blocker is None: break
46 print kf.status
47 yield kf.blocker
48 """
49 def __init__(self, server, fingerprint):
50 self.fingerprint = fingerprint
51 self.info = []
52 self.blocker = None
54 if server is None: return
56 self.status = _('Fetching key information from %s...') % server
58 dl = download.Download(server + '/key/' + fingerprint)
59 dl.start()
61 from xml.dom import minidom
63 @tasks.async
64 def fetch_key_info():
65 try:
66 tempfile = dl.tempfile
67 yield dl.downloaded
68 self.blocker = None
69 tasks.check(dl.downloaded)
70 tempfile.seek(0)
71 doc = minidom.parse(tempfile)
72 if doc.documentElement.localName != 'key-lookup':
73 raise SafeException(_('Expected <key-lookup>, not <%s>') % doc.documentElement.localName)
74 self.info += doc.documentElement.childNodes
75 except Exception, ex:
76 doc = minidom.parseString('<item vote="bad"/>')
77 root = doc.documentElement
78 root.appendChild(doc.createTextNode(_('Error getting key information: %s') % ex))
79 self.info.append(root)
81 self.blocker = fetch_key_info()
83 class Fetcher(object):
84 """Downloads and stores various things.
85 @ivar handler: handler to use for user-interaction
86 @type handler: L{handler.Handler}
87 @ivar key_info: caches information about GPG keys
88 @type key_info: {str: L{KeyInfoFetcher}}
89 @ivar key_info_server: the base URL of a key information server
90 @type key_info_server: str
91 @ivar feed_mirror: the base URL of a mirror site for keys and feeds
92 @type feed_mirror: str
93 """
94 __slots__ = ['handler', 'feed_mirror', 'key_info_server', 'key_info']
96 def __init__(self, handler):
97 self.handler = handler
98 self.feed_mirror = "http://roscidus.com/0mirror"
99 self.key_info_server = DEFAULT_KEY_LOOKUP_SERVER
100 self.key_info = {}
102 @tasks.async
103 def cook(self, required_digest, recipe, stores, force = False, impl_hint = None):
104 """Follow a Recipe.
105 @param impl_hint: the Implementation this is for (if any) as a hint for the GUI
106 @see: L{download_impl} uses this method when appropriate"""
107 # Maybe we're taking this metaphor too far?
109 # Start downloading all the ingredients.
110 downloads = {} # Downloads that are not yet successful
111 streams = {} # Streams collected from successful downloads
113 # Start a download for each ingredient
114 blockers = []
115 for step in recipe.steps:
116 blocker, stream = self.download_archive(step, force = force, impl_hint = impl_hint)
117 assert stream
118 blockers.append(blocker)
119 streams[step] = stream
121 while blockers:
122 yield blockers
123 tasks.check(blockers)
124 blockers = [b for b in blockers if not b.happened]
126 from zeroinstall.zerostore import unpack
128 # Create an empty directory for the new implementation
129 store = stores.stores[0]
130 tmpdir = store.get_tmp_dir_for(required_digest)
131 try:
132 # Unpack each of the downloaded archives into it in turn
133 for step in recipe.steps:
134 stream = streams[step]
135 stream.seek(0)
136 unpack.unpack_archive_over(step.url, stream, tmpdir, step.extract)
137 # Check that the result is correct and store it in the cache
138 store.check_manifest_and_rename(required_digest, tmpdir)
139 tmpdir = None
140 finally:
141 # If unpacking fails, remove the temporary directory
142 if tmpdir is not None:
143 from zeroinstall import support
144 support.ro_rmtree(tmpdir)
146 def get_feed_mirror(self, url):
147 """Return the URL of a mirror for this feed."""
148 import urlparse
149 if urlparse.urlparse(url).hostname == 'localhost':
150 return None
151 return '%s/%s/latest.xml' % (self.feed_mirror, _get_feed_dir(url))
153 def download_and_import_feed(self, feed_url, iface_cache, force = False):
154 """Download the feed, download any required keys, confirm trust if needed and import.
155 @param feed_url: the feed to be downloaded
156 @type feed_url: str
157 @param iface_cache: cache in which to store the feed
158 @type iface_cache: L{iface_cache.IfaceCache}
159 @param force: whether to abort and restart an existing download"""
160 from download import DownloadAborted
162 debug(_("download_and_import_feed %(url)s (force = %(force)d)"), {'url': feed_url, 'force': force})
163 assert not feed_url.startswith('/')
165 primary = self._download_and_import_feed(feed_url, iface_cache, force, use_mirror = False)
167 @tasks.named_async("monitor feed downloads for " + feed_url)
168 def wait_for_downloads(primary):
169 # Download just the upstream feed, unless it takes too long...
170 timeout = tasks.TimeoutBlocker(5, 'Mirror timeout') # 5 seconds
172 yield primary, timeout
173 tasks.check(timeout)
175 try:
176 tasks.check(primary)
177 if primary.happened:
178 return # OK, primary succeeded!
179 # OK, maybe it's just being slow...
180 info("Feed download from %s is taking a long time. Trying mirror too...", feed_url)
181 primary_ex = None
182 except NoTrustedKeys, ex:
183 raise # Don't bother trying the mirror if we have a trust problem
184 except ReplayAttack, ex:
185 raise # Don't bother trying the mirror if we have a replay attack
186 except DownloadAborted, ex:
187 raise # Don't bother trying the mirror if the user cancelled
188 except SafeException, ex:
189 # Primary failed
190 primary = None
191 primary_ex = ex
192 warn(_("Trying mirror, as feed download from %(url)s failed: %(exception)s"), {'url': feed_url, 'exception': ex})
194 # Start downloading from mirror...
195 mirror = self._download_and_import_feed(feed_url, iface_cache, force, use_mirror = True)
197 # Wait until both mirror and primary tasks are complete...
198 while True:
199 blockers = filter(None, [primary, mirror])
200 if not blockers:
201 break
202 yield blockers
204 if primary:
205 try:
206 tasks.check(primary)
207 if primary.happened:
208 primary = None
209 # No point carrying on with the mirror once the primary has succeeded
210 if mirror:
211 info(_("Primary feed download succeeded; aborting mirror download for %s") % feed_url)
212 mirror.dl.abort()
213 except SafeException, ex:
214 primary = None
215 primary_ex = ex
216 info(_("Feed download from %(url)s failed; still trying mirror: %(exception)s"), {'url': feed_url, 'exception': ex})
218 if mirror:
219 try:
220 tasks.check(mirror)
221 if mirror.happened:
222 mirror = None
223 if primary_ex:
224 # We already warned; no need to raise an exception too,
225 # as the mirror download succeeded.
226 primary_ex = None
227 except ReplayAttack, ex:
228 info(_("Version from mirror is older than cached version; ignoring it: %s"), ex)
229 mirror = None
230 primary_ex = None
231 except SafeException, ex:
232 info(_("Mirror download failed: %s"), ex)
233 mirror = None
235 if primary_ex:
236 raise primary_ex
238 return wait_for_downloads(primary)
240 def _download_and_import_feed(self, feed_url, iface_cache, force, use_mirror):
241 """Download and import a feed.
242 @param use_mirror: False to use primary location; True to use mirror."""
243 if use_mirror:
244 url = self.get_feed_mirror(feed_url)
245 if url is None: return None
246 else:
247 url = feed_url
249 dl = self.handler.get_download(url, force = force, hint = feed_url)
250 stream = dl.tempfile
252 @tasks.named_async("fetch_feed " + url)
253 def fetch_feed():
254 yield dl.downloaded
255 tasks.check(dl.downloaded)
257 pending = PendingFeed(feed_url, stream)
259 if use_mirror:
260 # If we got the feed from a mirror, get the key from there too
261 key_mirror = self.feed_mirror + '/keys/'
262 else:
263 key_mirror = None
265 keys_downloaded = tasks.Task(pending.download_keys(self.handler, feed_hint = feed_url, key_mirror = key_mirror), _("download keys for %s") % feed_url)
266 yield keys_downloaded.finished
267 tasks.check(keys_downloaded.finished)
269 iface = iface_cache.get_interface(pending.url)
270 if not iface_cache.update_interface_if_trusted(iface, pending.sigs, pending.new_xml):
271 blocker = self.handler.confirm_keys(pending, self.fetch_key_info)
272 if blocker:
273 yield blocker
274 tasks.check(blocker)
275 if not iface_cache.update_interface_if_trusted(iface, pending.sigs, pending.new_xml):
276 raise NoTrustedKeys(_("No signing keys trusted; not importing"))
278 task = fetch_feed()
279 task.dl = dl
280 return task
282 def fetch_key_info(self, fingerprint):
283 try:
284 return self.key_info[fingerprint]
285 except KeyError:
286 self.key_info[fingerprint] = info = KeyInfoFetcher(self.key_info_server, fingerprint)
287 return info
289 def download_impl(self, impl, retrieval_method, stores, force = False):
290 """Download an implementation.
291 @param impl: the selected implementation
292 @type impl: L{model.ZeroInstallImplementation}
293 @param retrieval_method: a way of getting the implementation (e.g. an Archive or a Recipe)
294 @type retrieval_method: L{model.RetrievalMethod}
295 @param stores: where to store the downloaded implementation
296 @type stores: L{zerostore.Stores}
297 @param force: whether to abort and restart an existing download
298 @rtype: L{tasks.Blocker}"""
299 assert impl
300 assert retrieval_method
302 from zeroinstall.zerostore import manifest
303 for required_digest in impl.digests:
304 alg = required_digest.split('=', 1)[0]
305 if alg in manifest.algorithms:
306 break
307 else:
308 if not impl.digests:
309 raise SafeException(_("No <manifest-digest> given for '%(implementation)s' version %(version)s") %
310 {'implementation': impl.feed.get_name(), 'version': impl.get_version()})
311 raise SafeException(_("Unknown digest algorithms '%(algorithms)s' for '%(implementation)s' version %(version)s") %
312 {'algorithms': impl.digests, 'implementation': impl.feed.get_name(), 'version': impl.get_version()})
314 @tasks.async
315 def download_impl():
316 if isinstance(retrieval_method, DownloadSource):
317 blocker, stream = self.download_archive(retrieval_method, force = force, impl_hint = impl)
318 yield blocker
319 tasks.check(blocker)
321 stream.seek(0)
322 self._add_to_cache(required_digest, stores, retrieval_method, stream)
323 elif isinstance(retrieval_method, Recipe):
324 blocker = self.cook(required_digest, retrieval_method, stores, force, impl_hint = impl)
325 yield blocker
326 tasks.check(blocker)
327 else:
328 raise Exception(_("Unknown download type for '%s'") % retrieval_method)
330 self.handler.impl_added_to_store(impl)
331 return download_impl()
333 def _add_to_cache(self, required_digest, stores, retrieval_method, stream):
334 assert isinstance(retrieval_method, DownloadSource)
335 url = retrieval_method.url
336 stores.add_archive_to_cache(required_digest, stream, retrieval_method.url, retrieval_method.extract,
337 type = retrieval_method.type, start_offset = retrieval_method.start_offset or 0)
339 def download_archive(self, download_source, force = False, impl_hint = None):
340 """Fetch an archive. You should normally call L{download_impl}
341 instead, since it handles other kinds of retrieval method too."""
342 from zeroinstall.zerostore import unpack
344 url = download_source.url
345 if not (url.startswith('http:') or url.startswith('https:') or url.startswith('ftp:')):
346 raise SafeException(_("Unknown scheme in download URL '%s'") % url)
348 mime_type = download_source.type
349 if not mime_type:
350 mime_type = unpack.type_from_url(download_source.url)
351 if not mime_type:
352 raise SafeException(_("No 'type' attribute on archive, and I can't guess from the name (%s)") % download_source.url)
353 unpack.check_type_ok(mime_type)
354 dl = self.handler.get_download(download_source.url, force = force, hint = impl_hint)
355 dl.expected_size = download_source.size + (download_source.start_offset or 0)
356 return (dl.downloaded, dl.tempfile)
358 def download_icon(self, interface, force = False, modification_time = None):
359 """Download an icon for this interface and add it to the
360 icon cache. If the interface has no icon or we are offline, do nothing.
361 @return: the task doing the import, or None
362 @rtype: L{tasks.Task}"""
363 debug(_("download_icon %(interface)s (force = %(force)d)"), {'interface': interface, 'force': force})
365 # Find a suitable icon to download
366 for icon in interface.get_metadata(XMLNS_IFACE, 'icon'):
367 type = icon.getAttribute('type')
368 if type != 'image/png':
369 debug(_('Skipping non-PNG icon'))
370 continue
371 source = icon.getAttribute('href')
372 if source:
373 break
374 warn(_('Missing "href" attribute on <icon> in %s'), interface)
375 else:
376 info(_('No PNG icons found in %s'), interface)
377 return
379 try:
380 dl = self.handler.monitored_downloads[source]
381 if dl and force:
382 dl.abort()
383 raise KeyError
384 except KeyError:
385 dl = download.Download(source, hint = interface, modification_time = modification_time)
386 self.handler.monitor_download(dl)
388 @tasks.async
389 def download_and_add_icon():
390 stream = dl.tempfile
391 yield dl.downloaded
392 try:
393 tasks.check(dl.downloaded)
394 if dl.unmodified: return
395 stream.seek(0)
397 import shutil
398 icons_cache = basedir.save_cache_path(config_site, 'interface_icons')
399 icon_file = file(os.path.join(icons_cache, escape(interface.uri)), 'w')
400 shutil.copyfileobj(stream, icon_file)
401 except Exception, ex:
402 self.handler.report_error(ex)
404 return download_and_add_icon()
406 def download_impls(self, implementations, stores):
407 """Download the given implementations, choosing a suitable retrieval method for each."""
408 blockers = []
410 to_download = []
411 for impl in implementations:
412 debug(_("start_downloading_impls: for %(feed)s get %(implementation)s"), {'feed': impl.feed, 'implementation': impl})
413 source = self.get_best_source(impl)
414 if not source:
415 raise SafeException(_("Implementation %(implementation_id)s of interface %(interface)s"
416 " cannot be downloaded (no download locations given in "
417 "interface!)") % {'implementation_id': impl.id, 'interface': impl.feed.get_name()})
418 to_download.append((impl, source))
420 for impl, source in to_download:
421 blockers.append(self.download_impl(impl, source, stores))
423 if not blockers:
424 return None
426 @tasks.async
427 def download_impls(blockers):
428 # Record the first error log the rest
429 error = []
430 def dl_error(ex, tb = None):
431 if error:
432 self.handler.report_error(ex)
433 else:
434 error.append(ex)
435 while blockers:
436 yield blockers
437 tasks.check(blockers, dl_error)
439 blockers = [b for b in blockers if not b.happened]
440 if error:
441 raise error[0]
443 return download_impls(blockers)
445 def get_best_source(self, impl):
446 """Return the best download source for this implementation.
447 @rtype: L{model.RetrievalMethod}"""
448 if impl.download_sources:
449 return impl.download_sources[0]
450 return None