diff --git a/swh/vault/backend.py b/swh/vault/backend.py
index fb8f244..80412d3 100644
--- a/swh/vault/backend.py
+++ b/swh/vault/backend.py
@@ -1,224 +1,224 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import textwrap
 import smtplib
 import celery
 import psycopg2
 import psycopg2.extras
 
 from functools import wraps
 from email.mime.text import MIMEText
 
 from swh.model import hashutil
 from swh.scheduler.utils import get_task
 from swh.vault.cache import VaultCache
 from swh.vault.cookers import COOKER_TYPES
 from swh.vault.cooking_tasks import SWHCookingTask  # noqa
 
 cooking_task_name = 'swh.vault.cooking_tasks.SWHCookingTask'
 
 
 # TODO: Imported from swh.scheduler.backend. Factorization needed.
 def autocommit(fn):
     @wraps(fn)
     def wrapped(self, *args, **kwargs):
         autocommit = False
         # TODO: I don't like using None, it's confusing for the user. how about
         # a NEW_CURSOR object()?
         if 'cursor' not in kwargs or not kwargs['cursor']:
             autocommit = True
             kwargs['cursor'] = self.cursor()
 
         try:
             ret = fn(self, *args, **kwargs)
         except:
             if autocommit:
                 self.rollback()
             raise
 
         if autocommit:
             self.commit()
 
         return ret
 
     return wrapped
 
 
 # TODO: This has to be factorized with other database base classes and helpers
 # (swh.scheduler.backend.SchedulerBackend, swh.storage.db.BaseDb, ...)
 # The three first methods are imported from swh.scheduler.backend.
 class VaultBackend:
     """
     Backend for the Software Heritage vault.
     """
     def __init__(self, config):
         self.config = config
         self.cache = VaultCache(**self.config['cache'])
         self.db = None
         self.reconnect()
         self.smtp_server = smtplib.SMTP('localhost')
 
     def reconnect(self):
         if not self.db or self.db.closed:
             self.db = psycopg2.connect(
                 dsn=self.config['vault_db'],
                 cursor_factory=psycopg2.extras.RealDictCursor,
             )
 
     def cursor(self):
         """Return a fresh cursor on the database, with auto-reconnection in case
         of failure"""
         cur = None
 
         # Get a fresh cursor and reconnect at most three times
         tries = 0
         while True:
             tries += 1
             try:
                 cur = self.db.cursor()
                 cur.execute('select 1')
                 break
             except psycopg2.OperationalError:
                 if tries < 3:
                     self.reconnect()
                 else:
                     raise
         return cur
 
     def commit(self):
         """Commit a transaction"""
         self.db.commit()
 
     def rollback(self):
         """Rollback a transaction"""
         self.db.rollback()
 
     @autocommit
     def task_info(self, obj_type, obj_id, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         cursor.execute('''
             SELECT id, type, object_id, task_uuid, task_status,
                    ts_created, ts_done
             FROM vault_bundle
             WHERE type = %s AND object_id = %s''', (obj_type, obj_id))
         return cursor.fetchone()
 
     @autocommit
     def create_task(self, obj_type, obj_id, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         assert obj_type in COOKER_TYPES
 
         task_uuid = celery.uuid()
         cursor.execute('''
             INSERT INTO vault_bundle (type, object_id, task_uuid)
             VALUES (%s, %s, %s)''', (obj_type, obj_id, task_uuid))
 
         args = [self.config, obj_type, obj_id]
         task = get_task(cooking_task_name)
         self.commit()
         task.apply_async(args, task_id=task_uuid)
 
     @autocommit
     def add_notif_email(self, obj_type, obj_id, email, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         cursor.execute('''
             INSERT INTO vault_notif_email (email, bundle_id)
             VALUES (%s, (SELECT id FROM vault_bundle
                          WHERE type = %s AND object_id = %s))''',
                        (email, obj_type, obj_id))
 
     @autocommit
     def cook_request(self, obj_type, obj_id, email=None, cursor=None):
         info = self.task_info(obj_type, obj_id)
         if info is None:
             self.create_task(obj_type, obj_id)
         if email is not None:
             if info is not None and info['task_status'] == 'done':
                 self.send_notification(None, email, obj_type, obj_id)
             else:
                 self.add_notif_email(obj_type, obj_id, email)
 
     @autocommit
     def is_available(self, obj_type, obj_id, cursor=None):
         info = self.task_info(obj_type, obj_id, cursor=cursor)
         return (info is not None
                 and info['task_status'] == 'done'
                 and self.cache.is_cached(obj_type, obj_id))
 
     @autocommit
     def fetch(self, obj_type, obj_id, cursor=None):
         if not self.is_available(obj_type, obj_id, cursor=cursor):
             return None
         self.update_access_ts(obj_type, obj_id, cursor=cursor)
         return self.cache.get(obj_type, obj_id)
 
     @autocommit
     def update_access_ts(self, obj_type, obj_id, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         cursor.execute('''
             UPDATE vault_bundle
             SET ts_last_access = NOW()
             WHERE type = %s AND object_id = %s''',
                        (obj_type, obj_id))
 
     @autocommit
     def set_status(self, obj_type, obj_id, status, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         req = ('''
                UPDATE vault_bundle
                SET task_status = %s '''
                + (''', ts_done = NOW() ''' if status == 'done' else '')
                + '''WHERE type = %s AND object_id = %s''')
         cursor.execute(req, (status, obj_type, obj_id))
 
     @autocommit
     def set_progress(self, obj_type, obj_id, progress, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         cursor.execute('''
             UPDATE vault_bundle
-            SET progress = %s
+            SET progress_msg = %s
             WHERE type = %s AND object_id = %s''',
                        (progress, obj_type, obj_id))
 
     @autocommit
     def send_all_notifications(self, obj_type, obj_id, cursor=None):
         obj_id = hashutil.hash_to_bytes(obj_id)
         cursor.execute('''
             SELECT vault_notif_email.id AS id, email
             FROM vault_notif_email
             RIGHT JOIN vault_bundle ON bundle_id = vault_bundle.id
             WHERE vault_bundle.type = %s AND vault_bundle.object_id = %s''',
                        (obj_type, obj_id))
         for d in cursor:
             self.send_notification(d['id'], d['email'], obj_type, obj_id)
 
     @autocommit
     def send_notification(self, n_id, email, obj_type, obj_id, cursor=None):
         hex_id = hashutil.hash_to_hex(obj_id)
         text = (
             "You have requested a bundle of type `{obj_type}` for the object "
             "`{hex_id}` from the Software Heritage Archive.\n\n"
             "The bundle you requested is now available for download at the "
             "following address:\n\n"
             "{url}\n\n"
             "Please keep in mind that this link might expire at some point, "
             "in which case you will need to request the bundle again.")
 
         text = text.format(obj_type=obj_type, hex_id=hex_id, url='URL_TODO')
         text = textwrap.dedent(text)
         text = '\n'.join(textwrap.wrap(text, 72, replace_whitespace=False))
         msg = MIMEText(text)
         msg['Subject'] = ("The `{obj_type}` bundle of `{hex_id}` is ready"
                           .format(obj_type=obj_type, hex_id=hex_id))
         msg['From'] = '"Software Heritage Vault" <vault@softwareheritage.org>'
         msg['To'] = email
 
         self.smtp_server.send_message(msg)
 
         if n_id is not None:
             cursor.execute('''
                 DELETE FROM vault_notif_email
                 WHERE id = %s''', (n_id,))
diff --git a/swh/vault/cookers/base.py b/swh/vault/cookers/base.py
index 6cb9660..36fb20c 100644
--- a/swh/vault/cookers/base.py
+++ b/swh/vault/cookers/base.py
@@ -1,221 +1,223 @@
 # Copyright (C) 2016-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import abc
 import io
 import itertools
 import logging
 import os
 import tarfile
 import tempfile
 
 from pathlib import Path
 
 from swh.model import hashutil
 from swh.storage import get_storage
 
 
 def get_tar_bytes(path, arcname=None):
     path = Path(path)
     if not arcname:
         arcname = path.name
     tar_buffer = io.BytesIO()
     tar = tarfile.open(fileobj=tar_buffer, mode='w')
     tar.add(str(path), arcname=arcname)
     return tar_buffer.getbuffer()
 
 
 SKIPPED_MESSAGE = (b'This content have not been retrieved in '
                    b'Software Heritage archive due to its size')
 
 
 HIDDEN_MESSAGE = (b'This content is hidden')
 
 
 class BaseVaultCooker(metaclass=abc.ABCMeta):
     """Abstract base class for the vault's bundle creators
 
     This class describes a common API for the cookers.
 
     To define a new cooker, inherit from this class and override:
     - CACHE_TYPE_KEY: key to use for the bundle to reference in cache
     - def cook(): cook the object into a bundle
     """
     CACHE_TYPE_KEY = None
 
     def __init__(self, config, obj_type, obj_id):
         """Initialize the cooker.
 
         The type of the object represented by the id depends on the
         concrete class. Very likely, each type of bundle will have its
         own cooker class.
 
         Args:
             storage: the storage object
             cache: the cache where to store the bundle
             obj_id: id of the object to be cooked into a bundle.
         """
         # Imported here to avoid circular dependency
         from swh.vault.backend import VaultBackend
 
         self.storage = get_storage(**config['storage'])
         self.backend = VaultBackend(config)
         self.obj_type = obj_type
         self.obj_id = hashutil.hash_to_bytes(obj_id)
 
     @abc.abstractmethod
     def prepare_bundle(self):
         """Implementation of the cooker. Yields chunks of the bundle bytes.
 
         Override this with the cooker implementation.
         """
         raise NotImplemented
 
     def cook(self):
         """Cook the requested object into a bundle
         """
         self.backend.set_status(self.obj_type, self.obj_id, 'pending')
+        self.backend.set_progress(self.obj_type, self.obj_id, 'Initializing.')
         content_iter = self.prepare_bundle()
 
         self.update_cache(content_iter)
         self.backend.set_status(self.obj_type, self.obj_id, 'done')
+        self.backend.set_progress(self.obj_type, self.obj_id, 'Done.')
 
         self.notify_bundle_ready()
 
     def update_cache(self, content_iter):
         """Update the cache with id and bundle_content.
 
         """
         self.backend.cache.add_stream(self.CACHE_TYPE_KEY,
                                       self.obj_id, content_iter)
 
     def notify_bundle_ready(self):
         self.backend.send_all_notifications(self.obj_type, self.obj_id)
 
 
 class DirectoryBuilder:
     """Creates a cooked directory from its sha1_git in the db.
 
     Warning: This is NOT a directly accessible cooker, but a low-level
     one that executes the manipulations.
 
     """
     def __init__(self, storage):
         self.storage = storage
 
     def get_directory_bytes(self, dir_id):
         # Create temporary folder to retrieve the files into.
         root = bytes(tempfile.mkdtemp(prefix='directory.',
                                       suffix='.cook'), 'utf8')
         self.build_directory(dir_id, root)
         # Use the created directory to make a bundle with the data as
         # a compressed directory.
         bundle_content = self._create_bundle_content(
             root,
             hashutil.hash_to_hex(dir_id))
         return bundle_content
 
     def build_directory(self, dir_id, root):
         # Retrieve data from the database.
         data = self.storage.directory_ls(dir_id, recursive=True)
 
         # Split into files and directory data.
         # TODO(seirl): also handle revision data.
         data1, data2 = itertools.tee(data, 2)
         dir_data = (entry['name'] for entry in data1 if entry['type'] == 'dir')
         file_data = (entry for entry in data2 if entry['type'] == 'file')
 
         # Recreate the directory's subtree and then the files into it.
         self._create_tree(root, dir_data)
         self._create_files(root, file_data)
 
     def _create_tree(self, root, directory_paths):
         """Create a directory tree from the given paths
 
         The tree is created from `root` and each given path in
         `directory_paths` will be created.
 
         """
         # Directories are sorted by depth so they are created in the
         # right order
         bsep = bytes(os.path.sep, 'utf8')
         dir_names = sorted(
             directory_paths,
             key=lambda x: len(x.split(bsep)))
         for dir_name in dir_names:
             os.makedirs(os.path.join(root, dir_name))
 
     def _create_files(self, root, file_datas):
         """Create the files according to their status.
 
         """
         # Then create the files
         for file_data in file_datas:
             path = os.path.join(root, file_data['name'])
             status = file_data['status']
             perms = file_data['perms']
             if status == 'absent':
                 self._create_file_absent(path)
             elif status == 'hidden':
                 self._create_file_hidden(path)
             else:
                 content = self._get_file_content(file_data['sha1'])
                 self._create_file(path, content, perms)
 
     def _create_file(self, path, content, perms=0o100644):
         """Create the given file and fill it with content.
 
         """
         if perms not in (0o100644, 0o100755, 0o120000):
             logging.warning('File {} has invalid permission {}, '
                             'defaulting to 644.'.format(path, perms))
             perms = 0o100644
 
         if perms == 0o120000:  # Symbolic link
             os.symlink(content, path)
         else:
             with open(path, 'wb') as f:
                 f.write(content)
             os.chmod(path, perms & 0o777)
 
     def _get_file_content(self, obj_id):
         """Get the content of the given file.
 
         """
         content = list(self.storage.content_get([obj_id]))[0]['data']
         return content
 
     def _create_file_absent(self, path):
         """Create a file that indicates a skipped content
 
         Create the given file but fill it with a specific content to
         indicate that the content have not been retrieved by the
         software heritage archive due to its size.
 
         """
         self._create_file(self, SKIPPED_MESSAGE)
 
     def _create_file_hidden(self, path):
         """Create a file that indicates an hidden content
 
         Create the given file but fill it with a specific content to
         indicate that the content could not be retrieved due to
         privacy policy.
 
         """
         self._create_file(self, HIDDEN_MESSAGE)
 
     def _create_bundle_content(self, path, hex_dir_id):
         """Create a bundle from the given directory
 
         Args:
             path: location of the directory to package.
             hex_dir_id: hex representation of the directory id
 
         Returns:
             bytes that represent the compressed directory as a bundle.
 
         """
         return get_tar_bytes(path.decode(), hex_dir_id)
diff --git a/swh/vault/cookers/revision_gitfast.py b/swh/vault/cookers/revision_gitfast.py
index 2fb35ad..d55a368 100644
--- a/swh/vault/cookers/revision_gitfast.py
+++ b/swh/vault/cookers/revision_gitfast.py
@@ -1,206 +1,216 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import collections
 import fastimport.commands
 import functools
-import logging
 import os
+import time
 
 from .base import BaseVaultCooker
 
 
 class RevisionGitfastCooker(BaseVaultCooker):
     """Cooker to create a git fast-import bundle """
     CACHE_TYPE_KEY = 'revision_gitfast'
 
     def prepare_bundle(self):
         log = self.storage.revision_log([self.obj_id])
         commands = self.fastexport(log)
 
         for command in commands:
             yield bytes(command)
 
     def fastexport(self, log):
         """Generate all the git fast-import commands from a given log.
         """
         self.rev_by_id = {r['id']: r for r in log}
         self.rev_sorted = list(self._toposort(self.rev_by_id))
         self.obj_done = set()
         self.obj_to_mark = {}
         self.next_available_mark = 1
 
+        last_progress_report = None
+
         # We want a single transaction for the whole export, so we store a
         # cursor and use it during the process.
         with self.storage.db.transaction() as self.cursor:
             for i, rev in enumerate(self.rev_sorted, 1):
-                logging.info('Computing revision %d/%d', i,
-                             len(self.rev_sorted))
+                # Update progress if needed
+                ct = time.time()
+                if (last_progress_report is None
+                        or last_progress_report + 2 <= ct):
+                    last_progress_report = ct
+                    pg = ('Computing revision {}/{}'
+                          .format(i, len(self.rev_sorted)))
+                    self.backend.set_progress(self.obj_type, self.obj_id, pg)
+
+                # Compute the current commit
                 yield from self._compute_commit_command(rev)
 
     def _toposort(self, rev_by_id):
         """Perform a topological sort on the revision graph.
         """
         children = collections.defaultdict(list)  # rev -> children
         in_degree = {}  # rev -> numbers of parents left to compute
 
         # Compute the in_degrees and the parents of all the revisions.
         # Add the roots to the processing queue.
         queue = collections.deque()
         for rev_id, rev in rev_by_id.items():
             in_degree[rev_id] = len(rev['parents'])
             if not rev['parents']:
                 queue.append(rev_id)
             for parent in rev['parents']:
                 children[parent].append(rev_id)
 
         # Topological sort: yield the 'ready' nodes, decrease the in degree of
         # their children and add the 'ready' ones to the queue.
         while queue:
             rev_id = queue.popleft()
             yield rev_by_id[rev_id]
             for child in children[rev_id]:
                 in_degree[child] -= 1
                 if in_degree[child] == 0:
                     queue.append(child)
 
     def mark(self, obj_id):
         """Get the mark ID as bytes of a git object.
 
         If the object has not yet been marked, assign a new ID and add it to
         the mark dictionary.
         """
         if obj_id not in self.obj_to_mark:
             self.obj_to_mark[obj_id] = self.next_available_mark
             self.next_available_mark += 1
         return str(self.obj_to_mark[obj_id]).encode()
 
     def _compute_blob_command_content(self, file_data):
         """Compute the blob command of a file entry if it has not been
         computed yet.
         """
         obj_id = file_data['sha1']
         if obj_id in self.obj_done:
             return
         content = list(self.storage.content_get([obj_id]))[0]['data']
         yield fastimport.commands.BlobCommand(
             mark=self.mark(obj_id),
             data=content,
         )
         self.obj_done.add(obj_id)
 
     def _compute_commit_command(self, rev):
         """Compute a commit command from a specific revision.
         """
         if 'parents' in rev and rev['parents']:
             from_ = b':' + self.mark(rev['parents'][0])
             merges = [b':' + self.mark(r) for r in rev['parents'][1:]]
             parent = self.rev_by_id[rev['parents'][0]]
         else:
             # We issue a reset command before all the new roots so that they
             # are not automatically added as children of the current branch.
             yield fastimport.commands.ResetCommand(b'refs/heads/master', None)
             from_ = None
             merges = None
             parent = None
 
         # Retrieve the file commands while yielding new blob commands if
         # needed.
         files = yield from self._compute_file_commands(rev, parent)
 
         # Construct and yield the commit command
         author = (rev['author']['name'],
                   rev['author']['email'],
                   rev['date']['timestamp']['seconds'],
                   rev['date']['offset'] * 60)
         committer = (rev['committer']['name'],
                      rev['committer']['email'],
                      rev['committer_date']['timestamp']['seconds'],
                      rev['committer_date']['offset'] * 60)
         yield fastimport.commands.CommitCommand(
             ref=b'refs/heads/master',
             mark=self.mark(rev['id']),
             author=author,
             committer=committer,
             message=rev['message'],
             from_=from_,
             merges=merges,
             file_iter=files,
         )
 
     @functools.lru_cache(maxsize=4096)
     def _get_dir_ents(self, dir_id=None):
         """Get the entities of a directory as a dictionary (name -> entity).
 
         This function has a cache to avoid doing multiple requests to retrieve
         the same entities, as doing a directory_ls() is expensive.
         """
         data = (self.storage.directory_ls(dir_id, cur=self.cursor)
                 if dir_id is not None else [])
         return {f['name']: f for f in data}
 
     def _compute_file_commands(self, rev, parent=None):
         """Compute all the file commands of a revision.
 
         Generate a diff of the files between the revision and its main parent
         to find the necessary file commands to apply.
         """
         commands = []
 
         # Initialize the stack with the root of the tree.
         cur_dir = rev['directory']
         parent_dir = parent['directory'] if parent else None
         stack = [(b'', cur_dir, parent_dir)]
 
         while stack:
             # Retrieve the current directory and the directory of the parent
             # commit in order to compute the diff of the trees.
             root, cur_dir_id, prev_dir_id = stack.pop()
             cur_dir = self._get_dir_ents(cur_dir_id)
             prev_dir = self._get_dir_ents(prev_dir_id)
 
             # Find subtrees to delete:
             #  - Subtrees that are not in the new tree (file or directory
             #    deleted).
             #  - Subtrees that do not have the same type in the new tree
             #    (file -> directory or directory -> file)
             # After this step, every node remaining in the previous directory
             # has the same type than the one in the current directory.
             for fname, f in prev_dir.items():
                 if ((fname not in cur_dir
                      or f['type'] != cur_dir[fname]['type'])):
                     commands.append(fastimport.commands.FileDeleteCommand(
                         path=os.path.join(root, fname)
                     ))
 
             # Find subtrees to modify:
             #  - Leaves (files) will be added or modified using `filemodify`
             #  - Other subtrees (directories) will be added to the stack and
             #    processed in the next iteration.
             for fname, f in cur_dir.items():
                 # A file is added or modified if it was not in the tree, if its
                 # permissions changed or if its content changed.
                 if (f['type'] == 'file'
                     and (fname not in prev_dir
                          or f['sha1'] != prev_dir[fname]['sha1']
                          or f['perms'] != prev_dir[fname]['perms'])):
                     # Issue a blob command for the new blobs if needed.
                     yield from self._compute_blob_command_content(f)
                     commands.append(fastimport.commands.FileModifyCommand(
                         path=os.path.join(root, fname),
                         mode=f['perms'],
                         dataref=(b':' + self.mark(f['sha1'])),
                         data=None,
                     ))
                 # A directory is added or modified if it was not in the tree or
                 # if its target changed.
                 elif f['type'] == 'dir':
                     f_prev_target = None
                     if fname in prev_dir and prev_dir[fname]['type'] == 'dir':
                         f_prev_target = prev_dir[fname]['target']
                     if f_prev_target is None or f['target'] != f_prev_target:
                         stack.append((os.path.join(root, fname),
                                       f['target'], f_prev_target))
         return commands