diff --git a/PKG-INFO b/PKG-INFO
index 4fe384d..a697cb4 100644
--- a/PKG-INFO
+++ b/PKG-INFO
@@ -1,10 +1,10 @@
 Metadata-Version: 1.0
 Name: swh.vault
-Version: 0.0.8
+Version: 0.0.9
 Summary: Software Heritage vault
 Home-page: https://forge.softwareheritage.org/diffusion/DVAU/
 Author: Software Heritage developers
 Author-email: swh-devel@inria.fr
 License: UNKNOWN
 Description: UNKNOWN
 Platform: UNKNOWN
diff --git a/swh.vault.egg-info/PKG-INFO b/swh.vault.egg-info/PKG-INFO
index 4fe384d..a697cb4 100644
--- a/swh.vault.egg-info/PKG-INFO
+++ b/swh.vault.egg-info/PKG-INFO
@@ -1,10 +1,10 @@
 Metadata-Version: 1.0
 Name: swh.vault
-Version: 0.0.8
+Version: 0.0.9
 Summary: Software Heritage vault
 Home-page: https://forge.softwareheritage.org/diffusion/DVAU/
 Author: Software Heritage developers
 Author-email: swh-devel@inria.fr
 License: UNKNOWN
 Description: UNKNOWN
 Platform: UNKNOWN
diff --git a/swh/vault/cookers/revision_gitfast.py b/swh/vault/cookers/revision_gitfast.py
index a5f74ac..916b000 100644
--- a/swh/vault/cookers/revision_gitfast.py
+++ b/swh/vault/cookers/revision_gitfast.py
@@ -1,207 +1,208 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import functools
 import os
 import time
 import zlib
 
 from fastimport.commands import (CommitCommand, ResetCommand, BlobCommand,
                                  FileDeleteCommand, FileModifyCommand)
 
 from swh.model import hashutil
 from swh.model.toposort import toposort
 from swh.model.from_disk import mode_to_perms
 from swh.vault.cookers.base import BaseVaultCooker
-from swh.vault.to_disk import get_filtered_file_content
+from swh.vault.to_disk import get_filtered_files_content
 
 
 class RevisionGitfastCooker(BaseVaultCooker):
     """Cooker to create a git fast-import bundle """
     CACHE_TYPE_KEY = 'revision_gitfast'
 
     def check_exists(self):
         return not list(self.storage.revision_missing([self.obj_id]))
 
     def prepare_bundle(self):
         self.log = list(toposort(self.storage.revision_log([self.obj_id])))
         self.gzobj = zlib.compressobj(9, zlib.DEFLATED, zlib.MAX_WBITS | 16)
         self.fastexport()
         self.write(self.gzobj.flush())
 
     def write_cmd(self, cmd):
         chunk = bytes(cmd) + b'\n'
         super().write(self.gzobj.compress(chunk))
 
     def fastexport(self):
         """Generate all the git fast-import commands from a given log.
         """
         self.rev_by_id = {r['id']: r for r in self.log}
         self.obj_done = set()
         self.obj_to_mark = {}
         self.next_available_mark = 1
 
         last_progress_report = None
 
         for i, rev in enumerate(self.log, 1):
             # Update progress if needed
             ct = time.time()
             if (last_progress_report is None
                     or last_progress_report + 2 <= ct):
                 last_progress_report = ct
                 pg = ('Computing revision {}/{}'.format(i, len(self.log)))
                 self.backend.set_progress(self.obj_type, self.obj_id, pg)
 
             # Compute the current commit
             self._compute_commit_command(rev)
 
     def mark(self, obj_id):
         """Get the mark ID as bytes of a git object.
 
         If the object has not yet been marked, assign a new ID and add it to
         the mark dictionary.
         """
         if obj_id not in self.obj_to_mark:
             self.obj_to_mark[obj_id] = self.next_available_mark
             self.next_available_mark += 1
         return str(self.obj_to_mark[obj_id]).encode()
 
     def _compute_blob_command_content(self, file_data):
         """Compute the blob command of a file entry if it has not been
         computed yet.
         """
         obj_id = file_data['sha1']
         if obj_id in self.obj_done:
             return
-        content = get_filtered_file_content(self.storage, file_data)
+        contents = list(get_filtered_files_content(self.storage, [file_data]))
+        content = contents[0]['content']
         self.write_cmd(BlobCommand(mark=self.mark(obj_id), data=content))
         self.obj_done.add(obj_id)
 
     def _author_tuple_format(self, author, date):
         # We never want to have None values here so we replace null entries
         # by ''.
         if author is not None:
             author_tuple = (author.get('name') or b'',
                             author.get('email') or b'')
         else:
             author_tuple = (b'', b'')
         if date is not None:
             date_tuple = (date.get('timestamp', {}).get('seconds') or 0,
                           (date.get('offset') or 0) * 60)
         else:
             date_tuple = (0, 0)
         return author_tuple + date_tuple
 
     def _compute_commit_command(self, rev):
         """Compute a commit command from a specific revision.
         """
         if 'parents' in rev and rev['parents']:
             from_ = b':' + self.mark(rev['parents'][0])
             merges = [b':' + self.mark(r) for r in rev['parents'][1:]]
             parent = self.rev_by_id[rev['parents'][0]]
         else:
             # We issue a reset command before all the new roots so that they
             # are not automatically added as children of the current branch.
             self.write_cmd(ResetCommand(b'refs/heads/master', None))
             from_ = None
             merges = None
             parent = None
 
         # Retrieve the file commands while yielding new blob commands if
         # needed.
         files = list(self._compute_file_commands(rev, parent))
 
         # Construct and write the commit command
         author = self._author_tuple_format(rev['author'], rev['date'])
         committer = self._author_tuple_format(rev['committer'],
                                               rev['committer_date'])
         self.write_cmd(CommitCommand(
             ref=b'refs/heads/master',
             mark=self.mark(rev['id']),
             author=author,
             committer=committer,
             message=rev['message'] or b'',
             from_=from_,
             merges=merges,
             file_iter=files))
 
     @functools.lru_cache(maxsize=4096)
     def _get_dir_ents(self, dir_id=None):
         """Get the entities of a directory as a dictionary (name -> entity).
 
         This function has a cache to avoid doing multiple requests to retrieve
         the same entities, as doing a directory_ls() is expensive.
         """
         data = (self.storage.directory_ls(dir_id)
                 if dir_id is not None else [])
         return {f['name']: f for f in data}
 
     def _compute_file_commands(self, rev, parent=None):
         """Compute all the file commands of a revision.
 
         Generate a diff of the files between the revision and its main parent
         to find the necessary file commands to apply.
         """
         # Initialize the stack with the root of the tree.
         cur_dir = rev['directory']
         parent_dir = parent['directory'] if parent else None
         stack = [(b'', cur_dir, parent_dir)]
 
         while stack:
             # Retrieve the current directory and the directory of the parent
             # commit in order to compute the diff of the trees.
             root, cur_dir_id, prev_dir_id = stack.pop()
             cur_dir = self._get_dir_ents(cur_dir_id)
             prev_dir = self._get_dir_ents(prev_dir_id)
 
             # Find subtrees to delete:
             #  - Subtrees that are not in the new tree (file or directory
             #    deleted).
             #  - Subtrees that do not have the same type in the new tree
             #    (file -> directory or directory -> file)
             # After this step, every node remaining in the previous directory
             # has the same type than the one in the current directory.
             for fname, f in prev_dir.items():
                 if ((fname not in cur_dir
                      or f['type'] != cur_dir[fname]['type'])):
                     yield FileDeleteCommand(path=os.path.join(root, fname))
 
             # Find subtrees to modify:
             #  - Leaves (files) will be added or modified using `filemodify`
             #  - Other subtrees (directories) will be added to the stack and
             #    processed in the next iteration.
             for fname, f in cur_dir.items():
                 # A file is added or modified if it was not in the tree, if its
                 # permissions changed or if its content changed.
                 if (f['type'] == 'file'
                     and (fname not in prev_dir
                          or f['sha1'] != prev_dir[fname]['sha1']
                          or f['perms'] != prev_dir[fname]['perms'])):
                     # Issue a blob command for the new blobs if needed.
                     self._compute_blob_command_content(f)
                     yield FileModifyCommand(
                         path=os.path.join(root, fname),
                         mode=mode_to_perms(f['perms']).value,
                         dataref=(b':' + self.mark(f['sha1'])),
                         data=None)
                 # A revision is added or modified if it was not in the tree or
                 # if its target changed
                 elif (f['type'] == 'rev'
                       and (fname not in prev_dir
                            or f['target'] != prev_dir[fname]['target'])):
                     yield FileModifyCommand(
                         path=os.path.join(root, fname),
                         mode=0o160000,
                         dataref=hashutil.hash_to_hex(f['target']).encode(),
                         data=None)
                 # A directory is added or modified if it was not in the tree or
                 # if its target changed.
                 elif f['type'] == 'dir':
                     f_prev_target = None
                     if fname in prev_dir and prev_dir[fname]['type'] == 'dir':
                         f_prev_target = prev_dir[fname]['target']
                     if f_prev_target is None or f['target'] != f_prev_target:
                         stack.append((os.path.join(root, fname),
                                       f['target'], f_prev_target))
diff --git a/swh/vault/to_disk.py b/swh/vault/to_disk.py
index 6c6fc68..dae1ffb 100644
--- a/swh/vault/to_disk.py
+++ b/swh/vault/to_disk.py
@@ -1,113 +1,127 @@
 # Copyright (C) 2016-2018 The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
-import itertools
+import functools
+import collections
 import os
 
 from swh.model import hashutil
 from swh.model.from_disk import mode_to_perms, DentryPerms
 
 SKIPPED_MESSAGE = (b'This content has not been retrieved in the '
                    b'Software Heritage archive due to its size.')
 
 HIDDEN_MESSAGE = (b'This content is hidden.')
 
 
-def get_filtered_file_content(storage, file_data):
-    """Retrieve the file specified by file_data and apply filters for skipped
+def get_filtered_files_content(storage, files_data):
+    """Retrieve the files specified by files_data and apply filters for skipped
     and missing contents.
 
     Args:
-        storage: the storage from which to retrieve the object
-        file_data: file entry descriptor as returned by directory_ls()
-
-    Returns:
-        Bytes containing the specified content. The content will be replaced by
-        a specific message to indicate that the content could not be retrieved
-        (either due to privacy policy or because its size was too big for us to
-        archive it).
+        storage: the storage from which to retrieve the objects
+        files_data: list of file entries as returned by directory_ls()
+
+    Yields:
+        The entries given in files_data with a new 'content' key that points to
+        the file content in bytes.
+
+        The contents can be replaced by a specific message to indicate that
+        they could not be retrieved (either due to privacy policy or because
+        their sizes were too big for us to archive it).
     """
-    assert file_data['type'] == 'file'
+    contents_to_fetch = [f['sha1'] for f in files_data
+                         if f['status'] == 'visible']
+    contents_fetched = storage.content_get(contents_to_fetch)
+    contents = {c['sha1']: c['data'] for c in contents_fetched}
+
+    for file_data in files_data:
+        if file_data['status'] == 'visible':
+            content = contents[file_data['sha1']]
+        elif file_data['status'] == 'absent':
+            content = SKIPPED_MESSAGE
+        elif file_data['status'] == 'hidden':
+            content = HIDDEN_MESSAGE
+
+        yield {'content': content, **file_data}
+
 
-    if file_data['status'] == 'absent':
-        return SKIPPED_MESSAGE
-    elif file_data['status'] == 'hidden':
-        return HIDDEN_MESSAGE
-    else:
-        return list(storage.content_get([file_data['sha1']]))[0]['data']
+def apply_chunked(func, input_list, chunk_size):
+    """Apply func on input_list divided in chunks of size chunk_size"""
+    for i in range(0, len(input_list), chunk_size):
+        yield from func(input_list[i:i + chunk_size])
 
 
 class DirectoryBuilder:
     """Reconstructs the on-disk representation of a directory in the storage.
     """
 
     def __init__(self, storage, root, dir_id):
         """Initialize the directory builder.
 
         Args:
             storage: the storage object
             root: the path where the directory should be reconstructed
             dir_id: the identifier of the directory in the storage
         """
         self.storage = storage
         self.root = root
         self.dir_id = dir_id
 
     def build(self):
         """Perform the reconstruction of the directory in the given root."""
         # Retrieve data from the database.
         data = self.storage.directory_ls(self.dir_id, recursive=True)
 
-        # Split into files and directory data.
-        data1, data2 = itertools.tee(data, 2)
-        dir_data = (entry['name'] for entry in data1 if entry['type'] == 'dir')
-        file_data = (entry for entry in data2 if entry['type'] != 'dir')
+        # Split into files, revisions and directory data.
+        entries = collections.defaultdict(list)
+        for entry in data:
+            entries[entry['type']].append(entry)
 
         # Recreate the directory's subtree and then the files into it.
-        self._create_tree(dir_data)
-        self._create_files(file_data)
+        self._create_tree(entries['dir'])
+        self._create_files(entries['file'])
+        self._create_revisions(entries['rev'])
 
-    def _create_tree(self, directory_paths):
+    def _create_tree(self, directories):
         """Create a directory tree from the given paths
 
-        The tree is created from `root` and each given path in
-        `directory_paths` will be created.
-
+        The tree is created from `root` and each given directory in
+        `directories` will be created.
         """
         # Directories are sorted by depth so they are created in the
         # right order
-        bsep = bytes(os.path.sep, 'utf8')
-        dir_names = sorted(
-            directory_paths,
-            key=lambda x: len(x.split(bsep)))
-        for dir_name in dir_names:
-            os.makedirs(os.path.join(self.root, dir_name))
-
-    def _create_files(self, file_datas):
-        """Create the files according to their status."""
-        for file_data in file_datas:
+        bsep = os.path.sep.encode()
+        directories = sorted(directories,
+                             key=lambda x: len(x['name'].split(bsep)))
+        for dir in directories:
+            os.makedirs(os.path.join(self.root, dir['name']))
+
+    def _create_files(self, files_data):
+        """Create the files in the tree and fetch their contents."""
+        f = functools.partial(get_filtered_files_content, self.storage)
+        files_data = apply_chunked(f, files_data, 1000)
+
+        for file_data in files_data:
+            path = os.path.join(self.root, file_data['name'])
+            self._create_file(path, file_data['content'], file_data['perms'])
+
+    def _create_revisions(self, revs_data):
+        """Create the revisions in the tree as broken symlinks to the target
+        identifier."""
+        for file_data in revs_data:
             path = os.path.join(self.root, file_data['name'])
-            if file_data['type'] == 'file':
-                content = get_filtered_file_content(self.storage, file_data)
-                self._create_file(path, content, file_data['perms'])
-            elif file_data['type'] == 'rev':
-                self._create_file(path,
-                                  hashutil.hash_to_hex(file_data['target']),
-                                  0o120000)
+            self._create_file(path, hashutil.hash_to_hex(file_data['target']),
+                              mode=0o120000)
 
     def _create_file(self, path, content, mode=0o100644):
         """Create the given file and fill it with content."""
         perms = mode_to_perms(mode)
         if perms == DentryPerms.symlink:
             os.symlink(content, path)
         else:
             with open(path, 'wb') as f:
                 f.write(content)
             os.chmod(path, perms.value)
-
-    def _get_file_content(self, obj_id):
-        """Get the content of the given file."""
-        content = list(self.storage.content_get([obj_id]))[0]['data']
-        return content
diff --git a/version.txt b/version.txt
index 5f5ea89..d63e418 100644
--- a/version.txt
+++ b/version.txt
@@ -1 +1 @@
-v0.0.8-0-g971485c
\ No newline at end of file
+v0.0.9-0-gbca6619
\ No newline at end of file