diff --git a/swh/indexer/__init__.py b/swh/indexer/__init__.py
index 7a7e0d3..b558a81 100644
--- a/swh/indexer/__init__.py
+++ b/swh/indexer/__init__.py
@@ -1,56 +1,55 @@
 # Copyright (C) 2016-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 
 INDEXER_CLASSES = {
     'mimetype': 'swh.indexer.mimetype.ContentMimetypeIndexer',
     'language': 'swh.indexer.language.ContentLanguageIndexer',
     'ctags': 'swh.indexer.ctags.CtagsIndexer',
     'fossology_license':
     'swh.indexer.fossology_license.ContentFossologyLicenseIndexer',
 }
 
 
 TASK_NAMES = {
     'orchestrator_all': 'swh.indexer.tasks.SWHOrchestratorAllContentsTask',
     'orchestrator_text': 'swh.indexer.tasks.SWHOrchestratorTextContentsTask',
     'mimetype': 'swh.indexer.tasks.SWHContentMimetypeTask',
     'language': 'swh.indexer.tasks.SWHContentLanguageTask',
     'ctags': 'swh.indexer.tasks.SWHCtagsTask',
     'fossology_license': 'swh.indexer.tasks.SWHContentFossologyLicenseTask',
     'rehash': 'swh.indexer.tasks.SWHRecomputeChecksumsTask',
 }
 
 
 __all__ = [
     'INDEXER_CLASSES', 'TASK_NAMES',
 ]
 
 
-def get_storage(cls, args):
+def get_indexer_storage(cls, args):
     """Get an indexer storage object of class `storage_class` with
     arguments `storage_args`.
 
     Args:
         storage (dict): dictionary with keys:
         - cls (str): storage's class, either 'local' or 'remote'
         - args (dict): dictionary with keys
 
     Returns:
         an instance of swh.indexer's storage (either local or remote)
 
     Raises:
         ValueError if passed an unknown storage class.
 
     """
-
     if cls == 'remote':
         from .storage.api.client import RemoteStorage as IndexerStorage
     elif cls == 'local':
         from .storage import IndexerStorage
     else:
-        raise ValueError('Unknown storage class `%s`' % cls)
+        raise ValueError('Unknown indexer storage class `%s`' % cls)
 
     return IndexerStorage(**args)
diff --git a/swh/indexer/ctags.py b/swh/indexer/ctags.py
index ec395f2..dde3740 100644
--- a/swh/indexer/ctags.py
+++ b/swh/indexer/ctags.py
@@ -1,161 +1,161 @@
 # Copyright (C) 2015-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import click
 import subprocess
 import json
 
 from swh.model import hashutil
 
 from .language import compute_language
 from .indexer import ContentIndexer, DiskIndexer
 
 
 # Options used to compute tags
 __FLAGS = [
     '--fields=+lnz',  # +l: language
                       # +n: line number of tag definition
                       # +z: include the symbol's kind (function, variable, ...)
     '--sort=no',      # sort output on tag name
     '--links=no',     # do not follow symlinks
     '--output-format=json',  # outputs in json
 ]
 
 
 def run_ctags(path, lang=None, ctags_command='ctags'):
     """Run ctags on file path with optional language.
 
     Args:
         path: path to the file
         lang: language for that path (optional)
 
     Returns:
         ctags' output
 
     """
     optional = []
     if lang:
         optional = ['--language-force=%s' % lang]
 
     cmd = [ctags_command] + __FLAGS + optional + [path]
     output = subprocess.check_output(cmd, universal_newlines=True)
 
     for symbol in output.split('\n'):
         if not symbol:
             continue
         js_symbol = json.loads(symbol)
         yield {
             'name': js_symbol['name'],
             'kind': js_symbol['kind'],
             'line': js_symbol['line'],
             'lang': js_symbol['language'],
         }
 
 
 class CtagsIndexer(ContentIndexer, DiskIndexer):
     CONFIG_BASE_FILENAME = 'indexer/ctags'
 
     ADDITIONAL_CONFIG = {
         'workdir': ('str', '/tmp/swh/indexer.ctags'),
         'tools': ('dict', {
             'name': 'universal-ctags',
             'version': '~git7859817b',
             'configuration': {
                 'command_line': '''ctags --fields=+lnz --sort=no --links=no '''
                                 '''--output-format=json <filepath>'''
             },
         }),
         'languages': ('dict', {
             'ada': 'Ada',
             'adl': None,
             'agda': None,
             # ...
         })
     }
 
     def prepare(self):
         super().prepare()
         self.working_directory = self.config['workdir']
         self.language_map = self.config['languages']
         self.tool = self.tools[0]
 
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
 
         """
-        yield from self.storage.content_ctags_missing((
+        yield from self.idx_storage.content_ctags_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1 in ids
         ))
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             id (bytes): content's identifier
             data (bytes): raw content in bytes
 
         Returns:
             A dict, representing a content_mimetype, with keys:
               - id (bytes): content's identifier (sha1)
               - ctags ([dict]): ctags list of symbols
 
         """
         lang = compute_language(data, log=self.log)['lang']
 
         if not lang:
             return None
 
         ctags_lang = self.language_map.get(lang)
 
         if not ctags_lang:
             return None
 
         ctags = {
             'id': id,
         }
 
         filename = hashutil.hash_to_hex(id)
         content_path = self.write_to_temp(
             filename=filename,
             data=data)
 
         result = run_ctags(content_path, lang=ctags_lang)
         ctags.update({
             'ctags': list(result),
             'indexer_configuration_id': self.tool['id'],
         })
 
         self.cleanup(content_path)
 
         return ctags
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_mimetype, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - ctags ([dict]): ctags list of symbols
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
-        self.storage.content_ctags_add(
+        self.idx_storage.content_ctags_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
 
 @click.command()
 @click.option('--path', help="Path to execute index on")
 def main(path):
     r = list(run_ctags(path))
     print(r)
 
 
 if __name__ == '__main__':
     main()
diff --git a/swh/indexer/fossology_license.py b/swh/indexer/fossology_license.py
index d1f9db6..3d46407 100644
--- a/swh/indexer/fossology_license.py
+++ b/swh/indexer/fossology_license.py
@@ -1,141 +1,141 @@
 # Copyright (C) 2016-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import click
 import subprocess
 
 from swh.model import hashutil
 
 from .indexer import ContentIndexer, DiskIndexer
 
 
 def compute_license(path, log=None):
     """Determine license from file at path.
 
     Args:
         path: filepath to determine the license
 
     Returns:
         A dict with the following keys:
         - licenses ([str]): associated detected licenses to path
         - path (bytes): content filepath
         - tool (str): tool used to compute the output
 
     """
     try:
         properties = subprocess.check_output(['nomossa', path],
                                              universal_newlines=True)
         if properties:
             res = properties.rstrip().split(' contains license(s) ')
             licenses = res[1].split(',')
 
             return {
                 'licenses': licenses,
                 'path': path,
             }
     except subprocess.CalledProcessError:
         if log:
             from os import path as __path
             log.exception('Problem during license detection for sha1 %s' %
                           __path.basename(path))
         return {
             'licenses': [],
             'path': path,
         }
 
 
 class ContentFossologyLicenseIndexer(ContentIndexer, DiskIndexer):
     """Indexer in charge of:
     - filtering out content already indexed
     - reading content from objstorage per the content's id (sha1)
     - computing {license, encoding} from that content
     - store result in storage
 
     """
     ADDITIONAL_CONFIG = {
         'workdir': ('str', '/tmp/swh/indexer.fossology.license'),
         'tools': ('dict', {
             'name': 'nomos',
             'version': '3.1.0rc2-31-ga2cbb8c',
             'configuration': {
                 'command_line': 'nomossa <filepath>',
             },
         }),
     }
 
     CONFIG_BASE_FILENAME = 'indexer/fossology_license'
 
     def prepare(self):
         super().prepare()
         self.working_directory = self.config['workdir']
         self.tool = self.tools[0]
 
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
 
         """
-        yield from self.storage.content_fossology_license_missing((
+        yield from self.idx_storage.content_fossology_license_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1 in ids
         ))
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             sha1 (bytes): content's identifier
             raw_content (bytes): raw content in bytes
 
         Returns:
             A dict, representing a content_license, with keys:
               - id (bytes): content's identifier (sha1)
               - license (bytes): license in bytes
               - path (bytes): path
 
         """
         filename = hashutil.hash_to_hex(id)
         content_path = self.write_to_temp(
             filename=filename,
             data=data)
 
         try:
             properties = compute_license(path=content_path, log=self.log)
             properties.update({
                 'id': id,
                 'indexer_configuration_id': self.tool['id'],
             })
         finally:
             self.cleanup(content_path)
 
         return properties
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_license, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - license (bytes): license in bytes
               - path (bytes): path
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
-        self.storage.content_fossology_license_add(
+        self.idx_storage.content_fossology_license_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
 
 @click.command(help='Compute license for path using tool')
 @click.option('--tool', default='nomossa', help="Path to tool")
 @click.option('--path', required=1, help="Path to execute index on")
 def main(tool, path):
     print(compute_license(tool, path))
 
 
 if __name__ == '__main__':
     main()
diff --git a/swh/indexer/indexer.py b/swh/indexer/indexer.py
index 2cd850d..07cd85c 100644
--- a/swh/indexer/indexer.py
+++ b/swh/indexer/indexer.py
@@ -1,419 +1,418 @@
 # Copyright (C) 2016-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import abc
 import os
 import logging
 import shutil
 import tempfile
 
 from swh.core.config import SWHConfig
 from swh.objstorage import get_objstorage
 from swh.objstorage.exc import ObjNotFoundError
 from swh.model import hashutil
-from swh.storage import get_storage
 from swh.scheduler.utils import get_task
+from swh.indexer import get_indexer_storage
 
 
 class DiskIndexer:
     """Mixin intended to be used with other SomethingIndexer classes.
 
        Indexers inheriting from this class are a category of indexers
        which needs the disk for their computations.
 
        Note:
            This expects `self.working_directory` variable defined at
            runtime.
 
     """
     def write_to_temp(self, filename, data):
         """Write the sha1's content in a temporary file.
 
         Args:
             sha1 (str): the sha1 name
             filename (str): one of sha1's many filenames
             data (bytes): the sha1's content to write in temporary
             file
 
         Returns:
             The path to the temporary file created. That file is
             filled in with the raw content's data.
 
         """
         os.makedirs(self.working_directory, exist_ok=True)
         temp_dir = tempfile.mkdtemp(dir=self.working_directory)
         content_path = os.path.join(temp_dir, filename)
 
         with open(content_path, 'wb') as f:
             f.write(data)
 
         return content_path
 
     def cleanup(self, content_path):
         """Remove content_path from working directory.
 
         Args:
             content_path (str): the file to remove
 
         """
         temp_dir = os.path.dirname(content_path)
         shutil.rmtree(temp_dir)
 
 
 class BaseIndexer(SWHConfig,
                   metaclass=abc.ABCMeta):
     """Base class for indexers to inherit from.
 
     The main entry point is the :func:`run` function which is in
     charge of triggering the computations on the batch dict/ids
     received.
 
     Indexers can:
 
     - filter out ids whose data has already been indexed.
     - retrieve ids data from storage or objstorage
     - index this data depending on the object and store the result in
       storage.
 
     To implement a new object type indexer, inherit from the
     BaseIndexer and implement the process of indexation:
 
     :func:`run`:
       object_ids are different depending on object. For example: sha1 for
       content, sha1_git for revision, directory, release, and id for origin
 
     To implement a new concrete indexer, inherit from the object level
     classes: :class:`ContentIndexer`, :class:`RevisionIndexer` (later
     on :class:`OriginIndexer` will also be available)
 
     Then you need to implement the following functions:
 
     :func:`filter`:
       filter out data already indexed (in storage). This function is used by
       the orchestrator and not directly by the indexer
       (cf. swh.indexer.orchestrator.BaseOrchestratorIndexer).
 
     :func:`index_object`:
       compute index on id with data (retrieved from the storage or the
       objstorage by the id key) and return the resulting index computation.
 
     :func:`persist_index_computations`:
       persist the results of multiple index computations in the storage.
 
     The new indexer implementation can also override the following functions:
 
     :func:`prepare`:
       Configuration preparation for the indexer.  When overriding, this must
       call the `super().prepare()` instruction.
 
     :func:`check`:
       Configuration check for the indexer.  When overriding, this must call the
       `super().check()` instruction.
 
     :func:`register_tools`:
       This should return a dict of the tool(s) to use when indexing or
       filtering.
 
     """
     CONFIG = 'indexer/base'
 
     DEFAULT_CONFIG = {
-        'storage': ('dict', {
-            'host': 'uffizi',
+        'indexer_storage': ('dict', {
             'cls': 'remote',
-            'args': {'root': '/tmp/softwareheritage/objects',
-                     'slicing': '0:2/2:4/4:6'}
+            'args': {
+                'db': 'service=swh-indexer-dev'
+            }
         }),
+
         # queue to reschedule if problem (none for no rescheduling,
         # the default)
         'rescheduling_task': ('str', None),
         'objstorage': ('dict', {
             'cls': 'multiplexer',
             'args': {
                 'objstorages': [{
                     'cls': 'filtered',
                     'args': {
                         'storage_conf': {
                             'cls': 'azure-storage',
                             'args': {
                                 'account_name': '0euwestswh',
                                 'api_secret_key': 'secret',
                                 'container_name': 'contents'
                             }
                         },
                         'filters_conf': [
                             {'type': 'readonly'},
                             {'type': 'prefix', 'prefix': '0'}
                         ]
                     }
                 }, {
                     'cls': 'filtered',
                     'args': {
                         'storage_conf': {
                             'cls': 'azure-storage',
                             'args': {
                                 'account_name': '1euwestswh',
                                 'api_secret_key': 'secret',
                                 'container_name': 'contents'
                             }
                         },
                         'filters_conf': [
                             {'type': 'readonly'},
                             {'type': 'prefix', 'prefix': '1'}
                         ]
                     }
                 }]
             },
         }),
     }
 
     ADDITIONAL_CONFIG = {}
 
     def __init__(self):
         """Prepare and check that the indexer is ready to run.
 
         """
         super().__init__()
         self.prepare()
         self.check()
 
     def prepare(self):
         """Prepare the indexer's needed runtime configuration.
            Without this step, the indexer cannot possibly run.
 
         """
         self.config = self.parse_config_file(
             additional_configs=[self.ADDITIONAL_CONFIG])
         objstorage = self.config['objstorage']
         self.objstorage = get_objstorage(objstorage['cls'], objstorage['args'])
-        storage = self.config['storage']
-        self.storage = get_storage(storage['cls'], storage['args'])
+        idx_storage = self.config['indexer_storage']
+        self.idx_storage = get_indexer_storage(**idx_storage)
         rescheduling_task = self.config['rescheduling_task']
         if rescheduling_task:
             self.rescheduling_task = get_task(rescheduling_task)
         else:
             self.rescheduling_task = None
 
         l = logging.getLogger('requests.packages.urllib3.connectionpool')
         l.setLevel(logging.WARN)
         self.log = logging.getLogger('swh.indexer')
         self.tools = list(self.register_tools(self.config['tools']))
 
     def check(self):
         """Check the indexer's configuration is ok before proceeding.
            If ok, does nothing. If not raise error.
 
         """
         if not self.tools:
             raise ValueError('Tools %s is unknown, cannot continue' %
                              self.tools)
 
     def _prepare_tool(self, tool):
         """Prepare the tool dict to be compliant with the storage api.
 
         """
         return {'tool_%s' % key: value for key, value in tool.items()}
 
     def register_tools(self, tools):
         """Permit to register tools to the storage.
 
            Add a sensible default which can be overridden if not
            sufficient.  (For now, all indexers use only one tool)
 
            Expects the self.config['tools'] property to be set with
            one or more tools.
 
         Args:
             tools (dict/[dict]): Either a dict or a list of dict.
 
         Returns:
             List of dict with additional id key.
 
         Raises:
             ValueError if not a list nor a dict.
 
         """
         tools = self.config['tools']
         if isinstance(tools, list):
             tools = map(self._prepare_tool, tools)
         elif isinstance(tools, dict):
             tools = [self._prepare_tool(tools)]
         else:
             raise ValueError('Configuration tool(s) must be a dict or list!')
 
-        registered_tools = self.storage.indexer_configuration_add(tools)
-        return registered_tools
+        return self.idx_storage.indexer_configuration_add(tools)
 
     @abc.abstractmethod
     def filter(self, ids):
         """Filter missing ids for that particular indexer.
 
         Args:
             ids ([bytes]): list of ids
 
         Yields:
             iterator of missing ids
 
         """
         pass
 
     @abc.abstractmethod
     def index(self, id, data):
         """Index computation for the id and associated raw data.
 
         Args:
             id (bytes): identifier
             data (bytes): id's data from storage or objstorage depending on
                              object type
 
         Returns:
             a dict that makes sense for the persist_index_computations
         function.
 
         """
         pass
 
     @abc.abstractmethod
     def persist_index_computations(self, results, policy_update):
         """Persist the computation resulting from the index.
 
         Args:
 
             results ([result]): List of results. One result is the
                                 result of the index function.
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
                                    respectively update duplicates or ignore
                                    them
 
         Returns:
             None
 
         """
         pass
 
     def next_step(self, results):
         """Do something else with computations results (e.g. send to another
         queue, ...).
 
         (This is not an abstractmethod since it is optional).
 
         Args:
             results ([result]): List of results (dict) as returned
                                 by index function.
 
         Returns:
             None
 
         """
         pass
 
     @abc.abstractmethod
     def run(self, ids, policy_update):
         """Given a list of ids:
 
         - retrieves the data from the storage
         - executes the indexing computations
         - stores the results (according to policy_update)
 
         Args:
             ids ([bytes]): id's identifier list
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
         pass
 
 
 class ContentIndexer(BaseIndexer):
     """An object type indexer, inherits from the :class:`BaseIndexer` and
     implements the process of indexation for Contents using the run
     method
 
     Note: the :class:`ContentIndexer` is not an instantiable
     object. To use it in another context, one should inherit from this
     class and override the methods mentioned in the
     :class:`BaseIndexer` class.
 
     """
 
     def run(self, ids, policy_update):
         """Given a list of ids:
 
         - retrieve the content from the storage
         - execute the indexing computations
         - store the results (according to policy_update)
 
         Args:
             ids ([bytes]): sha1's identifier list
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
                                    respectively update duplicates or ignore
                                    them
 
         """
         results = []
         try:
             for sha1 in ids:
                 try:
                     raw_content = self.objstorage.get(sha1)
                 except ObjNotFoundError:
                     self.log.warn('Content %s not found in objstorage' %
                                   hashutil.hash_to_hex(sha1))
                     continue
                 res = self.index(sha1, raw_content)
                 if res:  # If no results, skip it
                     results.append(res)
 
             self.persist_index_computations(results, policy_update)
             self.next_step(results)
         except Exception:
             self.log.exception(
                 'Problem when reading contents metadata.')
             if self.rescheduling_task:
                 self.log.warn('Rescheduling batch')
                 self.rescheduling_task.delay(ids, policy_update)
 
 
 class RevisionIndexer(BaseIndexer):
     """An object type indexer, inherits from the :class:`BaseIndexer` and
     implements the process of indexation for Revisions using the run
     method
 
     Note: the :class:`RevisionIndexer` is not an instantiable object.
     To use it in another context one should inherit from this class
     and override the methods mentioned in the :class:`BaseIndexer`
     class.
 
     """
-
     def run(self, ids, policy_update):
         """Given a list of sha1_gits:
 
         - retrieve revisions from storage
         - execute the indexing computations
         - store the results (according to policy_update)
 
         Args:
             ids ([bytes]): sha1_git's identifier list
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
                                    respectively update duplicates or ignore
                                    them
 
         """
         results = []
         revs = self.storage.revision_get(ids)
 
         for rev in revs:
             if not rev:
                 self.log.warn('Revisions %s not found in storage' %
                               list(map(hashutil.hash_to_hex, ids)))
                 continue
             try:
                 res = self.index(rev)
                 if res:  # If no results, skip it
                     results.append(res)
             except Exception:
                 self.log.exception(
                         'Problem when processing revision')
         self.persist_index_computations(results, policy_update)
diff --git a/swh/indexer/language.py b/swh/indexer/language.py
index 78d6b62..6433977 100644
--- a/swh/indexer/language.py
+++ b/swh/indexer/language.py
@@ -1,208 +1,208 @@
 # Copyright (C) 2016-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 
 import io
 
 from pygments.lexers import guess_lexer
 from pygments.util import ClassNotFound
 from chardet.universaldetector import UniversalDetector
 
 from .indexer import ContentIndexer
 
 
 def _cleanup_classname(classname):
     """Determine the language from the pygments' lexer names.
 
     """
     return classname.lower().replace(' ', '-')
 
 
 def _read_raw(raw_content, size=2048):
     """Read raw content in chunk.
 
     """
     bs = io.BytesIO(raw_content)
     while True:
         chunk = bs.read(size)
         if not chunk:
             break
         yield chunk
 
 
 def _detect_encoding(raw_content):
     """Given a raw content, try and detect its encoding.
 
     """
     detector = UniversalDetector()
     for chunk in _read_raw(raw_content):
         detector.feed(chunk)
         if detector.done:
             break
     detector.close()
     return detector.result['encoding']
 
 
 def compute_language_from_chunk(encoding, length, raw_content, max_size,
                                 log=None):
     """Determine the raw content's language.
 
     Args:
         encoding (str): Encoding to use to decode the content
         length (int): raw_content's length
         raw_content (bytes): raw content to work with
         max_size (int): max size to split the raw content at
 
     Returns:
         Dict with keys:
         - lang: None if nothing found or the possible language
 
     """
     try:
         if max_size <= length:
             raw_content = raw_content[0:max_size]
 
         content = raw_content.decode(encoding)
         lang = _cleanup_classname(
             guess_lexer(content).name)
     except ClassNotFound:
         lang = None
     except UnicodeDecodeError:
         raise
     except Exception:
         if log:
             log.exception('Problem during language detection, skipping')
         lang = None
     return {
         'lang': lang
     }
 
 
 def compute_language(raw_content, encoding=None, log=None):
     """Determine the raw content's language.
 
     Args:
         raw_content (bytes): raw content to work with
 
     Returns:
         Dict with keys:
         - lang: None if nothing found or the possible language
 
     """
     try:
         encoding = _detect_encoding(raw_content)
         content = raw_content.decode(encoding)
         lang = _cleanup_classname(
             guess_lexer(content).name)
     except ClassNotFound:
         lang = None
     except Exception:
         if log:
             log.exception('Problem during language detection, skipping')
         lang = None
     return {
         'lang': lang
     }
 
 
 class ContentLanguageIndexer(ContentIndexer):
     """Indexer in charge of:
 
     - filtering out content already indexed
     - reading content from objstorage per the content's id (sha1)
     - computing {mimetype, encoding} from that content
     - store result in storage
 
     """
     CONFIG_BASE_FILENAME = 'indexer/language'
 
     ADDITIONAL_CONFIG = {
         'tools': ('dict', {
             'name': 'pygments',
             'version': '2.0.1+dfsg-1.1+deb8u1',
             'configuration': {
                 'type': 'library',
                 'debian-package': 'python3-pygments',
                 'max_content_size': 10240,
             },
         }),
     }
 
     def prepare(self):
         super().prepare()
         c = self.config
         self.max_content_size = c['tools']['configuration']['max_content_size']
         self.tool = self.tools[0]
 
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
 
         """
-        yield from self.storage.content_language_missing((
+        yield from self.idx_storage.content_language_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id']
             } for sha1 in ids
         ))
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             id (bytes): content's identifier
             data (bytes): raw content in bytes
 
         Returns:
             A dict, representing a content_mimetype, with keys:
               - id (bytes): content's identifier (sha1)
               - lang (bytes): detected language
 
         """
         result = {
             'id': id,
             'indexer_configuration_id': self.tool['id'],
             'lang': None,
         }
 
         encoding = _detect_encoding(data)
 
         if not encoding:
             return result
 
         l = len(data)
         for i in range(0, 9):
             max_size = self.max_content_size + i
 
             try:
                 result = compute_language_from_chunk(
                     encoding, l, data, max_size, log=self.log)
             except UnicodeDecodeError:
                 self.log.warn('Decoding failed on wrong byte chunk at [0-%s]'
                               ', trying again at next ending byte.' % max_size)
                 continue
 
             # we found something, so we return it
             result.update({
                 'id': id,
                 'indexer_configuration_id': self.tool['id'],
             })
             break
 
         return result
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_mimetype, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - lang (bytes): detected language
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
-        self.storage.content_language_add(
+        self.idx_storage.content_language_add(
             results, conflict_update=(policy_update == 'update-dups'))
diff --git a/swh/indexer/metadata.py b/swh/indexer/metadata.py
index f40c0e4..9bded05 100644
--- a/swh/indexer/metadata.py
+++ b/swh/indexer/metadata.py
@@ -1,293 +1,299 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 import click
 import logging
 
 from swh.indexer.indexer import ContentIndexer, RevisionIndexer
 from swh.indexer.metadata_dictionary import compute_metadata
 from swh.indexer.metadata_detector import detect_metadata
 from swh.indexer.metadata_detector import extract_minimal_metadata_dict
 
 from swh.model import hashutil
 
 
 class ContentMetadataIndexer(ContentIndexer):
     """Content-level indexer
 
     This indexer is in charge of:
 
     - filtering out content already indexed in content_metadata
     - reading content from objstorage with the content's id sha1
     - computing translated_metadata by given context
     - using the metadata_dictionary as the 'swh-metadata-translator' tool
     - store result in content_metadata table
 
     """
     CONFIG_BASE_FILENAME = 'indexer/metadata'
 
     def __init__(self, tool, config):
         # twisted way to use the exact same config of RevisionMetadataIndexer
         # object that uses internally ContentMetadataIndexer
         self.config = config
         self.config['tools'] = tool
         super().__init__()
 
     def prepare(self):
         self.results = []
-        if self.config['storage']:
-            self.storage = self.config['storage']
+        if self.config['indexer_storage']:
+            self.idx_storage = self.config['indexer_storage']
         if self.config['objstorage']:
             self.objstorage = self.config['objstorage']
         l = logging.getLogger('requests.packages.urllib3.connectionpool')
         l.setLevel(logging.WARN)
         self.log = logging.getLogger('swh.indexer')
         self.tools = self.register_tools(self.config['tools'])
         # NOTE: only one tool so far, change when no longer true
         self.tool = self.tools[0]
 
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
         """
-        yield from self.storage.content_metadata_missing((
+        yield from self.idx_storage.content_metadata_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1 in ids
         ))
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             id (bytes): content's identifier
             data (bytes): raw content in bytes
 
         Returns:
             dict: dictionary representing a content_metadata. If the
             translation wasn't successful the translated_metadata keys will
             be returned as None
 
         """
         result = {
             'id': id,
             'indexer_configuration_id': self.tool['id'],
             'translated_metadata': None
         }
         try:
             context = self.tool['tool_configuration']['context']
             result['translated_metadata'] = compute_metadata(context, data)
             # a twisted way to keep result with indexer object for get_results
             self.results.append(result)
         except:
             self.log.exception(
                 "Problem during tool retrieval of metadata translation")
         return result
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_metadata, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - translated_metadata (jsonb): detected metadata
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
-        self.storage.content_metadata_add(
+        self.idx_storage.content_metadata_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
     def get_results(self):
         """can be called only if run method was called before
 
         Returns:
             list: list of content_metadata entries calculated by
                   current indexer
 
         """
         return self.results
 
 
 class RevisionMetadataIndexer(RevisionIndexer):
     """Revision-level indexer
 
     This indexer is in charge of:
 
     - filtering revisions already indexed in revision_metadata table with
       defined computation tool
     - retrieve all entry_files in root directory
     - use metadata_detector for file_names containig metadata
     - compute metadata translation if necessary and possible (depends on tool)
     - send sha1s to content indexing if possible
     - store the results for revision
 
     """
     CONFIG_BASE_FILENAME = 'indexer/metadata'
 
     ADDITIONAL_CONFIG = {
+        'storage': ('dict', {
+            'cls': 'remote',
+            'args': {
+                'url': 'http://localhost:5002/',
+            }
+        }),
         'tools': ('dict', {
             'name': 'swh-metadata-detector',
             'version': '0.0.1',
             'configuration': {
                 'type': 'local',
                 'context': ['npm', 'codemeta']
             },
         }),
     }
 
     def prepare(self):
         super().prepare()
         self.tool = self.tools[0]
 
     def filter(self, sha1_gits):
         """Filter out known sha1s and return only missing ones.
 
         """
-        yield from self.storage.revision_metadata_missing((
+        yield from self.idx_storage.revision_metadata_missing((
             {
                 'id': sha1_git,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1_git in sha1_gits
         ))
 
     def index(self, rev):
         """Index rev by processing it and organizing result.
 
         use metadata_detector to iterate on filenames
 
         - if one filename detected -> sends file to content indexer
         - if multiple file detected -> translation needed at revision level
 
         Args:
           rev (bytes): revision artifact from storage
 
         Returns:
             dict: dictionary representing a revision_metadata, with keys:
 
                 - id (bytes): rev's identifier (sha1_git)
                 - indexer_configuration_id (bytes): tool used
                 - translated_metadata (bytes): dict of retrieved metadata
 
         """
         try:
             result = {
                 'id': rev['id'],
                 'indexer_configuration_id': self.tool['id'],
                 'translated_metadata': None
             }
 
             root_dir = rev['directory']
             dir_ls = self.storage.directory_ls(root_dir, recursive=False)
             files = (entry for entry in dir_ls if entry['type'] == 'file')
             detected_files = detect_metadata(files)
             result['translated_metadata'] = self.translate_revision_metadata(
                                                                 detected_files)
         except Exception as e:
             self.log.exception(
                 'Problem when indexing rev')
         return result
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_mimetype, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
         # TODO: add functions in storage to keep data in revision_metadata
-        self.storage.revision_metadata_add(
+        self.idx_storage.revision_metadata_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
     def translate_revision_metadata(self, detected_files):
         """
         Determine plan of action to translate metadata when containing
         one or multiple detected files:
 
         Args:
             detected_files (dict): dictionary mapping context names (e.g.,
               "npm", "authors") to list of sha1
 
         Returns:
             dict: dict with translated metadata according to the CodeMeta
             vocabulary
 
         """
         translated_metadata = []
         tool = {
                 'name': 'swh-metadata-translator',
                 'version': '0.0.1',
                 'configuration': {
                     'type': 'local',
                     'context': None
                 },
             }
         # TODO: iterate on each context, on each file
         # -> get raw_contents
         # -> translate each content
         config = {
-            'storage': self.storage,
+            'indexer_storage': self.idx_storage,
             'objstorage': self.objstorage
         }
         for context in detected_files.keys():
             tool['configuration']['context'] = context
             c_metadata_indexer = ContentMetadataIndexer(tool, config)
             # sha1s that are in content_metadata table
             sha1s_in_storage = []
-            metadata_generator = self.storage.content_metadata_get(
-                                              detected_files[context])
+            metadata_generator = self.idx_storage.content_metadata_get(
+                detected_files[context])
             for c in metadata_generator:
                 # extracting translated_metadata
                 sha1 = c['id']
                 sha1s_in_storage.append(sha1)
                 local_metadata = c['translated_metadata']
                 # local metadata is aggregated
                 if local_metadata:
                     translated_metadata.append(local_metadata)
 
             sha1s_filtered = [item for item in detected_files[context]
                               if item not in sha1s_in_storage]
 
             if sha1s_filtered:
                 # schedule indexation of content
                 try:
                     c_metadata_indexer.run(sha1s_filtered,
                                            policy_update='ignore-dups')
                     # on the fly possibility:
                     results = c_metadata_indexer.get_results()
 
                     for result in results:
                         local_metadata = result['translated_metadata']
                         translated_metadata.append(local_metadata)
 
                 except Exception as e:
                     self.log.warn("""Exception while indexing content""", e)
 
         # transform translated_metadata into min set with swh-metadata-detector
         min_metadata = extract_minimal_metadata_dict(translated_metadata)
         return min_metadata
 
 
 @click.command()
 @click.option('--revs', '-i',
               default=['8dbb6aeb036e7fd80664eb8bfd1507881af1ba9f',
                        '026040ea79dec1b49b4e3e7beda9132b6b26b51b',
                        '9699072e21eded4be8d45e3b8d543952533fa190'],
               help='Default sha1_git to lookup', multiple=True)
 def main(revs):
     _git_sha1s = list(map(hashutil.hash_to_bytes, revs))
     rev_metadata_indexer = RevisionMetadataIndexer()
     rev_metadata_indexer.run(_git_sha1s, 'update-dups')
 
 
 if __name__ == '__main__':
     logging.basicConfig(level=logging.INFO)
     main()
diff --git a/swh/indexer/mimetype.py b/swh/indexer/mimetype.py
index 8bbbf64..57bcd3a 100644
--- a/swh/indexer/mimetype.py
+++ b/swh/indexer/mimetype.py
@@ -1,158 +1,158 @@
 # Copyright (C) 2016-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import click
 import magic
 
 from swh.model import hashutil
 from swh.scheduler import utils
 
 from .indexer import ContentIndexer
 
 
 def compute_mimetype_encoding(raw_content):
     """Determine mimetype and encoding from the raw content.
 
     Args:
         raw_content (bytes): content's raw data
 
     Returns:
         A dict with mimetype and encoding key and corresponding values
         (as bytes).
 
     """
     r = magic.detect_from_content(raw_content)
     return {
         'mimetype': r.mime_type.encode('utf-8'),
         'encoding': r.encoding.encode('utf-8'),
     }
 
 
 class ContentMimetypeIndexer(ContentIndexer):
     """Indexer in charge of:
 
     - filtering out content already indexed
     - reading content from objstorage per the content's id (sha1)
     - computing {mimetype, encoding} from that content
     - store result in storage
 
     """
     ADDITIONAL_CONFIG = {
         'destination_queue': ('str', None),
         'tools': ('dict', {
             'name': 'file',
             'version': '1:5.30-1+deb9u1',
             'configuration': {
                 "type": "library",
                 "debian-package": "python3-magic"
             },
         }),
     }
 
     CONFIG_BASE_FILENAME = 'indexer/mimetype'
 
     def prepare(self):
         super().prepare()
         destination_queue = self.config.get('destination_queue')
         if destination_queue:
             self.task_destination = utils.get_task(destination_queue)
         else:
             self.task_destination = None
         self.tool = self.tools[0]
 
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
 
         """
-        yield from self.storage.content_mimetype_missing((
+        yield from self.idx_storage.content_mimetype_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1 in ids
         ))
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             id (bytes): content's identifier
             data (bytes): raw content in bytes
 
         Returns:
             A dict, representing a content_mimetype, with keys:
 
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
 
         """
         try:
             properties = compute_mimetype_encoding(data)
             properties.update({
                 'id': id,
                 'indexer_configuration_id': self.tool['id'],
                 })
         except TypeError:
             self.log.error('Detecting mimetype error for id %s' % (
                 hashutil.hash_to_hex(id), ))
             return None
 
         return properties
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_mimetype, dict with the
             following keys:
 
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
 
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
-        self.storage.content_mimetype_add(
+        self.idx_storage.content_mimetype_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
     def _filter_text(self, results):
         """Filter sha1 whose raw content is text.
 
         """
         for result in results:
             if b'binary' in result['encoding']:
                 continue
             yield result['id']
 
     def next_step(self, results):
         """When the computations is done, we'd like to send over only text
         contents to the text content orchestrator.
 
         Args:
             results ([dict]): List of content_mimetype results, dict
             with the following keys:
 
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
 
         """
         if self.task_destination:
             self.task_destination.delay(list(self._filter_text(results)))
 
 
 @click.command()
 @click.option('--path', help="Path to execute index on")
 def main(path):
     with open(path, 'rb') as f:
         raw_content = f.read()
 
     print(compute_mimetype_encoding(raw_content))
 
 
 if __name__ == '__main__':
     main()
diff --git a/swh/indexer/storage/api/server.py b/swh/indexer/storage/api/server.py
index a126243..5ebacf2 100644
--- a/swh/indexer/storage/api/server.py
+++ b/swh/indexer/storage/api/server.py
@@ -1,197 +1,197 @@
 # Copyright (C) 2015-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import logging
 import click
 
 from flask import g, request
 
 from swh.core import config
 from swh.core.api import (SWHServerAPIApp, decode_request,
                           error_handler,
                           encode_data_server as encode_data)
-from swh.indexer import get_storage
+from swh.indexer import get_indexer_storage
 
 
 DEFAULT_CONFIG = {
     'storage': ('dict', {
         'cls': 'local',
         'args': {
             'db': 'dbname=softwareheritage-indexer-dev',
         },
     })
 }
 
 
 app = SWHServerAPIApp(__name__)
 
 
 @app.errorhandler(Exception)
 def my_error_handler(exception):
     return error_handler(exception, encode_data)
 
 
 @app.before_request
 def before_request():
-    g.storage = get_storage(**app.config['storage'])
+    g.storage = get_indexer_storage(**app.config['storage'])
 
 
 @app.route('/')
 def index():
     return 'SWH Indexer Storage API server'
 
 
 @app.route('/check_config', methods=['POST'])
 def check_config():
     return encode_data(g.storage.check_config(**decode_request(request)))
 
 
 @app.route('/content_mimetype/add', methods=['POST'])
 def content_mimetype_add():
     return encode_data(
         g.storage.content_mimetype_add(**decode_request(request)))
 
 
 @app.route('/content_mimetype/missing', methods=['POST'])
 def content_mimetype_missing():
     return encode_data(
         g.storage.content_mimetype_missing(**decode_request(request)))
 
 
 @app.route('/content_mimetype', methods=['POST'])
 def content_mimetype_get():
     return encode_data(
         g.storage.content_mimetype_get(**decode_request(request)))
 
 
 @app.route('/content_language/add', methods=['POST'])
 def content_language_add():
     return encode_data(
         g.storage.content_language_add(**decode_request(request)))
 
 
 @app.route('/content_language/missing', methods=['POST'])
 def content_language_missing():
     return encode_data(
         g.storage.content_language_missing(**decode_request(request)))
 
 
 @app.route('/content_language', methods=['POST'])
 def content_language_get():
     return encode_data(
         g.storage.content_language_get(**decode_request(request)))
 
 
 @app.route('/content/ctags/add', methods=['POST'])
 def content_ctags_add():
     return encode_data(
         g.storage.content_ctags_add(**decode_request(request)))
 
 
 @app.route('/content/ctags/search', methods=['POST'])
 def content_ctags_search():
     return encode_data(
         g.storage.content_ctags_search(**decode_request(request)))
 
 
 @app.route('/content/ctags/missing', methods=['POST'])
 def content_ctags_missing():
     return encode_data(
         g.storage.content_ctags_missing(**decode_request(request)))
 
 
 @app.route('/content/ctags', methods=['POST'])
 def content_ctags_get():
     return encode_data(
         g.storage.content_ctags_get(**decode_request(request)))
 
 
 @app.route('/content/fossology_license/add', methods=['POST'])
 def content_fossology_license_add():
     return encode_data(
         g.storage.content_fossology_license_add(**decode_request(request)))
 
 
 @app.route('/content/fossology_license', methods=['POST'])
 def content_fossology_license_get():
     return encode_data(
         g.storage.content_fossology_license_get(**decode_request(request)))
 
 
 @app.route('/indexer_configuration/data', methods=['POST'])
 def indexer_configuration_get():
     return encode_data(g.storage.indexer_configuration_get(
         **decode_request(request)))
 
 
 @app.route('/indexer_configuration/add', methods=['POST'])
 def indexer_configuration_add():
     return encode_data(g.storage.indexer_configuration_add(
         **decode_request(request)))
 
 
 @app.route('/content_metadata/add', methods=['POST'])
 def content_metadata_add():
     return encode_data(
         g.storage.content_metadata_add(**decode_request(request)))
 
 
 @app.route('/content_metadata/missing', methods=['POST'])
 def content_metadata_missing():
     return encode_data(
         g.storage.content_metadata_missing(**decode_request(request)))
 
 
 @app.route('/content_metadata', methods=['POST'])
 def content_metadata_get():
     return encode_data(
         g.storage.content_metadata_get(**decode_request(request)))
 
 
 @app.route('/revision_metadata/add', methods=['POST'])
 def revision_metadata_add():
     return encode_data(
         g.storage.revision_metadata_add(**decode_request(request)))
 
 
 @app.route('/revision_metadata/missing', methods=['POST'])
 def revision_metadata_missing():
     return encode_data(
         g.storage.revision_metadata_missing(**decode_request(request)))
 
 
 @app.route('/revision_metadata', methods=['POST'])
 def revision_metadata_get():
     return encode_data(
         g.storage.revision_metadata_get(**decode_request(request)))
 
 
 def run_from_webserver(environ, start_response):
     """Run the WSGI app from the webserver, loading the configuration."""
 
     config_path = '/etc/softwareheritage/indexer/storage.yml'
 
     app.config.update(config.read(config_path, DEFAULT_CONFIG))
 
     handler = logging.StreamHandler()
     app.logger.addHandler(handler)
 
     return app(environ, start_response)
 
 
 @click.command()
 @click.argument('config-path', required=1)
 @click.option('--host', default='0.0.0.0', help="Host to run the server")
 @click.option('--port', default=5007, type=click.INT,
               help="Binding port of the server")
 @click.option('--debug/--nodebug', default=True,
               help="Indicates if the server should run in debug mode")
 def launch(config_path, host, port, debug):
     app.config.update(config.read(config_path, DEFAULT_CONFIG))
     app.run(host, port=int(port), debug=bool(debug))
 
 
 if __name__ == '__main__':
     launch()
diff --git a/swh/indexer/tests/storage/test_storage.py b/swh/indexer/tests/storage/test_storage.py
index b75b3b5..fad45c6 100644
--- a/swh/indexer/tests/storage/test_storage.py
+++ b/swh/indexer/tests/storage/test_storage.py
@@ -1,1504 +1,1504 @@
 # Copyright (C) 2015-2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import pathlib
 import unittest
 
 from nose.tools import istest
 from nose.plugins.attrib import attr
 from swh.model.hashutil import hash_to_bytes
 
-from swh.indexer import get_storage
+from swh.indexer import get_indexer_storage
 from swh.core.tests.db_testing import DbTestFixture
 
 
 PATH_TO_STORAGE_TEST_DATA = '../../../../../swh-storage-testdata'
 
 
 class StorageTestFixture:
     """Mix this in a test subject class to get Storage testing support.
 
     This fixture requires to come before DbTestFixture in the inheritance list
     as it uses its methods to setup its own internal database.
 
     Usage example:
 
         class TestStorage(StorageTestFixture, DbTestFixture):
             ...
     """
     TEST_STORAGE_DB_NAME = 'softwareheritage-test-indexer'
 
     @classmethod
     def setUpClass(cls):
         if not hasattr(cls, 'DB_TEST_FIXTURE_IMPORTED'):
             raise RuntimeError("StorageTestFixture needs to be followed by "
                                "DbTestFixture in the inheritance list.")
 
         test_dir = pathlib.Path(__file__).absolute().parent
         test_data_dir = test_dir / PATH_TO_STORAGE_TEST_DATA
         test_db_dump = (test_data_dir / 'dumps/swh-indexer.dump').absolute()
         cls.add_db(cls.TEST_STORAGE_DB_NAME, str(test_db_dump), 'pg_dump')
         super().setUpClass()
 
     def setUp(self):
         super().setUp()
 
         self.storage_config = {
             'cls': 'local',
             'args': {
                 'db': self.test_db[self.TEST_STORAGE_DB_NAME].conn,
             },
         }
-        self.storage = get_storage(**self.storage_config)
+        self.storage = get_indexer_storage(**self.storage_config)
 
     def tearDown(self):
         super().tearDown()
 
     def reset_storage_tables(self):
         excluded = {'indexer_configuration'}
         self.reset_db_tables(self.TEST_STORAGE_DB_NAME, excluded=excluded)
 
         db = self.test_db[self.TEST_STORAGE_DB_NAME]
         db.conn.commit()
 
 
 class BaseTestStorage(StorageTestFixture, DbTestFixture):
     def setUp(self):
         super().setUp()
 
         db = self.test_db[self.TEST_STORAGE_DB_NAME]
         self.conn = db.conn
         self.cursor = db.cursor
 
         self.sha1_1 = hash_to_bytes('34973274ccef6ab4dfaaf86599792fa9c3fe4689')
         self.sha1_2 = hash_to_bytes('61c2b3a30496d329e21af70dd2d7e097046d07b7')
         self.revision_id_1 = hash_to_bytes(
             '7026b7c1a2af56521e951c01ed20f255fa054238')
         self.revision_id_2 = hash_to_bytes(
             '7026b7c1a2af56521e9587659012345678904321')
 
     def tearDown(self):
         self.reset_storage_tables()
         super().tearDown()
 
     def fetch_tools(self):
         tools = {}
         self.cursor.execute('''
             select tool_name, id, tool_version, tool_configuration
             from indexer_configuration
             order by id''')
         for row in self.cursor.fetchall():
             key = row[0]
             while key in tools:
                 key = '_' + key
             tools[key] = {
                 'id': row[1],
                 'name': row[0],
                 'version': row[2],
                 'configuration': row[3]
             }
 
         return tools
 
 
 @attr('db')
 class CommonTestStorage(BaseTestStorage):
     """Base class for Indexer Storage testing.
 
     """
 
     @istest
     def check_config(self):
         self.assertTrue(self.storage.check_config(check_write=True))
         self.assertTrue(self.storage.check_config(check_write=False))
 
     @istest
     def content_mimetype_missing(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['file']['id']
 
         mimetypes = [
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             }]
 
         # when
         actual_missing = self.storage.content_mimetype_missing(mimetypes)
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_1,
             self.sha1_2,
         ])
 
         # given
         self.storage.content_mimetype_add([{
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'indexer_configuration_id': tool_id,
         }])
 
         # when
         actual_missing = self.storage.content_mimetype_missing(mimetypes)
 
         # then
         self.assertEqual(list(actual_missing), [self.sha1_1])
 
     @istest
     def content_mimetype_add__drop_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['file']['id']
 
         mimetype_v1 = {
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_mimetype_add([mimetype_v1])
 
         # when
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         # then
         expected_mimetypes_v1 = [{
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'tool': tools['file'],
         }]
         self.assertEqual(actual_mimetypes, expected_mimetypes_v1)
 
         # given
         mimetype_v2 = mimetype_v1.copy()
         mimetype_v2.update({
             'mimetype': b'text/html',
             'encoding': b'us-ascii',
         })
 
         self.storage.content_mimetype_add([mimetype_v2])
 
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         # mimetype did not change as the v2 was dropped.
         self.assertEqual(actual_mimetypes, expected_mimetypes_v1)
 
     @istest
     def content_mimetype_add__update_in_place_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['file']['id']
 
         mimetype_v1 = {
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_mimetype_add([mimetype_v1])
 
         # when
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         expected_mimetypes_v1 = [{
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'tool': tools['file'],
         }]
 
         # then
         self.assertEqual(actual_mimetypes, expected_mimetypes_v1)
 
         # given
         mimetype_v2 = mimetype_v1.copy()
         mimetype_v2.update({
             'mimetype': b'text/html',
             'encoding': b'us-ascii',
         })
 
         self.storage.content_mimetype_add([mimetype_v2], conflict_update=True)
 
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         expected_mimetypes_v2 = [{
             'id': self.sha1_2,
             'mimetype': b'text/html',
             'encoding': b'us-ascii',
             'tool': {
                 'id': 2,
                 'name': 'file',
                 'version': '5.22',
                 'configuration': {'command_line': 'file --mime <filepath>'}
             }
         }]
 
         # mimetype did change as the v2 was used to overwrite v1
         self.assertEqual(actual_mimetypes, expected_mimetypes_v2)
 
     @istest
     def content_mimetype_get(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['file']['id']
 
         mimetypes = [self.sha1_2, self.sha1_1]
 
         mimetype1 = {
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_mimetype_add([mimetype1])
 
         # then
         actual_mimetypes = list(self.storage.content_mimetype_get(mimetypes))
 
         # then
         expected_mimetypes = [{
             'id': self.sha1_2,
             'mimetype': b'text/plain',
             'encoding': b'utf-8',
             'tool': tools['file']
         }]
 
         self.assertEqual(actual_mimetypes, expected_mimetypes)
 
     @istest
     def content_language_missing(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['pygments']['id']
 
         languages = [
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = list(self.storage.content_language_missing(languages))
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_2,
             self.sha1_1,
         ])
 
         # given
         self.storage.content_language_add([{
             'id': self.sha1_2,
             'lang': 'haskell',
             'indexer_configuration_id': tool_id,
         }])
 
         # when
         actual_missing = list(self.storage.content_language_missing(languages))
 
         # then
         self.assertEqual(actual_missing, [self.sha1_1])
 
     @istest
     def content_language_get(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['pygments']['id']
 
         language1 = {
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_language_add([language1])
 
         # then
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2, self.sha1_1]))
 
         # then
         expected_languages = [{
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'tool': tools['pygments']
         }]
 
         self.assertEqual(actual_languages, expected_languages)
 
     @istest
     def content_language_add__drop_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['pygments']['id']
 
         language_v1 = {
             'id': self.sha1_2,
             'lang': 'emacslisp',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_language_add([language_v1])
 
         # when
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # then
         expected_languages_v1 = [{
             'id': self.sha1_2,
             'lang': 'emacslisp',
             'tool': tools['pygments']
         }]
         self.assertEqual(actual_languages, expected_languages_v1)
 
         # given
         language_v2 = language_v1.copy()
         language_v2.update({
             'lang': 'common-lisp',
         })
 
         self.storage.content_language_add([language_v2])
 
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # language did not change as the v2 was dropped.
         self.assertEqual(actual_languages, expected_languages_v1)
 
     @istest
     def content_language_add__update_in_place_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['pygments']['id']
 
         language_v1 = {
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_language_add([language_v1])
 
         # when
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # then
         expected_languages_v1 = [{
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'tool': tools['pygments']
         }]
         self.assertEqual(actual_languages, expected_languages_v1)
 
         # given
         language_v2 = language_v1.copy()
         language_v2.update({
             'lang': 'emacslisp',
         })
 
         self.storage.content_language_add([language_v2], conflict_update=True)
 
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # language did not change as the v2 was dropped.
         expected_languages_v2 = [{
             'id': self.sha1_2,
             'lang': 'emacslisp',
             'tool': tools['pygments']
         }]
 
         # language did change as the v2 was used to overwrite v1
         self.assertEqual(actual_languages, expected_languages_v2)
 
     @istest
     def content_ctags_missing(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['universal-ctags']['id']
 
         ctags = [
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = self.storage.content_ctags_missing(ctags)
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_2,
             self.sha1_1
         ])
 
         # given
         self.storage.content_ctags_add([
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
                 'ctags': [{
                     'name': 'done',
                     'kind': 'variable',
                     'line': 119,
                     'lang': 'OCaml',
                 }]
             },
         ])
 
         # when
         actual_missing = self.storage.content_ctags_missing(ctags)
 
         # then
         self.assertEqual(list(actual_missing), [self.sha1_1])
 
     @istest
     def content_ctags_get(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['universal-ctags']['id']
 
         ctags = [self.sha1_2, self.sha1_1]
 
         ctag1 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [
                 {
                     'name': 'done',
                     'kind': 'variable',
                     'line': 100,
                     'lang': 'Python',
                 },
                 {
                     'name': 'main',
                     'kind': 'function',
                     'line': 119,
                     'lang': 'Python',
                 }]
         }
 
         # when
         self.storage.content_ctags_add([ctag1])
 
         # then
         actual_ctags = list(self.storage.content_ctags_get(ctags))
 
         # then
 
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'tool': tools['universal-ctags'],
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Python',
             },
             {
                 'id': self.sha1_2,
                 'tool': tools['universal-ctags'],
                 'name': 'main',
                 'kind': 'function',
                 'line': 119,
                 'lang': 'Python',
             }
         ]
 
         self.assertEqual(actual_ctags, expected_ctags)
 
     @istest
     def content_ctags_search(self):
         # 1. given
         tools = self.fetch_tools()
         tool = tools['universal-ctags']
         tool_id = tool['id']
 
         ctag1 = {
             'id': self.sha1_1,
             'indexer_configuration_id': tool_id,
             'ctags': [
                 {
                     'name': 'hello',
                     'kind': 'function',
                     'line': 133,
                     'lang': 'Python',
                 },
                 {
                     'name': 'counter',
                     'kind': 'variable',
                     'line': 119,
                     'lang': 'Python',
                 },
             ]
         }
 
         ctag2 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [
                 {
                     'name': 'hello',
                     'kind': 'variable',
                     'line': 100,
                     'lang': 'C',
                 },
             ]
         }
 
         self.storage.content_ctags_add([ctag1, ctag2])
 
         # 1. when
         actual_ctags = list(self.storage.content_ctags_search('hello',
                                                               limit=1))
 
         # 1. then
         self.assertEqual(actual_ctags, [
             {
                 'id': ctag1['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'function',
                 'line': 133,
                 'lang': 'Python',
             }
         ])
 
         # 2. when
         actual_ctags = list(self.storage.content_ctags_search(
             'hello',
             limit=1,
             last_sha1=ctag1['id']))
 
         # 2. then
         self.assertEqual(actual_ctags, [
             {
                 'id': ctag2['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'C',
             }
         ])
 
         # 3. when
         actual_ctags = list(self.storage.content_ctags_search('hello'))
 
         # 3. then
         self.assertEqual(actual_ctags, [
             {
                 'id': ctag1['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'function',
                 'line': 133,
                 'lang': 'Python',
             },
             {
                 'id': ctag2['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'C',
             },
         ])
 
         # 4. when
         actual_ctags = list(self.storage.content_ctags_search('counter'))
 
         # then
         self.assertEqual(actual_ctags, [{
             'id': ctag1['id'],
             'tool': tool,
             'name': 'counter',
             'kind': 'variable',
             'line': 119,
             'lang': 'Python',
         }])
 
     @istest
     def content_ctags_search_no_result(self):
         actual_ctags = list(self.storage.content_ctags_search('counter'))
 
         self.assertEquals(actual_ctags, [])
 
     @istest
     def content_ctags_add__add_new_ctags_added(self):
         # given
         tools = self.fetch_tools()
         tool = tools['universal-ctags']
         tool_id = tool['id']
 
         ctag_v1 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [{
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
             }]
         }
 
         # given
         self.storage.content_ctags_add([ctag_v1])
         self.storage.content_ctags_add([ctag_v1])  # conflict does nothing
 
         # when
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         # then
         expected_ctags = [{
             'id': self.sha1_2,
             'name': 'done',
             'kind': 'variable',
             'line': 100,
             'lang': 'Scheme',
             'tool': tool,
         }]
 
         self.assertEqual(actual_ctags, expected_ctags)
 
         # given
         ctag_v2 = ctag_v1.copy()
         ctag_v2.update({
             'ctags': [
                 {
                     'name': 'defn',
                     'kind': 'function',
                     'line': 120,
                     'lang': 'Scheme',
                 }
             ]
         })
 
         self.storage.content_ctags_add([ctag_v2])
 
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
                 'tool': tool,
             }, {
                 'id': self.sha1_2,
                 'name': 'defn',
                 'kind': 'function',
                 'line': 120,
                 'lang': 'Scheme',
                 'tool': tool,
             }
         ]
 
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         self.assertEqual(actual_ctags, expected_ctags)
 
     @istest
     def content_ctags_add__update_in_place(self):
         # given
         tools = self.fetch_tools()
         tool = tools['universal-ctags']
         tool_id = tool['id']
 
         ctag_v1 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [{
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
             }]
         }
 
         # given
         self.storage.content_ctags_add([ctag_v1])
 
         # when
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         # then
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
                 'tool': tool
             }
         ]
         self.assertEqual(actual_ctags, expected_ctags)
 
         # given
         ctag_v2 = ctag_v1.copy()
         ctag_v2.update({
             'ctags': [
                 {
                     'name': 'done',
                     'kind': 'variable',
                     'line': 100,
                     'lang': 'Scheme',
                 },
                 {
                     'name': 'defn',
                     'kind': 'function',
                     'line': 120,
                     'lang': 'Scheme',
                 }
             ]
         })
 
         self.storage.content_ctags_add([ctag_v2], conflict_update=True)
 
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         # ctag did change as the v2 was used to overwrite v1
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
                 'tool': tool,
             },
             {
                 'id': self.sha1_2,
                 'name': 'defn',
                 'kind': 'function',
                 'line': 120,
                 'lang': 'Scheme',
                 'tool': tool,
             }
         ]
         self.assertEqual(actual_ctags, expected_ctags)
 
     @istest
     def content_fossology_license_get(self):
         # given
         tools = self.fetch_tools()
         tool = tools['nomos']
         tool_id = tool['id']
 
         license1 = {
             'id': self.sha1_1,
             'licenses': ['GPL-2.0+'],
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_fossology_license_add([license1])
 
         # then
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_2, self.sha1_1]))
 
         expected_license = {
             'id': self.sha1_1,
             'licenses': ['GPL-2.0+'],
             'tool': tool,
         }
 
         # then
         self.assertEqual(actual_licenses, [expected_license])
 
     @istest
     def content_fossology_license_add__new_license_added(self):
         # given
         tools = self.fetch_tools()
         tool = tools['nomos']
         tool_id = tool['id']
 
         license_v1 = {
             'id': self.sha1_1,
             'licenses': ['Apache-2.0'],
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_fossology_license_add([license_v1])
         # conflict does nothing
         self.storage.content_fossology_license_add([license_v1])
 
         # when
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         # then
         expected_license = {
             'id': self.sha1_1,
             'licenses': ['Apache-2.0'],
             'tool': tool,
         }
         self.assertEqual(actual_licenses, [expected_license])
 
         # given
         license_v2 = license_v1.copy()
         license_v2.update({
             'licenses': ['BSD-2-Clause'],
         })
 
         self.storage.content_fossology_license_add([license_v2])
 
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         expected_license.update({
             'licenses': ['Apache-2.0', 'BSD-2-Clause'],
         })
 
         # license did not change as the v2 was dropped.
         self.assertEqual(actual_licenses, [expected_license])
 
     @istest
     def content_fossology_license_add__update_in_place_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool = tools['nomos']
         tool_id = tool['id']
 
         license_v1 = {
             'id': self.sha1_1,
             'licenses': ['CECILL'],
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_fossology_license_add([license_v1])
         # conflict does nothing
         self.storage.content_fossology_license_add([license_v1])
 
         # when
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         # then
         expected_license = {
             'id': self.sha1_1,
             'licenses': ['CECILL'],
             'tool': tool,
         }
         self.assertEqual(actual_licenses, [expected_license])
 
         # given
         license_v2 = license_v1.copy()
         license_v2.update({
             'licenses': ['CECILL-2.0']
         })
 
         self.storage.content_fossology_license_add([license_v2],
                                                    conflict_update=True)
 
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         # license did change as the v2 was used to overwrite v1
         expected_license.update({
             'licenses': ['CECILL-2.0']
         })
         self.assertEqual(actual_licenses, [expected_license])
 
     @istest
     def content_metadata_missing(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-translator']['id']
 
         metadatas = [
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = list(self.storage.content_metadata_missing(metadatas))
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_2,
             self.sha1_1,
         ])
 
         # given
         self.storage.content_metadata_add([{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id
         }])
 
         # when
         actual_missing = list(self.storage.content_metadata_missing(metadatas))
 
         # then
         self.assertEqual(actual_missing, [self.sha1_1])
 
     @istest
     def content_metadata_get(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-translator']['id']
 
         metadata1 = {
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_metadata_add([metadata1])
 
         # then
         actual_metadatas = list(self.storage.content_metadata_get(
             [self.sha1_2, self.sha1_1]))
 
         expected_metadatas = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'tool': tools['swh-metadata-translator']
         }]
 
         self.assertEqual(actual_metadatas, expected_metadatas)
 
     @istest
     def content_metadata_add_drop_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-translator']['id']
 
         metadata_v1 = {
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_metadata_add([metadata_v1])
 
         # when
         actual_metadatas = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         expected_metadatas_v1 = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'tool': tools['swh-metadata-translator']
         }]
 
         self.assertEqual(actual_metadatas, expected_metadatas_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata': {
                 'other': {},
                 'name': 'test_drop_duplicated_metadata',
                 'version': '0.0.1'
             },
         })
 
         self.storage.content_metadata_add([metadata_v2])
 
         # then
         actual_metadatas = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         # metadata did not change as the v2 was dropped.
         self.assertEqual(actual_metadatas, expected_metadatas_v1)
 
     @istest
     def content_metadata_add_update_in_place_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-translator']['id']
 
         metadata_v1 = {
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_metadata_add([metadata_v1])
 
         # when
         actual_metadatas = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         # then
         expected_metadatas_v1 = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'tool': tools['swh-metadata-translator']
         }]
         self.assertEqual(actual_metadatas, expected_metadatas_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata': {
                 'other': {},
                 'name': 'test_update_duplicated_metadata',
                 'version': '0.0.1'
             },
         })
         self.storage.content_metadata_add([metadata_v2], conflict_update=True)
 
         actual_metadatas = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         # language did not change as the v2 was dropped.
         expected_metadatas_v2 = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_update_duplicated_metadata',
                 'version': '0.0.1'
             },
             'tool': tools['swh-metadata-translator']
         }]
 
         # metadata did change as the v2 was used to overwrite v1
         self.assertEqual(actual_metadatas, expected_metadatas_v2)
 
     @istest
     def revision_metadata_missing(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-detector']['id']
 
         metadatas = [
             {
                 'id': self.revision_id_1,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.revision_id_2,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = list(self.storage.revision_metadata_missing(
                               metadatas))
 
         # then
         self.assertEqual(list(actual_missing), [
             self.revision_id_1,
             self.revision_id_2,
         ])
 
         # given
         self.storage.revision_metadata_add([{
             'id': self.revision_id_1,
             'translated_metadata': {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'type': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id
         }])
 
         # when
         actual_missing = list(self.storage.revision_metadata_missing(
                               metadatas))
 
         # then
         self.assertEqual(actual_missing, [self.revision_id_2])
 
     @istest
     def revision_metadata_get(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-detector']['id']
 
         metadata_rev = {
             'id': self.revision_id_2,
             'translated_metadata': {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'type': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id
         }
 
         # when
         self.storage.revision_metadata_add([metadata_rev])
 
         # then
         actual_metadatas = list(self.storage.revision_metadata_get(
             [self.revision_id_2, self.revision_id_1]))
 
         expected_metadatas = [{
             'id': self.revision_id_2,
             'translated_metadata': metadata_rev['translated_metadata'],
             'tool': tools['swh-metadata-detector']
         }]
 
         self.assertEqual(actual_metadatas, expected_metadatas)
 
     @istest
     def revision_metadata_add_drop_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-detector']['id']
 
         metadata_v1 = {
             'id': self.revision_id_1,
             'translated_metadata':  {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'type': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.revision_metadata_add([metadata_v1])
 
         # when
         actual_metadatas = list(self.storage.revision_metadata_get(
             [self.revision_id_1]))
 
         expected_metadatas_v1 = [{
             'id': self.revision_id_1,
             'translated_metadata':  metadata_v1['translated_metadata'],
             'tool': tools['swh-metadata-detector']
         }]
 
         self.assertEqual(actual_metadatas, expected_metadatas_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata':  {
                 'name': 'test_metadata',
                 'author': 'MG',
             },
         })
 
         self.storage.revision_metadata_add([metadata_v2])
 
         # then
         actual_metadatas = list(self.storage.revision_metadata_get(
             [self.revision_id_1]))
 
         # metadata did not change as the v2 was dropped.
         self.assertEqual(actual_metadatas, expected_metadatas_v1)
 
     @istest
     def revision_metadata_add_update_in_place_duplicate(self):
         # given
         tools = self.fetch_tools()
         tool_id = tools['swh-metadata-detector']['id']
 
         metadata_v1 = {
             'id': self.revision_id_2,
             'translated_metadata': {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'type': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.revision_metadata_add([metadata_v1])
 
         # when
         actual_metadatas = list(self.storage.revision_metadata_get(
             [self.revision_id_2]))
 
         # then
         expected_metadatas_v1 = [{
             'id': self.revision_id_2,
             'translated_metadata':  metadata_v1['translated_metadata'],
             'tool': tools['swh-metadata-detector']
         }]
         self.assertEqual(actual_metadatas, expected_metadatas_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata':  {
                 'name': 'test_update_duplicated_metadata',
                 'author': 'MG'
             },
         })
         self.storage.revision_metadata_add([metadata_v2], conflict_update=True)
 
         actual_metadatas = list(self.storage.revision_metadata_get(
             [self.revision_id_2]))
 
         # language did not change as the v2 was dropped.
         expected_metadatas_v2 = [{
             'id': self.revision_id_2,
             'translated_metadata': metadata_v2['translated_metadata'],
             'tool': tools['swh-metadata-detector']
         }]
 
         # metadata did change as the v2 was used to overwrite v1
         self.assertEqual(actual_metadatas, expected_metadatas_v2)
 
     @istest
     def indexer_configuration_add(self):
         tool = {
             'tool_name': 'some-unknown-tool',
             'tool_version': 'some-version',
             'tool_configuration': {"debian-package": "some-package"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
         self.assertIsNone(actual_tool)  # does not exist
 
         # add it
         actual_tools = list(self.storage.indexer_configuration_add([tool]))
 
         self.assertEquals(len(actual_tools), 1)
         actual_tool = actual_tools[0]
         self.assertIsNotNone(actual_tool)  # now it exists
         new_id = actual_tool.pop('id')
         self.assertEquals(actual_tool, tool)
 
         actual_tools2 = list(self.storage.indexer_configuration_add([tool]))
         actual_tool2 = actual_tools2[0]
         self.assertIsNotNone(actual_tool2)  # now it exists
         new_id2 = actual_tool2.pop('id')
 
         self.assertEqual(new_id, new_id2)
         self.assertEqual(actual_tool, actual_tool2)
 
     @istest
     def indexer_configuration_add_multiple(self):
         tool = {
             'tool_name': 'some-unknown-tool',
             'tool_version': 'some-version',
             'tool_configuration': {"debian-package": "some-package"},
         }
 
         actual_tools = list(self.storage.indexer_configuration_add([tool]))
         self.assertEqual(len(actual_tools), 1)
 
         new_tools = [tool, {
             'tool_name': 'yet-another-tool',
             'tool_version': 'version',
             'tool_configuration': {},
         }]
 
         actual_tools = list(self.storage.indexer_configuration_add(new_tools))
         self.assertEqual(len(actual_tools), 2)
 
         # order not guaranteed, so we iterate over results to check
         for tool in actual_tools:
             _id = tool.pop('id')
             self.assertIsNotNone(_id)
             self.assertIn(tool, new_tools)
 
     @istest
     def indexer_configuration_get_missing(self):
         tool = {
             'tool_name': 'unknown-tool',
             'tool_version': '3.1.0rc2-31-ga2cbb8c',
             'tool_configuration': {"command_line": "nomossa <filepath>"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         self.assertIsNone(actual_tool)
 
     @istest
     def indexer_configuration_get(self):
         tool = {
             'tool_name': 'nomos',
             'tool_version': '3.1.0rc2-31-ga2cbb8c',
             'tool_configuration': {"command_line": "nomossa <filepath>"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         expected_tool = tool.copy()
         expected_tool['id'] = 1
 
         self.assertEqual(expected_tool, actual_tool)
 
     @istest
     def indexer_configuration_metadata_get_missing_context(self):
         tool = {
             'tool_name': 'swh-metadata-translator',
             'tool_version': '0.0.1',
             'tool_configuration': {"context": "unknown-context"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         self.assertIsNone(actual_tool)
 
     @istest
     def indexer_configuration_metadata_get(self):
         tool = {
             'tool_name': 'swh-metadata-translator',
             'tool_version': '0.0.1',
             'tool_configuration': {"type": "local", "context": "npm"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         expected_tool = tool.copy()
         expected_tool['id'] = actual_tool['id']
 
         self.assertEqual(expected_tool, actual_tool)
 
 
 class IndexerTestStorage(CommonTestStorage, unittest.TestCase):
     """Running the tests locally.
 
     For the client api tests (remote storage), see
     `class`:swh.indexer.storage.test_api_client:TestRemoteStorage
     class.
 
     """
     pass
diff --git a/swh/indexer/tests/test_language.py b/swh/indexer/tests/test_language.py
index 96a431d..048f309 100644
--- a/swh/indexer/tests/test_language.py
+++ b/swh/indexer/tests/test_language.py
@@ -1,113 +1,113 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import unittest
 import logging
 from nose.tools import istest
 from swh.indexer import language
 from swh.indexer.language import ContentLanguageIndexer
 from swh.indexer.tests.test_utils import MockObjStorage
 
 
-class MockStorage():
+class _MockIndexerStorage():
     """Mock storage to simplify reading indexers' outputs.
     """
     def content_language_add(self, languages, conflict_update=None):
         self.state = languages
         self.conflict_update = conflict_update
 
     def indexer_configuration_add(self, tools):
         return [{
             'id': 20,
         }]
 
 
 class TestLanguageIndexer(ContentLanguageIndexer):
     """Specific language whose configuration is enough to satisfy the
        indexing tests.
     """
     def prepare(self):
         self.config = {
             'destination_queue': None,
             'rescheduling_task': None,
             'tools':  {
                 'name': 'pygments',
                 'version': '2.0.1+dfsg-1.1+deb8u1',
                 'configuration': {
                     'type': 'library',
                     'debian-package': 'python3-pygments',
                     'max_content_size': 10240,
                 },
             }
         }
-        self.storage = MockStorage()
+        self.idx_storage = _MockIndexerStorage()
         self.log = logging.getLogger('swh.indexer')
         self.objstorage = MockObjStorage()
         self.task_destination = None
         self.rescheduling_task = self.config['rescheduling_task']
         self.tool_config = self.config['tools']['configuration']
         self.max_content_size = self.tool_config['max_content_size']
         self.tools = self.register_tools(self.config['tools'])
         self.tool = self.tools[0]
 
 
 class Language(unittest.TestCase):
     """
     Tests pygments tool for language detection
     """
     def setUp(self):
         self.maxDiff = None
 
     @istest
     def test_compute_language_none(self):
         # given
         self.content = ""
         self.declared_language = {
             'lang': None
         }
         # when
         result = language.compute_language(self.content)
         # then
         self.assertEqual(self.declared_language, result)
 
     @istest
     def test_index_content_language_python(self):
         # given
         # testing python
         sha1s = ['02fb2c89e14f7fab46701478c83779c7beb7b069']
         lang_indexer = TestLanguageIndexer()
 
         # when
         lang_indexer.run(sha1s, policy_update='ignore-dups')
-        results = lang_indexer.storage.state
+        results = lang_indexer.idx_storage.state
 
         expected_results = [{
             'id': '02fb2c89e14f7fab46701478c83779c7beb7b069',
             'indexer_configuration_id': 20,
             'lang': 'python'
         }]
         # then
         self.assertEqual(expected_results, results)
 
     @istest
     def test_index_content_language_c(self):
         # given
         # testing c
         sha1s = ['103bc087db1d26afc3a0283f38663d081e9b01e6']
         lang_indexer = TestLanguageIndexer()
 
         # when
         lang_indexer.run(sha1s, policy_update='ignore-dups')
-        results = lang_indexer.storage.state
+        results = lang_indexer.idx_storage.state
 
         expected_results = [{
             'id': '103bc087db1d26afc3a0283f38663d081e9b01e6',
             'indexer_configuration_id': 20,
             'lang': 'c'
         }]
 
         # then
         self.assertEqual('c', results[0]['lang'])
         self.assertEqual(expected_results, results)
diff --git a/swh/indexer/tests/test_metadata.py b/swh/indexer/tests/test_metadata.py
index 74b8309..2953bfc 100644
--- a/swh/indexer/tests/test_metadata.py
+++ b/swh/indexer/tests/test_metadata.py
@@ -1,298 +1,305 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import unittest
 import logging
 from nose.tools import istest
 
 from swh.indexer.metadata_dictionary import compute_metadata
 from swh.indexer.metadata_detector import detect_metadata
 from swh.indexer.metadata import ContentMetadataIndexer
 from swh.indexer.metadata import RevisionMetadataIndexer
-from swh.indexer.tests.test_utils import MockObjStorage
-from swh.indexer.tests.test_utils import MockStorage
+from swh.indexer.tests.test_utils import MockObjStorage, MockStorage
+from swh.indexer.tests.test_utils import MockIndexerStorage
 
 
 class TestContentMetadataIndexer(ContentMetadataIndexer):
     """Specific Metadata whose configuration is enough to satisfy the
        indexing tests.
     """
     def prepare(self):
         self.config.update({
             'rescheduling_task': None,
         })
-        self.storage = MockStorage()
+        self.idx_storage = MockIndexerStorage()
         self.log = logging.getLogger('swh.indexer')
         self.objstorage = MockObjStorage()
         self.task_destination = None
         self.rescheduling_task = self.config['rescheduling_task']
         self.tools = self.register_tools(self.config['tools'])
         self.tool = self.tools[0]
         self.results = []
 
 
 class TestRevisionMetadataIndexer(RevisionMetadataIndexer):
     """Specific indexer whose configuration is enough to satisfy the
        indexing tests.
     """
     def prepare(self):
         self.config = {
             'rescheduling_task': None,
+            'storage': {
+                'cls': 'remote',
+                'args': {
+                    'url': 'http://localhost:9999',
+                }
+            },
             'tools': {
                 'name': 'swh-metadata-detector',
                 'version': '0.0.1',
                 'configuration': {
                     'type': 'local',
                     'context': 'npm'
                 }
             }
         }
         self.storage = MockStorage()
+        self.idx_storage = MockIndexerStorage()
         self.log = logging.getLogger('swh.indexer')
         self.objstorage = MockObjStorage()
         self.task_destination = None
         self.rescheduling_task = self.config['rescheduling_task']
         self.tools = self.register_tools(self.config['tools'])
         self.tool = self.tools[0]
         self.results = []
 
 
 class Metadata(unittest.TestCase):
     """
     Tests metadata_mock_tool tool for Metadata detection
     """
     def setUp(self):
         """
         shows the entire diff in the results
         """
         self.maxDiff = None
         self.content_tool = {
             'name': 'swh-metadata-translator',
             'version': '0.0.1',
             'configuration': {
                 'type': 'local',
                 'context': 'npm'
             }
         }
 
     @istest
     def test_compute_metadata_none(self):
         """
         testing content empty content is empty
         should return None
         """
         # given
         content = b""
         context = "npm"
 
         # None if no metadata was found or an error occurred
         declared_metadata = None
         # when
         result = compute_metadata(context, content)
         # then
         self.assertEqual(declared_metadata, result)
 
     @istest
     def test_compute_metadata_npm(self):
         """
         testing only computation of metadata with hard_mapping_npm
         """
         # given
         content = b"""
             {
                 "name": "test_metadata",
                 "version": "0.0.1",
                 "description": "Simple package.json test for indexer",
                   "repository": {
                     "type": "git",
                     "url": "https://github.com/moranegg/metadata_test"
                 }
             }
         """
         declared_metadata = {
             'name': 'test_metadata',
             'version': '0.0.1',
             'description': 'Simple package.json test for indexer',
             'codeRepository': {
                 'type': 'git',
                 'url': 'https://github.com/moranegg/metadata_test'
               },
             'other': {}
         }
 
         # when
         result = compute_metadata("npm", content)
         # then
         self.assertEqual(declared_metadata, result)
 
     @istest
     def test_index_content_metadata_npm(self):
         """
         testing NPM with package.json
         - one sha1 uses a file that can't be translated to metadata and
           should return None in the translated metadata
         """
         # given
         sha1s = ['26a9f72a7c87cc9205725cfd879f514ff4f3d8d5',
                  'd4c647f0fc257591cc9ba1722484229780d1c607',
                  '02fb2c89e14f7fab46701478c83779c7beb7b069']
         # this metadata indexer computes only metadata for package.json
         # in npm context with a hard mapping
         metadata_indexer = TestContentMetadataIndexer(
             tool=self.content_tool, config={})
 
         # when
         metadata_indexer.run(sha1s, policy_update='ignore-dups')
-        results = metadata_indexer.storage.state
+        results = metadata_indexer.idx_storage.state
 
         expected_results = [{
             'indexer_configuration_id': 30,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'id': '26a9f72a7c87cc9205725cfd879f514ff4f3d8d5'
             }, {
             'indexer_configuration_id': 30,
             'translated_metadata': {
                 'softwareRequirements': {
                         'JSONStream': '~1.3.1',
                         'abbrev': '~1.1.0',
                         'ansi-regex': '~2.1.1',
                         'ansicolors': '~0.3.2',
                         'ansistyles': '~0.1.3'
                 },
                 'issueTracker': {
                     'url': 'https://github.com/npm/npm/issues'
                 },
                 'author':
                     'Isaac Z. Schlueter <i@izs.me> (http://blog.izs.me)',
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/npm/npm'
                 },
                 'description': 'a package manager for JavaScript',
                 'softwareSuggestions': {
                         'tacks': '~1.2.6',
                         'tap': '~10.3.2'
                 },
                 'license': 'Artistic-2.0',
                 'version': '5.0.3',
                 'other': {
                     'preferGlobal': True,
                     'config': {
                         'publishtest': False
                     }
                 },
                 'name': 'npm',
                 'keywords': [
                     'install',
                     'modules',
                     'package manager',
                     'package.json'
                 ],
                 'url': 'https://docs.npmjs.com/'
             },
             'id': 'd4c647f0fc257591cc9ba1722484229780d1c607'
             }, {
             'indexer_configuration_id': 30,
             'translated_metadata': None,
             'id': '02fb2c89e14f7fab46701478c83779c7beb7b069'
         }]
 
         # The assertion bellow returns False sometimes because of nested lists
         self.assertEqual(expected_results, results)
 
     @istest
     def test_detect_metadata_package_json(self):
         # given
         df = [{
                 'sha1_git': b'abc',
                 'name': b'index.js',
                 'target': b'abc',
                 'length': 897,
                 'status': 'visible',
                 'type': 'file',
                 'perms': 33188,
                 'dir_id': b'dir_a',
                 'sha1': b'bcd'
             },
             {
                 'sha1_git': b'aab',
                 'name': b'package.json',
                 'target': b'aab',
                 'length': 712,
                 'status': 'visible',
                 'type': 'file',
                 'perms': 33188,
                 'dir_id': b'dir_a',
                 'sha1': b'cde'
         }]
         # when
         results = detect_metadata(df)
 
         expected_results = {
             'npm': [
                 b'cde'
             ]
         }
         # then
         self.assertEqual(expected_results, results)
 
     @istest
     def test_revision_metadata_indexer(self):
         metadata_indexer = TestRevisionMetadataIndexer()
 
         sha1_gits = [
             b'8dbb6aeb036e7fd80664eb8bfd1507881af1ba9f',
         ]
         metadata_indexer.run(sha1_gits, 'update-dups')
 
-        results = metadata_indexer.storage.state
+        results = metadata_indexer.idx_storage.state
 
         expected_results = [{
             'id': b'8dbb6aeb036e7fd80664eb8bfd1507881af1ba9f',
             'translated_metadata': {
                 'identifier': None,
                 'maintainer': None,
                 'url': [
                     'https://github.com/librariesio/yarn-parser#readme'
                 ],
                 'codeRepository': [{
                     'type': 'git',
                     'url': 'git+https://github.com/librariesio/yarn-parser.git'
                 }],
                 'author': ['Andrew Nesbitt'],
                 'license': ['AGPL-3.0'],
                 'version': ['1.0.0'],
                 'description': [
                     'Tiny web service for parsing yarn.lock files'
                 ],
                 'relatedLink': None,
                 'developmentStatus': None,
                 'operatingSystem': None,
                 'issueTracker': [{
                     'url': 'https://github.com/librariesio/yarn-parser/issues'
                 }],
                 'softwareRequirements': [{
                     'express': '^4.14.0',
                     'yarn': '^0.21.0',
                     'body-parser': '^1.15.2'
                 }],
                 'name': ['yarn-parser'],
                 'keywords': [['yarn', 'parse', 'lock', 'dependencies']],
                 'type': None,
                 'email': None
             },
             'indexer_configuration_id': 7
         }]
         # then
         self.assertEqual(expected_results, results)
diff --git a/swh/indexer/tests/test_mimetype.py b/swh/indexer/tests/test_mimetype.py
index a15b971..63f6044 100644
--- a/swh/indexer/tests/test_mimetype.py
+++ b/swh/indexer/tests/test_mimetype.py
@@ -1,158 +1,158 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import unittest
 import logging
 from nose.tools import istest
 
 from swh.indexer.mimetype import ContentMimetypeIndexer
 
 from swh.indexer.tests.test_utils import MockObjStorage
 
 
-class _MockStorage():
+class _MockIndexerStorage():
     """Mock storage to simplify reading indexers' outputs.
 
     """
     def content_mimetype_add(self, mimetypes, conflict_update=None):
         self.state = mimetypes
         self.conflict_update = conflict_update
 
     def indexer_configuration_add(self, tools):
         return [{
             'id': 10,
         }]
 
 
 class TestMimetypeIndexer(ContentMimetypeIndexer):
     """Specific mimetype whose configuration is enough to satisfy the
        indexing tests.
 
     """
     def prepare(self):
         self.config = {
             'destination_queue': None,
             'rescheduling_task': None,
             'tools': {
                 'name': 'file',
                 'version': '1:5.30-1+deb9u1',
                 'configuration': {
                     "type": "library",
                     "debian-package": "python3-magic"
                 },
             },
         }
-        self.storage = _MockStorage()
+        self.idx_storage = _MockIndexerStorage()
         self.log = logging.getLogger('swh.indexer')
         self.objstorage = MockObjStorage()
         self.task_destination = None
         self.rescheduling_task = self.config['rescheduling_task']
         self.destination_queue = self.config['destination_queue']
         self.tools = self.register_tools(self.config['tools'])
         self.tool = self.tools[0]
 
 
 class TestMimetypeIndexerUnknownToolStorage(TestMimetypeIndexer):
     """Specific mimetype whose configuration is not enough to satisfy the
        indexing tests.
 
     """
     def prepare(self):
         super().prepare()
         self.tools = None
 
 
 class TestMimetypeIndexerWithErrors(unittest.TestCase):
     @istest
     def wrong_unknown_configuration_tool(self):
         """Indexer with unknown configuration tool should fail the check"""
         with self.assertRaisesRegex(ValueError, 'Tools None is unknown'):
             TestMimetypeIndexerUnknownToolStorage()
 
 
 class TestMimetypeIndexerTest(unittest.TestCase):
     def setUp(self):
         self.indexer = TestMimetypeIndexer()
 
     @istest
     def test_index_no_update(self):
         # given
         sha1s = [
             '01c9379dfc33803963d07c1ccc748d3fe4c96bb5',
             '688a5ef812c53907562fe379d4b3851e69c7cb15',
         ]
 
         # when
         self.indexer.run(sha1s, policy_update='ignore-dups')
 
         # then
         expected_results = [{
             'id': '01c9379dfc33803963d07c1ccc748d3fe4c96bb5',
             'indexer_configuration_id': 10,
             'mimetype': b'text/plain',
             'encoding': b'us-ascii',
         }, {
             'id': '688a5ef812c53907562fe379d4b3851e69c7cb15',
             'indexer_configuration_id': 10,
             'mimetype': b'text/plain',
             'encoding': b'us-ascii',
         }]
 
-        self.assertFalse(self.indexer.storage.conflict_update)
-        self.assertEquals(expected_results, self.indexer.storage.state)
+        self.assertFalse(self.indexer.idx_storage.conflict_update)
+        self.assertEquals(expected_results, self.indexer.idx_storage.state)
 
     @istest
     def test_index_update(self):
         # given
         sha1s = [
             '01c9379dfc33803963d07c1ccc748d3fe4c96bb5',
             '688a5ef812c53907562fe379d4b3851e69c7cb15',
             'da39a3ee5e6b4b0d3255bfef95601890afd80709',  # empty content
         ]
 
         # when
         self.indexer.run(sha1s, policy_update='update-dups')
 
         # then
         expected_results = [{
             'id': '01c9379dfc33803963d07c1ccc748d3fe4c96bb5',
             'indexer_configuration_id': 10,
             'mimetype': b'text/plain',
             'encoding': b'us-ascii',
         }, {
             'id': '688a5ef812c53907562fe379d4b3851e69c7cb15',
             'indexer_configuration_id': 10,
             'mimetype': b'text/plain',
             'encoding': b'us-ascii',
         }, {
             'id': 'da39a3ee5e6b4b0d3255bfef95601890afd80709',
             'indexer_configuration_id': 10,
             'mimetype': b'application/x-empty',
             'encoding': b'binary',
         }]
 
-        self.assertTrue(self.indexer.storage.conflict_update)
-        self.assertEquals(expected_results, self.indexer.storage.state)
+        self.assertTrue(self.indexer.idx_storage.conflict_update)
+        self.assertEquals(expected_results, self.indexer.idx_storage.state)
 
     @istest
     def test_index_one_unknown_sha1(self):
         # given
         sha1s = ['688a5ef812c53907562fe379d4b3851e69c7cb15',
                  '799a5ef812c53907562fe379d4b3851e69c7cb15',  # unknown
                  '800a5ef812c53907562fe379d4b3851e69c7cb15']  # unknown
 
         # when
         self.indexer.run(sha1s, policy_update='update-dups')
 
         # then
         expected_results = [{
             'id': '688a5ef812c53907562fe379d4b3851e69c7cb15',
             'indexer_configuration_id': 10,
             'mimetype': b'text/plain',
             'encoding': b'us-ascii',
         }]
 
-        self.assertTrue(self.indexer.storage.conflict_update)
-        self.assertEquals(expected_results, self.indexer.storage.state)
+        self.assertTrue(self.indexer.idx_storage.conflict_update)
+        self.assertEquals(expected_results, self.indexer.idx_storage.state)
diff --git a/swh/indexer/tests/test_utils.py b/swh/indexer/tests/test_utils.py
index 328a062..41c9068 100644
--- a/swh/indexer/tests/test_utils.py
+++ b/swh/indexer/tests/test_utils.py
@@ -1,254 +1,261 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 
 from swh.objstorage.exc import ObjNotFoundError
 
 
 class MockObjStorage:
-    """Mock objstorage with predefined contents.
+    """Mock an swh-objstorage objstorage with predefined contents.
 
     """
     data = {}
 
     def __init__(self):
         self.data = {
             '01c9379dfc33803963d07c1ccc748d3fe4c96bb5': b'this is some text',
             '688a5ef812c53907562fe379d4b3851e69c7cb15': b'another text',
             '8986af901dd2043044ce8f0d8fc039153641cf17': b'yet another text',
             '02fb2c89e14f7fab46701478c83779c7beb7b069': b"""
             import unittest
             import logging
             from nose.tools import istest
             from swh.indexer.mimetype import ContentMimetypeIndexer
             from swh.indexer.tests.test_utils import MockObjStorage
 
             class MockStorage():
                 def content_mimetype_add(self, mimetypes):
                     self.state = mimetypes
                     self.conflict_update = conflict_update
 
                 def indexer_configuration_add(self, tools):
                     return [{
                         'id': 10,
                     }]
             """,
             '103bc087db1d26afc3a0283f38663d081e9b01e6': b"""
                 #ifndef __AVL__
                 #define __AVL__
 
                 typedef struct _avl_tree avl_tree;
 
                 typedef struct _data_t {
                   int content;
                 } data_t;
             """,
             '93666f74f1cf635c8c8ac118879da6ec5623c410': b"""
             (should 'pygments (recognize 'lisp 'easily))
 
             """,
             '26a9f72a7c87cc9205725cfd879f514ff4f3d8d5': b"""
             {
                 "name": "test_metadata",
                 "version": "0.0.1",
                 "description": "Simple package.json test for indexer",
                 "repository": {
                   "type": "git",
                   "url": "https://github.com/moranegg/metadata_test"
               }
             }
             """,
             'd4c647f0fc257591cc9ba1722484229780d1c607': b"""
             {
               "version": "5.0.3",
               "name": "npm",
               "description": "a package manager for JavaScript",
               "keywords": [
                 "install",
                 "modules",
                 "package manager",
                 "package.json"
               ],
               "preferGlobal": true,
               "config": {
                 "publishtest": false
               },
               "homepage": "https://docs.npmjs.com/",
               "author": "Isaac Z. Schlueter <i@izs.me> (http://blog.izs.me)",
               "repository": {
                 "type": "git",
                 "url": "https://github.com/npm/npm"
               },
               "bugs": {
                 "url": "https://github.com/npm/npm/issues"
               },
               "dependencies": {
                 "JSONStream": "~1.3.1",
                 "abbrev": "~1.1.0",
                 "ansi-regex": "~2.1.1",
                 "ansicolors": "~0.3.2",
                 "ansistyles": "~0.1.3"
               },
               "devDependencies": {
                 "tacks": "~1.2.6",
                 "tap": "~10.3.2"
               },
               "license": "Artistic-2.0"
             }
 
             """,
             'a7ab314d8a11d2c93e3dcf528ca294e7b431c449': b"""
             """,
             'da39a3ee5e6b4b0d3255bfef95601890afd80709': b'',
         }
 
     def __iter__(self):
         yield from self.data.keys()
 
     def __contains__(self, sha1):
         return self.data.get(sha1) is not None
 
     def get(self, sha1):
         raw_content = self.data.get(sha1)
         if raw_content is None:
             raise ObjNotFoundError(sha1)
         return raw_content
 
 
-class MockStorage():
-    """Mock storage to simplify reading indexers' outputs.
-    """
-    def content_metadata_missing(self, sha1s):
-        yield from []
-
-    def content_metadata_add(self, metadata, conflict_update=None):
-        self.state = metadata
-        self.conflict_update = conflict_update
-
-    def revision_metadata_add(self, metadata, conflict_update=None):
-        self.state = metadata
-        self.conflict_update = conflict_update
+class MockIndexerStorage():
+    """Mock an swh-indexer storage.
 
+    """
     def indexer_configuration_add(self, tools):
         tool = tools[0]
         if tool['tool_name'] == 'swh-metadata-translator':
             return [{
                 'id': 30,
                 'tool_name': 'swh-metadata-translator',
                 'tool_version': '0.0.1',
                 'tool_configuration': {
                     'type': 'local',
                     'context': 'npm'
                 },
             }]
         elif tool['tool_name'] == 'swh-metadata-detector':
             return [{
                 'id': 7,
                 'tool_name': 'swh-metadata-detector',
                 'tool_version': '0.0.1',
                 'tool_configuration': {
                     'type': 'local',
                     'context': 'npm'
                 },
             }]
 
+    def content_metadata_missing(self, sha1s):
+        yield from []
+
+    def content_metadata_add(self, metadata, conflict_update=None):
+        self.state = metadata
+        self.conflict_update = conflict_update
+
+    def revision_metadata_add(self, metadata, conflict_update=None):
+        self.state = metadata
+        self.conflict_update = conflict_update
+
+    def content_metadata_get(self, sha1s):
+        return [{
+            'tool': {
+                'configuration': {
+                    'type': 'local',
+                    'context': 'npm'
+                    },
+                'version': '0.0.1',
+                'id': 6,
+                'name': 'swh-metadata-translator'
+            },
+            'id': b'cde',
+            'translated_metadata': {
+                'issueTracker': {
+                    'url': 'https://github.com/librariesio/yarn-parser/issues'
+                },
+                'version': '1.0.0',
+                'name': 'yarn-parser',
+                'author': 'Andrew Nesbitt',
+                'url': 'https://github.com/librariesio/yarn-parser#readme',
+                'processorRequirements': {'node': '7.5'},
+                'other': {
+                    'scripts': {
+                                    'start': 'node index.js'
+                    },
+                    'main': 'index.js'
+                },
+                'license': 'AGPL-3.0',
+                'keywords': ['yarn', 'parse', 'lock', 'dependencies'],
+                'codeRepository': {
+                    'type': 'git',
+                    'url': 'git+https://github.com/librariesio/yarn-parser.git'
+                },
+                'description': 'Tiny web service for parsing yarn.lock files',
+                'softwareRequirements': {
+                    'yarn': '^0.21.0',
+                    'express': '^4.14.0',
+                    'body-parser': '^1.15.2'}
+                }
+        }]
+
+
+class MockStorage():
+    """Mock a real swh-storage storage to simplify reading indexers'
+    outputs.
+
+    """
     def revision_get(self, revisions):
         return [{
             'id': b'8dbb6aeb036e7fd80664eb8bfd1507881af1ba9f',
             'committer': {
                 'id': 26,
                 'name': b'Andrew Nesbitt',
                 'fullname': b'Andrew Nesbitt <andrewnez@gmail.com>',
                 'email': b'andrewnez@gmail.com'
             },
             'synthetic': False,
             'date': {
                 'negative_utc': False,
                 'timestamp': {
                     'seconds': 1487596456,
                     'microseconds': 0
                 },
                 'offset': 0
             },
             'directory': b'10'
         }]
 
     def directory_ls(self, directory, recursive=False, cur=None):
         # with directory: b'\x9d',
         return [{
                 'sha1_git': b'abc',
                 'name': b'index.js',
                 'target': b'abc',
                 'length': 897,
                 'status': 'visible',
                 'type': 'file',
                 'perms': 33188,
                 'dir_id': b'10',
                 'sha1': b'bcd'
                 },
                 {
                 'sha1_git': b'aab',
                 'name': b'package.json',
                 'target': b'aab',
                 'length': 712,
                 'status': 'visible',
                 'type': 'file',
                 'perms': 33188,
                 'dir_id': b'10',
                 'sha1': b'cde'
                 },
                 {
                 'dir_id': b'10',
                 'target': b'11',
                 'type': 'dir',
                 'length': None,
                 'name': b'.github',
                 'sha1': None,
                 'perms': 16384,
                 'sha1_git': None,
                 'status': None,
                 'sha256': None
                 }]
-
-    def content_metadata_get(self, sha1s):
-        return [{
-            'tool': {
-                'configuration': {
-                    'type': 'local',
-                    'context': 'npm'
-                    },
-                'version': '0.0.1',
-                'id': 6,
-                'name': 'swh-metadata-translator'
-            },
-            'id': b'cde',
-            'translated_metadata': {
-                'issueTracker': {
-                    'url': 'https://github.com/librariesio/yarn-parser/issues'
-                },
-                'version': '1.0.0',
-                'name': 'yarn-parser',
-                'author': 'Andrew Nesbitt',
-                'url': 'https://github.com/librariesio/yarn-parser#readme',
-                'processorRequirements': {'node': '7.5'},
-                'other': {
-                    'scripts': {
-                                    'start': 'node index.js'
-                    },
-                    'main': 'index.js'
-                },
-                'license': 'AGPL-3.0',
-                'keywords': ['yarn', 'parse', 'lock', 'dependencies'],
-                'codeRepository': {
-                    'type': 'git',
-                    'url': 'git+https://github.com/librariesio/yarn-parser.git'
-                },
-                'description': 'Tiny web service for parsing yarn.lock files',
-                'softwareRequirements': {
-                    'yarn': '^0.21.0',
-                    'express': '^4.14.0',
-                    'body-parser': '^1.15.2'}
-                }
-        }]