diff --git a/sql/upgrades/118.sql b/sql/upgrades/118.sql
new file mode 100644
index 0000000..b2c4930
--- /dev/null
+++ b/sql/upgrades/118.sql
@@ -0,0 +1,11 @@
+-- SWH Indexer DB schema upgrade
+-- from_version: 117
+-- to_version: 118
+-- description: content_mimetype: Migrate bytes column to text
+
+insert into dbversion(version, release, description)
+values(118, now(), 'Work In Progress');
+
+alter table content_mimetype
+  alter column mimetype set data type text,
+  alter column encoding set data type text;
diff --git a/swh/indexer/mimetype.py b/swh/indexer/mimetype.py
index ee5e735..1877644 100644
--- a/swh/indexer/mimetype.py
+++ b/swh/indexer/mimetype.py
@@ -1,153 +1,153 @@
 # Copyright (C) 2016-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import magic
 
 from swh.model import hashutil
 
 from .indexer import ContentIndexer, ContentRangeIndexer
 
 
 def compute_mimetype_encoding(raw_content):
     """Determine mimetype and encoding from the raw content.
 
     Args:
         raw_content (bytes): content's raw data
 
     Returns:
         A dict with mimetype and encoding key and corresponding values
         (as bytes).
 
     """
     r = magic.detect_from_content(raw_content)
     return {
-        'mimetype': r.mime_type.encode('utf-8'),
-        'encoding': r.encoding.encode('utf-8'),
+        'mimetype': r.mime_type,
+        'encoding': r.encoding,
     }
 
 
 class MixinMimetypeIndexer:
     """Mixin mimetype indexer.
 
     See :class:`ContentMimetypeIndexer` and :class:`MimetypeRangeIndexer`
 
     """
     ADDITIONAL_CONFIG = {
         'tools': ('dict', {
             'name': 'file',
             'version': '1:5.30-1+deb9u1',
             'configuration': {
                 "type": "library",
                 "debian-package": "python3-magic"
             },
         }),
         'write_batch_size': ('int', 1000),
     }
 
     CONFIG_BASE_FILENAME = 'indexer/mimetype'
 
     def prepare(self):
         super().prepare()
         self.tool = self.tools[0]
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             id (bytes): content's identifier
             data (bytes): raw content in bytes
 
         Returns:
             A dict, representing a content_mimetype, with keys:
 
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
 
         """
         try:
             properties = compute_mimetype_encoding(data)
             properties.update({
                 'id': id,
                 'indexer_configuration_id': self.tool['id'],
                 })
         except TypeError:
             self.log.error('Detecting mimetype error for id %s' % (
                 hashutil.hash_to_hex(id), ))
             return None
 
         return properties
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_mimetype, dict with the
             following keys:
 
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
 
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
         self.idx_storage.content_mimetype_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
 
 class ContentMimetypeIndexer(MixinMimetypeIndexer, ContentIndexer):
     """Mimetype Indexer working on list of content identifiers.
 
     It:
     - (optionally) filters out content already indexed (cf. :callable:`filter`)
     - reads content from objstorage per the content's id (sha1)
     - computes {mimetype, encoding} from that content
     - stores result in storage
 
     FIXME:
     - 1. Rename redundant ContentMimetypeIndexer to MimetypeIndexer
     - 2. Do we keep it afterwards? ~> i think this can be used with the journal
 
     """
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
 
         """
         yield from self.idx_storage.content_mimetype_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1 in ids
         ))
 
 
 class MimetypeRangeIndexer(MixinMimetypeIndexer, ContentRangeIndexer):
     """Mimetype Range Indexer working on range of content identifiers.
 
     It:
     - (optionally) filters out content already indexed (cf :callable:`range`)
     - reads content from objstorage per the content's id (sha1)
     - computes {mimetype, encoding} from that content
     - stores result in storage
 
     """
     def indexed_contents_in_range(self, start, end):
         """Retrieve indexed content id within range [start, end].
 
         Args
             **start** (bytes): Starting bound from range identifier
             **end** (bytes): End range identifier
 
         Returns:
             a dict with keys:
             - **ids** [bytes]: iterable of content ids within the range.
             - **next** (Optional[bytes]): The next range of sha1 starts at
                                           this sha1 if any
 
         """
         return self.idx_storage.content_mimetype_get_range(
             start, end, self.tool['id'])
diff --git a/swh/indexer/sql/30-swh-schema.sql b/swh/indexer/sql/30-swh-schema.sql
index 62b61ea..ddd0d71 100644
--- a/swh/indexer/sql/30-swh-schema.sql
+++ b/swh/indexer/sql/30-swh-schema.sql
@@ -1,141 +1,141 @@
 ---
 --- Software Heritage Indexers Data Model
 ---
 
 -- drop schema if exists swh cascade;
 -- create schema swh;
 -- set search_path to swh;
 
 create table dbversion
 (
   version     int primary key,
   release     timestamptz,
   description text
 );
 
 insert into dbversion(version, release, description)
-      values(117, now(), 'Work In Progress');
+      values(118, now(), 'Work In Progress');
 -- Computing metadata on sha1's contents
 
 -- a SHA1 checksum (not necessarily originating from Git)
 create domain sha1 as bytea check (length(value) = 20);
 
 -- a Git object ID, i.e., a SHA1 checksum
 create domain sha1_git as bytea check (length(value) = 20);
 
 create table indexer_configuration (
   id serial not null,
   tool_name text not null,
   tool_version text not null,
   tool_configuration jsonb
 );
 
 comment on table indexer_configuration is 'Indexer''s configuration version';
 comment on column indexer_configuration.id is 'Tool identifier';
 comment on column indexer_configuration.tool_version is 'Tool name';
 comment on column indexer_configuration.tool_version is 'Tool version';
 comment on column indexer_configuration.tool_configuration is 'Tool configuration: command line, flags, etc...';
 
 -- Properties (mimetype, encoding, etc...)
 create table content_mimetype (
   id sha1 not null,
-  mimetype bytea not null,
-  encoding bytea not null,
+  mimetype text not null,
+  encoding text not null,
   indexer_configuration_id bigint not null
 );
 
 comment on table content_mimetype is 'Metadata associated to a raw content';
 comment on column content_mimetype.mimetype is 'Raw content Mimetype';
 comment on column content_mimetype.encoding is 'Raw content encoding';
 comment on column content_mimetype.indexer_configuration_id is 'Tool used to compute the information';
 
 -- Language metadata
 create table content_language (
   id sha1 not null,
   lang languages not null,
   indexer_configuration_id bigint not null
 );
 
 comment on table content_language is 'Language information on a raw content';
 comment on column content_language.lang is 'Language information';
 comment on column content_language.indexer_configuration_id is 'Tool used to compute the information';
 
 -- ctags information per content
 create table content_ctags (
   id sha1 not null,
   name text not null,
   kind text not null,
   line bigint not null,
   lang ctags_languages not null,
   indexer_configuration_id bigint not null
 );
 
 comment on table content_ctags is 'Ctags information on a raw content';
 comment on column content_ctags.id is 'Content identifier';
 comment on column content_ctags.name is 'Symbol name';
 comment on column content_ctags.kind is 'Symbol kind (function, class, variable, const...)';
 comment on column content_ctags.line is 'Symbol line';
 comment on column content_ctags.lang is 'Language information for that content';
 comment on column content_ctags.indexer_configuration_id is 'Tool used to compute the information';
 
 create table fossology_license(
   id smallserial,
   name text not null
 );
 
 comment on table fossology_license is 'Possible license recognized by license indexer';
 comment on column fossology_license.id is 'License identifier';
 comment on column fossology_license.name is 'License name';
 
 create table content_fossology_license (
   id sha1 not null,
   license_id smallserial not null,
   indexer_configuration_id bigint not null
 );
 
 comment on table content_fossology_license is 'license associated to a raw content';
 comment on column content_fossology_license.id is 'Raw content identifier';
 comment on column content_fossology_license.license_id is 'One of the content''s license identifier';
 comment on column content_fossology_license.indexer_configuration_id is 'Tool used to compute the information';
 
 
 -- The table content_metadata provides a translation to files
 -- identified as potentially containning metadata with a translation tool (indexer_configuration_id)
 create table content_metadata(
   id                       sha1   not null,
   translated_metadata      jsonb  not null,
   indexer_configuration_id bigint not null
 );
 
 comment on table content_metadata is 'metadata semantically translated from a content file';
 comment on column content_metadata.id is 'sha1 of content file';
 comment on column content_metadata.translated_metadata is 'result of translation with defined format';
 comment on column content_metadata.indexer_configuration_id is 'tool used for translation';
 
 -- The table revision_metadata provides a minimal set of intrinsic metadata
 -- detected with the detection  tool (indexer_configuration_id) and aggregated
 -- from the content_metadata translation.
 create table revision_metadata(
   id                       sha1_git   not null,
   translated_metadata      jsonb      not null,
   indexer_configuration_id bigint     not null
 );
 
 comment on table revision_metadata is 'metadata semantically detected and translated in a revision';
 comment on column revision_metadata.id is 'sha1_git of revision';
 comment on column revision_metadata.translated_metadata is 'result of detection and translation with defined format';
 comment on column revision_metadata.indexer_configuration_id is 'tool used for detection';
 
 create table origin_intrinsic_metadata(
   origin_id                 bigserial  not null,
   metadata                  jsonb,
   indexer_configuration_id  bigint     not null,
   from_revision             sha1_git   not null,
   metadata_tsvector         tsvector
 );
 
 comment on table origin_intrinsic_metadata is 'keeps intrinsic metadata for an origin';
 comment on column origin_intrinsic_metadata.origin_id is 'the entry id in origin';
 comment on column origin_intrinsic_metadata.metadata is 'metadata extracted from a revision';
 comment on column origin_intrinsic_metadata.indexer_configuration_id is 'tool used to generate this metadata';
 comment on column origin_intrinsic_metadata.from_revision is 'sha1 of the revision this metadata was copied from.';
diff --git a/swh/indexer/tests/storage/test_storage.py b/swh/indexer/tests/storage/test_storage.py
index 00af0e6..1127c23 100644
--- a/swh/indexer/tests/storage/test_storage.py
+++ b/swh/indexer/tests/storage/test_storage.py
@@ -1,1968 +1,1968 @@
 # Copyright (C) 2015-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import os
 import pytest
 import unittest
 
 from hypothesis import given
 
 from swh.model.hashutil import hash_to_bytes
 
 from swh.indexer.storage import get_indexer_storage
 from swh.core.tests.db_testing import SingleDbTestFixture
 from swh.indexer.tests.storage.generate_data_test import (
     gen_content_mimetypes, gen_content_fossology_licenses
 )
 from swh.indexer.tests.storage import SQL_DIR
 
 
 @pytest.mark.db
 class BaseTestStorage(SingleDbTestFixture):
     """Base test class for most indexer tests.
 
     It adds support for Storage testing to the SingleDbTestFixture class.
     It will also build the database from the swh-indexed/sql/*.sql files.
     """
 
     TEST_DB_NAME = 'softwareheritage-test-indexer'
     TEST_DB_DUMP = os.path.join(SQL_DIR, '*.sql')
 
     def setUp(self):
         super().setUp()
         self.storage_config = {
             'cls': 'local',
             'args': {
                 'db': 'dbname=%s' % self.TEST_DB_NAME,
             },
         }
         self.storage = get_indexer_storage(**self.storage_config)
 
         self.sha1_1 = hash_to_bytes('34973274ccef6ab4dfaaf86599792fa9c3fe4689')
         self.sha1_2 = hash_to_bytes('61c2b3a30496d329e21af70dd2d7e097046d07b7')
         self.revision_id_1 = hash_to_bytes(
             '7026b7c1a2af56521e951c01ed20f255fa054238')
         self.revision_id_2 = hash_to_bytes(
             '7026b7c1a2af56521e9587659012345678904321')
         self.origin_id_1 = 54974445
         self.origin_id_2 = 44434342
 
         cur = self.test_db[self.TEST_DB_NAME].cursor
         tools = {}
         cur.execute('''
             select tool_name, id, tool_version, tool_configuration
             from indexer_configuration
             order by id''')
         for row in cur.fetchall():
             key = row[0]
             while key in tools:
                 key = '_' + key
             tools[key] = {
                 'id': row[1],
                 'name': row[0],
                 'version': row[2],
                 'configuration': row[3]
             }
         self.tools = tools
 
     def tearDown(self):
         self.reset_storage_tables()
         self.storage = None
         super().tearDown()
 
     def reset_storage_tables(self):
         excluded = {'indexer_configuration'}
         self.reset_db_tables(self.TEST_DB_NAME, excluded=excluded)
 
         db = self.test_db[self.TEST_DB_NAME]
         db.conn.commit()
 
 
 @pytest.mark.db
 class CommonTestStorage(BaseTestStorage):
     """Base class for Indexer Storage testing.
 
     """
 
     def test_check_config(self):
         self.assertTrue(self.storage.check_config(check_write=True))
         self.assertTrue(self.storage.check_config(check_write=False))
 
     def test_content_mimetype_missing(self):
         # given
         tool_id = self.tools['file']['id']
 
         mimetypes = [
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             }]
 
         # when
         actual_missing = self.storage.content_mimetype_missing(mimetypes)
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_1,
             self.sha1_2,
         ])
 
         # given
         self.storage.content_mimetype_add([{
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'indexer_configuration_id': tool_id,
         }])
 
         # when
         actual_missing = self.storage.content_mimetype_missing(mimetypes)
 
         # then
         self.assertEqual(list(actual_missing), [self.sha1_1])
 
     def test_content_mimetype_add__drop_duplicate(self):
         # given
         tool_id = self.tools['file']['id']
 
         mimetype_v1 = {
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_mimetype_add([mimetype_v1])
 
         # when
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         # then
         expected_mimetypes_v1 = [{
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'tool': self.tools['file'],
         }]
         self.assertEqual(actual_mimetypes, expected_mimetypes_v1)
 
         # given
         mimetype_v2 = mimetype_v1.copy()
         mimetype_v2.update({
-            'mimetype': b'text/html',
-            'encoding': b'us-ascii',
+            'mimetype': 'text/html',
+            'encoding': 'us-ascii',
         })
 
         self.storage.content_mimetype_add([mimetype_v2])
 
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         # mimetype did not change as the v2 was dropped.
         self.assertEqual(actual_mimetypes, expected_mimetypes_v1)
 
     def test_content_mimetype_add__update_in_place_duplicate(self):
         # given
         tool_id = self.tools['file']['id']
 
         mimetype_v1 = {
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_mimetype_add([mimetype_v1])
 
         # when
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         expected_mimetypes_v1 = [{
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'tool': self.tools['file'],
         }]
 
         # then
         self.assertEqual(actual_mimetypes, expected_mimetypes_v1)
 
         # given
         mimetype_v2 = mimetype_v1.copy()
         mimetype_v2.update({
-            'mimetype': b'text/html',
-            'encoding': b'us-ascii',
+            'mimetype': 'text/html',
+            'encoding': 'us-ascii',
         })
 
         self.storage.content_mimetype_add([mimetype_v2], conflict_update=True)
 
         actual_mimetypes = list(self.storage.content_mimetype_get(
             [self.sha1_2]))
 
         expected_mimetypes_v2 = [{
             'id': self.sha1_2,
-            'mimetype': b'text/html',
-            'encoding': b'us-ascii',
+            'mimetype': 'text/html',
+            'encoding': 'us-ascii',
             'tool': {
                 'id': 2,
                 'name': 'file',
                 'version': '5.22',
                 'configuration': {'command_line': 'file --mime <filepath>'}
             }
         }]
 
         # mimetype did change as the v2 was used to overwrite v1
         self.assertEqual(actual_mimetypes, expected_mimetypes_v2)
 
     def test_content_mimetype_get(self):
         # given
         tool_id = self.tools['file']['id']
 
         mimetypes = [self.sha1_2, self.sha1_1]
 
         mimetype1 = {
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_mimetype_add([mimetype1])
 
         # then
         actual_mimetypes = list(self.storage.content_mimetype_get(mimetypes))
 
         # then
         expected_mimetypes = [{
             'id': self.sha1_2,
-            'mimetype': b'text/plain',
-            'encoding': b'utf-8',
+            'mimetype': 'text/plain',
+            'encoding': 'utf-8',
             'tool': self.tools['file']
         }]
 
         self.assertEqual(actual_mimetypes, expected_mimetypes)
 
     def test_content_language_missing(self):
         # given
         tool_id = self.tools['pygments']['id']
 
         languages = [
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = list(self.storage.content_language_missing(languages))
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_2,
             self.sha1_1,
         ])
 
         # given
         self.storage.content_language_add([{
             'id': self.sha1_2,
             'lang': 'haskell',
             'indexer_configuration_id': tool_id,
         }])
 
         # when
         actual_missing = list(self.storage.content_language_missing(languages))
 
         # then
         self.assertEqual(actual_missing, [self.sha1_1])
 
     def test_content_language_get(self):
         # given
         tool_id = self.tools['pygments']['id']
 
         language1 = {
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_language_add([language1])
 
         # then
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2, self.sha1_1]))
 
         # then
         expected_languages = [{
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'tool': self.tools['pygments']
         }]
 
         self.assertEqual(actual_languages, expected_languages)
 
     def test_content_language_add__drop_duplicate(self):
         # given
         tool_id = self.tools['pygments']['id']
 
         language_v1 = {
             'id': self.sha1_2,
             'lang': 'emacslisp',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_language_add([language_v1])
 
         # when
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # then
         expected_languages_v1 = [{
             'id': self.sha1_2,
             'lang': 'emacslisp',
             'tool': self.tools['pygments']
         }]
         self.assertEqual(actual_languages, expected_languages_v1)
 
         # given
         language_v2 = language_v1.copy()
         language_v2.update({
             'lang': 'common-lisp',
         })
 
         self.storage.content_language_add([language_v2])
 
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # language did not change as the v2 was dropped.
         self.assertEqual(actual_languages, expected_languages_v1)
 
     def test_content_language_add__update_in_place_duplicate(self):
         # given
         tool_id = self.tools['pygments']['id']
 
         language_v1 = {
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_language_add([language_v1])
 
         # when
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # then
         expected_languages_v1 = [{
             'id': self.sha1_2,
             'lang': 'common-lisp',
             'tool': self.tools['pygments']
         }]
         self.assertEqual(actual_languages, expected_languages_v1)
 
         # given
         language_v2 = language_v1.copy()
         language_v2.update({
             'lang': 'emacslisp',
         })
 
         self.storage.content_language_add([language_v2], conflict_update=True)
 
         actual_languages = list(self.storage.content_language_get(
             [self.sha1_2]))
 
         # language did not change as the v2 was dropped.
         expected_languages_v2 = [{
             'id': self.sha1_2,
             'lang': 'emacslisp',
             'tool': self.tools['pygments']
         }]
 
         # language did change as the v2 was used to overwrite v1
         self.assertEqual(actual_languages, expected_languages_v2)
 
     def test_content_ctags_missing(self):
         # given
         tool_id = self.tools['universal-ctags']['id']
 
         ctags = [
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = self.storage.content_ctags_missing(ctags)
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_2,
             self.sha1_1
         ])
 
         # given
         self.storage.content_ctags_add([
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
                 'ctags': [{
                     'name': 'done',
                     'kind': 'variable',
                     'line': 119,
                     'lang': 'OCaml',
                 }]
             },
         ])
 
         # when
         actual_missing = self.storage.content_ctags_missing(ctags)
 
         # then
         self.assertEqual(list(actual_missing), [self.sha1_1])
 
     def test_content_ctags_get(self):
         # given
         tool_id = self.tools['universal-ctags']['id']
 
         ctags = [self.sha1_2, self.sha1_1]
 
         ctag1 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [
                 {
                     'name': 'done',
                     'kind': 'variable',
                     'line': 100,
                     'lang': 'Python',
                 },
                 {
                     'name': 'main',
                     'kind': 'function',
                     'line': 119,
                     'lang': 'Python',
                 }]
         }
 
         # when
         self.storage.content_ctags_add([ctag1])
 
         # then
         actual_ctags = list(self.storage.content_ctags_get(ctags))
 
         # then
 
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'tool': self.tools['universal-ctags'],
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Python',
             },
             {
                 'id': self.sha1_2,
                 'tool': self.tools['universal-ctags'],
                 'name': 'main',
                 'kind': 'function',
                 'line': 119,
                 'lang': 'Python',
             }
         ]
 
         self.assertEqual(actual_ctags, expected_ctags)
 
     def test_content_ctags_search(self):
         # 1. given
         tool = self.tools['universal-ctags']
         tool_id = tool['id']
 
         ctag1 = {
             'id': self.sha1_1,
             'indexer_configuration_id': tool_id,
             'ctags': [
                 {
                     'name': 'hello',
                     'kind': 'function',
                     'line': 133,
                     'lang': 'Python',
                 },
                 {
                     'name': 'counter',
                     'kind': 'variable',
                     'line': 119,
                     'lang': 'Python',
                 },
             ]
         }
 
         ctag2 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [
                 {
                     'name': 'hello',
                     'kind': 'variable',
                     'line': 100,
                     'lang': 'C',
                 },
             ]
         }
 
         self.storage.content_ctags_add([ctag1, ctag2])
 
         # 1. when
         actual_ctags = list(self.storage.content_ctags_search('hello',
                                                               limit=1))
 
         # 1. then
         self.assertEqual(actual_ctags, [
             {
                 'id': ctag1['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'function',
                 'line': 133,
                 'lang': 'Python',
             }
         ])
 
         # 2. when
         actual_ctags = list(self.storage.content_ctags_search(
             'hello',
             limit=1,
             last_sha1=ctag1['id']))
 
         # 2. then
         self.assertEqual(actual_ctags, [
             {
                 'id': ctag2['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'C',
             }
         ])
 
         # 3. when
         actual_ctags = list(self.storage.content_ctags_search('hello'))
 
         # 3. then
         self.assertEqual(actual_ctags, [
             {
                 'id': ctag1['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'function',
                 'line': 133,
                 'lang': 'Python',
             },
             {
                 'id': ctag2['id'],
                 'tool': tool,
                 'name': 'hello',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'C',
             },
         ])
 
         # 4. when
         actual_ctags = list(self.storage.content_ctags_search('counter'))
 
         # then
         self.assertEqual(actual_ctags, [{
             'id': ctag1['id'],
             'tool': tool,
             'name': 'counter',
             'kind': 'variable',
             'line': 119,
             'lang': 'Python',
         }])
 
     def test_content_ctags_search_no_result(self):
         actual_ctags = list(self.storage.content_ctags_search('counter'))
 
         self.assertEqual(actual_ctags, [])
 
     def test_content_ctags_add__add_new_ctags_added(self):
         # given
         tool = self.tools['universal-ctags']
         tool_id = tool['id']
 
         ctag_v1 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [{
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
             }]
         }
 
         # given
         self.storage.content_ctags_add([ctag_v1])
         self.storage.content_ctags_add([ctag_v1])  # conflict does nothing
 
         # when
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         # then
         expected_ctags = [{
             'id': self.sha1_2,
             'name': 'done',
             'kind': 'variable',
             'line': 100,
             'lang': 'Scheme',
             'tool': tool,
         }]
 
         self.assertEqual(actual_ctags, expected_ctags)
 
         # given
         ctag_v2 = ctag_v1.copy()
         ctag_v2.update({
             'ctags': [
                 {
                     'name': 'defn',
                     'kind': 'function',
                     'line': 120,
                     'lang': 'Scheme',
                 }
             ]
         })
 
         self.storage.content_ctags_add([ctag_v2])
 
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
                 'tool': tool,
             }, {
                 'id': self.sha1_2,
                 'name': 'defn',
                 'kind': 'function',
                 'line': 120,
                 'lang': 'Scheme',
                 'tool': tool,
             }
         ]
 
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         self.assertEqual(actual_ctags, expected_ctags)
 
     def test_content_ctags_add__update_in_place(self):
         # given
         tool = self.tools['universal-ctags']
         tool_id = tool['id']
 
         ctag_v1 = {
             'id': self.sha1_2,
             'indexer_configuration_id': tool_id,
             'ctags': [{
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
             }]
         }
 
         # given
         self.storage.content_ctags_add([ctag_v1])
 
         # when
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         # then
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
                 'tool': tool
             }
         ]
         self.assertEqual(actual_ctags, expected_ctags)
 
         # given
         ctag_v2 = ctag_v1.copy()
         ctag_v2.update({
             'ctags': [
                 {
                     'name': 'done',
                     'kind': 'variable',
                     'line': 100,
                     'lang': 'Scheme',
                 },
                 {
                     'name': 'defn',
                     'kind': 'function',
                     'line': 120,
                     'lang': 'Scheme',
                 }
             ]
         })
 
         self.storage.content_ctags_add([ctag_v2], conflict_update=True)
 
         actual_ctags = list(self.storage.content_ctags_get(
             [self.sha1_2]))
 
         # ctag did change as the v2 was used to overwrite v1
         expected_ctags = [
             {
                 'id': self.sha1_2,
                 'name': 'done',
                 'kind': 'variable',
                 'line': 100,
                 'lang': 'Scheme',
                 'tool': tool,
             },
             {
                 'id': self.sha1_2,
                 'name': 'defn',
                 'kind': 'function',
                 'line': 120,
                 'lang': 'Scheme',
                 'tool': tool,
             }
         ]
         self.assertEqual(actual_ctags, expected_ctags)
 
     def test_content_fossology_license_get(self):
         # given
         tool = self.tools['nomos']
         tool_id = tool['id']
 
         license1 = {
             'id': self.sha1_1,
             'licenses': ['GPL-2.0+'],
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_fossology_license_add([license1])
 
         # then
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_2, self.sha1_1]))
 
         expected_license = {
             self.sha1_1: [{
                 'licenses': ['GPL-2.0+'],
                 'tool': tool,
             }]
         }
 
         # then
         self.assertEqual(actual_licenses, [expected_license])
 
     def test_content_fossology_license_add__new_license_added(self):
         # given
         tool = self.tools['nomos']
         tool_id = tool['id']
 
         license_v1 = {
             'id': self.sha1_1,
             'licenses': ['Apache-2.0'],
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_fossology_license_add([license_v1])
         # conflict does nothing
         self.storage.content_fossology_license_add([license_v1])
 
         # when
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         # then
         expected_license = {
             self.sha1_1: [{
                 'licenses': ['Apache-2.0'],
                 'tool': tool,
             }]
         }
         self.assertEqual(actual_licenses, [expected_license])
 
         # given
         license_v2 = license_v1.copy()
         license_v2.update({
             'licenses': ['BSD-2-Clause'],
         })
 
         self.storage.content_fossology_license_add([license_v2])
 
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         expected_license = {
             self.sha1_1: [{
                 'licenses': ['Apache-2.0', 'BSD-2-Clause'],
                 'tool': tool
             }]
         }
 
         # license did not change as the v2 was dropped.
         self.assertEqual(actual_licenses, [expected_license])
 
     def test_content_fossology_license_add__update_in_place_duplicate(self):
         # given
         tool = self.tools['nomos']
         tool_id = tool['id']
 
         license_v1 = {
             'id': self.sha1_1,
             'licenses': ['CECILL'],
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_fossology_license_add([license_v1])
         # conflict does nothing
         self.storage.content_fossology_license_add([license_v1])
 
         # when
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         # then
         expected_license = {
             self.sha1_1: [{
                 'licenses': ['CECILL'],
                 'tool': tool,
             }]
         }
         self.assertEqual(actual_licenses, [expected_license])
 
         # given
         license_v2 = license_v1.copy()
         license_v2.update({
             'licenses': ['CECILL-2.0']
         })
 
         self.storage.content_fossology_license_add([license_v2],
                                                    conflict_update=True)
 
         actual_licenses = list(self.storage.content_fossology_license_get(
             [self.sha1_1]))
 
         # license did change as the v2 was used to overwrite v1
         expected_license = {
             self.sha1_1: [{
                 'licenses': ['CECILL-2.0'],
                 'tool': tool,
             }]
         }
         self.assertEqual(actual_licenses, [expected_license])
 
     def test_content_metadata_missing(self):
         # given
         tool_id = self.tools['swh-metadata-translator']['id']
 
         metadata = [
             {
                 'id': self.sha1_2,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.sha1_1,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = list(self.storage.content_metadata_missing(metadata))
 
         # then
         self.assertEqual(list(actual_missing), [
             self.sha1_2,
             self.sha1_1,
         ])
 
         # given
         self.storage.content_metadata_add([{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id
         }])
 
         # when
         actual_missing = list(self.storage.content_metadata_missing(metadata))
 
         # then
         self.assertEqual(actual_missing, [self.sha1_1])
 
     def test_content_metadata_get(self):
         # given
         tool_id = self.tools['swh-metadata-translator']['id']
 
         metadata1 = {
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id,
         }
 
         # when
         self.storage.content_metadata_add([metadata1])
 
         # then
         actual_metadata = list(self.storage.content_metadata_get(
             [self.sha1_2, self.sha1_1]))
 
         expected_metadata = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'codeRepository': {
                     'type': 'git',
                     'url': 'https://github.com/moranegg/metadata_test'
                 },
                 'description': 'Simple package.json test for indexer',
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'tool': self.tools['swh-metadata-translator']
         }]
 
         self.assertEqual(actual_metadata, expected_metadata)
 
     def test_content_metadata_add_drop_duplicate(self):
         # given
         tool_id = self.tools['swh-metadata-translator']['id']
 
         metadata_v1 = {
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_metadata_add([metadata_v1])
 
         # when
         actual_metadata = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         expected_metadata_v1 = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'tool': self.tools['swh-metadata-translator']
         }]
 
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata': {
                 'other': {},
                 'name': 'test_drop_duplicated_metadata',
                 'version': '0.0.1'
             },
         })
 
         self.storage.content_metadata_add([metadata_v2])
 
         # then
         actual_metadata = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         # metadata did not change as the v2 was dropped.
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
     def test_content_metadata_add_update_in_place_duplicate(self):
         # given
         tool_id = self.tools['swh-metadata-translator']['id']
 
         metadata_v1 = {
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.content_metadata_add([metadata_v1])
 
         # when
         actual_metadata = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         # then
         expected_metadata_v1 = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_metadata',
                 'version': '0.0.1'
             },
             'tool': self.tools['swh-metadata-translator']
         }]
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata': {
                 'other': {},
                 'name': 'test_update_duplicated_metadata',
                 'version': '0.0.1'
             },
         })
         self.storage.content_metadata_add([metadata_v2], conflict_update=True)
 
         actual_metadata = list(self.storage.content_metadata_get(
             [self.sha1_2]))
 
         # language did not change as the v2 was dropped.
         expected_metadata_v2 = [{
             'id': self.sha1_2,
             'translated_metadata': {
                 'other': {},
                 'name': 'test_update_duplicated_metadata',
                 'version': '0.0.1'
             },
             'tool': self.tools['swh-metadata-translator']
         }]
 
         # metadata did change as the v2 was used to overwrite v1
         self.assertEqual(actual_metadata, expected_metadata_v2)
 
     def test_revision_metadata_missing(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata = [
             {
                 'id': self.revision_id_1,
                 'indexer_configuration_id': tool_id,
             },
             {
                 'id': self.revision_id_2,
                 'indexer_configuration_id': tool_id,
             }
         ]
 
         # when
         actual_missing = list(self.storage.revision_metadata_missing(
                               metadata))
 
         # then
         self.assertEqual(list(actual_missing), [
             self.revision_id_1,
             self.revision_id_2,
         ])
 
         # given
         self.storage.revision_metadata_add([{
             'id': self.revision_id_1,
             'translated_metadata': {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id
         }])
 
         # when
         actual_missing = list(self.storage.revision_metadata_missing(
                               metadata))
 
         # then
         self.assertEqual(actual_missing, [self.revision_id_2])
 
     def test_revision_metadata_get(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata_rev = {
             'id': self.revision_id_2,
             'translated_metadata': {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id
         }
 
         # when
         self.storage.revision_metadata_add([metadata_rev])
 
         # then
         actual_metadata = list(self.storage.revision_metadata_get(
             [self.revision_id_2, self.revision_id_1]))
 
         expected_metadata = [{
             'id': self.revision_id_2,
             'translated_metadata': metadata_rev['translated_metadata'],
             'tool': self.tools['swh-metadata-detector']
         }]
 
         self.assertEqual(actual_metadata, expected_metadata)
 
     def test_revision_metadata_add_drop_duplicate(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata_v1 = {
             'id': self.revision_id_1,
             'translated_metadata':  {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.revision_metadata_add([metadata_v1])
 
         # when
         actual_metadata = list(self.storage.revision_metadata_get(
             [self.revision_id_1]))
 
         expected_metadata_v1 = [{
             'id': self.revision_id_1,
             'translated_metadata':  metadata_v1['translated_metadata'],
             'tool': self.tools['swh-metadata-detector']
         }]
 
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata':  {
                 'name': 'test_metadata',
                 'author': 'MG',
             },
         })
 
         self.storage.revision_metadata_add([metadata_v2])
 
         # then
         actual_metadata = list(self.storage.revision_metadata_get(
             [self.revision_id_1]))
 
         # metadata did not change as the v2 was dropped.
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
     def test_revision_metadata_add_update_in_place_duplicate(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata_v1 = {
             'id': self.revision_id_2,
             'translated_metadata': {
                 'developmentStatus': None,
                 'version': None,
                 'operatingSystem': None,
                 'description': None,
                 'keywords': None,
                 'issueTracker': None,
                 'name': None,
                 'author': None,
                 'relatedLink': None,
                 'url': None,
                 'license': None,
                 'maintainer': None,
                 'email': None,
                 'softwareRequirements': None,
                 'identifier': None
             },
             'indexer_configuration_id': tool_id,
         }
 
         # given
         self.storage.revision_metadata_add([metadata_v1])
 
         # when
         actual_metadata = list(self.storage.revision_metadata_get(
             [self.revision_id_2]))
 
         # then
         expected_metadata_v1 = [{
             'id': self.revision_id_2,
             'translated_metadata':  metadata_v1['translated_metadata'],
             'tool': self.tools['swh-metadata-detector']
         }]
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'translated_metadata':  {
                 'name': 'test_update_duplicated_metadata',
                 'author': 'MG'
             },
         })
         self.storage.revision_metadata_add([metadata_v2], conflict_update=True)
 
         actual_metadata = list(self.storage.revision_metadata_get(
             [self.revision_id_2]))
 
         expected_metadata_v2 = [{
             'id': self.revision_id_2,
             'translated_metadata': metadata_v2['translated_metadata'],
             'tool': self.tools['swh-metadata-detector']
         }]
 
         # metadata did change as the v2 was used to overwrite v1
         self.assertEqual(actual_metadata, expected_metadata_v2)
 
     def test_origin_intrinsic_metadata_get(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata = {
             'developmentStatus': None,
             'version': None,
             'operatingSystem': None,
             'description': None,
             'keywords': None,
             'issueTracker': None,
             'name': None,
             'author': None,
             'relatedLink': None,
             'url': None,
             'license': None,
             'maintainer': None,
             'email': None,
             'softwareRequirements': None,
             'identifier': None,
         }
         metadata_rev = {
             'id': self.revision_id_2,
             'translated_metadata': metadata,
             'indexer_configuration_id': tool_id,
         }
         metadata_origin = {
             'origin_id': self.origin_id_1,
             'metadata': metadata,
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_2,
             }
 
         # when
         self.storage.revision_metadata_add([metadata_rev])
         self.storage.origin_intrinsic_metadata_add([metadata_origin])
 
         # then
         actual_metadata = list(self.storage.origin_intrinsic_metadata_get(
             [self.origin_id_1, 42]))
 
         expected_metadata = [{
             'origin_id': self.origin_id_1,
             'metadata': metadata,
             'tool': self.tools['swh-metadata-detector'],
             'from_revision': self.revision_id_2,
         }]
 
         self.assertEqual(actual_metadata, expected_metadata)
 
     def test_origin_intrinsic_metadata_add_drop_duplicate(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata_v1 = {
             'developmentStatus': None,
             'version': None,
             'operatingSystem': None,
             'description': None,
             'keywords': None,
             'issueTracker': None,
             'name': None,
             'author': None,
             'relatedLink': None,
             'url': None,
             'license': None,
             'maintainer': None,
             'email': None,
             'softwareRequirements': None,
             'identifier': None
         }
         metadata_rev_v1 = {
             'id': self.revision_id_1,
             'translated_metadata': metadata_v1.copy(),
             'indexer_configuration_id': tool_id,
         }
         metadata_origin_v1 = {
             'origin_id': self.origin_id_1,
             'metadata': metadata_v1.copy(),
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_1,
         }
 
         # given
         self.storage.revision_metadata_add([metadata_rev_v1])
         self.storage.origin_intrinsic_metadata_add([metadata_origin_v1])
 
         # when
         actual_metadata = list(self.storage.origin_intrinsic_metadata_get(
             [self.origin_id_1, 42]))
 
         expected_metadata_v1 = [{
             'origin_id': self.origin_id_1,
             'metadata': metadata_v1,
             'tool': self.tools['swh-metadata-detector'],
             'from_revision': self.revision_id_1,
         }]
 
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'name': 'test_metadata',
             'author': 'MG',
         })
         metadata_rev_v2 = metadata_rev_v1.copy()
         metadata_origin_v2 = metadata_origin_v1.copy()
         metadata_rev_v2['translated_metadata'] = metadata_v2
         metadata_origin_v2['translated_metadata'] = metadata_v2
 
         self.storage.revision_metadata_add([metadata_rev_v2])
         self.storage.origin_intrinsic_metadata_add([metadata_origin_v2])
 
         # then
         actual_metadata = list(self.storage.origin_intrinsic_metadata_get(
             [self.origin_id_1]))
 
         # metadata did not change as the v2 was dropped.
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
     def test_origin_intrinsic_metadata_add_update_in_place_duplicate(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata_v1 = {
             'developmentStatus': None,
             'version': None,
             'operatingSystem': None,
             'description': None,
             'keywords': None,
             'issueTracker': None,
             'name': None,
             'author': None,
             'relatedLink': None,
             'url': None,
             'license': None,
             'maintainer': None,
             'email': None,
             'softwareRequirements': None,
             'identifier': None
         }
         metadata_rev_v1 = {
             'id': self.revision_id_2,
             'translated_metadata': metadata_v1,
             'indexer_configuration_id': tool_id,
         }
         metadata_origin_v1 = {
             'origin_id': self.origin_id_1,
             'metadata': metadata_v1.copy(),
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_2,
         }
 
         # given
         self.storage.revision_metadata_add([metadata_rev_v1])
         self.storage.origin_intrinsic_metadata_add([metadata_origin_v1])
 
         # when
         actual_metadata = list(self.storage.origin_intrinsic_metadata_get(
             [self.origin_id_1]))
 
         # then
         expected_metadata_v1 = [{
             'origin_id': self.origin_id_1,
             'metadata': metadata_v1,
             'tool': self.tools['swh-metadata-detector'],
             'from_revision': self.revision_id_2,
         }]
         self.assertEqual(actual_metadata, expected_metadata_v1)
 
         # given
         metadata_v2 = metadata_v1.copy()
         metadata_v2.update({
             'name': 'test_update_duplicated_metadata',
             'author': 'MG',
         })
         metadata_rev_v2 = metadata_rev_v1.copy()
         metadata_origin_v2 = metadata_origin_v1.copy()
         metadata_rev_v2['translated_metadata'] = metadata_v2
         metadata_origin_v2['metadata'] = metadata_v2
 
         self.storage.revision_metadata_add([metadata_rev_v2],
                                            conflict_update=True)
         self.storage.origin_intrinsic_metadata_add([metadata_origin_v2],
                                                    conflict_update=True)
 
         actual_metadata = list(self.storage.origin_intrinsic_metadata_get(
             [self.origin_id_1]))
 
         expected_metadata_v2 = [{
             'origin_id': self.origin_id_1,
             'metadata': metadata_v2,
             'tool': self.tools['swh-metadata-detector'],
             'from_revision': self.revision_id_2,
         }]
 
         # metadata did change as the v2 was used to overwrite v1
         self.assertEqual(actual_metadata, expected_metadata_v2)
 
     def test_origin_intrinsic_metadata_search_fulltext(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         metadata1 = {
             'author': 'John Doe',
         }
         metadata1_rev = {
             'id': self.revision_id_1,
             'translated_metadata': metadata1,
             'indexer_configuration_id': tool_id,
         }
         metadata1_origin = {
             'origin_id': self.origin_id_1,
             'metadata': metadata1,
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_1,
         }
         metadata2 = {
             'author': 'Jane Doe',
         }
         metadata2_rev = {
             'id': self.revision_id_2,
             'translated_metadata': metadata2,
             'indexer_configuration_id': tool_id,
         }
         metadata2_origin = {
             'origin_id': self.origin_id_2,
             'metadata': metadata2,
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_2,
         }
 
         # when
         self.storage.revision_metadata_add([metadata1_rev])
         self.storage.origin_intrinsic_metadata_add([metadata1_origin])
         self.storage.revision_metadata_add([metadata2_rev])
         self.storage.origin_intrinsic_metadata_add([metadata2_origin])
 
         # then
         search = self.storage.origin_intrinsic_metadata_search_fulltext
         self.assertCountEqual(
                 [res['origin_id'] for res in search(['Doe'])],
                 [self.origin_id_1, self.origin_id_2])
         self.assertEqual(
                 [res['origin_id'] for res in search(['John', 'Doe'])],
                 [self.origin_id_1])
         self.assertEqual(
                 [res['origin_id'] for res in search(['John'])],
                 [self.origin_id_1])
         self.assertEqual(
                 [res['origin_id'] for res in search(['John', 'Jane'])],
                 [])
 
     def test_origin_intrinsic_metadata_search_fulltext_rank(self):
         # given
         tool_id = self.tools['swh-metadata-detector']['id']
 
         # The following authors have "Random Person" to add some more content
         # to the JSON data, to work around normalization quirks when there
         # are few words (rank/(1+ln(nb_words)) is very sensitive to nb_words
         # for small values of nb_words).
         metadata1 = {
             'author': [
                 'Random Person',
                 'John Doe',
                 'Jane Doe',
             ]
         }
         metadata1_rev = {
             'id': self.revision_id_1,
             'translated_metadata': metadata1,
             'indexer_configuration_id': tool_id,
         }
         metadata1_origin = {
             'origin_id': self.origin_id_1,
             'metadata': metadata1,
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_1,
         }
         metadata2 = {
             'author': [
                 'Random Person',
                 'Jane Doe',
             ]
         }
         metadata2_rev = {
             'id': self.revision_id_2,
             'translated_metadata': metadata2,
             'indexer_configuration_id': tool_id,
         }
         metadata2_origin = {
             'origin_id': self.origin_id_2,
             'metadata': metadata2,
             'indexer_configuration_id': tool_id,
             'from_revision': self.revision_id_2,
         }
 
         # when
         self.storage.revision_metadata_add([metadata1_rev])
         self.storage.origin_intrinsic_metadata_add([metadata1_origin])
         self.storage.revision_metadata_add([metadata2_rev])
         self.storage.origin_intrinsic_metadata_add([metadata2_origin])
 
         # then
         search = self.storage.origin_intrinsic_metadata_search_fulltext
         self.assertEqual(
                 [res['origin_id'] for res in search(['Doe'])],
                 [self.origin_id_1, self.origin_id_2])
         self.assertEqual(
                 [res['origin_id'] for res in search(['Doe'], limit=1)],
                 [self.origin_id_1])
         self.assertEqual(
                 [res['origin_id'] for res in search(['John'])],
                 [self.origin_id_1])
         self.assertEqual(
                 [res['origin_id'] for res in search(['Jane'])],
                 [self.origin_id_2, self.origin_id_1])
         self.assertEqual(
                 [res['origin_id'] for res in search(['John', 'Jane'])],
                 [self.origin_id_1])
 
     def test_indexer_configuration_add(self):
         tool = {
             'tool_name': 'some-unknown-tool',
             'tool_version': 'some-version',
             'tool_configuration': {"debian-package": "some-package"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
         self.assertIsNone(actual_tool)  # does not exist
 
         # add it
         actual_tools = list(self.storage.indexer_configuration_add([tool]))
 
         self.assertEqual(len(actual_tools), 1)
         actual_tool = actual_tools[0]
         self.assertIsNotNone(actual_tool)  # now it exists
         new_id = actual_tool.pop('id')
         self.assertEqual(actual_tool, tool)
 
         actual_tools2 = list(self.storage.indexer_configuration_add([tool]))
         actual_tool2 = actual_tools2[0]
         self.assertIsNotNone(actual_tool2)  # now it exists
         new_id2 = actual_tool2.pop('id')
 
         self.assertEqual(new_id, new_id2)
         self.assertEqual(actual_tool, actual_tool2)
 
     def test_indexer_configuration_add_multiple(self):
         tool = {
             'tool_name': 'some-unknown-tool',
             'tool_version': 'some-version',
             'tool_configuration': {"debian-package": "some-package"},
         }
 
         actual_tools = list(self.storage.indexer_configuration_add([tool]))
         self.assertEqual(len(actual_tools), 1)
 
         new_tools = [tool, {
             'tool_name': 'yet-another-tool',
             'tool_version': 'version',
             'tool_configuration': {},
         }]
 
         actual_tools = list(self.storage.indexer_configuration_add(new_tools))
         self.assertEqual(len(actual_tools), 2)
 
         # order not guaranteed, so we iterate over results to check
         for tool in actual_tools:
             _id = tool.pop('id')
             self.assertIsNotNone(_id)
             self.assertIn(tool, new_tools)
 
     def test_indexer_configuration_get_missing(self):
         tool = {
             'tool_name': 'unknown-tool',
             'tool_version': '3.1.0rc2-31-ga2cbb8c',
             'tool_configuration': {"command_line": "nomossa <filepath>"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         self.assertIsNone(actual_tool)
 
     def test_indexer_configuration_get(self):
         tool = {
             'tool_name': 'nomos',
             'tool_version': '3.1.0rc2-31-ga2cbb8c',
             'tool_configuration': {"command_line": "nomossa <filepath>"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         expected_tool = tool.copy()
         expected_tool['id'] = 1
 
         self.assertEqual(expected_tool, actual_tool)
 
     def test_indexer_configuration_metadata_get_missing_context(self):
         tool = {
             'tool_name': 'swh-metadata-translator',
             'tool_version': '0.0.1',
             'tool_configuration': {"context": "unknown-context"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         self.assertIsNone(actual_tool)
 
     def test_indexer_configuration_metadata_get(self):
         tool = {
             'tool_name': 'swh-metadata-translator',
             'tool_version': '0.0.1',
             'tool_configuration': {"type": "local", "context": "NpmMapping"},
         }
 
         actual_tool = self.storage.indexer_configuration_get(tool)
 
         expected_tool = tool.copy()
         expected_tool['id'] = actual_tool['id']
 
         self.assertEqual(expected_tool, actual_tool)
 
 
 @pytest.mark.property_based
 class PropBasedTestStorage(BaseTestStorage, unittest.TestCase):
     """Properties-based tests
 
     """
     def test_generate_content_mimetype_get_range_limit_none(self):
         """mimetype_get_range call with wrong limit input should fail"""
         with self.assertRaises(ValueError) as e:
             self.storage.content_mimetype_get_range(
                 start=None, end=None, indexer_configuration_id=None,
                 limit=None)
 
         self.assertEqual(e.exception.args, (
             'Development error: limit should not be None',))
 
     @given(gen_content_mimetypes(min_size=1, max_size=4))
     def test_generate_content_mimetype_get_range_no_limit(self, mimetypes):
         """mimetype_get_range returns mimetypes within range provided"""
         self.reset_storage_tables()
         # add mimetypes to storage
         self.storage.content_mimetype_add(mimetypes)
 
         # All ids from the db
         content_ids = sorted([c['id'] for c in mimetypes])
 
         start = content_ids[0]
         end = content_ids[-1]
 
         # retrieve mimetypes
         tool_id = mimetypes[0]['indexer_configuration_id']
         actual_result = self.storage.content_mimetype_get_range(
             start, end, indexer_configuration_id=tool_id)
 
         actual_ids = actual_result['ids']
         actual_next = actual_result['next']
 
         self.assertEqual(len(mimetypes), len(actual_ids))
         self.assertIsNone(actual_next)
         self.assertEqual(content_ids, actual_ids)
 
     @given(gen_content_mimetypes(min_size=4, max_size=4))
     def test_generate_content_mimetype_get_range_limit(self, mimetypes):
         """mimetype_get_range paginates results if limit exceeded"""
         self.reset_storage_tables()
 
         # add mimetypes to storage
         self.storage.content_mimetype_add(mimetypes)
 
         # input the list of sha1s we want from storage
         content_ids = sorted([c['id'] for c in mimetypes])
         start = content_ids[0]
         end = content_ids[-1]
 
         # retrieve mimetypes limited to 3 results
         limited_results = len(mimetypes) - 1
         tool_id = mimetypes[0]['indexer_configuration_id']
         actual_result = self.storage.content_mimetype_get_range(
             start, end,
             indexer_configuration_id=tool_id, limit=limited_results)
 
         actual_ids = actual_result['ids']
         actual_next = actual_result['next']
 
         self.assertEqual(limited_results, len(actual_ids))
         self.assertIsNotNone(actual_next)
         self.assertEqual(actual_next, content_ids[-1])
 
         expected_mimetypes = content_ids[:-1]
         self.assertEqual(expected_mimetypes, actual_ids)
 
         # retrieve next part
         actual_results2 = self.storage.content_mimetype_get_range(
             start=end, end=end, indexer_configuration_id=tool_id)
         actual_ids2 = actual_results2['ids']
         actual_next2 = actual_results2['next']
 
         self.assertIsNone(actual_next2)
         expected_mimetypes2 = [content_ids[-1]]
         self.assertEqual(expected_mimetypes2, actual_ids2)
 
     def test_generate_content_fossology_license_get_range_limit_none(self):
         """license_get_range call with wrong limit input should fail"""
         with self.assertRaises(ValueError) as e:
             self.storage.content_fossology_license_get_range(
                 start=None, end=None, indexer_configuration_id=None,
                 limit=None)
 
         self.assertEqual(e.exception.args, (
             'Development error: limit should not be None',))
 
     def prepare_mimetypes_from(self, fossology_licenses):
         """Fossology license needs some consistent data in db to run.
 
         """
         mimetypes = []
         for c in fossology_licenses:
             mimetypes.append({
                 'id': c['id'],
                 'mimetype': 'text/plain',
                 'encoding': 'utf-8',
                 'indexer_configuration_id': c['indexer_configuration_id'],
             })
         return mimetypes
 
     @given(gen_content_fossology_licenses(min_size=1, max_size=4))
     def test_generate_content_fossology_license_get_range_no_limit(
             self, fossology_licenses):
         """license_get_range returns licenses within range provided"""
         self.reset_storage_tables()
         # craft some consistent mimetypes
         mimetypes = self.prepare_mimetypes_from(fossology_licenses)
 
         self.storage.content_mimetype_add(mimetypes)
         # add fossology_licenses to storage
         self.storage.content_fossology_license_add(fossology_licenses)
 
         # All ids from the db
         content_ids = sorted([c['id'] for c in fossology_licenses])
 
         start = content_ids[0]
         end = content_ids[-1]
 
         # retrieve fossology_licenses
         tool_id = fossology_licenses[0]['indexer_configuration_id']
         actual_result = self.storage.content_fossology_license_get_range(
             start, end, indexer_configuration_id=tool_id)
 
         actual_ids = actual_result['ids']
         actual_next = actual_result['next']
 
         self.assertEqual(len(fossology_licenses), len(actual_ids))
         self.assertIsNone(actual_next)
         self.assertEqual(content_ids, actual_ids)
 
     @given(gen_content_fossology_licenses(min_size=1, max_size=4),
            gen_content_mimetypes(min_size=1, max_size=1))
     def test_generate_content_fossology_license_get_range_no_limit_with_filter(
             self, fossology_licenses, mimetypes):
         """This filters non textual, then returns results within range"""
         self.reset_storage_tables()
 
         # craft some consistent mimetypes
         _mimetypes = self.prepare_mimetypes_from(fossology_licenses)
         # add binary mimetypes which will get filtered out in results
         for m in mimetypes:
             _mimetypes.append({
                 'mimetype': 'binary',
                 **m,
             })
 
         self.storage.content_mimetype_add(_mimetypes)
         # add fossology_licenses to storage
         self.storage.content_fossology_license_add(fossology_licenses)
 
         # All ids from the db
         content_ids = sorted([c['id'] for c in fossology_licenses])
 
         start = content_ids[0]
         end = content_ids[-1]
 
         # retrieve fossology_licenses
         tool_id = fossology_licenses[0]['indexer_configuration_id']
         actual_result = self.storage.content_fossology_license_get_range(
             start, end, indexer_configuration_id=tool_id)
 
         actual_ids = actual_result['ids']
         actual_next = actual_result['next']
 
         self.assertEqual(len(fossology_licenses), len(actual_ids))
         self.assertIsNone(actual_next)
         self.assertEqual(content_ids, actual_ids)
 
     @given(gen_content_fossology_licenses(min_size=4, max_size=4))
     def test_generate_fossology_license_get_range_limit(
             self, fossology_licenses):
         """fossology_license_get_range paginates results if limit exceeded"""
         self.reset_storage_tables()
         # craft some consistent mimetypes
         mimetypes = self.prepare_mimetypes_from(fossology_licenses)
 
         # add fossology_licenses to storage
         self.storage.content_mimetype_add(mimetypes)
         self.storage.content_fossology_license_add(fossology_licenses)
 
         # input the list of sha1s we want from storage
         content_ids = sorted([c['id'] for c in fossology_licenses])
         start = content_ids[0]
         end = content_ids[-1]
 
         # retrieve fossology_licenses limited to 3 results
         limited_results = len(fossology_licenses) - 1
         tool_id = fossology_licenses[0]['indexer_configuration_id']
         actual_result = self.storage.content_fossology_license_get_range(
             start, end,
             indexer_configuration_id=tool_id, limit=limited_results)
 
         actual_ids = actual_result['ids']
         actual_next = actual_result['next']
 
         self.assertEqual(limited_results, len(actual_ids))
         self.assertIsNotNone(actual_next)
         self.assertEqual(actual_next, content_ids[-1])
 
         expected_fossology_licenses = content_ids[:-1]
         self.assertEqual(expected_fossology_licenses, actual_ids)
 
         # retrieve next part
         actual_results2 = self.storage.content_fossology_license_get_range(
             start=end, end=end, indexer_configuration_id=tool_id)
         actual_ids2 = actual_results2['ids']
         actual_next2 = actual_results2['next']
 
         self.assertIsNone(actual_next2)
         expected_fossology_licenses2 = [content_ids[-1]]
         self.assertEqual(expected_fossology_licenses2, actual_ids2)
 
 
 class IndexerTestStorage(CommonTestStorage, unittest.TestCase):
     """Running the tests locally.
 
     For the client api tests (remote storage), see
     `class`:swh.indexer.storage.test_api_client:TestRemoteStorage
     class.
 
     """
     pass
diff --git a/swh/indexer/tests/test_mimetype.py b/swh/indexer/tests/test_mimetype.py
index 41ad9ea..40dd723 100644
--- a/swh/indexer/tests/test_mimetype.py
+++ b/swh/indexer/tests/test_mimetype.py
@@ -1,188 +1,188 @@
 # Copyright (C) 2017-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import unittest
 import logging
 
 from unittest.mock import patch
 
 from swh.indexer.mimetype import (
     ContentMimetypeIndexer, MimetypeRangeIndexer, compute_mimetype_encoding
 )
 
 from swh.indexer.tests.test_utils import (
     MockObjStorage, BasicMockStorage, BasicMockIndexerStorage,
     CommonContentIndexerTest, CommonContentIndexerRangeTest,
     CommonIndexerWithErrorsTest, CommonIndexerNoTool
 )
 
 
 class FakeMagicResult:
     def __init__(self, mimetype, encoding):
         self.mime_type = mimetype
         self.encoding = encoding
 
 
 class BasicTest(unittest.TestCase):
     @patch('swh.indexer.mimetype.magic')
     def test_compute_mimetype_encoding(self, mock_magic):
         """Compute mimetype encoding should return results"""
         for _input, _mimetype, _encoding in [
                 (b'some-content', 'text/plain', 'utf-8'),
                 (b'raw-content', 'application/json', 'ascii')]:
             mock_magic.detect_from_content.return_value = FakeMagicResult(
                 _mimetype, _encoding)
 
             actual_result = compute_mimetype_encoding(_input)
             self.assertEqual(actual_result, {
-                'mimetype': _mimetype.encode('utf-8'),
-                'encoding': _encoding.encode('utf-8'),
+                'mimetype': _mimetype,
+                'encoding': _encoding
             })
 
 
 class MimetypeTestIndexer(ContentMimetypeIndexer):
     """Specific mimetype indexer instance whose configuration is enough to
        satisfy the indexing tests.
 
     """
     def prepare(self):
         self.config = {
             'tools': {
                 'name': 'file',
                 'version': '1:5.30-1+deb9u1',
                 'configuration': {
                     "type": "library",
                     "debian-package": "python3-magic"
                 },
             },
         }
         self.idx_storage = BasicMockIndexerStorage()
         self.log = logging.getLogger('swh.indexer')
         self.objstorage = MockObjStorage()
         self.tools = self.register_tools(self.config['tools'])
         self.tool = self.tools[0]
 
 
 class TestMimetypeIndexer(CommonContentIndexerTest, unittest.TestCase):
     """Mimetype indexer test scenarios:
 
     - Known sha1s in the input list have their data indexed
     - Unknown sha1 in the input list are not indexed
 
     """
     def setUp(self):
         self.indexer = MimetypeTestIndexer()
 
         self.id0 = '01c9379dfc33803963d07c1ccc748d3fe4c96bb5'
         self.id1 = '688a5ef812c53907562fe379d4b3851e69c7cb15'
         self.id2 = 'da39a3ee5e6b4b0d3255bfef95601890afd80709'
         tool_id = self.indexer.tool['id']
         self.expected_results = {
             self.id0: {
                 'id': self.id0,
                 'indexer_configuration_id': tool_id,
-                'mimetype': b'text/plain',
-                'encoding': b'us-ascii',
+                'mimetype': 'text/plain',
+                'encoding': 'us-ascii',
             },
             self.id1: {
                 'id': self.id1,
                 'indexer_configuration_id': tool_id,
-                'mimetype': b'text/plain',
-                'encoding': b'us-ascii',
+                'mimetype': 'text/plain',
+                'encoding': 'us-ascii',
             },
             self.id2: {
                 'id': self.id2,
                 'indexer_configuration_id': tool_id,
-                'mimetype': b'application/x-empty',
-                'encoding': b'binary',
+                'mimetype': 'application/x-empty',
+                'encoding': 'binary',
             }
         }
 
 
 class MimetypeRangeIndexerTest(MimetypeRangeIndexer):
     """Specific mimetype whose configuration is enough to satisfy the
        indexing tests.
 
     """
     def prepare(self):
         self.config = {
             'tools': {
                 'name': 'file',
                 'version': '1:5.30-1+deb9u1',
                 'configuration': {
                     "type": "library",
                     "debian-package": "python3-magic"
                 },
             },
             'write_batch_size': 100,
         }
         self.idx_storage = BasicMockIndexerStorage()
         self.log = logging.getLogger('swh.indexer')
         # this hardcodes some contents, will use this to setup the storage
         self.objstorage = MockObjStorage()
         # sync objstorage and storage
         contents = [{'sha1': c_id} for c_id in self.objstorage]
         self.storage = BasicMockStorage(contents)
         self.tools = self.register_tools(self.config['tools'])
         self.tool = self.tools[0]
 
 
 class TestMimetypeRangeIndexer(
         CommonContentIndexerRangeTest, unittest.TestCase):
     """Range Mimetype Indexer tests.
 
     - new data within range are indexed
     - no data outside a range are indexed
     - with filtering existing indexed data prior to compute new index
     - without filtering existing indexed data prior to compute new index
 
     """
     def setUp(self):
         self.indexer = MimetypeRangeIndexerTest()
         # will play along with the objstorage's mocked contents for now
         self.contents = sorted(self.indexer.objstorage)
         # FIXME: leverage swh.objstorage.in_memory_storage's
         # InMemoryObjStorage, swh.storage.tests's gen_contents, and
         # hypothesis to generate data to actually run indexer on those
 
         self.id0 = '01c9379dfc33803963d07c1ccc748d3fe4c96bb5'
         self.id1 = '02fb2c89e14f7fab46701478c83779c7beb7b069'
         self.id2 = '103bc087db1d26afc3a0283f38663d081e9b01e6'
         tool_id = self.indexer.tool['id']
 
         self.expected_results = {
             self.id0: {
-                'encoding': b'us-ascii',
+                'encoding': 'us-ascii',
                 'id': self.id0,
                 'indexer_configuration_id': tool_id,
-                'mimetype': b'text/plain'},
+                'mimetype': 'text/plain'},
             self.id1: {
-                'encoding': b'us-ascii',
+                'encoding': 'us-ascii',
                 'id': self.id1,
                 'indexer_configuration_id': tool_id,
-                'mimetype': b'text/x-python'},
+                'mimetype': 'text/x-python'},
             self.id2: {
-                'encoding': b'us-ascii',
+                'encoding': 'us-ascii',
                 'id': self.id2,
                 'indexer_configuration_id': tool_id,
-                'mimetype': b'text/plain'}
+                'mimetype': 'text/plain'}
         }
 
 
 class MimetypeIndexerUnknownToolTestStorage(
         CommonIndexerNoTool, MimetypeTestIndexer):
     """Mimetype indexer with wrong configuration"""
 
 
 class MimetypeRangeIndexerUnknownToolTestStorage(
         CommonIndexerNoTool, MimetypeRangeIndexerTest):
     """Mimetype range indexer with wrong configuration"""
 
 
 class TestMimetypeIndexersErrors(
         CommonIndexerWithErrorsTest, unittest.TestCase):
     """Test the indexer raise the right errors when wrongly initialized"""
     Indexer = MimetypeIndexerUnknownToolTestStorage
     RangeIndexer = MimetypeRangeIndexerUnknownToolTestStorage