diff --git a/swh/web/api/views/content.py b/swh/web/api/views/content.py
index c327303d..661cc103 100644
--- a/swh/web/api/views/content.py
+++ b/swh/web/api/views/content.py
@@ -1,379 +1,381 @@
 # Copyright (C) 2015-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU Affero General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import functools
 
 from django.http import HttpResponse
 
 from swh.web.common import service
 from swh.web.common.utils import reverse
 from swh.web.common.exc import NotFoundExc
 from swh.web.api.apidoc import api_doc
 from swh.web.api import utils
 from swh.web.api.apiurls import api_route
 from swh.web.api.views.utils import api_lookup
 
 
 @api_route(r'/content/(?P<q>[0-9a-z_:]*[0-9a-f]+)/filetype/',
            'api-content-filetype', checksum_args=['q'])
 @api_doc('/content/filetype/')
 def api_content_filetype(request, q):
     """
     .. http:get:: /api/1/content/[(hash_type):](hash)/filetype/
 
         Get information about the detected MIME type of a content object.
 
         :param string hash_type: optional parameter specifying which hashing algorithm has been used
             to compute the content checksum. It can be either ``sha1``, ``sha1_git``, ``sha256``
             or ``blake2s256``. If that parameter is not provided, it is assumed that the
             hashing algorithm used is `sha1`.
         :param string hash: hexadecimal representation of the checksum value computed with
             the specified hashing algorithm.
 
         :>json object content_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/` for
             getting information about the content
         :>json string encoding: the detected content encoding
         :>json string id: the **sha1** identifier of the content
         :>json string mimetype: the detected MIME type of the content
         :>json object tool: information about the tool used to detect the content filetype
 
         :reqheader Accept: the requested response content type,
             either ``application/json`` (default) or ``application/yaml``
         :resheader Content-Type: this depends on :http:header:`Accept` header of request
 
         **Allowed HTTP Methods:** :http:method:`get`, :http:method:`head`, :http:method:`options`
 
         :statuscode 200: no error
         :statuscode 400: an invalid **hash_type** or **hash** has been provided
         :statuscode 404: requested content can not be found in the archive
 
         **Example:**
 
         .. parsed-literal::
 
             :swh_web_api:`content/sha1:dc2830a9e72f23c1dfebef4413003221baa5fb62/filetype/`
     """ # noqa
     return api_lookup(
         service.lookup_content_filetype, q,
         notfound_msg='No filetype information found for content {}.'.format(q),
         enrich_fn=utils.enrich_metadata_endpoint)
 
 
 @api_route(r'/content/(?P<q>[0-9a-z_:]*[0-9a-f]+)/language/',
            'api-content-language', checksum_args=['q'])
 @api_doc('/content/language/')
 def api_content_language(request, q):
     """
     .. http:get:: /api/1/content/[(hash_type):](hash)/language/
 
         Get information about the programming language used in a content object.
 
+        Note: this endpoint currently returns no data.
+
         :param string hash_type: optional parameter specifying which hashing algorithm has been used
             to compute the content checksum. It can be either ``sha1``, ``sha1_git``, ``sha256``
             or ``blake2s256``. If that parameter is not provided, it is assumed that the
             hashing algorithm used is ``sha1``.
         :param string hash: hexadecimal representation of the checksum value computed with
             the specified hashing algorithm.
 
         :>json object content_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/` for
             getting information about the content
         :>json string id: the **sha1** identifier of the content
         :>json string lang: the detected programming language if any
         :>json object tool: information about the tool used to detect the programming language
 
         :reqheader Accept: the requested response content type,
             either ``application/json`` (default) or ``application/yaml``
         :resheader Content-Type: this depends on :http:header:`Accept` header of request
 
         **Allowed HTTP Methods:** :http:method:`get`, :http:method:`head`, :http:method:`options`
 
         :statuscode 200: no error
         :statuscode 400: an invalid **hash_type** or **hash** has been provided
         :statuscode 404: requested content can not be found in the archive
 
         **Example:**
 
         .. parsed-literal::
 
             :swh_web_api:`content/sha1:dc2830a9e72f23c1dfebef4413003221baa5fb62/language/`
     """ # noqa
     return api_lookup(
         service.lookup_content_language, q,
         notfound_msg='No language information found for content {}.'.format(q),
         enrich_fn=utils.enrich_metadata_endpoint)
 
 
 @api_route(r'/content/(?P<q>[0-9a-z_:]*[0-9a-f]+)/license/',
            'api-content-license', checksum_args=['q'])
 @api_doc('/content/license/')
 def api_content_license(request, q):
     """
     .. http:get:: /api/1/content/[(hash_type):](hash)/license/
 
         Get information about the license of a content object.
 
         :param string hash_type: optional parameter specifying which hashing algorithm has been used
             to compute the content checksum. It can be either ``sha1``, ``sha1_git``, ``sha256``
             or ``blake2s256``. If that parameter is not provided, it is assumed that the
             hashing algorithm used is ``sha1``.
         :param string hash: hexadecimal representation of the checksum value computed with
             the specified hashing algorithm.
 
         :>json object content_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/` for
             getting information about the content
         :>json string id: the **sha1** identifier of the content
         :>json array licenses: array of strings containing the detected license names if any
         :>json object tool: information about the tool used to detect the license
 
         :reqheader Accept: the requested response content type,
             either ``application/json`` (default) or ``application/yaml``
         :resheader Content-Type: this depends on :http:header:`Accept` header of request
 
         **Allowed HTTP Methods:** :http:method:`get`, :http:method:`head`, :http:method:`options`
 
         :statuscode 200: no error
         :statuscode 400: an invalid **hash_type** or **hash** has been provided
         :statuscode 404: requested content can not be found in the archive
 
         **Example:**
 
         .. parsed-literal::
 
             :swh_web_api:`content/sha1:dc2830a9e72f23c1dfebef4413003221baa5fb62/license/`
     """ # noqa
     return api_lookup(
         service.lookup_content_license, q,
         notfound_msg='No license information found for content {}.'.format(q),
         enrich_fn=utils.enrich_metadata_endpoint)
 
 
 @api_route(r'/content/(?P<q>[0-9a-z_:]*[0-9a-f]+)/ctags/', 'api-content-ctags')
 @api_doc('/content/ctags/', tags=['hidden'])
 def api_content_ctags(request, q):
     """
     Get information about all `Ctags <http://ctags.sourceforge.net/>`_-style
     symbols defined in a content object.
     """
     return api_lookup(
         service.lookup_content_ctags, q,
         notfound_msg='No ctags symbol found for content {}.'.format(q),
         enrich_fn=utils.enrich_metadata_endpoint)
 
 
 @api_route(r'/content/(?P<q>[0-9a-z_:]*[0-9a-f]+)/raw/', 'api-content-raw',
            checksum_args=['q'])
 @api_doc('/content/raw/', handle_response=True)
 def api_content_raw(request, q):
     """
     .. http:get:: /api/1/content/[(hash_type):](hash)/raw/
 
         Get the raw content of a content object (aka a "blob"), as a byte sequence.
 
         :param string hash_type: optional parameter specifying which hashing algorithm has been used
             to compute the content checksum. It can be either ``sha1``, ``sha1_git``, ``sha256``
             or ``blake2s256``. If that parameter is not provided, it is assumed that the
             hashing algorithm used is ``sha1``.
         :param string hash: hexadecimal representation of the checksum value computed with
             the specified hashing algorithm.
         :query string filename: if provided, the downloaded content will get that filename
 
         :resheader Content-Type: application/octet-stream
 
         **Allowed HTTP Methods:** :http:method:`get`, :http:method:`head`, :http:method:`options`
 
         :statuscode 200: no error
         :statuscode 400: an invalid **hash_type** or **hash** has been provided
         :statuscode 404: requested content can not be found in the archive
 
         **Example:**
 
         .. parsed-literal::
 
             :swh_web_api:`content/sha1:dc2830a9e72f23c1dfebef4413003221baa5fb62/raw/`
     """ # noqa
     def generate(content):
         yield content['data']
 
     content_raw = service.lookup_content_raw(q)
     if not content_raw:
         raise NotFoundExc('Content %s is not found.' % q)
 
     filename = request.query_params.get('filename')
     if not filename:
         filename = 'content_%s_raw' % q.replace(':', '_')
 
     response = HttpResponse(generate(content_raw),
                             content_type='application/octet-stream')
     response['Content-disposition'] = 'attachment; filename=%s' % filename
     return response
 
 
 @api_route(r'/content/symbol/(?P<q>.+)/', 'api-content-symbol')
 @api_doc('/content/symbol/', tags=['hidden'])
 def api_content_symbol(request, q=None):
     """Search content objects by `Ctags <http://ctags.sourceforge.net/>`_-style
     symbol (e.g., function name, data type, method, ...).
 
     """
     result = {}
     last_sha1 = request.query_params.get('last_sha1', None)
     per_page = int(request.query_params.get('per_page', '10'))
 
     def lookup_exp(exp, last_sha1=last_sha1, per_page=per_page):
         exp = list(service.lookup_expression(exp, last_sha1, per_page))
         return exp if exp else None
 
     symbols = api_lookup(
         lookup_exp, q,
         notfound_msg="No indexed raw content match expression '{}'.".format(q),
         enrich_fn=functools.partial(utils.enrich_content, top_url=True))
 
     if symbols:
         nb_symbols = len(symbols)
 
         if nb_symbols == per_page:
             query_params = {}
             new_last_sha1 = symbols[-1]['sha1']
             query_params['last_sha1'] = new_last_sha1
             if request.query_params.get('per_page'):
                 query_params['per_page'] = per_page
 
             result['headers'] = {
                 'link-next': reverse('api-content-symbol', url_args={'q': q},
                                      query_params=query_params)
             }
 
     result.update({
         'results': symbols
     })
 
     return result
 
 
 @api_route(r'/content/known/search/', 'api-content-known', methods=['POST'])
 @api_route(r'/content/known/(?P<q>(?!search).*)/', 'api-content-known')
 @api_doc('/content/known/', tags=['hidden'])
 def api_check_content_known(request, q=None):
     """
     .. http:get:: /api/1/content/known/(sha1)[,(sha1), ...,(sha1)]/
 
         Check whether some content(s) (aka "blob(s)") is present in the archive
         based on its **sha1** checksum.
 
         :param string sha1: hexadecimal representation of the **sha1** checksum value
             for the content to check existence. Multiple values can be provided separated
             by ','.
 
         :reqheader Accept: the requested response content type,
             either ``application/json`` (default) or ``application/yaml``
         :resheader Content-Type: this depends on :http:header:`Accept` header of request
 
         :>json array search_res: array holding the search result for each provided **sha1**
         :>json object search_stats: some statistics regarding the number of **sha1** provided
             and the percentage of those found in the archive
 
         **Allowed HTTP Methods:** :http:method:`get`, :http:method:`head`, :http:method:`options`
 
         :statuscode 200: no error
         :statuscode 400: an invalid **sha1** has been provided
 
         **Example:**
 
         .. parsed-literal::
 
             :swh_web_api:`content/known/dc2830a9e72f23c1dfebef4413003221baa5fb62,0c3f19cb47ebfbe643fb19fa94c874d18fa62d12/`
     """ # noqa
     response = {'search_res': None,
                 'search_stats': None}
     search_stats = {'nbfiles': 0, 'pct': 0}
     search_res = None
 
     queries = []
     # GET: Many hash separated values request
     if q:
         hashes = q.split(',')
         for v in hashes:
             queries.append({'filename': None, 'sha1': v})
 
     # POST: Many hash requests in post form submission
     elif request.method == 'POST':
         data = request.data
         # Remove potential inputs with no associated value
         for k, v in data.items():
             if v is not None:
                 if k == 'q' and len(v) > 0:
                     queries.append({'filename': None, 'sha1': v})
                 elif v != '':
                     queries.append({'filename': k, 'sha1': v})
 
     if queries:
         lookup = service.lookup_multiple_hashes(queries)
         result = []
         nb_queries = len(queries)
         for el in lookup:
             res_d = {'sha1': el['sha1'],
                      'found': el['found']}
             if 'filename' in el and el['filename']:
                 res_d['filename'] = el['filename']
             result.append(res_d)
             search_res = result
             nbfound = len([x for x in lookup if x['found']])
             search_stats['nbfiles'] = nb_queries
             search_stats['pct'] = (nbfound / nb_queries) * 100
 
     response['search_res'] = search_res
     response['search_stats'] = search_stats
     return response
 
 
 @api_route(r'/content/(?P<q>[0-9a-z_:]*[0-9a-f]+)/', 'api-content',
            checksum_args=['q'])
 @api_doc('/content/')
 def api_content_metadata(request, q):
     """
     .. http:get:: /api/1/content/[(hash_type):](hash)/
 
         Get information about a content (aka a "blob") object.
         In the archive, a content object is identified based on checksum
         values computed using various hashing algorithms.
 
         :param string hash_type: optional parameter specifying which hashing algorithm has been used
             to compute the content checksum. It can be either ``sha1``, ``sha1_git``, ``sha256``
             or ``blake2s256``. If that parameter is not provided, it is assumed that the
             hashing algorithm used is ``sha1``.
         :param string hash: hexadecimal representation of the checksum value computed with
             the specified hashing algorithm.
 
         :reqheader Accept: the requested response content type,
             either ``application/json`` (default) or ``application/yaml``
         :resheader Content-Type: this depends on :http:header:`Accept` header of request
 
         :>json object checksums: object holding the computed checksum values for the requested content
         :>json string data_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/raw/`
             for downloading the content raw bytes
         :>json string filetype_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/filetype/`
             for getting information about the content MIME type
         :>json string language_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/language/`
             for getting information about the programming language used in the content
         :>json number length: length of the content in bytes
         :>json string license_url: link to :http:get:`/api/1/content/[(hash_type):](hash)/license/`
             for getting information about the license of the content
 
         **Allowed HTTP Methods:** :http:method:`get`, :http:method:`head`, :http:method:`options`
 
         :statuscode 200: no error
         :statuscode 400: an invalid **hash_type** or **hash** has been provided
         :statuscode 404: requested content can not be found in the archive
 
         **Example:**
 
         .. parsed-literal::
 
             curl -i :swh_web_api:`content/sha1_git:fe95a46679d128ff167b7c55df5d02356c5a1ae1/`
     """ # noqa
     return api_lookup(
         service.lookup_content, q,
         notfound_msg='Content with {} not found.'.format(q),
         enrich_fn=functools.partial(utils.enrich_content, query_string=q))
diff --git a/swh/web/tests/api/views/test_content.py b/swh/web/tests/api/views/test_content.py
index ae402069..778b62c0 100644
--- a/swh/web/tests/api/views/test_content.py
+++ b/swh/web/tests/api/views/test_content.py
@@ -1,388 +1,389 @@
 # Copyright (C) 2015-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU Affero General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import pytest
 
 from hypothesis import given
 from rest_framework.test import APITestCase
 
 from swh.web.common.utils import reverse
 from swh.web.tests.strategies import (
     content, unknown_content, contents_with_ctags
 )
 from swh.web.tests.testcase import (
     WebTestCase, ctags_json_missing, fossology_missing
 )
 
 
 class ContentApiTestCase(WebTestCase, APITestCase):
 
     @given(content())
     def test_api_content_filetype(self, content):
 
         self.content_add_mimetype(content['sha1'])
         url = reverse('api-content-filetype',
                       url_args={'q': 'sha1_git:%s' % content['sha1_git']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         content_url = reverse('api-content',
                               url_args={'q': 'sha1:%s' % content['sha1']})
         expected_data = self.content_get_mimetype(content['sha1'])
         expected_data['content_url'] = content_url
         self.assertEqual(rv.data, expected_data)
 
     @given(unknown_content())
     def test_api_content_filetype_sha_not_found(self, unknown_content):
 
         url = reverse('api-content-filetype',
                       url_args={'q': 'sha1:%s' % unknown_content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 404)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'No filetype information found for content '
             'sha1:%s.' % unknown_content['sha1']
         })
 
+    @pytest.mark.xfail  # Language indexer is disabled
     @given(content())
     def test_api_content_language(self, content):
 
         self.content_add_language(content['sha1'])
         url = reverse('api-content-language',
                       url_args={'q': 'sha1_git:%s' % content['sha1_git']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         content_url = reverse('api-content',
                               url_args={'q': 'sha1:%s' % content['sha1']})
         expected_data = self.content_get_language(content['sha1'])
         expected_data['content_url'] = content_url
         self.assertEqual(rv.data, expected_data)
 
     @given(unknown_content())
     def test_api_content_language_sha_not_found(self, unknown_content):
 
         url = reverse('api-content-language',
                       url_args={'q': 'sha1:%s' % unknown_content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 404)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'No language information found for content '
             'sha1:%s.' % unknown_content['sha1']
         })
 
     @pytest.mark.skipif(ctags_json_missing,
                         reason="requires ctags with json output support")
     @given(contents_with_ctags())
     def test_api_content_symbol(self, contents_with_ctags):
 
         expected_data = {}
         for content_sha1 in contents_with_ctags['sha1s']:
             self.content_add_ctags(content_sha1)
             for ctag in self.content_get_ctags(content_sha1):
                 if ctag['name'] == contents_with_ctags['symbol_name']:
                     expected_data[content_sha1] = ctag
                     break
         url = reverse('api-content-symbol',
                       url_args={'q': contents_with_ctags['symbol_name']},
                       query_params={'per_page': 100})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         for entry in rv.data:
             content_sha1 = entry['sha1']
             expected_entry = expected_data[content_sha1]
             for key, view_name in (('content_url', 'api-content'),
                                    ('data_url', 'api-content-raw'),
                                    ('license_url', 'api-content-license'),
                                    ('language_url', 'api-content-language'),
                                    ('filetype_url', 'api-content-filetype')):
                 expected_entry[key] = reverse(view_name,
                                               url_args={'q': 'sha1:%s' %
                                                         content_sha1})
             expected_entry['sha1'] = content_sha1
             del expected_entry['id']
             self.assertEqual(entry, expected_entry)
         self.assertFalse('Link' in rv)
 
         url = reverse('api-content-symbol',
                       url_args={'q': contents_with_ctags['symbol_name']},
                       query_params={'per_page': 2})
         rv = self.client.get(url)
 
         next_url = reverse('api-content-symbol',
                            url_args={'q': contents_with_ctags['symbol_name']},
                            query_params={'last_sha1': rv.data[1]['sha1'],
                                          'per_page': 2})
         self.assertEqual(rv['Link'], '<%s>; rel="next"' % next_url)
 
     def test_api_content_symbol_not_found(self):
 
         url = reverse('api-content-symbol', url_args={'q': 'bar'})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 404)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'No indexed raw content match expression \'bar\'.'
         })
         self.assertFalse('Link' in rv)
 
     @pytest.mark.skipif(ctags_json_missing,
                         reason="requires ctags with json output support")
     @given(content())
     def test_api_content_ctags(self, content):
 
         self.content_add_ctags(content['sha1'])
         url = reverse('api-content-ctags',
                       url_args={'q': 'sha1_git:%s' % content['sha1_git']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         content_url = reverse('api-content',
                               url_args={'q': 'sha1:%s' % content['sha1']})
         expected_data = list(self.content_get_ctags(content['sha1']))
         for e in expected_data:
             e['content_url'] = content_url
         self.assertEqual(rv.data, expected_data)
 
     @pytest.mark.skipif(fossology_missing,
                         reason="requires fossology-nomossa installed")
     @given(content())
     def test_api_content_license(self, content):
 
         self.content_add_license(content['sha1'])
         url = reverse('api-content-license',
                       url_args={'q': 'sha1_git:%s' % content['sha1_git']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         content_url = reverse('api-content',
                               url_args={'q': 'sha1:%s' % content['sha1']})
         expected_data = self.content_get_license(content['sha1'])
         expected_data['content_url'] = content_url
         self.assertEqual(rv.data, expected_data)
 
     @given(unknown_content())
     def test_api_content_license_sha_not_found(self, unknown_content):
 
         url = reverse('api-content-license',
                       url_args={'q': 'sha1:%s' % unknown_content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 404)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'No license information found for content '
             'sha1:%s.' % unknown_content['sha1']
         })
 
     @given(content())
     def test_api_content_metadata(self, content):
 
         url = reverse('api-content', {'q': 'sha1:%s' % content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         expected_data = self.content_get_metadata(content['sha1'])
         for key, view_name in (('data_url', 'api-content-raw'),
                                ('license_url', 'api-content-license'),
                                ('language_url', 'api-content-language'),
                                ('filetype_url', 'api-content-filetype')):
             expected_data[key] = reverse(view_name,
                                          url_args={'q': 'sha1:%s' %
                                                    content['sha1']})
         self.assertEqual(rv.data, expected_data)
 
     @given(unknown_content())
     def test_api_content_not_found_as_json(self, unknown_content):
 
         url = reverse('api-content',
                       url_args={'q': 'sha1:%s' % unknown_content['sha1']})
         rv = self.client.get(url)
         self.assertEqual(rv.status_code, 404)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'Content with sha1 checksum equals to %s not found!'
             % unknown_content['sha1']
         })
 
     @given(unknown_content())
     def test_api_content_not_found_as_yaml(self, unknown_content):
 
         url = reverse('api-content',
                       url_args={'q': 'sha256:%s' % unknown_content['sha256']})
         rv = self.client.get(url, HTTP_ACCEPT='application/yaml')
 
         self.assertEqual(rv.status_code, 404)
         self.assertTrue('application/yaml' in rv['Content-Type'])
 
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'Content with sha256 checksum equals to %s not found!' %
             unknown_content['sha256']
         })
 
     @given(unknown_content())
     def test_api_content_raw_ko_not_found(self, unknown_content):
 
         url = reverse('api-content-raw',
                       url_args={'q': 'sha1:%s' % unknown_content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 404)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'exception': 'NotFoundExc',
             'reason': 'Content with sha1 checksum equals to %s not found!' %
             unknown_content['sha1']
         })
 
     @given(content())
     def test_api_content_raw_text(self, content):
 
         url = reverse('api-content-raw',
                       url_args={'q': 'sha1:%s' % content['sha1']})
 
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/octet-stream')
         self.assertEqual(
             rv['Content-disposition'],
             'attachment; filename=content_sha1_%s_raw' % content['sha1'])
         self.assertEqual(
             rv['Content-Type'], 'application/octet-stream')
         expected_data = self.content_get(content['sha1'])
         self.assertEqual(rv.content, expected_data['data'])
 
     @given(content())
     def test_api_content_raw_text_with_filename(self, content):
 
         url = reverse('api-content-raw',
                       url_args={'q': 'sha1:%s' % content['sha1']},
                       query_params={'filename': 'filename.txt'})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/octet-stream')
         self.assertEqual(
             rv['Content-disposition'],
             'attachment; filename=filename.txt')
         self.assertEqual(
             rv['Content-Type'], 'application/octet-stream')
         expected_data = self.content_get(content['sha1'])
         self.assertEqual(rv.content, expected_data['data'])
 
     @given(content())
     def test_api_check_content_known(self, content):
 
         url = reverse('api-content-known',
                       url_args={'q': content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
 
         self.assertEqual(rv.data, {
             'search_res': [
                 {
                     'found': True,
                     'sha1': content['sha1']
                 }
             ],
             'search_stats': {'nbfiles': 1, 'pct': 100.0}
         })
 
     @given(content())
     def test_api_check_content_known_as_yaml(self, content):
 
         url = reverse('api-content-known',
                       url_args={'q': content['sha1']})
         rv = self.client.get(url, HTTP_ACCEPT='application/yaml')
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/yaml')
 
         self.assertEqual(rv.data, {
             'search_res': [
                 {
                     'found': True,
                     'sha1': content['sha1']
                 }
             ],
             'search_stats': {'nbfiles': 1, 'pct': 100.0}
         })
 
     @given(content())
     def test_api_check_content_known_post_as_yaml(self, content):
 
         url = reverse('api-content-known')
         rv = self.client.post(
             url,
             data={
                 'q': content['sha1']
             },
             HTTP_ACCEPT='application/yaml'
         )
 
         self.assertEqual(rv.status_code, 200)
         self.assertTrue('application/yaml' in rv['Content-Type'])
         self.assertEqual(rv.data, {
             'search_res': [
                 {
                     'found': True,
                     'sha1': content['sha1']
                 }
             ],
             'search_stats': {'nbfiles': 1, 'pct': 100.0}
         })
 
     @given(unknown_content())
     def test_api_check_content_known_not_found(self, unknown_content):
 
         url = reverse('api-content-known',
                       url_args={'q': unknown_content['sha1']})
         rv = self.client.get(url)
 
         self.assertEqual(rv.status_code, 200)
         self.assertEqual(rv['Content-Type'], 'application/json')
         self.assertEqual(rv.data, {
             'search_res': [
                 {
                     'found': False,
                     'sha1': unknown_content['sha1']
                 }
             ],
             'search_stats': {'nbfiles': 1, 'pct': 0.0}
         })
 
     @given(content())
     def test_api_content_uppercase(self, content):
         url = reverse('api-content-uppercase-checksum',
                       url_args={'q': content['sha1'].upper()})
 
         resp = self.client.get(url)
         self.assertEqual(resp.status_code, 302)
 
         redirect_url = reverse('api-content',
                                url_args={'q': content['sha1']})
 
         self.assertEqual(resp['location'], redirect_url)
diff --git a/swh/web/tests/common/test_service.py b/swh/web/tests/common/test_service.py
index d0ad0b8f..3a5eb0be 100644
--- a/swh/web/tests/common/test_service.py
+++ b/swh/web/tests/common/test_service.py
@@ -1,820 +1,821 @@
 # Copyright (C) 2015-2019  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU Affero General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import itertools
 import pytest
 import random
 
 from collections import defaultdict
 from hypothesis import given
 
 from swh.model.hashutil import hash_to_bytes, hash_to_hex
 
 from swh.web.common import service
 from swh.web.common.exc import BadInputExc, NotFoundExc
 from swh.web.tests.strategies import (
     content, contents, unknown_content, unknown_contents,
     contents_with_ctags, origin, new_origin, visit_dates, directory,
     release, revision, unknown_revision, revisions, unknown_revisions,
     ancestor_revisions, non_ancestor_revisions, invalid_sha1, sha256,
     revision_with_submodules, unknown_directory, empty_directory,
     new_revision, new_origins
 )
 from swh.web.tests.testcase import (
     WebTestCase, ctags_json_missing, fossology_missing
 )
 
 
 class ServiceTestCase(WebTestCase):
 
     @given(contents())
     def test_lookup_multiple_hashes_all_present(self, contents):
         input_data = []
         expected_output = []
         for cnt in contents:
             input_data.append({'sha1': cnt['sha1']})
             expected_output.append({'sha1': cnt['sha1'],
                                     'found': True})
 
         self.assertEqual(service.lookup_multiple_hashes(input_data),
                          expected_output)
 
     @given(contents(), unknown_contents())
     def test_lookup_multiple_hashes_some_missing(self, contents,
                                                  unknown_contents):
         input_contents = list(itertools.chain(contents, unknown_contents))
         random.shuffle(input_contents)
 
         input_data = []
         expected_output = []
         for cnt in input_contents:
             input_data.append({'sha1': cnt['sha1']})
             expected_output.append({'sha1': cnt['sha1'],
                                     'found': cnt in contents})
 
         self.assertEqual(service.lookup_multiple_hashes(input_data),
                          expected_output)
 
     @given(unknown_content())
     def test_lookup_hash_does_not_exist(self, unknown_content):
 
         actual_lookup = service.lookup_hash('sha1_git:%s' %
                                             unknown_content['sha1_git'])
 
         self.assertEqual(actual_lookup, {'found': None,
                                          'algo': 'sha1_git'})
 
     @given(content())
     def test_lookup_hash_exist(self, content):
 
         actual_lookup = service.lookup_hash('sha1:%s' % content['sha1'])
 
         content_metadata = self.content_get_metadata(content['sha1'])
 
         self.assertEqual({'found': content_metadata,
                           'algo': 'sha1'}, actual_lookup)
 
     @given(unknown_content())
     def test_search_hash_does_not_exist(self, content):
 
         actual_lookup = service.search_hash('sha1_git:%s' %
                                             content['sha1_git'])
 
         self.assertEqual({'found': False}, actual_lookup)
 
     @given(content())
     def test_search_hash_exist(self, content):
 
         actual_lookup = service.search_hash('sha1:%s' % content['sha1'])
 
         self.assertEqual({'found': True}, actual_lookup)
 
     @pytest.mark.skipif(ctags_json_missing,
                         reason="requires ctags with json output support")
     @given(contents_with_ctags())
     def test_lookup_content_ctags(self, contents_with_ctags):
 
         content_sha1 = random.choice(contents_with_ctags['sha1s'])
         self.content_add_ctags(content_sha1)
         actual_ctags = \
             list(service.lookup_content_ctags('sha1:%s' % content_sha1))
 
         expected_data = list(self.content_get_ctags(content_sha1))
         for ctag in expected_data:
             ctag['id'] = content_sha1
 
         self.assertEqual(actual_ctags, expected_data)
 
     @given(unknown_content())
     def test_lookup_content_ctags_no_hash(self, unknown_content):
 
         actual_ctags = \
             list(service.lookup_content_ctags('sha1:%s' %
                                               unknown_content['sha1']))
 
         self.assertEqual(actual_ctags, [])
 
     @given(content())
     def test_lookup_content_filetype(self, content):
 
         self.content_add_mimetype(content['sha1'])
         actual_filetype = service.lookup_content_filetype(content['sha1'])
 
         expected_filetype = self.content_get_mimetype(content['sha1'])
         self.assertEqual(actual_filetype, expected_filetype)
 
+    @pytest.mark.xfail  # Language indexer is disabled.
     @given(content())
     def test_lookup_content_language(self, content):
 
         self.content_add_language(content['sha1'])
         actual_language = service.lookup_content_language(content['sha1'])
 
         expected_language = self.content_get_language(content['sha1'])
         self.assertEqual(actual_language, expected_language)
 
     @given(contents_with_ctags())
     def test_lookup_expression(self, contents_with_ctags):
 
         per_page = 10
         expected_ctags = []
 
         for content_sha1 in contents_with_ctags['sha1s']:
             if len(expected_ctags) == per_page:
                 break
             self.content_add_ctags(content_sha1)
             for ctag in self.content_get_ctags(content_sha1):
                 if len(expected_ctags) == per_page:
                     break
                 if ctag['name'] == contents_with_ctags['symbol_name']:
                     del ctag['id']
                     ctag['sha1'] = content_sha1
                     expected_ctags.append(ctag)
 
         actual_ctags = \
             list(service.lookup_expression(contents_with_ctags['symbol_name'],
                                            last_sha1=None, per_page=10))
 
         self.assertEqual(actual_ctags, expected_ctags)
 
     def test_lookup_expression_no_result(self):
 
         expected_ctags = []
 
         actual_ctags = \
             list(service.lookup_expression('barfoo', last_sha1=None,
                                            per_page=10))
         self.assertEqual(actual_ctags, expected_ctags)
 
     @pytest.mark.skipif(fossology_missing,
                         reason="requires fossology-nomossa installed")
     @given(content())
     def test_lookup_content_license(self, content):
 
         self.content_add_license(content['sha1'])
         actual_license = service.lookup_content_license(content['sha1'])
 
         expected_license = self.content_get_license(content['sha1'])
         self.assertEqual(actual_license, expected_license)
 
     def test_stat_counters(self):
         actual_stats = service.stat_counters()
         self.assertEqual(actual_stats, self.storage.stat_counters())
 
     @given(new_origin(), visit_dates())
     def test_lookup_origin_visits(self, new_origin, visit_dates):
 
         origin_id = self.storage.origin_add_one(new_origin)
         for ts in visit_dates:
             self.storage.origin_visit_add(origin_id, ts)
 
         actual_origin_visits = list(
             service.lookup_origin_visits(origin_id, per_page=100))
 
         expected_visits = self.origin_visit_get(origin_id)
 
         self.assertEqual(actual_origin_visits, expected_visits)
 
     @given(new_origin(), visit_dates())
     def test_lookup_origin_visit(self, new_origin, visit_dates):
         origin_id = self.storage.origin_add_one(new_origin)
         visits = []
         for ts in visit_dates:
             visits.append(self.storage.origin_visit_add(origin_id, ts))
 
         visit = random.choice(visits)['visit']
         actual_origin_visit = service.lookup_origin_visit(origin_id, visit)
 
         expected_visit = dict(self.storage.origin_visit_get_by(origin_id,
                                                                visit))
         expected_visit['date'] = expected_visit['date'].isoformat()
         expected_visit['metadata'] = {}
 
         self.assertEqual(actual_origin_visit, expected_visit)
 
     @given(new_origin())
     def test_lookup_origin(self, new_origin):
         origin_id = self.storage.origin_add_one(new_origin)
 
         actual_origin = service.lookup_origin({'id': origin_id})
         expected_origin = self.storage.origin_get({'id': origin_id})
         self.assertEqual(actual_origin, expected_origin)
 
         actual_origin = service.lookup_origin({'type': new_origin['type'],
                                                'url': new_origin['url']})
         expected_origin = self.storage.origin_get({'type': new_origin['type'],
                                                    'url': new_origin['url']})
         self.assertEqual(actual_origin, expected_origin)
 
     @given(invalid_sha1())
     def test_lookup_release_ko_id_checksum_not_a_sha1(self, invalid_sha1):
         with self.assertRaises(BadInputExc) as cm:
             service.lookup_release(invalid_sha1)
         self.assertIn('invalid checksum', cm.exception.args[0].lower())
 
     @given(sha256())
     def test_lookup_release_ko_id_checksum_too_long(self, sha256):
         with self.assertRaises(BadInputExc) as cm:
             service.lookup_release(sha256)
         self.assertEqual('Only sha1_git is supported.', cm.exception.args[0])
 
     @given(directory())
     def test_lookup_directory_with_path_not_found(self, directory):
         path = 'some/invalid/path/here'
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_directory_with_path(directory, path)
         self.assertEqual('Directory entry with path %s from %s '
                          'not found' % (path, directory),
                          cm.exception.args[0])
 
     @given(directory())
     def test_lookup_directory_with_path_found(self, directory):
         directory_content = self.directory_ls(directory)
         directory_entry = random.choice(directory_content)
         path = directory_entry['name']
         actual_result = service.lookup_directory_with_path(directory, path)
         self.assertEqual(actual_result, directory_entry)
 
     @given(release())
     def test_lookup_release(self, release):
         actual_release = service.lookup_release(release)
 
         self.assertEqual(actual_release,
                          self.release_get(release))
 
     @given(revision(), invalid_sha1(), sha256())
     def test_lookup_revision_with_context_ko_not_a_sha1(self, revision,
                                                         invalid_sha1,
                                                         sha256):
         sha1_git_root = revision
         sha1_git = invalid_sha1
 
         with self.assertRaises(BadInputExc) as cm:
             service.lookup_revision_with_context(sha1_git_root, sha1_git)
         self.assertIn('Invalid checksum query string', cm.exception.args[0])
 
         sha1_git = sha256
 
         with self.assertRaises(BadInputExc) as cm:
             service.lookup_revision_with_context(sha1_git_root, sha1_git)
         self.assertIn('Only sha1_git is supported', cm.exception.args[0])
 
     @given(revision(), unknown_revision())
     def test_lookup_revision_with_context_ko_sha1_git_does_not_exist(
             self, revision, unknown_revision):
         sha1_git_root = revision
         sha1_git = unknown_revision
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_revision_with_context(sha1_git_root, sha1_git)
         self.assertIn('Revision %s not found' % sha1_git, cm.exception.args[0])
 
     @given(revision(), unknown_revision())
     def test_lookup_revision_with_context_ko_root_sha1_git_does_not_exist(
             self, revision, unknown_revision):
         sha1_git_root = unknown_revision
         sha1_git = revision
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_revision_with_context(sha1_git_root, sha1_git)
         self.assertIn('Revision root %s not found' % sha1_git_root,
                       cm.exception.args[0])
 
     @given(ancestor_revisions())
     def test_lookup_revision_with_context(self, ancestor_revisions):
         sha1_git = ancestor_revisions['sha1_git']
         root_sha1_git = ancestor_revisions['sha1_git_root']
         for sha1_git_root in (root_sha1_git,
                               {'id': hash_to_bytes(root_sha1_git)}):
             actual_revision = \
                 service.lookup_revision_with_context(sha1_git_root,
                                                      sha1_git)
 
             children = []
             for rev in self.revision_log(root_sha1_git):
                 for p_rev in rev['parents']:
                     p_rev_hex = hash_to_hex(p_rev)
                     if p_rev_hex == sha1_git:
                         children.append(rev['id'])
 
             expected_revision = self.revision_get(sha1_git)
             expected_revision['children'] = children
             self.assertEqual(actual_revision, expected_revision)
 
     @given(non_ancestor_revisions())
     def test_lookup_revision_with_context_ko(self, non_ancestor_revisions):
         sha1_git = non_ancestor_revisions['sha1_git']
         root_sha1_git = non_ancestor_revisions['sha1_git_root']
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_revision_with_context(root_sha1_git, sha1_git)
         self.assertIn('Revision %s is not an ancestor of %s' %
                       (sha1_git, root_sha1_git), cm.exception.args[0])
 
     @given(unknown_revision())
     def test_lookup_directory_with_revision_not_found(self, unknown_revision):
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_directory_with_revision(unknown_revision)
         self.assertIn('Revision %s not found' % unknown_revision,
                       cm.exception.args[0])
 
     @given(revision())
     def test_lookup_directory_with_revision_ko_path_to_nowhere(self, revision):
 
         invalid_path = 'path/to/something/unknown'
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_directory_with_revision(revision, invalid_path)
         exception_text = cm.exception.args[0].lower()
         self.assertIn('directory or file', exception_text)
         self.assertIn(invalid_path, exception_text)
         self.assertIn('revision %s' % revision, exception_text)
         self.assertIn('not found', exception_text)
 
     @given(revision_with_submodules())
     def test_lookup_directory_with_revision_submodules(
             self, revision_with_submodules):
 
         rev_sha1_git = revision_with_submodules['rev_sha1_git']
         rev_dir_path = revision_with_submodules['rev_dir_rev_path']
 
         actual_data = service.lookup_directory_with_revision(
                 rev_sha1_git, rev_dir_path)
 
         revision = self.revision_get(revision_with_submodules['rev_sha1_git'])
         directory = self.directory_ls(revision['directory'])
         rev_entry = next(e for e in directory if e['name'] == rev_dir_path)
 
         expected_data = {
             'content': self.revision_get(rev_entry['target']),
             'path': rev_dir_path,
             'revision': rev_sha1_git,
             'type': 'rev'
         }
 
         self.assertEqual(actual_data, expected_data)
 
     @given(revision())
     def test_lookup_directory_with_revision_without_path(self, revision):
 
         actual_directory_entries = \
             service.lookup_directory_with_revision(revision)
 
         revision_data = self.revision_get(revision)
         expected_directory_entries = \
             self.directory_ls(revision_data['directory'])
 
         self.assertEqual(actual_directory_entries['type'], 'dir')
         self.assertEqual(actual_directory_entries['content'],
                          expected_directory_entries)
 
     @given(revision())
     def test_lookup_directory_with_revision_with_path(self, revision):
 
         revision_data = self.revision_get(revision)
         dir_entries = [e for e in self.directory_ls(revision_data['directory'])
                        if e['type'] in ('file', 'dir')]
         expected_dir_entry = random.choice(dir_entries)
 
         actual_dir_entry = \
             service.lookup_directory_with_revision(revision,
                                                    expected_dir_entry['name'])
 
         self.assertEqual(actual_dir_entry['type'], expected_dir_entry['type'])
         self.assertEqual(actual_dir_entry['revision'], revision)
         self.assertEqual(actual_dir_entry['path'], expected_dir_entry['name'])
         if actual_dir_entry['type'] == 'file':
             del actual_dir_entry['content']['checksums']['blake2s256']
             for key in ('checksums', 'status', 'length'):
                 self.assertEqual(actual_dir_entry['content'][key],
                                  expected_dir_entry[key])
         else:
             sub_dir_entries = self.directory_ls(expected_dir_entry['target'])
             self.assertEqual(actual_dir_entry['content'], sub_dir_entries)
 
     @given(revision())
     def test_lookup_directory_with_revision_with_path_to_file_and_data(
             self, revision):
 
         revision_data = self.revision_get(revision)
         dir_entries = [e for e in self.directory_ls(revision_data['directory'])
                        if e['type'] == 'file']
         expected_dir_entry = random.choice(dir_entries)
         expected_data = \
             self.content_get(expected_dir_entry['checksums']['sha1'])
 
         actual_dir_entry = \
             service.lookup_directory_with_revision(revision,
                                                    expected_dir_entry['name'],
                                                    with_data=True)
 
         self.assertEqual(actual_dir_entry['type'], expected_dir_entry['type'])
         self.assertEqual(actual_dir_entry['revision'], revision)
         self.assertEqual(actual_dir_entry['path'], expected_dir_entry['name'])
         del actual_dir_entry['content']['checksums']['blake2s256']
         for key in ('checksums', 'status', 'length'):
             self.assertEqual(actual_dir_entry['content'][key],
                              expected_dir_entry[key])
         self.assertEqual(actual_dir_entry['content']['data'],
                          expected_data['data'])
 
     @given(revision())
     def test_lookup_revision(self, revision):
         actual_revision = service.lookup_revision(revision)
         self.assertEqual(actual_revision, self.revision_get(revision))
 
     @given(new_revision())
     def test_lookup_revision_invalid_msg(self, new_revision):
 
         new_revision['message'] = b'elegant fix for bug \xff'
         self.storage.revision_add([new_revision])
 
         revision = service.lookup_revision(hash_to_hex(new_revision['id']))
         self.assertEqual(revision['message'], None)
         self.assertEqual(revision['message_decoding_failed'], True)
 
     @given(new_revision())
     def test_lookup_revision_msg_ok(self, new_revision):
 
         self.storage.revision_add([new_revision])
 
         revision_message = service.lookup_revision_message(
             hash_to_hex(new_revision['id']))
 
         self.assertEqual(revision_message,
                          {'message': new_revision['message']})
 
     @given(new_revision())
     def test_lookup_revision_msg_absent(self, new_revision):
 
         del new_revision['message']
         self.storage.revision_add([new_revision])
 
         new_revision_id = hash_to_hex(new_revision['id'])
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_revision_message(new_revision_id)
 
         self.assertEqual(
             cm.exception.args[0],
             'No message for revision with sha1_git %s.' % new_revision_id
         )
 
     @given(unknown_revision())
     def test_lookup_revision_msg_no_rev(self, unknown_revision):
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_revision_message(unknown_revision)
 
         self.assertEqual(
             cm.exception.args[0],
             'Revision with sha1_git %s not found.' % unknown_revision
         )
 
     @given(revisions())
     def test_lookup_revision_multiple(self, revisions):
 
         actual_revisions = list(service.lookup_revision_multiple(revisions))
 
         expected_revisions = []
         for rev in revisions:
             expected_revisions.append(self.revision_get(rev))
 
         self.assertEqual(actual_revisions, expected_revisions)
 
     @given(unknown_revisions())
     def test_lookup_revision_multiple_none_found(self, unknown_revisions):
 
         actual_revisions = \
             list(service.lookup_revision_multiple(unknown_revisions))
 
         self.assertEqual(actual_revisions, [None] * len(unknown_revisions))
 
     @given(revision())
     def test_lookup_revision_log(self, revision):
 
         actual_revision_log = \
             list(service.lookup_revision_log(revision, limit=25))
         expected_revision_log = self.revision_log(revision, limit=25)
 
         self.assertEqual(actual_revision_log, expected_revision_log)
 
     def _get_origin_branches(self, origin):
         origin_visit = self.origin_visit_get(origin['id'])[-1]
         snapshot = self.snapshot_get(origin_visit['snapshot'])
         branches = {k: v for (k, v) in snapshot['branches'].items()
                     if v['target_type'] == 'revision'}
         return branches
 
     @given(origin())
     def test_lookup_revision_log_by(self, origin):
 
         branches = self._get_origin_branches(origin)
         branch_name = random.choice(list(branches.keys()))
 
         actual_log =  \
             list(service.lookup_revision_log_by(origin['id'], branch_name,
                                                 None, limit=25))
 
         expected_log = \
             self.revision_log(branches[branch_name]['target'], limit=25)
 
         self.assertEqual(actual_log, expected_log)
 
     @given(origin())
     def test_lookup_revision_log_by_notfound(self, origin):
 
         with self.assertRaises(NotFoundExc):
             service.lookup_revision_log_by(
                 origin['id'], 'unknown_branch_name', None, limit=100)
 
     @given(unknown_content())
     def test_lookup_content_raw_not_found(self, unknown_content):
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_content_raw('sha1:' + unknown_content['sha1'])
 
         self.assertIn(cm.exception.args[0],
                       'Content with %s checksum equals to %s not found!' %
                       ('sha1', unknown_content['sha1']))
 
     @given(content())
     def test_lookup_content_raw(self, content):
 
         actual_content = service.lookup_content_raw(
             'sha256:%s' % content['sha256'])
 
         expected_content = self.content_get(content['sha1'])
 
         self.assertEqual(actual_content, expected_content)
 
     @given(unknown_content())
     def test_lookup_content_not_found(self, unknown_content):
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_content('sha1:%s' % unknown_content['sha1'])
 
         self.assertIn(cm.exception.args[0],
                       'Content with %s checksum equals to %s not found!' %
                       ('sha1', unknown_content['sha1']))
 
     @given(content())
     def test_lookup_content_with_sha1(self, content):
 
         actual_content = service.lookup_content(
             'sha1:%s' % content['sha1'])
 
         expected_content = self.content_get_metadata(content['sha1'])
 
         self.assertEqual(actual_content, expected_content)
 
     @given(content())
     def test_lookup_content_with_sha256(self, content):
 
         actual_content = service.lookup_content(
             'sha256:%s' % content['sha256'])
 
         expected_content = self.content_get_metadata(content['sha1'])
 
         self.assertEqual(actual_content, expected_content)
 
     @given(revision())
     def test_lookup_person(self, revision):
 
         rev_data = self.revision_get(revision)
 
         actual_person = service.lookup_person(rev_data['author']['id'])
 
         self.assertEqual(actual_person, rev_data['author'])
 
     def test_lookup_directory_bad_checksum(self):
 
         with self.assertRaises(BadInputExc):
             service.lookup_directory('directory_id')
 
     @given(unknown_directory())
     def test_lookup_directory_not_found(self, unknown_directory):
 
         with self.assertRaises(NotFoundExc) as cm:
             service.lookup_directory(unknown_directory)
 
         self.assertIn('Directory with sha1_git %s not found'
                       % unknown_directory, cm.exception.args[0])
 
     @given(directory())
     def test_lookup_directory(self, directory):
 
         actual_directory_ls = list(service.lookup_directory(
             directory))
 
         expected_directory_ls = self.directory_ls(directory)
 
         self.assertEqual(actual_directory_ls, expected_directory_ls)
 
     @given(empty_directory())
     def test_lookup_directory_empty(self, empty_directory):
 
         actual_directory_ls = list(service.lookup_directory(empty_directory))
 
         self.assertEqual(actual_directory_ls, [])
 
     @given(origin())
     def test_lookup_revision_by_nothing_found(self, origin):
 
         with self.assertRaises(NotFoundExc):
             service.lookup_revision_by(origin['id'], 'invalid-branch-name')
 
     @given(origin())
     def test_lookup_revision_by(self, origin):
 
         branches = self._get_origin_branches(origin)
         branch_name = random.choice(list(branches.keys()))
 
         actual_revision =  \
             service.lookup_revision_by(origin['id'], branch_name, None)
 
         expected_revision = \
             self.revision_get(branches[branch_name]['target'])
 
         self.assertEqual(actual_revision, expected_revision)
 
     @given(origin(), revision())
     def test_lookup_revision_with_context_by_ko(self, origin, revision):
 
         with self.assertRaises(NotFoundExc):
             service.lookup_revision_with_context_by(origin['id'],
                                                     'invalid-branch-name',
                                                     None,
                                                     revision)
 
     @given(origin())
     def test_lookup_revision_with_context_by(self, origin):
 
         branches = self._get_origin_branches(origin)
         branch_name = random.choice(list(branches.keys()))
 
         root_rev = branches[branch_name]['target']
         root_rev_log = self.revision_log(root_rev)
 
         children = defaultdict(list)
 
         for rev in root_rev_log:
             for rev_p in rev['parents']:
                 children[rev_p].append(rev['id'])
 
         rev = root_rev_log[-1]['id']
 
         actual_root_rev, actual_rev = service.lookup_revision_with_context_by(
             origin['id'], branch_name, None, rev)
 
         expected_root_rev = self.revision_get(root_rev)
         expected_rev = self.revision_get(rev)
         expected_rev['children'] = children[rev]
 
         self.assertEqual(actual_root_rev, expected_root_rev)
         self.assertEqual(actual_rev, expected_rev)
 
     def test_lookup_revision_through_ko_not_implemented(self):
 
         with self.assertRaises(NotImplementedError):
             service.lookup_revision_through({
                 'something-unknown': 10,
             })
 
     @given(origin())
     def test_lookup_revision_through_with_context_by(self, origin):
 
         branches = self._get_origin_branches(origin)
         branch_name = random.choice(list(branches.keys()))
 
         root_rev = branches[branch_name]['target']
         root_rev_log = self.revision_log(root_rev)
         rev = root_rev_log[-1]['id']
 
         self.assertEqual(service.lookup_revision_through({
                             'origin_id': origin['id'],
                             'branch_name': branch_name,
                             'ts': None,
                             'sha1_git': rev
                          }),
                          service.lookup_revision_with_context_by(
                             origin['id'], branch_name, None, rev)
                          )
 
     @given(origin())
     def test_lookup_revision_through_with_revision_by(self, origin):
 
         branches = self._get_origin_branches(origin)
         branch_name = random.choice(list(branches.keys()))
 
         self.assertEqual(service.lookup_revision_through({
                             'origin_id': origin['id'],
                             'branch_name': branch_name,
                             'ts': None,
                          }),
                          service.lookup_revision_by(
                             origin['id'], branch_name, None)
                          )
 
     @given(ancestor_revisions())
     def test_lookup_revision_through_with_context(self, ancestor_revisions):
 
         sha1_git = ancestor_revisions['sha1_git']
         sha1_git_root = ancestor_revisions['sha1_git_root']
 
         self.assertEqual(service.lookup_revision_through({
                             'sha1_git_root': sha1_git_root,
                             'sha1_git': sha1_git,
                          }),
                          service.lookup_revision_with_context(
                              sha1_git_root, sha1_git)
 
                          )
 
     @given(revision())
     def test_lookup_revision_through_with_revision(self, revision):
 
         self.assertEqual(service.lookup_revision_through({
                             'sha1_git': revision
                          }),
                          service.lookup_revision(revision)
                          )
 
     @given(revision())
     def test_lookup_directory_through_revision_ko_not_found(self, revision):
 
         with self.assertRaises(NotFoundExc):
             service.lookup_directory_through_revision(
                 {'sha1_git': revision}, 'some/invalid/path')
 
     @given(revision())
     def test_lookup_directory_through_revision_ok(self, revision):
 
         revision_data = self.revision_get(revision)
         dir_entries = [e for e in self.directory_ls(revision_data['directory'])
                        if e['type'] == 'file']
         dir_entry = random.choice(dir_entries)
 
         self.assertEqual(
             service.lookup_directory_through_revision({'sha1_git': revision},
                                                       dir_entry['name']),
             (revision,
              service.lookup_directory_with_revision(
                 revision, dir_entry['name']))
         )
 
     @given(revision())
     def test_lookup_directory_through_revision_ok_with_data(self, revision):
 
         revision_data = self.revision_get(revision)
         dir_entries = [e for e in self.directory_ls(revision_data['directory'])
                        if e['type'] == 'file']
         dir_entry = random.choice(dir_entries)
 
         self.assertEqual(
             service.lookup_directory_through_revision({'sha1_git': revision},
                                                       dir_entry['name'],
                                                       with_data=True),
             (revision,
              service.lookup_directory_with_revision(
                 revision, dir_entry['name'], with_data=True))
         )
 
     @given(new_origins(20))
     def test_lookup_origins(self, new_origins):
 
         nb_origins = len(new_origins)
         expected_origins = self.storage.origin_add(new_origins)
 
         origin_from_idx = random.randint(1, nb_origins-1) - 1
         origin_from = expected_origins[origin_from_idx]['id']
         max_origin_idx = expected_origins[-1]['id']
         origin_count = random.randint(1, max_origin_idx - origin_from)
 
         actual_origins = list(service.lookup_origins(origin_from,
                                                      origin_count))
         expected_origins = list(self.storage.origin_get_range(origin_from,
                                                               origin_count))
 
         self.assertEqual(actual_origins, expected_origins)
diff --git a/swh/web/tests/data.py b/swh/web/tests/data.py
index f54351f9..694c5b0e 100644
--- a/swh/web/tests/data.py
+++ b/swh/web/tests/data.py
@@ -1,304 +1,285 @@
 # Copyright (C) 2018-2019  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU Affero General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 from copy import deepcopy
 import os
 import time
 
-from swh.indexer.language import LanguageIndexer
 from swh.indexer.fossology_license import FossologyLicenseIndexer
 from swh.indexer.mimetype import MimetypeIndexer
 from swh.indexer.ctags import CtagsIndexer
 from swh.indexer.storage import get_indexer_storage
 from swh.model.hashutil import hash_to_hex, hash_to_bytes, DEFAULT_ALGORITHMS
 from swh.model.identifiers import directory_identifier
 from swh.loader.git.from_disk import GitLoaderFromArchive
 from swh.storage.algos.dir_iterators import dir_iterator
 from swh.web.browse.utils import (
     get_mimetype_and_encoding_for_content, prepare_content_for_display
 )
 
 # Module used to initialize data that will be provided as tests input
 
 # Configuration for git loader
 _TEST_LOADER_CONFIG = {
     'storage': {
         'cls': 'memory',
         'args': {}
     },
     'send_contents': True,
     'send_directories': True,
     'send_revisions': True,
     'send_releases': True,
     'send_snapshot': True,
 
     'content_size_limit': 100 * 1024 * 1024,
     'content_packet_size': 10,
     'content_packet_size_bytes': 100 * 1024 * 1024,
     'directory_packet_size': 10,
     'revision_packet_size': 10,
     'release_packet_size': 10,
 
     'save_data': False,
 }
 
 # Base content indexer configuration
 _TEST_INDEXER_BASE_CONFIG = {
     'storage': {
         'cls': 'memory',
         'args': {},
     },
     'objstorage': {
         'cls': 'memory',
         'args': {},
     },
     'indexer_storage': {
         'cls': 'memory',
         'args': {},
     }
 }
 
 
 # MimetypeIndexer with custom configuration for tests
 class _MimetypeIndexer(MimetypeIndexer):
     def parse_config_file(self, *args, **kwargs):
         return {
             **_TEST_INDEXER_BASE_CONFIG,
             'tools': {
                 'name': 'file',
                 'version': '1:5.30-1+deb9u1',
                 'configuration': {
                     "type": "library",
                     "debian-package": "python3-magic"
                 }
             }
         }
 
 
-# LanguageIndexer with custom configuration for tests
-class _LanguageIndexer(LanguageIndexer):
-    def parse_config_file(self, *args, **kwargs):
-        return {
-            **_TEST_INDEXER_BASE_CONFIG,
-            'tools': {
-                'name': 'pygments',
-                'version': '2.0.1+dfsg-1.1+deb8u1',
-                'configuration': {
-                    'type': 'library',
-                    'debian-package': 'python3-pygments',
-                    'max_content_size': 10240,
-                }
-            }
-        }
-
-
 # FossologyLicenseIndexer with custom configuration for tests
 class _FossologyLicenseIndexer(FossologyLicenseIndexer):
     def parse_config_file(self, *args, **kwargs):
         return {
             **_TEST_INDEXER_BASE_CONFIG,
             'workdir': '/tmp/swh/indexer.fossology.license',
             'tools': {
                 'name': 'nomos',
                 'version': '3.1.0rc2-31-ga2cbb8c',
                 'configuration': {
                     'command_line': 'nomossa <filepath>',
                 },
             }
         }
 
 
 # CtagsIndexer with custom configuration for tests
 class _CtagsIndexer(CtagsIndexer):
     def parse_config_file(self, *args, **kwargs):
         return {
             **_TEST_INDEXER_BASE_CONFIG,
             'workdir': '/tmp/swh/indexer.ctags',
             'languages': {'c': 'c'},
             'tools': {
                 'name': 'universal-ctags',
                 'version': '~git7859817b',
                 'configuration': {
                     'command_line': '''ctags --fields=+lnz --sort=no --links=no ''' # noqa
                                     '''--output-format=json <filepath>'''
                 },
             }
         }
 
 
 # Lightweight git repositories that will be loaded to generate
 # input data for tests
 _TEST_ORIGINS = [
     {
         'id': 1,
         'type': 'git',
         'url': 'https://github.com/wcoder/highlightjs-line-numbers.js',
         'archives': ['highlightjs-line-numbers.js.zip',
                      'highlightjs-line-numbers.js_visit2.zip']
     },
     {
         'id': 2,
         'type': 'git',
         'url': 'https://github.com/memononen/libtess2',
         'archives': ['libtess2.zip']
     },
     {
         'id': 3,
         'type': 'git',
         'url': 'repo_with_submodules',
         'archives': ['repo_with_submodules.tgz']
     }
 ]
 
 _contents = {}
 
 
 # Tests data initialization
 def _init_tests_data():
     # Load git repositories from archives
     loader = GitLoaderFromArchive(config=_TEST_LOADER_CONFIG)
 
     # Get reference to the memory storage
     storage = loader.storage
 
     for origin in _TEST_ORIGINS:
         nb_visits = len(origin['archives'])
         for i, archive in enumerate(origin['archives']):
             origin_repo_archive = \
                 os.path.join(os.path.dirname(__file__),
                              'resources/repos/%s' % archive)
             loader.load(origin['url'], origin_repo_archive, None)
             if nb_visits > 1 and i != nb_visits - 1:
                 time.sleep(1)
 
     contents = set()
     directories = set()
     revisions = set()
     releases = set()
     snapshots = set()
     persons = set()
 
     content_path = {}
 
     # Get all objects loaded into the test archive
     for origin in _TEST_ORIGINS:
         snp = storage.snapshot_get_latest(origin['id'])
         snapshots.add(hash_to_hex(snp['id']))
         for branch_name, branch_data in snp['branches'].items():
             if branch_data['target_type'] == 'revision':
                 revisions.add(branch_data['target'])
             elif branch_data['target_type'] == 'release':
                 release = next(storage.release_get([branch_data['target']]))
                 revisions.add(release['target'])
                 releases.add(hash_to_hex(branch_data['target']))
                 persons.add(release['author']['id'])
 
         for rev_log in storage.revision_shortlog(set(revisions)):
             rev_id = rev_log[0]
             revisions.add(rev_id)
 
         for rev in storage.revision_get(revisions):
             dir_id = rev['directory']
             persons.add(rev['author']['id'])
             persons.add(rev['committer']['id'])
             directories.add(hash_to_hex(dir_id))
             for entry in dir_iterator(storage, dir_id):
                 content_path[entry['sha1']] = '/'.join(
                     [hash_to_hex(dir_id), entry['path'].decode('utf-8')])
                 if entry['type'] == 'file':
                     contents.add(entry['sha1'])
                 elif entry['type'] == 'dir':
                     directories.add(hash_to_hex(entry['target']))
 
     # Get all checksums for each content
     contents_metadata = storage.content_get_metadata(contents)
     contents = []
     for content_metadata in contents_metadata:
         contents.append({
             algo: hash_to_hex(content_metadata[algo])
             for algo in DEFAULT_ALGORITHMS
         })
         path = content_path[content_metadata['sha1']]
         cnt = next(storage.content_get([content_metadata['sha1']]))
         mimetype, encoding = get_mimetype_and_encoding_for_content(cnt['data'])
         content_display_data = prepare_content_for_display(
             cnt['data'], mimetype, path)
         contents[-1]['path'] = path
         contents[-1]['mimetype'] = mimetype
         contents[-1]['encoding'] = encoding
         contents[-1]['hljs_language'] = content_display_data['language']
         contents[-1]['data'] = content_display_data['content_data']
         _contents[contents[-1]['sha1']] = contents[-1]
 
     # Create indexer storage instance that will be shared by indexers
     idx_storage = get_indexer_storage('memory', {})
 
     # Add the empty directory to the test archive
     empty_dir_id = directory_identifier({'entries': []})
     empty_dir_id_bin = hash_to_bytes(empty_dir_id)
     storage.directory_add([{'id': empty_dir_id_bin, 'entries': []}])
 
     # Return tests data
     return {
         'storage': storage,
         'idx_storage': idx_storage,
         'origins': _TEST_ORIGINS,
         'contents': contents,
         'directories': list(directories),
         'persons': list(persons),
         'releases': list(releases),
         'revisions': list(map(hash_to_hex, revisions)),
         'snapshots': list(snapshots),
         'generated_checksums': set(),
     }
 
 
 def _init_indexers(tests_data):
     # Instantiate content indexers that will be used in tests
     # and force them to use the memory storages
     indexers = {}
     for idx_name, idx_class in (('mimetype_indexer', _MimetypeIndexer),
-                                ('language_indexer', _LanguageIndexer),
                                 ('license_indexer', _FossologyLicenseIndexer),
                                 ('ctags_indexer', _CtagsIndexer)):
         idx = idx_class()
         idx.storage = tests_data['storage']
         idx.objstorage = tests_data['storage'].objstorage
         idx.idx_storage = tests_data['idx_storage']
         idx.register_tools(idx.config['tools'])
         indexers[idx_name] = idx
 
     return indexers
 
 
 def get_content(content_sha1):
     return _contents.get(content_sha1)
 
 
 _tests_data = None
 _current_tests_data = None
 _indexer_loggers = {}
 
 
 def get_tests_data(reset=False):
     """
     Initialize tests data and return them in a dict.
     """
     global _tests_data, _current_tests_data
     if _tests_data is None:
         _tests_data = _init_tests_data()
         indexers = _init_indexers(_tests_data)
         for (name, idx) in indexers.items():
             # pytest makes the loggers use a temporary file; and deepcopy
             # requires serializability. So we remove them, and add them
             # back after the copy.
             _indexer_loggers[name] = idx.log
             del idx.log
         _tests_data.update(indexers)
     if reset or _current_tests_data is None:
         _current_tests_data = deepcopy(_tests_data)
         for (name, logger) in _indexer_loggers.items():
             _current_tests_data[name].log = logger
     return _current_tests_data
diff --git a/swh/web/tests/testcase.py b/swh/web/tests/testcase.py
index d15bb62e..fc7c55dc 100644
--- a/swh/web/tests/testcase.py
+++ b/swh/web/tests/testcase.py
@@ -1,161 +1,161 @@
 # Copyright (C) 2015-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU Affero General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import shutil
 from subprocess import run, PIPE
 
 from django.core.cache import cache
 from hypothesis.extra.django import TestCase
 
 from swh.model.hashutil import hash_to_bytes
 from swh.web import config
 from swh.web.common import converters, service
 from swh.web.tests.data import get_tests_data
 
 
 ctags_json_missing = \
     shutil.which('ctags') is None or \
     b'+json' not in run(['ctags', '--version'], stdout=PIPE).stdout
 
 fossology_missing = shutil.which('nomossa') is None
 
 
 class WebTestCase(TestCase):
     """Base TestCase class for swh-web.
 
     It is initialized with references to in-memory storages containing
     raw tests data.
 
     It also defines class methods to retrieve those tests data in
     a json serializable format in order to ease tests implementation.
 
     """
     def _pre_setup(self):
         cache.clear()
 
         tests_data = get_tests_data(reset=True)
         self.storage = tests_data['storage']
         self.idx_storage = tests_data['idx_storage']
         self.mimetype_indexer = tests_data['mimetype_indexer']
-        self.language_indexer = tests_data['language_indexer']
         self.license_indexer = tests_data['license_indexer']
         self.ctags_indexer = tests_data['ctags_indexer']
 
         # Update swh-web configuration to use the in-memory storage
         # instantiated in the tests.data module
         swh_config = config.get_config()
         swh_config.update({'storage': self.storage})
         service.storage = self.storage
 
         # Update swh-web configuration to use the in-memory indexer storage
         # instantiated in the tests.data modules
         swh_config.update({'indexer_storage': self.idx_storage})
         service.idx_storage = self.idx_storage
 
         super()._pre_setup()
 
     def content_add_mimetype(self, cnt_id):
         self.mimetype_indexer.run([hash_to_bytes(cnt_id)],
                                   'update-dups')
 
     def content_get_mimetype(self, cnt_id):
         mimetype = next(self.idx_storage.content_mimetype_get(
                         [hash_to_bytes(cnt_id)]))
         return converters.from_filetype(mimetype)
 
     def content_add_language(self, cnt_id):
+        raise NotImplementedError('Language indexer is disabled.')
         self.language_indexer.run([hash_to_bytes(cnt_id)],
                                   'update-dups')
 
     def content_get_language(self, cnt_id):
         lang = next(self.idx_storage.content_language_get(
                     [hash_to_bytes(cnt_id)]))
         return converters.from_swh(lang, hashess={'id'})
 
     def content_add_license(self, cnt_id):
         self.license_indexer.run([hash_to_bytes(cnt_id)],
                                  'update-dups')
 
     def content_get_license(self, cnt_id):
         cnt_id_bytes = hash_to_bytes(cnt_id)
         lic = next(self.idx_storage.content_fossology_license_get(
                    [cnt_id_bytes]))
         return converters.from_swh({'id': cnt_id_bytes,
                                     'facts': lic[cnt_id_bytes]},
                                    hashess={'id'})
 
     def content_add_ctags(self, cnt_id):
         self.ctags_indexer.run([hash_to_bytes(cnt_id)],
                                'update-dups')
 
     def content_get_ctags(self, cnt_id):
         cnt_id_bytes = hash_to_bytes(cnt_id)
         ctags = self.idx_storage.content_ctags_get([cnt_id_bytes])
         for ctag in ctags:
             yield converters.from_swh(ctag, hashess={'id'})
 
     def content_get_metadata(self, cnt_id):
         cnt_id_bytes = hash_to_bytes(cnt_id)
         metadata = next(self.storage.content_get_metadata([cnt_id_bytes]))
         return converters.from_swh(metadata,
                                    hashess={'sha1', 'sha1_git', 'sha256',
                                             'blake2s256'})
 
     def content_get(self, cnt_id):
         cnt_id_bytes = hash_to_bytes(cnt_id)
         cnt = next(self.storage.content_get([cnt_id_bytes]))
         return converters.from_content(cnt)
 
     def directory_ls(self, dir_id):
         cnt_id_bytes = hash_to_bytes(dir_id)
         dir_content = map(converters.from_directory_entry,
                           self.storage.directory_ls(cnt_id_bytes))
         return list(dir_content)
 
     def release_get(self, rel_id):
         rel_id_bytes = hash_to_bytes(rel_id)
         rel_data = next(self.storage.release_get([rel_id_bytes]))
         return converters.from_release(rel_data)
 
     def revision_get(self, rev_id):
         rev_id_bytes = hash_to_bytes(rev_id)
         rev_data = next(self.storage.revision_get([rev_id_bytes]))
         return converters.from_revision(rev_data)
 
     def revision_log(self, rev_id, limit=None):
         rev_id_bytes = hash_to_bytes(rev_id)
         return list(map(converters.from_revision,
                     self.storage.revision_log([rev_id_bytes], limit=limit)))
 
     def snapshot_get_latest(self, origin_id):
         snp = self.storage.snapshot_get_latest(origin_id)
         return converters.from_snapshot(snp)
 
     def origin_get(self, origin_info):
         origin = self.storage.origin_get(origin_info)
         return converters.from_origin(origin)
 
     def origin_visit_get(self, origin_id):
         visits = self.storage.origin_visit_get(origin_id)
         return list(map(converters.from_origin_visit, visits))
 
     def origin_visit_get_by(self, origin_id, visit_id):
         visit = self.storage.origin_visit_get_by(origin_id, visit_id)
         return converters.from_origin_visit(visit)
 
     def snapshot_get(self, snapshot_id):
         snp = self.storage.snapshot_get(hash_to_bytes(snapshot_id))
         return converters.from_snapshot(snp)
 
     def snapshot_get_branches(self, snapshot_id, branches_from='',
                               branches_count=1000, target_types=None):
         snp = self.storage.snapshot_get_branches(
             hash_to_bytes(snapshot_id), branches_from.encode(),
             branches_count, target_types)
         return converters.from_snapshot(snp)
 
     def person_get(self, person_id):
         person = next(self.storage.person_get([person_id]))
         return converters.from_person(person)