diff --git a/swh/search/cli.py b/swh/search/cli.py
index 26658ab..ae67b1c 100644
--- a/swh/search/cli.py
+++ b/swh/search/cli.py
@@ -1,127 +1,130 @@
 # Copyright (C) 2019-2020  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 # WARNING: do not import unnecessary things here to keep cli startup time under
 # control
 import click
 
 from swh.core.cli import CONTEXT_SETTINGS
 from swh.core.cli import swh as swh_cli_group
 
 
 @swh_cli_group.group(name="search", context_settings=CONTEXT_SETTINGS)
 @click.option(
     "--config-file",
     "-C",
     default=None,
     type=click.Path(exists=True, dir_okay=False,),
     help="Configuration file.",
 )
 @click.pass_context
 def search_cli_group(ctx, config_file):
     """Software Heritage Search tools."""
     from swh.core import config
 
     ctx.ensure_object(dict)
     conf = config.read(config_file)
     ctx.obj["config"] = conf
 
 
 @search_cli_group.command("initialize")
 @click.pass_context
 def initialize(ctx):
     """Creates Elasticsearch indices."""
     from . import get_search
 
     search = get_search(**ctx.obj["config"]["search"])
     search.initialize()
     print("Done.")
 
 
 @search_cli_group.group("journal-client")
 @click.pass_context
 def journal_client(ctx):
     """"""
     pass
 
 
 @journal_client.command("objects")
 @click.option(
     "--stop-after-objects",
     "-m",
     default=None,
     type=int,
     help="Maximum number of objects to replay. Default is to run forever.",
 )
 @click.option(
     "--object-type",
     "-o",
     multiple=True,
     help="Default list of object types to subscribe to",
 )
 @click.option(
     "--prefix", "-p", help="Topic prefix to use (e.g swh.journal.indexed)",
 )
 @click.pass_context
 def journal_client_objects(ctx, stop_after_objects, object_type, prefix):
     """Listens for new objects from the SWH Journal, and schedules tasks
     to run relevant indexers (currently, origin and origin_visit)
     on these new objects.
 
     """
     import functools
 
     from swh.journal.client import get_journal_client
 
     from . import get_search
     from .journal_client import process_journal_objects
 
     config = ctx.obj["config"]
     journal_cfg = config["journal"]
 
     journal_cfg["object_types"] = object_type or journal_cfg.get("object_types", [])
     journal_cfg["prefix"] = prefix or journal_cfg.get("prefix")
     journal_cfg["stop_after_objects"] = stop_after_objects or journal_cfg.get(
         "stop_after_objects"
     )
 
     if len(journal_cfg["object_types"]) == 0:
         raise ValueError("'object_types' must be specified by cli or configuration")
 
     if journal_cfg["prefix"] is None:
         raise ValueError("'prefix' must be specified by cli or configuration")
 
     client = get_journal_client(cls="kafka", **journal_cfg,)
     search = get_search(**config["search"])
 
     worker_fn = functools.partial(process_journal_objects, search=search,)
     nb_messages = 0
     try:
         nb_messages = client.process(worker_fn)
         print("Processed %d messages." % nb_messages)
     except KeyboardInterrupt:
         ctx.exit(0)
     else:
         print("Done.")
     finally:
         client.close()
 
 
 @search_cli_group.command("rpc-serve")
 @click.argument("config-path", required=True)
 @click.option("--host", default="0.0.0.0", help="Host to run the server")
 @click.option("--port", default=5010, type=click.INT, help="Binding port of the server")
+@click.option(
+    "--index-prefix", required=False, help="The prefix to add before the index names"
+)
 @click.option(
     "--debug/--nodebug",
     default=True,
     help="Indicates if the server should run in debug mode",
 )
-def rpc_server(config_path, host, port, debug):
+def rpc_server(config_path, host, port, index_prefix, debug):
     """Starts a Software Heritage Indexer RPC HTTP server."""
     from .api.server import app, load_and_check_config
 
     api_cfg = load_and_check_config(config_path, type="any")
     app.config.update(api_cfg)
-    app.run(host, port=int(port), debug=bool(debug))
+    app.run(host, port=int(port), index_prefix=index_prefix, debug=bool(debug))
diff --git a/swh/search/elasticsearch.py b/swh/search/elasticsearch.py
index d444bc8..fc0aa4b 100644
--- a/swh/search/elasticsearch.py
+++ b/swh/search/elasticsearch.py
@@ -1,232 +1,240 @@
 # Copyright (C) 2019-2020  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import base64
 from typing import Any, Dict, Iterable, Iterator, List, Optional
 
 from elasticsearch import Elasticsearch
 from elasticsearch.helpers import bulk, scan
 import msgpack
 
 from swh.indexer import codemeta
 from swh.model import model
 from swh.model.identifiers import origin_identifier
 from swh.search.interface import PagedResult
 
 
 def _sanitize_origin(origin):
     origin = origin.copy()
 
     # Whitelist fields to be saved in Elasticsearch
     res = {"url": origin.pop("url")}
     for field_name in ("intrinsic_metadata", "has_visits"):
         if field_name in origin:
             res[field_name] = origin.pop(field_name)
 
     # Run the JSON-LD expansion algorithm
     # <https://www.w3.org/TR/json-ld-api/#expansion>
     # to normalize the Codemeta metadata.
     # This is required as Elasticsearch will needs each field to have a consistent
     # type across documents to be searchable; and non-expanded JSON-LD documents
     # can have various types in the same field. For example, all these are
     # equivalent in JSON-LD:
     # * {"author": "Jane Doe"}
     # * {"author": ["Jane Doe"]}
     # * {"author": {"@value": "Jane Doe"}}
     # * {"author": [{"@value": "Jane Doe"}]}
     # and JSON-LD expansion will convert them all to the last one.
     if "intrinsic_metadata" in res:
         res["intrinsic_metadata"] = codemeta.expand(res["intrinsic_metadata"])
 
     return res
 
 
 def token_encode(index_to_tokenize: Dict[bytes, Any]) -> str:
     """Tokenize as string an index page result from a search
 
     """
     page_token = base64.b64encode(msgpack.dumps(index_to_tokenize))
     return page_token.decode()
 
 
 def token_decode(page_token: str) -> Dict[bytes, Any]:
     """Read the page_token
 
     """
     return msgpack.loads(base64.b64decode(page_token.encode()), raw=True)
 
 
 class ElasticSearch:
-    def __init__(self, hosts: List[str]):
+    def __init__(self, hosts: List[str], index_prefix=None):
         self._backend = Elasticsearch(hosts=hosts)
+        self.index_prefix = index_prefix
+
+        self.origin_index = "origin"
+
+        if index_prefix:
+            self.origin_index = index_prefix + "_" + self.origin_index
 
     def check(self):
         return self._backend.ping()
 
     def deinitialize(self) -> None:
         """Removes all indices from the Elasticsearch backend"""
         self._backend.indices.delete(index="*")
 
     def initialize(self) -> None:
         """Declare Elasticsearch indices and mappings"""
-        if not self._backend.indices.exists(index="origin"):
-            self._backend.indices.create(index="origin")
+        if not self._backend.indices.exists(index=self.origin_index):
+            self._backend.indices.create(index=self.origin_index)
         self._backend.indices.put_mapping(
-            index="origin",
+            index=self.origin_index,
             body={
                 "properties": {
                     # sha1 of the URL; used as the document id
                     "sha1": {"type": "keyword", "doc_values": True,},
                     # Used both to search URLs, and as the result to return
                     # as a response to queries
                     "url": {
                         "type": "text",
                         # To split URLs into token on any character
                         # that is not alphanumerical
                         "analyzer": "simple",
                         # 2-gram and partial-3-gram search (ie. with the end of the
                         # third word potentially missing)
                         "fields": {
                             "as_you_type": {
                                 "type": "search_as_you_type",
                                 "analyzer": "simple",
                             }
                         },
                     },
                     # used to filter out origins that were never visited
                     "has_visits": {"type": "boolean",},
                     "intrinsic_metadata": {
                         "type": "nested",
                         "properties": {
                             "@context": {
                                 # don't bother indexing tokens in these URIs, as the
                                 # are used as namespaces
                                 "type": "keyword",
                             }
                         },
                     },
                 }
             },
         )
 
     def flush(self) -> None:
-        self._backend.indices.refresh(index="_all")
+        self._backend.indices.refresh(index=self.origin_index)
 
     def origin_update(self, documents: Iterable[Dict]) -> None:
         documents = map(_sanitize_origin, documents)
         documents_with_sha1 = (
             (origin_identifier(document), document) for document in documents
         )
         actions = [
             {
                 "_op_type": "update",
                 "_id": sha1,
-                "_index": "origin",
+                "_index": self.origin_index,
                 "doc": {**document, "sha1": sha1,},
                 "doc_as_upsert": True,
             }
             for (sha1, document) in documents_with_sha1
         ]
-        bulk(self._backend, actions, index="origin")
+        bulk(self._backend, actions, index=self.origin_index)
 
     def origin_dump(self) -> Iterator[model.Origin]:
-        results = scan(self._backend, index="*")
+        results = scan(self._backend, index=self.origin_index)
         for hit in results:
-            yield self._backend.termvectors(index="origin", id=hit["_id"], fields=["*"])
+            yield self._backend.termvectors(
+                index=self.origin_index, id=hit["_id"], fields=["*"]
+            )
 
     def origin_search(
         self,
         *,
         url_pattern: Optional[str] = None,
         metadata_pattern: Optional[str] = None,
         with_visit: bool = False,
         page_token: Optional[str] = None,
         limit: int = 50,
     ) -> PagedResult[Dict[str, Any]]:
         query_clauses: List[Dict[str, Any]] = []
 
         if url_pattern:
             query_clauses.append(
                 {
                     "multi_match": {
                         "query": url_pattern,
                         "type": "bool_prefix",
                         "operator": "and",
                         "fields": [
                             "url.as_you_type",
                             "url.as_you_type._2gram",
                             "url.as_you_type._3gram",
                         ],
                     }
                 }
             )
 
         if metadata_pattern:
             query_clauses.append(
                 {
                     "nested": {
                         "path": "intrinsic_metadata",
                         "query": {
                             "multi_match": {
                                 "query": metadata_pattern,
                                 # Makes it so that the "foo bar" query returns
                                 # documents which contain "foo" in a field and "bar"
                                 # in a different field
                                 "type": "cross_fields",
                                 # All keywords must be found in a document for it to
                                 # be considered a match.
                                 # TODO: allow missing keywords?
                                 "operator": "and",
                                 # Searches on all fields of the intrinsic_metadata dict,
                                 # recursively.
                                 "fields": ["intrinsic_metadata.*"],
                             }
                         },
                     }
                 }
             )
 
         if not query_clauses:
             raise ValueError(
                 "At least one of url_pattern and metadata_pattern must be provided."
             )
 
         if with_visit:
             query_clauses.append({"term": {"has_visits": True,}})
 
         body = {
             "query": {"bool": {"must": query_clauses,}},
             "sort": [{"_score": "desc"}, {"sha1": "asc"},],
         }
         if page_token:
             # TODO: use ElasticSearch's scroll API?
             page_token_content = token_decode(page_token)
             body["search_after"] = [
                 page_token_content[b"score"],
                 page_token_content[b"sha1"].decode("ascii"),
             ]
 
-        res = self._backend.search(index="origin", body=body, size=limit)
+        res = self._backend.search(index=self.origin_index, body=body, size=limit)
 
         hits = res["hits"]["hits"]
 
         next_page_token: Optional[str] = None
 
         if len(hits) == limit:
             # There are more results after this page; return a pagination token
             # to get them in a future query
             last_hit = hits[-1]
             next_page_token_content = {
                 b"score": last_hit["_score"],
                 b"sha1": last_hit["_source"]["sha1"],
             }
             next_page_token = token_encode(next_page_token_content)
 
         assert len(hits) <= limit
 
         return PagedResult(
             results=[{"url": hit["_source"]["url"]} for hit in hits],
             next_page_token=next_page_token,
         )
diff --git a/swh/search/tests/conftest.py b/swh/search/tests/conftest.py
index b14e443..084c1b2 100644
--- a/swh/search/tests/conftest.py
+++ b/swh/search/tests/conftest.py
@@ -1,129 +1,131 @@
 # Copyright (C) 2019-2020  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import logging
 import socket
 import subprocess
 import time
 
 import elasticsearch
 import pytest
 
 from swh.search import get_search
 
 logger = logging.getLogger(__name__)
 
 
 def free_port():
     sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
     sock.bind(("127.0.0.1", 0))
     port = sock.getsockname()[1]
     sock.close()
     return port
 
 
 def wait_for_peer(addr, port):
     while True:
         try:
             sock = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
             sock.connect((addr, port))
         except ConnectionRefusedError:
             time.sleep(0.1)
         else:
             sock.close()
             break
 
 
 CONFIG_TEMPLATE = """
 node.name: node-1
 path.data: {data}
 path.logs: {logs}
 network.host: 127.0.0.1
 http.port: {http_port}
 transport.port: {transport_port}
 """
 
 
 def _run_elasticsearch(conf_dir, data_dir, logs_dir, http_port, transport_port):
     es_home = "/usr/share/elasticsearch"
 
     with open(conf_dir + "/elasticsearch.yml", "w") as fd:
         fd.write(
             CONFIG_TEMPLATE.format(
                 data=data_dir,
                 logs=logs_dir,
                 http_port=http_port,
                 transport_port=transport_port,
             )
         )
 
     with open(conf_dir + "/log4j2.properties", "w") as fd:
         pass
 
     cmd = [
         "/usr/share/elasticsearch/jdk/bin/java",
         "-Des.path.home={}".format(es_home),
         "-Des.path.conf={}".format(conf_dir),
         "-Des.bundled_jdk=true",
         "-Dlog4j2.disable.jmx=true",
         "-cp",
         "{}/lib/*".format(es_home),
         "org.elasticsearch.bootstrap.Elasticsearch",
     ]
 
     host = "127.0.0.1:{}".format(http_port)
 
     with open(logs_dir + "/output.txt", "w") as fd:
         p = subprocess.Popen(cmd)
 
     wait_for_peer("127.0.0.1", http_port)
 
     client = elasticsearch.Elasticsearch([host])
     assert client.ping()
 
     return p
 
 
 @pytest.fixture(scope="session")
 def elasticsearch_session(tmpdir_factory):
     tmpdir = tmpdir_factory.mktemp("elasticsearch")
     es_conf = tmpdir.mkdir("conf")
 
     http_port = free_port()
     transport_port = free_port()
 
     p = _run_elasticsearch(
         conf_dir=str(es_conf),
         data_dir=str(tmpdir.mkdir("data")),
         logs_dir=str(tmpdir.mkdir("logs")),
         http_port=http_port,
         transport_port=transport_port,
     )
 
     yield "127.0.0.1:{}".format(http_port)
 
     # Check ES didn't stop
     assert p.returncode is None, p.returncode
 
     p.kill()
     p.wait()
 
 
 @pytest.fixture(scope="class")
 def elasticsearch_host(elasticsearch_session):
     yield elasticsearch_session
 
 
 @pytest.fixture
 def swh_search(elasticsearch_host):
     """Instantiate a search client, initialize the elasticsearch instance,
     and returns it
 
     """
     logger.debug("swh_search: elasticsearch_host: %s", elasticsearch_host)
-    search = get_search("elasticsearch", hosts=[elasticsearch_host],)
+    search = get_search(
+        "elasticsearch", hosts=[elasticsearch_host], index_prefix="test"
+    )
     search.deinitialize()  # To reset internal state from previous runs
     search.initialize()  # install required index
     yield search
diff --git a/swh/search/tests/test_api_client.py b/swh/search/tests/test_api_client.py
index a173ebe..25a8b90 100644
--- a/swh/search/tests/test_api_client.py
+++ b/swh/search/tests/test_api_client.py
@@ -1,43 +1,45 @@
 # Copyright (C) 2019-2020  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import unittest
 
 import pytest
 
 from swh.core.api.tests.server_testing import ServerTestFixture
 from swh.search import get_search
 from swh.search.api.server import app
 
 from .test_search import CommonSearchTest
 
 
 class TestRemoteSearch(CommonSearchTest, ServerTestFixture, unittest.TestCase):
     @pytest.fixture(autouse=True)
     def _instantiate_search(self, elasticsearch_host):
         self._elasticsearch_host = elasticsearch_host
 
     def setUp(self):
         self.config = {
             "search": {
                 "cls": "elasticsearch",
-                "args": {"hosts": [self._elasticsearch_host],},
+                "args": {"hosts": [self._elasticsearch_host], "index_prefix": "test"},
             }
         }
         self.app = app
         super().setUp()
         self.reset()
         self.search = get_search("remote", url=self.url(),)
 
     def reset(self):
-        search = get_search("elasticsearch", hosts=[self._elasticsearch_host],)
+        search = get_search(
+            "elasticsearch", hosts=[self._elasticsearch_host], index_prefix="test"
+        )
         search.deinitialize()
         search.initialize()
 
     @pytest.mark.skip(
         "Elasticsearch also returns close matches, so this test would fail"
     )
     def test_origin_url_paging(self, count):
         pass
diff --git a/swh/search/tests/test_cli.py b/swh/search/tests/test_cli.py
index 297b444..d5ed883 100644
--- a/swh/search/tests/test_cli.py
+++ b/swh/search/tests/test_cli.py
@@ -1,391 +1,411 @@
 # Copyright (C) 2019-2020  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import copy
 import tempfile
 
 from click.testing import CliRunner
 from confluent_kafka import Producer
 import pytest
 import yaml
 
 from swh.journal.serializers import value_to_kafka
 from swh.model.hashutil import hash_to_bytes
+from swh.search import get_search
 from swh.search.cli import search_cli_group
 
 CLI_CONFIG = """
 search:
     cls: elasticsearch
     args:
         hosts:
         - '%(elasticsearch_host)s'
+        index_prefix: test
 """
 
 JOURNAL_OBJECTS_CONFIG_TEMPLATE = """
 journal:
     brokers:
         - {broker}
     prefix: {prefix}
     group_id: {group_id}
 """
 
 
 def invoke(catch_exceptions, args, config="", *, elasticsearch_host):
     runner = CliRunner()
     with tempfile.NamedTemporaryFile("a", suffix=".yml") as config_fd:
         config_fd.write(
             (CLI_CONFIG + config) % {"elasticsearch_host": elasticsearch_host}
         )
         config_fd.seek(0)
         result = runner.invoke(search_cli_group, ["-C" + config_fd.name] + args)
     if not catch_exceptions and result.exception:
         print(result.output)
         raise result.exception
     return result
 
 
 def test__journal_client__origin(
     swh_search, elasticsearch_host: str, kafka_prefix: str, kafka_server
 ):
     """Tests the re-indexing when origin_batch_size*task_batch_size is a
     divisor of nb_origins."""
     producer = Producer(
         {
             "bootstrap.servers": kafka_server,
             "client.id": "test search origin producer",
             "acks": "all",
         }
     )
     origin_foobar_baz = {
         "url": "http://foobar.baz",
     }
     value = value_to_kafka(origin_foobar_baz)
     topic = f"{kafka_prefix}.origin"
     producer.produce(topic=topic, key=b"bogus-origin", value=value)
 
     journal_objects_config = JOURNAL_OBJECTS_CONFIG_TEMPLATE.format(
         broker=kafka_server, prefix=kafka_prefix, group_id="test-consumer"
     )
     result = invoke(
         False,
         [
             "journal-client",
             "objects",
             "--stop-after-objects",
             "1",
             "--object-type",
             "origin",
             "--prefix",
             kafka_prefix,
         ],
         journal_objects_config,
         elasticsearch_host=elasticsearch_host,
     )
 
     # Check the output
     expected_output = "Processed 1 messages.\nDone.\n"
     assert result.exit_code == 0, result.output
     assert result.output == expected_output
 
     swh_search.flush()
 
     # searching origin without visit as requirement
     actual_page = swh_search.origin_search(url_pattern="foobar")
     # We find it
     assert actual_page.next_page_token is None
     assert actual_page.results == [origin_foobar_baz]
 
     # It's an origin with no visit, searching for it with visit
     actual_page = swh_search.origin_search(url_pattern="foobar", with_visit=True)
     # returns nothing
     assert actual_page.next_page_token is None
     assert actual_page.results == []
 
 
 def test__journal_client__origin_visit(
     swh_search, elasticsearch_host, kafka_prefix: str, kafka_server
 ):
     """Tests the re-indexing when origin_batch_size*task_batch_size is a
     divisor of nb_origins."""
     origin_foobar = {"url": "http://baz.foobar"}
     producer = Producer(
         {
             "bootstrap.servers": kafka_server,
             "client.id": "test search origin visit producer",
             "acks": "all",
         }
     )
     topic = f"{kafka_prefix}.origin_visit"
     value = value_to_kafka({"origin": origin_foobar["url"]})
     producer.produce(topic=topic, key=b"bogus-origin-visit", value=value)
 
     journal_objects_config = JOURNAL_OBJECTS_CONFIG_TEMPLATE.format(
         broker=kafka_server, prefix=kafka_prefix, group_id="test-consumer"
     )
     result = invoke(
         False,
         [
             "journal-client",
             "objects",
             "--stop-after-objects",
             "1",
             "--object-type",
             "origin_visit",
         ],
         journal_objects_config,
         elasticsearch_host=elasticsearch_host,
     )
 
     # Check the output
     expected_output = "Processed 1 messages.\nDone.\n"
     assert result.exit_code == 0, result.output
     assert result.output == expected_output
 
     swh_search.flush()
 
     # Both search returns the visit
     actual_page = swh_search.origin_search(url_pattern="foobar", with_visit=False)
     assert actual_page.next_page_token is None
     assert actual_page.results == [origin_foobar]
 
     actual_page = swh_search.origin_search(url_pattern="foobar", with_visit=True)
     assert actual_page.next_page_token is None
     assert actual_page.results == [origin_foobar]
 
 
 def test__journal_client__origin_visit_status(
     swh_search, elasticsearch_host, kafka_prefix: str, kafka_server
 ):
     """Subscribing to origin-visit-status should result in swh-search indexation
 
     """
     origin_foobar = {"url": "http://baz.foobar"}
     producer = Producer(
         {
             "bootstrap.servers": kafka_server,
             "client.id": "test search origin visit status producer",
             "acks": "all",
         }
     )
     topic = f"{kafka_prefix}.origin_visit_status"
     value = value_to_kafka(
         {
             "origin": origin_foobar["url"],
             "visit": 1,
             "snapshot": None,
             "status": "full",
         }
     )
     producer.produce(topic=topic, key=b"bogus-origin-visit-status", value=value)
 
     journal_objects_config = JOURNAL_OBJECTS_CONFIG_TEMPLATE.format(
         broker=kafka_server, prefix=kafka_prefix, group_id="test-consumer"
     )
     result = invoke(
         False,
         [
             "journal-client",
             "objects",
             "--stop-after-objects",
             "1",
             "--prefix",
             kafka_prefix,
             "--object-type",
             "origin_visit_status",
         ],
         journal_objects_config,
         elasticsearch_host=elasticsearch_host,
     )
 
     # Check the output
     expected_output = "Processed 1 messages.\nDone.\n"
     assert result.exit_code == 0, result.output
     assert result.output == expected_output
 
     swh_search.flush()
 
     # Both search returns the visit
     actual_page = swh_search.origin_search(url_pattern="foobar", with_visit=False)
     assert actual_page.next_page_token is None
     assert actual_page.results == [origin_foobar]
 
     actual_page = swh_search.origin_search(url_pattern="foobar", with_visit=True)
     assert actual_page.next_page_token is None
     assert actual_page.results == [origin_foobar]
 
 
 def test__journal_client__origin_intrinsic_metadata(
     swh_search, elasticsearch_host, kafka_prefix: str, kafka_server
 ):
     """Subscribing to origin-intrinsic-metadata should result in swh-search indexation
 
     """
     origin_foobar = {"url": "https://github.com/clojure/clojure"}
 
     origin_intrinsic_metadata = {
         "id": origin_foobar["url"],
         "metadata": {
             "name": "clojure",
             "type": "SoftwareSourceCode",
             "license": "http://opensource.org/licenses/eclipse-1.0.php",
             "version": "1.10.2-master-SNAPSHOT",
             "@context": "https://doi.org/10.5063/schema/codemeta-2.0",
             "identifier": "org.clojure",
             "description": "Clojure core environment and runtime library.",
             "codeRepository": "https://repo.maven.apache.org/maven2/org/clojure/clojure",  # noqa
         },
         "indexer_configuration_id": 1,
         "from_revision": hash_to_bytes("f47c139e20970ee0852166f48ee2a4626632b86e"),
         "mappings": ["maven"],
     }
 
     producer = Producer(
         {
             "bootstrap.servers": kafka_server,
             "client.id": "test search origin intrinsic metadata producer",
             "acks": "all",
         }
     )
     topic = f"{kafka_prefix}.origin_intrinsic_metadata"
     value = value_to_kafka(origin_intrinsic_metadata)
     producer.produce(topic=topic, key=b"bogus-origin-intrinsic-metadata", value=value)
 
     journal_objects_config = JOURNAL_OBJECTS_CONFIG_TEMPLATE.format(
         broker=kafka_server, prefix=kafka_prefix, group_id="test-consumer"
     )
     result = invoke(
         False,
         [
             "journal-client",
             "objects",
             "--stop-after-objects",
             "1",
             "--object-type",
             "origin_intrinsic_metadata",
         ],
         journal_objects_config,
         elasticsearch_host=elasticsearch_host,
     )
 
     # Check the output
     expected_output = "Processed 1 messages.\nDone.\n"
     assert result.exit_code == 0, result.output
     assert result.output == expected_output
 
     swh_search.flush()
 
     # search without visit returns the metadata
     actual_page = swh_search.origin_search(url_pattern="clojure", with_visit=False)
     assert actual_page.next_page_token is None
     assert actual_page.results == [origin_foobar]
 
     # no visit associated so it does not return anything
     actual_page = swh_search.origin_search(url_pattern="clojure", with_visit=True)
     assert actual_page.next_page_token is None
     assert actual_page.results == []
 
 
 def test__journal_client__missing_main_journal_config_key(elasticsearch_host):
     """Missing configuration on journal should raise"""
     with pytest.raises(KeyError, match="journal"):
         invoke(
             catch_exceptions=False,
             args=["journal-client", "objects", "--stop-after-objects", "1",],
             config="",  # missing config will make it raise
             elasticsearch_host=elasticsearch_host,
         )
 
 
 def test__journal_client__missing_journal_config_keys(elasticsearch_host):
     """Missing configuration on mandatory journal keys should raise"""
     kafka_prefix = "swh.journal.objects"
     journal_objects_config = JOURNAL_OBJECTS_CONFIG_TEMPLATE.format(
         broker="192.0.2.1", prefix=kafka_prefix, group_id="test-consumer"
     )
     journal_config = yaml.safe_load(journal_objects_config)
 
     for key in journal_config["journal"].keys():
         if key == "prefix":  # optional
             continue
         cfg = copy.deepcopy(journal_config)
         del cfg["journal"][key]  # make config incomplete
         yaml_cfg = yaml.dump(cfg)
 
         with pytest.raises(TypeError, match=f"{key}"):
             invoke(
                 catch_exceptions=False,
                 args=[
                     "journal-client",
                     "objects",
                     "--stop-after-objects",
                     "1",
                     "--prefix",
                     kafka_prefix,
                     "--object-type",
                     "origin_visit_status",
                 ],
                 config=yaml_cfg,  # incomplete config will make the cli raise
                 elasticsearch_host=elasticsearch_host,
             )
 
 
 def test__journal_client__missing_prefix_config_key(
     swh_search, elasticsearch_host, kafka_server
 ):
     """Missing configuration on mandatory prefix key should raise"""
 
     journal_cfg_template = """
 journal:
     brokers:
         - {broker}
     group_id: {group_id}
     """
 
     journal_cfg = journal_cfg_template.format(
         broker=kafka_server, group_id="test-consumer"
     )
 
     with pytest.raises(ValueError, match="prefix"):
         invoke(
             False,
             # Missing --prefix (and no config key) will make the cli raise
             [
                 "journal-client",
                 "objects",
                 "--stop-after-objects",
                 "1",
                 "--object-type",
                 "origin_visit_status",
             ],
             journal_cfg,
             elasticsearch_host=elasticsearch_host,
         )
 
 
 def test__journal_client__missing_object_types_config_key(
     swh_search, elasticsearch_host, kafka_server
 ):
     """Missing configuration on mandatory object-types key should raise"""
 
     journal_cfg_template = """
 journal:
     brokers:
         - {broker}
     prefix: swh.journal.objects
     group_id: {group_id}
     """
 
     journal_cfg = journal_cfg_template.format(
         broker=kafka_server, group_id="test-consumer"
     )
 
     with pytest.raises(ValueError, match="object_types"):
         invoke(
             False,
             # Missing --object-types (and no config key) will make the cli raise
             ["journal-client", "objects", "--stop-after-objects", "1"],
             journal_cfg,
             elasticsearch_host=elasticsearch_host,
         )
+
+
+def test__initialize__with_prefix(elasticsearch_host):
+    """Initializing the index with a prefix should create an <prefix>_origin index"""
+
+    search = get_search(
+        "elasticsearch", hosts=[elasticsearch_host], index_prefix="test"
+    )
+
+    assert search.origin_index == "test_origin"
+
+
+def test__initialize__without_prefix(elasticsearch_host):
+    """Initializing the index without a prefix should create an origin index"""
+
+    search = get_search("elasticsearch", hosts=[elasticsearch_host])
+
+    assert search.origin_index == "origin"
diff --git a/swh/search/tests/test_init.py b/swh/search/tests/test_init.py
index 8008a48..153309c 100644
--- a/swh/search/tests/test_init.py
+++ b/swh/search/tests/test_init.py
@@ -1,84 +1,84 @@
 # Copyright (C) 2020 The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import inspect
 
 import pytest
 
 from swh.search import get_search
 from swh.search.api.client import RemoteSearch
 from swh.search.elasticsearch import ElasticSearch
 from swh.search.in_memory import InMemorySearch
 from swh.search.interface import SearchInterface
 
 SEARCH_IMPLEMENTATIONS_KWARGS = [
     ("remote", RemoteSearch, {"url": "localhost"}),
-    ("elasticsearch", ElasticSearch, {"hosts": ["localhost"]}),
+    ("elasticsearch", ElasticSearch, {"hosts": ["localhost"], "index_prefix": "test"}),
 ]
 
 SEARCH_IMPLEMENTATIONS = SEARCH_IMPLEMENTATIONS_KWARGS + [
     ("memory", InMemorySearch, None),
 ]
 
 
 def test_get_search_failure():
     with pytest.raises(ValueError, match="Unknown search class"):
         get_search("unknown-search")
 
 
 @pytest.mark.parametrize("class_,expected_class,kwargs", SEARCH_IMPLEMENTATIONS)
 def test_get_search(mocker, class_, expected_class, kwargs):
     mocker.patch("swh.search.elasticsearch.Elasticsearch")
     if kwargs:
         concrete_search = get_search(class_, **kwargs)
     else:
         concrete_search = get_search(class_)
     assert isinstance(concrete_search, expected_class)
 
 
 @pytest.mark.parametrize("class_,expected_class,kwargs", SEARCH_IMPLEMENTATIONS_KWARGS)
 def test_get_search_deprecation_warning(mocker, class_, expected_class, kwargs):
     with pytest.warns(DeprecationWarning):
         concrete_search = get_search(class_, args=kwargs)
     assert isinstance(concrete_search, expected_class)
 
 
 @pytest.mark.parametrize("class_,expected_class,kwargs", SEARCH_IMPLEMENTATIONS)
 def test_types(mocker, class_, expected_class, kwargs):
     """Checks all methods of SearchInterface are implemented by this
     backend, and that they have the same signature.
 
     """
     mocker.patch("swh.search.elasticsearch.Elasticsearch")
     if kwargs:
         concrete_search = get_search(class_, **kwargs)
     else:
         concrete_search = get_search(class_)
 
     # Create an instance of the protocol (which cannot be instantiated
     # directly, so this creates a subclass, then instantiates it)
     interface = type("_", (SearchInterface,), {})()
 
     for meth_name in dir(interface):
         if meth_name.startswith("_"):
             continue
         interface_meth = getattr(interface, meth_name)
 
         missing_methods = []
 
         try:
             concrete_meth = getattr(concrete_search, meth_name)
         except AttributeError:
             if not getattr(interface_meth, "deprecated_endpoint", False):
                 # The backend is missing a (non-deprecated) endpoint
                 missing_methods.append(meth_name)
                 continue
 
         expected_signature = inspect.signature(interface_meth)
         actual_signature = inspect.signature(concrete_meth)
 
         assert expected_signature == actual_signature, meth_name
 
         assert missing_methods == []