diff --git a/swh/storage/pytest_plugin.py b/swh/storage/pytest_plugin.py
index a4640a8c..877d5c87 100644
--- a/swh/storage/pytest_plugin.py
+++ b/swh/storage/pytest_plugin.py
@@ -1,211 +1,252 @@
 # Copyright (C) 2019-2020  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import glob
 
 from os import path, environ
-from typing import Dict, Union
+from typing import Dict, Iterable, Union
 
 import pytest
 
 import swh.storage
 
 from pytest_postgresql import factories
 from pytest_postgresql.janitor import DatabaseJanitor, psycopg2, Version
 
 from swh.core.utils import numfile_sortkey as sortkey
+from swh.model.model import (
+    BaseModel,
+    Content,
+    Directory,
+    Origin,
+    Person,
+    Release,
+    Revision,
+    SkippedContent,
+    Snapshot,
+)
 from swh.storage import get_storage
 from swh.storage.tests.storage_data import data
 
 
 SQL_DIR = path.join(path.dirname(swh.storage.__file__), "sql")
 
 environ["LC_ALL"] = "C.UTF-8"
 
 DUMP_FILES = path.join(SQL_DIR, "*.sql")
 
 
 @pytest.fixture
 def swh_storage_backend_config(postgresql_proc, swh_storage_postgresql):
     """Basic pg storage configuration with no journal collaborator
     (to avoid pulling optional dependency on clients of this fixture)
 
     """
     yield {
         "cls": "local",
         "db": "postgresql://{user}@{host}:{port}/{dbname}".format(
             host=postgresql_proc.host,
             port=postgresql_proc.port,
             user="postgres",
             dbname="tests",
         ),
         "objstorage": {"cls": "memory", "args": {}},
     }
 
 
 @pytest.fixture
 def swh_storage(swh_storage_backend_config):
     return get_storage(cls="validate", storage=swh_storage_backend_config)
 
 
 # the postgres_fact factory fixture below is mostly a copy of the code
 # from pytest-postgresql. We need a custom version here to be able to
 # specify our version of the DBJanitor we use.
 def postgresql_fact(process_fixture_name, db_name=None, dump_files=DUMP_FILES):
     @pytest.fixture
     def postgresql_factory(request):
         """
         Fixture factory for PostgreSQL.
 
         :param FixtureRequest request: fixture request object
         :rtype: psycopg2.connection
         :returns: postgresql client
         """
         config = factories.get_config(request)
         if not psycopg2:
             raise ImportError("No module named psycopg2. Please install it.")
         proc_fixture = request.getfixturevalue(process_fixture_name)
 
         # _, config = try_import('psycopg2', request)
         pg_host = proc_fixture.host
         pg_port = proc_fixture.port
         pg_user = proc_fixture.user
         pg_options = proc_fixture.options
         pg_db = db_name or config["dbname"]
         with SwhDatabaseJanitor(
             pg_user,
             pg_host,
             pg_port,
             pg_db,
             proc_fixture.version,
             dump_files=dump_files,
         ):
             connection = psycopg2.connect(
                 dbname=pg_db,
                 user=pg_user,
                 host=pg_host,
                 port=pg_port,
                 options=pg_options,
             )
             yield connection
             connection.close()
 
     return postgresql_factory
 
 
 swh_storage_postgresql = postgresql_fact("postgresql_proc")
 
 
 # This version of the DatabaseJanitor implement a different setup/teardown
 # behavior than than the stock one: instead of dropping, creating and
 # initializing the database for each test, it create and initialize the db only
 # once, then it truncate the tables. This is needed to have acceptable test
 # performances.
 class SwhDatabaseJanitor(DatabaseJanitor):
     def __init__(
         self,
         user: str,
         host: str,
         port: str,
         db_name: str,
         version: Union[str, float, Version],
         dump_files: str = DUMP_FILES,
     ) -> None:
         super().__init__(user, host, port, db_name, version)
         self.dump_files = sorted(glob.glob(dump_files), key=sortkey)
 
     def db_setup(self):
         with psycopg2.connect(
             dbname=self.db_name, user=self.user, host=self.host, port=self.port,
         ) as cnx:
             with cnx.cursor() as cur:
                 for fname in self.dump_files:
                     with open(fname) as fobj:
                         sql = fobj.read().replace("concurrently", "").strip()
                         if sql:
                             cur.execute(sql)
             cnx.commit()
 
     def db_reset(self):
         with psycopg2.connect(
             dbname=self.db_name, user=self.user, host=self.host, port=self.port,
         ) as cnx:
             with cnx.cursor() as cur:
                 cur.execute(
                     "SELECT table_name FROM information_schema.tables "
                     "WHERE table_schema = %s",
                     ("public",),
                 )
                 tables = set(table for (table,) in cur.fetchall())
                 for table in tables:
                     cur.execute("truncate table %s cascade" % table)
 
                 cur.execute(
                     "SELECT sequence_name FROM information_schema.sequences "
                     "WHERE sequence_schema = %s",
                     ("public",),
                 )
                 seqs = set(seq for (seq,) in cur.fetchall())
                 for seq in seqs:
                     cur.execute("ALTER SEQUENCE %s RESTART;" % seq)
             cnx.commit()
 
     def init(self):
         with self.cursor() as cur:
             cur.execute(
                 "SELECT COUNT(1) FROM pg_database WHERE datname=%s;", (self.db_name,)
             )
             db_exists = cur.fetchone()[0] == 1
             if db_exists:
                 cur.execute(
                     "UPDATE pg_database SET datallowconn=true " "WHERE datname = %s;",
                     (self.db_name,),
                 )
 
         if db_exists:
             self.db_reset()
         else:
             with self.cursor() as cur:
                 cur.execute('CREATE DATABASE "{}";'.format(self.db_name))
             self.db_setup()
 
     def drop(self):
         pid_column = "pid"
         with self.cursor() as cur:
             cur.execute(
                 "UPDATE pg_database SET datallowconn=false " "WHERE datname = %s;",
                 (self.db_name,),
             )
             cur.execute(
                 "SELECT pg_terminate_backend(pg_stat_activity.{})"
                 "FROM pg_stat_activity "
                 "WHERE pg_stat_activity.datname = %s;".format(pid_column),
                 (self.db_name,),
             )
 
 
 @pytest.fixture
 def sample_data() -> Dict:
     """Pre-defined sample storage object data to manipulate
 
     Returns:
         Dict of data (keys: content, directory, revision, release, person,
         origin)
 
     """
     return {
         "content": [data.cont, data.cont2],
         "content_metadata": [data.cont3],
         "skipped_content": [data.skipped_cont, data.skipped_cont2],
         "person": [data.person],
         "directory": [data.dir2, data.dir],
         "revision": [data.revision, data.revision2, data.revision3],
         "release": [data.release, data.release2, data.release3],
         "snapshot": [data.snapshot],
         "origin": [data.origin, data.origin2],
         "fetcher": [data.metadata_fetcher],
         "authority": [data.metadata_authority],
         "origin_metadata": [data.origin_metadata, data.origin_metadata2],
     }
+
+
+# FIXME: Add the metadata keys when we can (right now, we cannot as the data model
+# changed but not the endpoints yet)
+OBJECT_FACTORY = {
+    "content": Content.from_dict,
+    "content_metadata": Content.from_dict,
+    "skipped_content": SkippedContent.from_dict,
+    "person": Person.from_dict,
+    "directory": Directory.from_dict,
+    "revision": Revision.from_dict,
+    "release": Release.from_dict,
+    "snapshot": Snapshot.from_dict,
+    "origin": Origin.from_dict,
+}
+
+
+@pytest.fixture
+def sample_data_model(sample_data) -> Dict[str, Iterable[BaseModel]]:
+    """Pre-defined sample storage object model to manipulate
+
+    Returns:
+        Dict of data (keys: content, directory, revision, release, person, origin, ...)
+        values list of object data model with the corresponding types
+
+    """
+    return {
+        object_type: [convert_fn(obj) for obj in sample_data[object_type]]
+        for object_type, convert_fn in OBJECT_FACTORY.items()
+    }
diff --git a/swh/storage/tests/conftest.py b/swh/storage/tests/conftest.py
index 634afa4b..13615c2a 100644
--- a/swh/storage/tests/conftest.py
+++ b/swh/storage/tests/conftest.py
@@ -1,82 +1,59 @@
 # Copyright (C) 2019-2020 The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import pytest
 import multiprocessing.util
 
 from hypothesis import settings
 
 try:
     import pytest_cov.embed
 except ImportError:
     pytest_cov = None
 
 from swh.model.tests.generate_testdata import gen_contents, gen_origins
-from swh.model.model import (
-    Content,
-    Directory,
-    Origin,
-    OriginVisit,
-    Release,
-    Revision,
-    SkippedContent,
-    Snapshot,
-)
-
-
-OBJECT_FACTORY = {
-    "content": Content.from_dict,
-    "directory": Directory.from_dict,
-    "origin": Origin.from_dict,
-    "origin_visit": OriginVisit.from_dict,
-    "release": Release.from_dict,
-    "revision": Revision.from_dict,
-    "skipped_content": SkippedContent.from_dict,
-    "snapshot": Snapshot.from_dict,
-}
-
 
 # define tests profile. Full documentation is at:
 # https://hypothesis.readthedocs.io/en/latest/settings.html#settings-profiles
 settings.register_profile("fast", max_examples=5, deadline=5000)
 settings.register_profile("slow", max_examples=20, deadline=5000)
 
 
 if pytest_cov is not None:
     # pytest_cov + multiprocessing can cause a segmentation fault when starting
     # the child process <https://forge.softwareheritage.org/P706>; so we're
     # removing pytest-coverage's hook that runs when a child process starts.
     # This means code run in child processes won't be counted in the coverage
     # report, but this is not an issue because the only code that runs only in
     # child processes is the RPC server.
     for (key, value) in multiprocessing.util._afterfork_registry.items():
         if value is pytest_cov.embed.multiprocessing_start:
             del multiprocessing.util._afterfork_registry[key]
             break
     else:
         assert False, "missing pytest_cov.embed.multiprocessing_start?"
 
 
 @pytest.fixture
 def swh_contents(swh_storage):
     contents = gen_contents(n=20)
     swh_storage.content_add([c for c in contents if c["status"] != "absent"])
     swh_storage.skipped_content_add([c for c in contents if c["status"] == "absent"])
     return contents
 
 
 @pytest.fixture
 def swh_origins(swh_storage):
     origins = gen_origins(n=100)
     swh_storage.origin_add(origins)
     return origins
 
 
 @pytest.fixture
 def swh_storage_backend_config(swh_storage_backend_config):
     """storage should test with its journal writer collaborator on
 
     """
     yield {**swh_storage_backend_config, "journal_writer": {"cls": "memory",}}
diff --git a/swh/storage/tests/test_pytest_plugin.py b/swh/storage/tests/test_pytest_plugin.py
new file mode 100644
index 00000000..e0384847
--- /dev/null
+++ b/swh/storage/tests/test_pytest_plugin.py
@@ -0,0 +1,60 @@
+# Copyright (C) 2020  The Software Heritage developers
+# See the AUTHORS file at the top-level directory of this distribution
+# License: GNU General Public License version 3, or any later version
+# See top-level LICENSE file for more information
+
+
+from swh.storage.pytest_plugin import OBJECT_FACTORY
+
+
+from swh.model.model import BaseModel
+
+
+def test_sample_data(sample_data, sample_data_model):
+    assert set(sample_data.keys()) == set(
+        [
+            "content",
+            "content_metadata",
+            "skipped_content",
+            "person",
+            "directory",
+            "revision",
+            "release",
+            "snapshot",
+            "origin",
+            "fetcher",
+            "authority",
+            "origin_metadata",
+        ]
+    )
+    for object_type, objs in sample_data.items():
+        for obj in objs:
+            assert isinstance(obj, dict)
+
+        if sample_data_model.get(object_type):
+            # metadata keys are missing because conversion is not possible yet
+            assert len(objs) == len(sample_data_model[object_type])
+
+
+def test_sample_data_model(sample_data, sample_data_model):
+    assert set(sample_data_model.keys()) == set(
+        [
+            "content",
+            "content_metadata",
+            "skipped_content",
+            "person",
+            "directory",
+            "revision",
+            "release",
+            "snapshot",
+            "origin",
+        ]
+    )
+
+    for object_type, objs in sample_data_model.items():
+        assert object_type in OBJECT_FACTORY
+
+        for obj in objs:
+            assert isinstance(obj, BaseModel)
+
+        assert len(objs) == len(sample_data[object_type])