diff --git a/.gitignore b/.gitignore
index 700f993..be9dfa5 100644
--- a/.gitignore
+++ b/.gitignore
@@ -1,11 +1,12 @@
 *.pyc
 *.sw?
 *~
 .coverage
 .eggs/
 __pycache__
 *.egg-info/
 build/
 dist/
 version.txt
 /.hypothesis/
+/.tox/
diff --git a/PKG-INFO b/PKG-INFO
index 783edcf..cb6e42f 100644
--- a/PKG-INFO
+++ b/PKG-INFO
@@ -1,65 +1,65 @@
 Metadata-Version: 2.1
 Name: swh.scheduler
-Version: 0.0.32
+Version: 0.0.33
 Summary: Software Heritage Scheduler
 Home-page: https://forge.softwareheritage.org/diffusion/DSCH/
 Author: Software Heritage developers
 Author-email: swh-devel@inria.fr
 License: UNKNOWN
 Project-URL: Bug Reports, https://forge.softwareheritage.org/maniphest
 Project-URL: Funding, https://www.softwareheritage.org/donate
 Project-URL: Source, https://forge.softwareheritage.org/source/swh-scheduler
 Description: swh-scheduler
         =============
         
         Job scheduler for the Software Heritage project.
         
         Task manager for asynchronous/delayed tasks, used for both recurrent (e.g.,
         listing a forge, loading new stuff from a Git repository) and one-off
         activities (e.g., loading a specific version of a source package).
         
         
         # Tests
         
         ## Running test manually
         
         ### Test data
         
         To be able to run (unit) tests, you need to have the
         [[https://forge.softwareheritage.org/source/swh-storage-testdata.git|swh-storage-testdata]]
         in the parent directory. If you have set your environment following the
         [[ https://docs.softwareheritage.org/devel/getting-started.html#getting-started|Getting started]]
         document everythong should be set up just fine.
         
         Otherwise:
         
         ```
         ~/.../swh-scheduler$ git clone https://forge.softwareheritage.org/source/swh-storage-testdata.git ../swh-storage-testdata
         ```
         
         ### Required services
         
         Unit tests that require a running celery broker uses an in memory broker/result
         backend by default, but you can choose to use a true broker by setting
         `CELERY_BROKER_URL` and `CELERY_RESULT_BACKEND` environment variables up.
         
         For example:
         
         ```
         $ CELERY_BROKER_URL=amqp://localhost pifpaf run postgresql nosetests
         
         .....................................
         ----------------------------------------------------------------------
         Ran 37 tests in 15.578s
         
         OK
         ```
         
 Platform: UNKNOWN
 Classifier: Programming Language :: Python :: 3
 Classifier: Intended Audience :: Developers
 Classifier: License :: OSI Approved :: GNU General Public License v3 (GPLv3)
 Classifier: Operating System :: OS Independent
 Classifier: Development Status :: 5 - Production/Stable
 Description-Content-Type: text/markdown
 Provides-Extra: testing
diff --git a/debian/changelog b/debian/changelog
index f2694c7..64c41a7 100644
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,276 +1,276 @@
-swh-scheduler (0.0.32-1~swh1~bpo9+1) stretch-swh; urgency=medium
+swh-scheduler (0.0.33-1~swh1) unstable-swh; urgency=medium
 
-  * Rebuild for stretch-backports.
+  * v0.0.33
 
- -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Mon, 22 Oct 2018 15:37:51 +0200
+ -- David Douard <david.douard@sdfa3.org>  Thu, 25 Oct 2018 16:03:16 +0200
 
 swh-scheduler (0.0.32-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.32
   * tests: Add celery fixture to ease tests
   * tests: make tests use sql/ files from the package
   * tests: Starting migration towards pytest
   * listener: Make the listener code compatible with new celery (debian
     buster)
   * Make swh_scheduler_create_tasks_from_temp use indexes
   * setup: prepare for pypi upload
   * docs: add a simple README file
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Mon, 22 Oct 2018 15:37:51 +0200
 
 swh-scheduler (0.0.31-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.31
   * sql/swh-scheduler: Make the create_tasks call idempotent
   * swh.scheduler.utils: Open create_task_dict function
   * sql/scheduler-data: Add lister gitlab task types
   * sql/scheduler-data: Reference the existing production lister data
   * swh.scheduler.backend_es: Open sniffing options
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Tue, 31 Jul 2018 06:55:39 +0200
 
 swh-scheduler (0.0.30-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.30
   * swh-scheduler-schema.sql: Archive disabled oneshot tasks as well
   * swh.scheduler.cli: Add policy to pretty printing task routine
   * swh.scheduler.cli: Fix broken cli list-pending since api change
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Fri, 22 Jun 2018 18:07:02 +0200
 
 swh-scheduler (0.0.29-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.29
   * swh.scheduler.cli: Change archival period to rolling month - 1 week
   * swh.scheduler.updater.writer: Force filter resolution to list
   * swh.scheduler.cli: Change default archival period to current month
   * swh.scheduler.cli: Improve logging message
   * swh.scheduler.updater.backend: Adapt configuration path accordingly
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Thu, 31 May 2018 11:42:51 +0200
 
 swh-scheduler (0.0.28-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.28
   * Fix wrong runtime dependencies
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Tue, 29 May 2018 14:12:15 +0200
 
 swh-scheduler (0.0.27-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.27
   * scheduler: Deal with priority in tasks
   * scheduler-update: new package python3-swh.scheduler.updater
   * Contains tools in charge of consuming events from arbitrary sources
   * and update the scheduler db
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Tue, 29 May 2018 12:27:34 +0200
 
 swh-scheduler (0.0.26-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.26
   * swh.scheduler: Fix package build
   * swh.scheduler.tests: Test remote scheduler api as well
   * swh.scheduler: Add tests around removing archivable tasks
   * swh.scheduler: Add tests around filtering archivable tasks
   * swh-scheduler-schema: Fix unneeded drop instructions
   * swh.scheduler.cli: Improve docstring
   * swh.scheduler.cli: Permit to specify the backend to use in cli
   * swh.scheduler.api: Bootstrap scheduler's remote api
   * swh.scheduler: Use `get_scheduler` api to instantiate a scheduler
   * swh.scheduler.backend: Fix docstring
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Thu, 26 Apr 2018 17:34:07 +0200
 
 swh-scheduler (0.0.25-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.25
   * swh.scheduler.cli.archive: Index arguments.kwargs as text
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Wed, 18 Apr 2018 12:34:43 +0200
 
 swh-scheduler (0.0.24-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.24
   * data/template: Do not index the arguments field (it's in _source)
   * data/README: Add a small readme to explain es install step
   * swh.scheduler.cli: Add a bulk index flag to separate read from index
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Fri, 13 Apr 2018 14:55:32 +0200
 
 swh-scheduler (0.0.23-1~swh1) unstable-swh; urgency=medium
 
   * swh.scheduler.cli.archive: Delete only completely indexed tasks
   * Prior to this commit, it could happen that we removed tasks even
   * though we did not yet index associated task_run.
   * Related T986
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Tue, 10 Apr 2018 17:43:07 +0200
 
 swh-scheduler (0.0.22-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.22
   * Update to a more recent python3-elasticsearch client
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Mon, 09 Apr 2018 16:09:16 +0200
 
 swh-scheduler (0.0.21-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.21
   * Adapt default configuration
   * Fix typo in configuration variable name
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Fri, 30 Mar 2018 15:02:55 +0200
 
 swh-scheduler (0.0.20-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.20
   * swh.scheduler.cli.archive: Open completed oneshot or disabled
   * recurring tasks archival endpoint
   * swh.core.serializer: Move to msgpack serialization format
   * swh.scheduler.cli: Unify pretty print output
   * sql/data: Add new task type for loading mercurial dump
   * swh.scheduler.cli: Add sample use case for the scheduling cli
   * swh.scheduler.cli: Open policy column to the scheduling cli
   * swh.scheduler.cli: Open the delimiter option as cli argument
   * Fix issue when updating task-type without any retry delay defined
   * swh-scheduler/data: Add new oneshot scheduling load-mercurial task
   * backend: fix default scheduling_db value for consistency
   * backend: doc: fix return value of create_tasks
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Fri, 30 Mar 2018 11:44:18 +0200
 
 swh-scheduler (0.0.19-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.19
   * swh.scheduler.utils: Open utility function to create oneshot task
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Wed, 29 Nov 2017 12:51:15 +0100
 
 swh-scheduler (0.0.18-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.18
   * Celery 4 compatibility
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Wed, 08 Nov 2017 17:06:22 +0100
 
 swh-scheduler (0.0.17-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler version 0.0.17
   * Update packaging runes
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Thu, 12 Oct 2017 18:49:02 +0200
 
 swh-scheduler (0.0.16-1~swh1) unstable-swh; urgency=medium
 
   * Release swh-scheduler v0.0.16
   * add some tests
   * implement one-shot tasks
   * implement retry on temporary failure
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Mon, 07 Aug 2017 18:44:03 +0200
 
 swh-scheduler (0.0.15-1~swh1) unstable-swh; urgency=medium
 
   * Release swh-scheduler v0.0.15
   * Add some methods to get the length of task queues
   * worker: Show logs on stdout if loglevel = debug
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Mon, 19 Jun 2017 19:44:56 +0200
 
 swh-scheduler (0.0.14-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler 0.0.14
   * Make the return value of tasks available in the listener
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Mon, 12 Jun 2017 17:50:32 +0200
 
 swh-scheduler (0.0.13-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.13
   * Use systemd for logging rather than PostgreSQL
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Fri, 07 Apr 2017 11:57:50 +0200
 
 swh-scheduler (0.0.12-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.12
   * Only log to database if the configuration is present
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Thu, 09 Mar 2017 11:12:45 +0100
 
 swh-scheduler (0.0.11-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.11
   * add utils.get_task
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Tue, 14 Feb 2017 19:49:34 +0100
 
 swh-scheduler (0.0.10-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.10
   * Allow disabling tasks
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Thu, 20 Oct 2016 17:20:17 +0200
 
 swh-scheduler (0.0.9-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.9
   * Revert management of one shot tasks
   * Add possibility of launching several worker instances
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Fri, 02 Sep 2016 17:09:18 +0200
 
 swh-scheduler (0.0.7-1~swh1) unstable-swh; urgency=medium
 
   * v0.0.7
   * Add oneshot task
 
  -- Antoine R. Dumont (@ardumont) <antoine.romain.dumont@gmail.com>  Fri, 01 Jul 2016 16:42:45 +0200
 
 swh-scheduler (0.0.6-1~swh1) unstable-swh; urgency=medium
 
   * Release swh-scheduler v0.0.6
   * More reliability and efficiency when scheduling a lot ot tasks
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Wed, 24 Feb 2016 18:46:57 +0100
 
 swh-scheduler (0.0.5-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.5
   * Use copy for task mass-scheduling
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Wed, 24 Feb 2016 12:13:38 +0100
 
 swh-scheduler (0.0.4-1~swh1) unstable-swh; urgency=medium
 
   * Release swh-scheduler v0.0.4
   * general cleanup of the backend
   * use arrow instead of dateutil
   * add new cli program
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Tue, 23 Feb 2016 17:46:04 +0100
 
 swh-scheduler (0.0.3-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler version 0.0.3
   * Implement the timestamp arguments to the task_run functions
   * Make the celery event listener use a reliable queue
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Mon, 22 Feb 2016 15:14:28 +0100
 
 swh-scheduler (0.0.2-1~swh1) unstable-swh; urgency=medium
 
   * Release swh.scheduler v0.0.2
   * Multiple schema changes
   * Initial releases for the celery job runner and the event listener
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Fri, 19 Feb 2016 18:50:47 +0100
 
 swh-scheduler (0.0.1-1~swh1) unstable-swh; urgency=medium
 
   * Initial release
   * Release swh.scheduler v0.0.1
   * Move swh.core.scheduling and swh.core.worker to swh.scheduler
 
  -- Nicolas Dandrimont <nicolas@dandrimont.eu>  Mon, 15 Feb 2016 11:07:30 +0100
diff --git a/pytest.ini b/pytest.ini
new file mode 100644
index 0000000..afa4cf3
--- /dev/null
+++ b/pytest.ini
@@ -0,0 +1,2 @@
+[pytest]
+norecursedirs = docs
diff --git a/requirements-test.txt b/requirements-test.txt
index 8a26d2c..6c62abe 100644
--- a/requirements-test.txt
+++ b/requirements-test.txt
@@ -1,3 +1,3 @@
 hypothesis
-nose
+pytest
 celery
diff --git a/swh.scheduler.egg-info/PKG-INFO b/swh.scheduler.egg-info/PKG-INFO
index 783edcf..cb6e42f 100644
--- a/swh.scheduler.egg-info/PKG-INFO
+++ b/swh.scheduler.egg-info/PKG-INFO
@@ -1,65 +1,65 @@
 Metadata-Version: 2.1
 Name: swh.scheduler
-Version: 0.0.32
+Version: 0.0.33
 Summary: Software Heritage Scheduler
 Home-page: https://forge.softwareheritage.org/diffusion/DSCH/
 Author: Software Heritage developers
 Author-email: swh-devel@inria.fr
 License: UNKNOWN
 Project-URL: Bug Reports, https://forge.softwareheritage.org/maniphest
 Project-URL: Funding, https://www.softwareheritage.org/donate
 Project-URL: Source, https://forge.softwareheritage.org/source/swh-scheduler
 Description: swh-scheduler
         =============
         
         Job scheduler for the Software Heritage project.
         
         Task manager for asynchronous/delayed tasks, used for both recurrent (e.g.,
         listing a forge, loading new stuff from a Git repository) and one-off
         activities (e.g., loading a specific version of a source package).
         
         
         # Tests
         
         ## Running test manually
         
         ### Test data
         
         To be able to run (unit) tests, you need to have the
         [[https://forge.softwareheritage.org/source/swh-storage-testdata.git|swh-storage-testdata]]
         in the parent directory. If you have set your environment following the
         [[ https://docs.softwareheritage.org/devel/getting-started.html#getting-started|Getting started]]
         document everythong should be set up just fine.
         
         Otherwise:
         
         ```
         ~/.../swh-scheduler$ git clone https://forge.softwareheritage.org/source/swh-storage-testdata.git ../swh-storage-testdata
         ```
         
         ### Required services
         
         Unit tests that require a running celery broker uses an in memory broker/result
         backend by default, but you can choose to use a true broker by setting
         `CELERY_BROKER_URL` and `CELERY_RESULT_BACKEND` environment variables up.
         
         For example:
         
         ```
         $ CELERY_BROKER_URL=amqp://localhost pifpaf run postgresql nosetests
         
         .....................................
         ----------------------------------------------------------------------
         Ran 37 tests in 15.578s
         
         OK
         ```
         
 Platform: UNKNOWN
 Classifier: Programming Language :: Python :: 3
 Classifier: Intended Audience :: Developers
 Classifier: License :: OSI Approved :: GNU General Public License v3 (GPLv3)
 Classifier: Operating System :: OS Independent
 Classifier: Development Status :: 5 - Production/Stable
 Description-Content-Type: text/markdown
 Provides-Extra: testing
diff --git a/swh.scheduler.egg-info/SOURCES.txt b/swh.scheduler.egg-info/SOURCES.txt
index 6af5abd..a4bf015 100644
--- a/swh.scheduler.egg-info/SOURCES.txt
+++ b/swh.scheduler.egg-info/SOURCES.txt
@@ -1,87 +1,89 @@
 .gitignore
 AUTHORS
 LICENSE
 LICENSE.Celery
 MANIFEST.in
 Makefile
 README.md
+pytest.ini
 requirements-swh.txt
 requirements-test.txt
 requirements.txt
 setup.py
+tox.ini
 version.txt
 bin/swh-worker-control
 data/README.md
 data/elastic-template.json
 data/update-index-settings.json
 debian/changelog
 debian/compat
 debian/control
 debian/copyright
 debian/rules
 debian/source/format
 docs/.gitignore
 docs/Makefile
 docs/conf.py
 docs/index.rst
 docs/_static/.placeholder
 docs/_templates/.placeholder
 sql/.gitignore
 sql/Makefile
 sql/updater/sql/Makefile
 sql/updates/02.sql
 sql/updates/03.sql
 sql/updates/04.sql
 sql/updates/05.sql
 sql/updates/06.sql
 sql/updates/07.sql
 sql/updates/08.sql
 sql/updates/09.sql
 sql/updates/10.sql
 sql/updates/11.sql
 sql/updates/12.sql
 swh/__init__.py
 swh.scheduler.egg-info/PKG-INFO
 swh.scheduler.egg-info/SOURCES.txt
 swh.scheduler.egg-info/dependency_links.txt
 swh.scheduler.egg-info/entry_points.txt
 swh.scheduler.egg-info/requires.txt
 swh.scheduler.egg-info/top_level.txt
 swh/scheduler/__init__.py
 swh/scheduler/backend.py
 swh/scheduler/backend_es.py
 swh/scheduler/cli.py
 swh/scheduler/task.py
 swh/scheduler/utils.py
 swh/scheduler/api/__init__.py
 swh/scheduler/api/client.py
 swh/scheduler/api/server.py
 swh/scheduler/celery_backend/__init__.py
 swh/scheduler/celery_backend/config.py
 swh/scheduler/celery_backend/listener.py
 swh/scheduler/celery_backend/runner.py
 swh/scheduler/sql/30-swh-schema.sql
 swh/scheduler/sql/40-swh-data.sql
 swh/scheduler/sql/updater/10-swh-init.sql
 swh/scheduler/sql/updater/30-swh-schema.sql
 swh/scheduler/sql/updater/40-swh-func.sql
 swh/scheduler/tests/__init__.py
 swh/scheduler/tests/celery_testing.py
 swh/scheduler/tests/test_api_client.py
 swh/scheduler/tests/test_scheduler.py
 swh/scheduler/tests/test_task.py
 swh/scheduler/tests/test_utils.py
 swh/scheduler/tests/updater/__init__.py
 swh/scheduler/tests/updater/test_backend.py
 swh/scheduler/tests/updater/test_consumer.py
 swh/scheduler/tests/updater/test_events.py
 swh/scheduler/tests/updater/test_ghtorrent.py
 swh/scheduler/tests/updater/test_writer.py
 swh/scheduler/updater/__init__.py
 swh/scheduler/updater/backend.py
 swh/scheduler/updater/consumer.py
 swh/scheduler/updater/events.py
 swh/scheduler/updater/writer.py
 swh/scheduler/updater/ghtorrent/__init__.py
 swh/scheduler/updater/ghtorrent/cli.py
 swh/scheduler/updater/ghtorrent/fake.py
\ No newline at end of file
diff --git a/swh.scheduler.egg-info/requires.txt b/swh.scheduler.egg-info/requires.txt
index c638937..aab4582 100644
--- a/swh.scheduler.egg-info/requires.txt
+++ b/swh.scheduler.egg-info/requires.txt
@@ -1,14 +1,14 @@
 Click
 arrow
 celery
 elasticsearch>5.4
 flask
 kombu
 psycopg2
 swh.core>=0.0.44
 vcversioner
 
 [testing]
 celery
 hypothesis
-nose
+pytest
diff --git a/swh/scheduler/celery_backend/config.py b/swh/scheduler/celery_backend/config.py
index b31bfc6..b31a6f6 100644
--- a/swh/scheduler/celery_backend/config.py
+++ b/swh/scheduler/celery_backend/config.py
@@ -1,201 +1,203 @@
 # Copyright (C) 2015  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import logging
 import os
 import urllib.parse
 
 from celery import Celery
 from celery.signals import setup_logging
 from celery.utils.log import ColorFormatter
 from celery.worker.control import Panel
 
 from kombu import Exchange, Queue
 from kombu.five import monotonic as _monotonic
 
 import requests
 
 from swh.core.config import load_named_config
 from swh.core.logger import JournalHandler
 
 DEFAULT_CONFIG_NAME = 'worker'
 CONFIG_NAME_ENVVAR = 'SWH_WORKER_INSTANCE'
 CONFIG_NAME_TEMPLATE = 'worker/%s'
 
 DEFAULT_CONFIG = {
     'task_broker': ('str', 'amqp://guest@localhost//'),
     'task_modules': ('list[str]', []),
     'task_queues': ('list[str]', []),
     'task_soft_time_limit': ('int', 0),
 }
 
 
 @setup_logging.connect
 def setup_log_handler(loglevel=None, logfile=None, format=None,
                       colorize=None, **kwargs):
     """Setup logging according to Software Heritage preferences.
 
     We use the command-line loglevel for tasks only, as we never
     really care about the debug messages from celery.
     """
 
     if loglevel is None:
         loglevel = logging.DEBUG
 
     formatter = logging.Formatter(format)
 
     root_logger = logging.getLogger('')
     root_logger.setLevel(logging.INFO)
 
     if loglevel == logging.DEBUG:
         color_formatter = ColorFormatter(format) if colorize else formatter
         console = logging.StreamHandler()
         console.setLevel(logging.DEBUG)
         console.setFormatter(color_formatter)
         root_logger.addHandler(console)
 
     systemd_journal = JournalHandler()
     systemd_journal.setLevel(logging.DEBUG)
     systemd_journal.setFormatter(formatter)
     root_logger.addHandler(systemd_journal)
 
     celery_logger = logging.getLogger('celery')
     celery_logger.setLevel(logging.INFO)
 
     # Silence useless "Starting new HTTP connection" messages
     urllib3_logger = logging.getLogger('urllib3')
     urllib3_logger.setLevel(logging.WARNING)
 
     swh_logger = logging.getLogger('swh')
     swh_logger.setLevel(loglevel)
 
     # get_task_logger makes the swh tasks loggers children of celery.task
     celery_task_logger = logging.getLogger('celery.task')
     celery_task_logger.setLevel(loglevel)
 
 
 @Panel.register
 def monotonic(state):
     """Get the current value for the monotonic clock"""
     return {'monotonic': _monotonic()}
 
 
 class TaskRouter:
     """Route tasks according to the task_queue attribute in the task class"""
     def route_for_task(self, task, args=None, kwargs=None):
         task_class = app.tasks[task]
         if hasattr(task_class, 'task_queue'):
             return {'queue': task_class.task_queue}
         return None
 
 
 class CustomCelery(Celery):
     def get_queue_stats(self, queue_name):
         """Get the statistics regarding a queue on the broker.
 
         Arguments:
           queue_name: name of the queue to check
 
         Returns a dictionary raw from the RabbitMQ management API.
 
         Interesting keys:
          - consumers (number of consumers for the queue)
          - messages (number of messages in queue)
          - messages_unacknowledged (number of messages currently being
            processed)
 
         Documentation: https://www.rabbitmq.com/management.html#http-api
         """
 
         conn_info = self.connection().info()
         url = 'http://{hostname}:{port}/api/queues/{vhost}/{queue}'.format(
             hostname=conn_info['hostname'],
             port=conn_info['port'] + 10000,
             vhost=urllib.parse.quote(conn_info['virtual_host'], safe=''),
             queue=urllib.parse.quote(queue_name, safe=''),
         )
         credentials = (conn_info['userid'], conn_info['password'])
         r = requests.get(url, auth=credentials)
         if r.status_code != 200:
             raise ValueError('Got error %s when reading queue stats: %s' % (
                 r.status_code, r.json()))
         return r.json()
 
     def get_queue_length(self, queue_name):
         """Shortcut to get a queue's length"""
         return self.get_queue_stats(queue_name)['messages']
 
 
 INSTANCE_NAME = os.environ.get(CONFIG_NAME_ENVVAR)
 if INSTANCE_NAME:
     CONFIG_NAME = CONFIG_NAME_TEMPLATE % INSTANCE_NAME
 else:
     CONFIG_NAME = DEFAULT_CONFIG_NAME
 
 # Load the Celery config
 CONFIG = load_named_config(CONFIG_NAME, DEFAULT_CONFIG)
 
 # Celery Queues
 CELERY_QUEUES = [Queue('celery', Exchange('celery'), routing_key='celery')]
 
 for queue in CONFIG['task_queues']:
     CELERY_QUEUES.append(Queue(queue, Exchange(queue), routing_key=queue))
 
 # Instantiate the Celery app
 app = CustomCelery()
 app.conf.update(
     # The broker
     BROKER_URL=CONFIG['task_broker'],
     # Timezone configuration: all in UTC
     CELERY_ENABLE_UTC=True,
     CELERY_TIMEZONE='UTC',
     # Imported modules
     CELERY_IMPORTS=CONFIG['task_modules'],
     # Time (in seconds, or a timedelta object) for when after stored task
     # tombstones will be deleted. None means to never expire results.
     CELERY_TASK_RESULT_EXPIRES=None,
     # A string identifying the default serialization method to use. Can
     # be json (default), pickle, yaml, msgpack, or any custom
     # serialization methods that have been registered with
     CELERY_TASK_SERIALIZER='msgpack',
+    # Result serialization format
+    CELERY_RESULT_SERIALIZER='msgpack',
     # Late ack means the task messages will be acknowledged after the task has
     # been executed, not just before, which is the default behavior.
     CELERY_ACKS_LATE=True,
     # A string identifying the default serialization method to use.
     # Can be pickle (default), json, yaml, msgpack or any custom serialization
     # methods that have been registered with kombu.serialization.registry
     CELERY_ACCEPT_CONTENT=['msgpack', 'json', 'pickle'],
     # If True the task will report its status as “started”
     # when the task is executed by a worker.
     CELERY_TRACK_STARTED=True,
     # Default compression used for task messages. Can be gzip, bzip2
     # (if available), or any custom compression schemes registered
     # in the Kombu compression registry.
     # CELERY_MESSAGE_COMPRESSION='bzip2',
     # Disable all rate limits, even if tasks has explicit rate limits set.
     # (Disabling rate limits altogether is recommended if you don’t have any
     # tasks using them.)
     CELERY_DISABLE_RATE_LIMITS=True,
     # Task hard time limit in seconds. The worker processing the task will be
     # killed and replaced with a new one when this is exceeded.
     # CELERYD_TASK_TIME_LIMIT=3600,
     # Task soft time limit in seconds.
     # The SoftTimeLimitExceeded exception will be raised when this is exceeded.
     # The task can catch this to e.g. clean up before the hard time limit
     # comes.
     CELERYD_TASK_SOFT_TIME_LIMIT=CONFIG['task_soft_time_limit'],
     # Task routing
     CELERY_ROUTES=TaskRouter(),
     # Task queues this worker will consume from
     CELERY_QUEUES=CELERY_QUEUES,
     # Allow pool restarts from remote
     CELERYD_POOL_RESTARTS=True,
     # Do not prefetch tasks
     CELERYD_PREFETCH_MULTIPLIER=1,
     # Send events
     CELERY_SEND_EVENTS=True,
     # Do not send useless task_sent events
     CELERY_SEND_TASK_SENT_EVENT=False,
 )
diff --git a/swh/scheduler/tests/test_scheduler.py b/swh/scheduler/tests/test_scheduler.py
index caf1748..cd3fc8c 100644
--- a/swh/scheduler/tests/test_scheduler.py
+++ b/swh/scheduler/tests/test_scheduler.py
@@ -1,474 +1,474 @@
 # Copyright (C) 2017-2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import copy
 import datetime
 import os
 import random
 import unittest
 import uuid
 from collections import defaultdict
 
 import psycopg2
 from arrow import utcnow
-from nose.plugins.attrib import attr
+import pytest
 
 from swh.core.tests.db_testing import SingleDbTestFixture
 from swh.scheduler import get_scheduler
 
 from . import SQL_DIR
 
 
-@attr('db')
+@pytest.mark.db
 class CommonSchedulerTest(SingleDbTestFixture):
     TEST_DB_NAME = 'softwareheritage-scheduler-test'
     TEST_DB_DUMP = os.path.join(SQL_DIR, '*.sql')
 
     def setUp(self):
         super().setUp()
 
         tt = {
             'type': 'update-git',
             'description': 'Update a git repository',
             'backend_name': 'swh.loader.git.tasks.UpdateGitRepository',
             'default_interval': datetime.timedelta(days=64),
             'min_interval': datetime.timedelta(hours=12),
             'max_interval': datetime.timedelta(days=64),
             'backoff_factor': 2,
             'max_queue_length': None,
             'num_retries': 7,
             'retry_delay': datetime.timedelta(hours=2),
         }
         tt2 = tt.copy()
         tt2['type'] = 'update-hg'
         tt2['description'] = 'Update a mercurial repository'
         tt2['backend_name'] = 'swh.loader.mercurial.tasks.UpdateHgRepository'
         tt2['max_queue_length'] = 42
         tt2['num_retries'] = None
         tt2['retry_delay'] = None
 
         self.task_types = {
             tt['type']: tt,
             tt2['type']: tt2,
         }
 
         self.task1_template = t1_template = {
             'type': tt['type'],
             'arguments': {
                 'args': [],
                 'kwargs': {},
             },
             'next_run': None,
         }
         self.task2_template = t2_template = copy.deepcopy(t1_template)
         t2_template['type'] = tt2['type']
         t2_template['policy'] = 'oneshot'
 
     def tearDown(self):
         self.backend.close_connection()
         self.empty_tables()
         super().tearDown()
 
     def empty_tables(self, whitelist=["priority_ratio"]):
         query = """SELECT table_name FROM information_schema.tables
                    WHERE table_schema = %%s and
                          table_name not in (%s)
                 """ % ','.join(map(lambda t: "'%s'" % t, whitelist))
         self.cursor.execute(query, ('public', ))
 
         tables = set(table for (table,) in self.cursor.fetchall())
 
         for table in tables:
             self.cursor.execute('truncate table %s cascade' % table)
         self.conn.commit()
 
     def test_add_task_type(self):
         tt, tt2 = self.task_types.values()
         self.backend.create_task_type(tt)
         self.assertEqual(tt, self.backend.get_task_type(tt['type']))
         with self.assertRaisesRegex(psycopg2.IntegrityError,
                                     r'\(type\)=\(%s\)' % tt['type']):
             self.backend.create_task_type(tt)
         self.backend.create_task_type(tt2)
         self.assertEqual(tt, self.backend.get_task_type(tt['type']))
         self.assertEqual(tt2, self.backend.get_task_type(tt2['type']))
 
     def test_get_task_types(self):
         tt, tt2 = self.task_types.values()
         self.backend.create_task_type(tt)
         self.backend.create_task_type(tt2)
         self.assertCountEqual([tt2, tt], self.backend.get_task_types())
 
     @staticmethod
     def _task_from_template(template, next_run, priority, *args, **kwargs):
         ret = copy.deepcopy(template)
         ret['next_run'] = next_run
         if priority:
             ret['priority'] = priority
         if args:
             ret['arguments']['args'] = list(args)
         if kwargs:
             ret['arguments']['kwargs'] = kwargs
         return ret
 
     def _pop_priority(self, priorities):
         if not priorities:
             return None
         for priority, remains in priorities.items():
             if remains > 0:
                 priorities[priority] = remains - 1
                 return priority
         return None
 
     def _tasks_from_template(self, template, max_timestamp, num,
                              num_priority=0, priorities=None):
         if num_priority and priorities:
             priorities = {
                 priority: ratio * num_priority
                 for priority, ratio in priorities.items()
             }
 
         tasks = []
         for i in range(num + num_priority):
             priority = self._pop_priority(priorities)
             tasks.append(self._task_from_template(
                 template,
                 max_timestamp - datetime.timedelta(microseconds=i),
                 priority,
                 'argument-%03d' % i,
                 **{'kwarg%03d' % i: 'bogus-kwarg'}
             ))
         return tasks
 
     def _create_task_types(self):
         for tt in self.task_types.values():
             self.backend.create_task_type(tt)
 
     def test_create_tasks(self):
         priority_ratio = self._priority_ratio()
         self._create_task_types()
         num_tasks_priority = 100
         tasks_1 = self._tasks_from_template(self.task1_template, utcnow(), 100)
         tasks_2 = self._tasks_from_template(
                 self.task2_template, utcnow(), 100,
                 num_tasks_priority, priorities=priority_ratio)
         tasks = tasks_1 + tasks_2
 
         # tasks are returned only once with their ids
         ret1 = self.backend.create_tasks(tasks + tasks_1 + tasks_2)
         set_ret1 = set([t['id'] for t in ret1])
 
         # creating the same set result in the same ids
         ret = self.backend.create_tasks(tasks)
         set_ret = set([t['id'] for t in ret])
 
         # Idempotence results
         self.assertEqual(set_ret, set_ret1)
         self.assertEqual(len(ret), len(ret1))
 
         ids = set()
         actual_priorities = defaultdict(int)
 
         for task, orig_task in zip(ret, tasks):
             task = copy.deepcopy(task)
             task_type = self.task_types[orig_task['type']]
             self.assertNotIn(task['id'], ids)
             self.assertEqual(task['status'], 'next_run_not_scheduled')
             self.assertEqual(task['current_interval'],
                              task_type['default_interval'])
             self.assertEqual(task['policy'], orig_task.get('policy',
                                                            'recurring'))
             priority = task.get('priority')
             if priority:
                 actual_priorities[priority] += 1
 
             self.assertEqual(task['retries_left'],
                              task_type['num_retries'] or 0)
             ids.add(task['id'])
             del task['id']
             del task['status']
             del task['current_interval']
             del task['retries_left']
             if 'policy' not in orig_task:
                 del task['policy']
             if 'priority' not in orig_task:
                 del task['priority']
                 self.assertEqual(task, orig_task)
 
         self.assertEqual(dict(actual_priorities), {
             priority: int(ratio * num_tasks_priority)
             for priority, ratio in priority_ratio.items()
         })
 
     def test_peek_ready_tasks_no_priority(self):
         self._create_task_types()
         t = utcnow()
         task_type = self.task1_template['type']
         tasks = self._tasks_from_template(self.task1_template, t, 100)
         random.shuffle(tasks)
         self.backend.create_tasks(tasks)
 
         ready_tasks = self.backend.peek_ready_tasks(task_type)
         self.assertEqual(len(ready_tasks), len(tasks))
         for i in range(len(ready_tasks) - 1):
             self.assertLessEqual(ready_tasks[i]['next_run'],
                                  ready_tasks[i+1]['next_run'])
 
         # Only get the first few ready tasks
         limit = random.randrange(5, 5 + len(tasks)//2)
         ready_tasks_limited = self.backend.peek_ready_tasks(
             task_type, num_tasks=limit)
 
         self.assertEqual(len(ready_tasks_limited), limit)
         self.assertCountEqual(ready_tasks_limited, ready_tasks[:limit])
 
         # Limit by timestamp
         max_ts = tasks[limit-1]['next_run']
         ready_tasks_timestamped = self.backend.peek_ready_tasks(
             task_type, timestamp=max_ts)
 
         for ready_task in ready_tasks_timestamped:
             self.assertLessEqual(ready_task['next_run'], max_ts)
 
         # Make sure we get proper behavior for the first ready tasks
         self.assertCountEqual(
             ready_tasks[:len(ready_tasks_timestamped)],
             ready_tasks_timestamped,
         )
 
         # Limit by both
         ready_tasks_both = self.backend.peek_ready_tasks(
             task_type, timestamp=max_ts, num_tasks=limit//3)
         self.assertLessEqual(len(ready_tasks_both), limit//3)
         for ready_task in ready_tasks_both:
             self.assertLessEqual(ready_task['next_run'], max_ts)
             self.assertIn(ready_task, ready_tasks[:limit//3])
 
     def _priority_ratio(self):
         self.cursor.execute('select id, ratio from priority_ratio')
         priority_ratio = {}
         for row in self.cursor.fetchall():
             priority_ratio[row[0]] = row[1]
         return priority_ratio
 
     def test_peek_ready_tasks_mixed_priorities(self):
         priority_ratio = self._priority_ratio()
         self._create_task_types()
         t = utcnow()
         task_type = self.task1_template['type']
         num_tasks_priority = 100
         num_tasks_no_priority = 100
         # Create tasks with and without priorities
         tasks = self._tasks_from_template(
             self.task1_template, t,
             num=num_tasks_no_priority,
             num_priority=num_tasks_priority,
             priorities=priority_ratio)
 
         random.shuffle(tasks)
         self.backend.create_tasks(tasks)
 
         # take all available tasks
         ready_tasks = self.backend.peek_ready_tasks(
             task_type)
 
         self.assertEqual(len(ready_tasks), len(tasks))
         self.assertEqual(num_tasks_priority + num_tasks_no_priority,
                          len(ready_tasks))
 
         count_tasks_per_priority = defaultdict(int)
         for task in ready_tasks:
             priority = task.get('priority')
             if priority:
                 count_tasks_per_priority[priority] += 1
 
         self.assertEqual(dict(count_tasks_per_priority), {
             priority: int(ratio * num_tasks_priority)
             for priority, ratio in priority_ratio.items()
         })
 
         # Only get some ready tasks
         num_tasks = random.randrange(5, 5 + num_tasks_no_priority//2)
         num_tasks_priority = random.randrange(5, num_tasks_priority//2)
         ready_tasks_limited = self.backend.peek_ready_tasks(
             task_type, num_tasks=num_tasks,
             num_tasks_priority=num_tasks_priority)
 
         count_tasks_per_priority = defaultdict(int)
         for task in ready_tasks_limited:
             priority = task.get('priority')
             count_tasks_per_priority[priority] += 1
 
         import math
         for priority, ratio in priority_ratio.items():
             expected_count = math.ceil(ratio * num_tasks_priority)
             actual_prio = count_tasks_per_priority[priority]
             self.assertTrue(
                 actual_prio == expected_count or
                 actual_prio == expected_count + 1)
 
         self.assertEqual(count_tasks_per_priority[None], num_tasks)
 
     def test_grab_ready_tasks(self):
         priority_ratio = self._priority_ratio()
         self._create_task_types()
         t = utcnow()
         task_type = self.task1_template['type']
         num_tasks_priority = 100
         num_tasks_no_priority = 100
         # Create tasks with and without priorities
         tasks = self._tasks_from_template(
             self.task1_template, t,
             num=num_tasks_no_priority,
             num_priority=num_tasks_priority,
             priorities=priority_ratio)
         random.shuffle(tasks)
         self.backend.create_tasks(tasks)
 
         first_ready_tasks = self.backend.peek_ready_tasks(
             task_type, num_tasks=10, num_tasks_priority=10)
         grabbed_tasks = self.backend.grab_ready_tasks(
             task_type, num_tasks=10, num_tasks_priority=10)
 
         for peeked, grabbed in zip(first_ready_tasks, grabbed_tasks):
             self.assertEqual(peeked['status'], 'next_run_not_scheduled')
             del peeked['status']
             self.assertEqual(grabbed['status'], 'next_run_scheduled')
             del grabbed['status']
             self.assertEqual(peeked, grabbed)
             self.assertEqual(peeked['priority'], grabbed['priority'])
 
     def test_get_tasks(self):
         self._create_task_types()
         t = utcnow()
         tasks = self._tasks_from_template(self.task1_template, t, 100)
         tasks = self.backend.create_tasks(tasks)
         random.shuffle(tasks)
         while len(tasks) > 1:
             length = random.randrange(1, len(tasks))
             cur_tasks = tasks[:length]
             tasks[:length] = []
 
             ret = self.backend.get_tasks(task['id'] for task in cur_tasks)
             self.assertCountEqual(ret, cur_tasks)
 
     def test_filter_task_to_archive(self):
         """Filtering only list disabled recurring or completed oneshot tasks
 
         """
         self._create_task_types()
         _time = utcnow()
         recurring = self._tasks_from_template(self.task1_template, _time, 12)
         oneshots = self._tasks_from_template(self.task2_template, _time, 12)
         total_tasks = len(recurring) + len(oneshots)
 
         # simulate scheduling tasks
         pending_tasks = self.backend.create_tasks(recurring + oneshots)
         backend_tasks = [{
             'task': task['id'],
             'backend_id': str(uuid.uuid4()),
             'scheduled': utcnow(),
         } for task in pending_tasks]
         self.backend.mass_schedule_task_runs(backend_tasks)
 
         # we simulate the task are being done
         _tasks = []
         for task in backend_tasks:
             t = self.backend.end_task_run(
                 task['backend_id'], status='eventful')
             _tasks.append(t)
 
         # Randomly update task's status per policy
         status_per_policy = {'recurring': 0, 'oneshot': 0}
         status_choice = {
             # policy: [tuple (1-for-filtering, 'associated-status')]
             'recurring': [(1, 'disabled'),
                           (0, 'completed'),
                           (0, 'next_run_not_scheduled')],
             'oneshot': [(0, 'next_run_not_scheduled'),
                         (1, 'disabled'),
                         (1, 'completed')]
         }
 
         tasks_to_update = defaultdict(list)
         _task_ids = defaultdict(list)
         # randomize 'disabling' recurring task or 'complete' oneshot task
         for task in pending_tasks:
             policy = task['policy']
             _task_ids[policy].append(task['id'])
             status = random.choice(status_choice[policy])
             if status[0] != 1:
                 continue
             # elected for filtering
             status_per_policy[policy] += status[0]
             tasks_to_update[policy].append(task['id'])
 
         self.backend.disable_tasks(tasks_to_update['recurring'])
         # hack: change the status to something else than completed/disabled
         self.backend.set_status_tasks(
             _task_ids['oneshot'], status='next_run_not_scheduled')
         # complete the tasks to update
         self.backend.set_status_tasks(
             tasks_to_update['oneshot'], status='completed')
 
         total_tasks_filtered = (status_per_policy['recurring'] +
                                 status_per_policy['oneshot'])
 
         # retrieve tasks to archive
         after = _time.shift(days=-1).format('YYYY-MM-DD')
         before = utcnow().shift(days=1).format('YYYY-MM-DD')
         tasks_to_archive = list(self.backend.filter_task_to_archive(
             after_ts=after, before_ts=before, limit=total_tasks))
 
         self.assertEqual(len(tasks_to_archive), total_tasks_filtered)
 
         actual_filtered_per_status = {'recurring': 0, 'oneshot': 0}
         for task in tasks_to_archive:
             actual_filtered_per_status[task['task_policy']] += 1
 
         self.assertEqual(actual_filtered_per_status, status_per_policy)
 
     def test_delete_archived_tasks(self):
         self._create_task_types()
         _time = utcnow()
         recurring = self._tasks_from_template(
             self.task1_template, _time, 12)
         oneshots = self._tasks_from_template(
             self.task2_template, _time, 12)
         total_tasks = len(recurring) + len(oneshots)
         pending_tasks = self.backend.create_tasks(recurring + oneshots)
         backend_tasks = [{
             'task': task['id'],
             'backend_id': str(uuid.uuid4()),
             'scheduled': utcnow(),
         } for task in pending_tasks]
         self.backend.mass_schedule_task_runs(backend_tasks)
 
         _tasks = []
         percent = random.randint(0, 100)  # random election removal boundary
         for task in backend_tasks:
             t = self.backend.end_task_run(
                 task['backend_id'], status='eventful')
             c = random.randint(0, 100)
             if c <= percent:
                 _tasks.append({'task_id': t['task'], 'task_run_id': t['id']})
 
         self.backend.delete_archived_tasks(_tasks)
 
         self.cursor.execute('select count(*) from task')
         tasks_count = self.cursor.fetchone()
 
         self.cursor.execute('select count(*) from task_run')
         tasks_run_count = self.cursor.fetchone()
 
         self.assertEqual(tasks_count[0], total_tasks - len(_tasks))
         self.assertEqual(tasks_run_count[0], total_tasks - len(_tasks))
 
 
 class LocalSchedulerTest(CommonSchedulerTest, unittest.TestCase):
     def setUp(self):
         super().setUp()
         self.config = {'scheduling_db': 'dbname=' + self.TEST_DB_NAME}
         self.backend = get_scheduler('local', self.config)
diff --git a/swh/scheduler/tests/updater/test_backend.py b/swh/scheduler/tests/updater/test_backend.py
index f08fca7..baa8205 100644
--- a/swh/scheduler/tests/updater/test_backend.py
+++ b/swh/scheduler/tests/updater/test_backend.py
@@ -1,65 +1,65 @@
 # Copyright (C) 2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import os
 import unittest
 
 from arrow import utcnow
 from hypothesis import given
 from hypothesis.strategies import sets
-from nose.plugins.attrib import attr
+import pytest
 
 from swh.core.tests.db_testing import SingleDbTestFixture
 from swh.scheduler.tests import SQL_DIR
 from swh.scheduler.updater.backend import SchedulerUpdaterBackend
 from swh.scheduler.updater.events import SWHEvent
 
 from . import from_regex
 
 
-@attr('db')
+@pytest.mark.db
 class SchedulerUpdaterBackendTest(SingleDbTestFixture, unittest.TestCase):
     TEST_DB_NAME = 'softwareheritage-scheduler-updater-test'
     TEST_DB_DUMP = os.path.join(SQL_DIR, 'updater', '*.sql')
 
     def setUp(self):
         super().setUp()
         config = {
             'scheduling_updater_db': 'dbname=' + self.TEST_DB_NAME,
             'cache_read_limit': 1000,
         }
         self.backend = SchedulerUpdaterBackend(**config)
 
     def _empty_tables(self):
         self.cursor.execute(
             """SELECT table_name FROM information_schema.tables
                WHERE table_schema = %s""", ('public', ))
         tables = set(table for (table,) in self.cursor.fetchall())
         for table in tables:
             self.cursor.execute('truncate table %s cascade' % table)
         self.conn.commit()
 
     def tearDown(self):
         self.backend.close_connection()
         self._empty_tables()
         super().tearDown()
 
     @given(sets(
         from_regex(
             r'^https://somewhere[.]org/[a-z0-9]{5,7}/[a-z0-9]{3,10}$'),
         min_size=10, max_size=15))
     def test_cache_read(self, urls):
         def gen_events(urls):
             for url in urls:
                 yield SWHEvent({
                     'url': url,
                     'type': 'create',
                     'origin_type': 'git',
                 })
 
         self.backend.cache_put(gen_events(urls))
         r = self.backend.cache_read(timestamp=utcnow())
 
         self.assertNotEqual(r, [])
diff --git a/swh/scheduler/tests/updater/test_consumer.py b/swh/scheduler/tests/updater/test_consumer.py
index 463a05c..1a2f2ac 100644
--- a/swh/scheduler/tests/updater/test_consumer.py
+++ b/swh/scheduler/tests/updater/test_consumer.py
@@ -1,194 +1,195 @@
 # Copyright (C) 2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import unittest
 from itertools import chain
 
-from hypothesis import given
+from hypothesis import given, settings, HealthCheck
 from hypothesis.strategies import lists, sampled_from, text, tuples
 
 from swh.scheduler.updater.consumer import UpdaterConsumer
 from swh.scheduler.updater.events import LISTENED_EVENTS, SWHEvent
 
 from . import UpdaterTestUtil, from_regex
 
 
 class FakeSchedulerUpdaterBackend:
     def __init__(self):
         self.events = []
 
     def cache_put(self, events):
         self.events.append(events)
 
 
 class FakeUpdaterConsumerBase(UpdaterConsumer):
     def __init__(self, backend_class=FakeSchedulerUpdaterBackend):
         super().__init__(backend_class=backend_class)
         self.connection_opened = False
         self.connection_closed = False
         self.consume_called = False
         self.has_events_called = False
 
     def open_connection(self):
         self.connection_opened = True
 
     def close_connection(self):
         self.connection_closed = True
 
     def convert_event(self, event):
         pass
 
 
 class FakeUpdaterConsumerRaise(FakeUpdaterConsumerBase):
     def has_events(self):
         self.has_events_called = True
         return True
 
     def consume_events(self):
         self.consume_called = True
         raise ValueError('Broken stuff')
 
 
 class UpdaterConsumerRaisingTest(unittest.TestCase):
     def setUp(self):
         self.updater = FakeUpdaterConsumerRaise()
 
     def test_running_raise(self):
         """Raising during run should finish fine.
 
         """
         # given
         self.assertEqual(self.updater.count, 0)
         self.assertEqual(self.updater.seen_events, set())
         self.assertEqual(self.updater.events, [])
 
         # when
         with self.assertRaisesRegex(ValueError, 'Broken stuff'):
             self.updater.run()
 
         # then
         self.assertEqual(self.updater.count, 0)
         self.assertEqual(self.updater.seen_events, set())
         self.assertEqual(self.updater.events, [])
         self.assertTrue(self.updater.connection_opened)
         self.assertTrue(self.updater.has_events_called)
         self.assertTrue(self.updater.connection_closed)
         self.assertTrue(self.updater.consume_called)
 
 
 class FakeUpdaterConsumerNoEvent(FakeUpdaterConsumerBase):
     def has_events(self):
         self.has_events_called = True
         return False
 
     def consume_events(self):
         self.consume_called = True
 
 
 class UpdaterConsumerNoEventTest(unittest.TestCase):
     def setUp(self):
         self.updater = FakeUpdaterConsumerNoEvent()
 
     def test_running_does_not_consume(self):
         """Run with no events should do just fine"""
         # given
         self.assertEqual(self.updater.count, 0)
         self.assertEqual(self.updater.seen_events, set())
         self.assertEqual(self.updater.events, [])
 
         # when
         self.updater.run()
 
         # then
         self.assertEqual(self.updater.count, 0)
         self.assertEqual(self.updater.seen_events, set())
         self.assertEqual(self.updater.events, [])
         self.assertTrue(self.updater.connection_opened)
         self.assertTrue(self.updater.has_events_called)
         self.assertTrue(self.updater.connection_closed)
         self.assertFalse(self.updater.consume_called)
 
 
 EVENT_KEYS = ['type', 'repo', 'created_at', 'origin_type']
 
 
 class FakeUpdaterConsumer(FakeUpdaterConsumerBase):
     def __init__(self, messages):
         super().__init__()
         self.messages = messages
         self.debug = False
 
     def has_events(self):
         self.has_events_called = True
         return len(self.messages) > 0
 
     def consume_events(self):
         self.consume_called = True
         for msg in self.messages:
             yield msg
             self.messages.pop()
 
     def convert_event(self, event, keys=EVENT_KEYS):
         for k in keys:
             v = event.get(k)
             if v is None:
                 return None
 
         e = {
             'type': event['type'],
             'url': 'https://fake.url/%s' % event['repo']['name'],
             'last_seen': event['created_at'],
             'origin_type': event['origin_type'],
         }
         return SWHEvent(e)
 
 
 class UpdaterConsumerWithEventTest(UpdaterTestUtil, unittest.TestCase):
+    @settings(suppress_health_check=[HealthCheck.too_slow])
     @given(lists(tuples(sampled_from(LISTENED_EVENTS),  # event type
                         from_regex(r'^[a-z0-9]{5,10}/[a-z0-9]{7,12}$'),  # name
                         text()),                        # origin type
                  min_size=3, max_size=10),
            lists(tuples(text(),                         # event type
                         from_regex(r'^[a-z0-9]{5,7}/[a-z0-9]{3,10}$'),  # name
                         text()),                        # origin type
                  min_size=3, max_size=10),
            lists(tuples(sampled_from(LISTENED_EVENTS),  # event type
                         from_regex(r'^[a-z0-9]{5,10}/[a-z0-9]{7,12}$'),  # name
                         text(),                     # origin type
                         sampled_from(EVENT_KEYS)),  # keys to drop
                  min_size=3, max_size=10))
     def test_running(self, events, uninteresting_events, incomplete_events):
         """Interesting events are written to cache, others are dropped
 
         """
         # given
         ready_events = self._make_events(events)
         ready_uninteresting_events = self._make_events(uninteresting_events)
         ready_incomplete_events = self._make_incomplete_events(
             incomplete_events)
 
         updater = FakeUpdaterConsumer(list(chain(
             ready_events, ready_incomplete_events,
             ready_uninteresting_events)))
 
         self.assertEqual(updater.count, 0)
         self.assertEqual(updater.seen_events, set())
         self.assertEqual(updater.events, [])
 
         # when
         updater.run()
 
         # then
         self.assertEqual(updater.count, 0)
         self.assertEqual(updater.seen_events, set())
         self.assertEqual(updater.events, [])
         self.assertTrue(updater.connection_opened)
         self.assertTrue(updater.has_events_called)
         self.assertTrue(updater.connection_closed)
         self.assertTrue(updater.consume_called)
 
         self.assertEqual(updater.messages, [])
         # uninteresting or incomplete events are dropped
         self.assertTrue(len(updater.backend.events), len(events))
diff --git a/swh/scheduler/tests/updater/test_writer.py b/swh/scheduler/tests/updater/test_writer.py
index 79a6f09..1d932a5 100644
--- a/swh/scheduler/tests/updater/test_writer.py
+++ b/swh/scheduler/tests/updater/test_writer.py
@@ -1,158 +1,158 @@
 # Copyright (C) 2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import os
 import unittest
 from glob import glob
 
-from nose.plugins.attrib import attr
+import pytest
 
 from swh.core.utils import numfile_sortkey as sortkey
 from swh.core.tests.db_testing import DbTestFixture
 from swh.scheduler.tests import SQL_DIR
 from swh.scheduler.updater.events import LISTENED_EVENTS, SWHEvent
 from swh.scheduler.updater.writer import UpdaterWriter
 
 from . import UpdaterTestUtil
 
 
-@attr('db')
+@pytest.mark.db
 class CommonSchedulerTest(DbTestFixture):
     TEST_SCHED_DB = 'softwareheritage-scheduler-test'
     TEST_SCHED_DUMP = os.path.join(SQL_DIR, '*.sql')
 
     TEST_SCHED_UPDATER_DB = 'softwareheritage-scheduler-updater-test'
     TEST_SCHED_UPDATER_DUMP = os.path.join(SQL_DIR, 'updater', '*.sql')
 
     @classmethod
     def setUpClass(cls):
         cls.add_db(cls.TEST_SCHED_DB,
                    [(sqlfn, 'psql') for sqlfn in
                     sorted(glob(cls.TEST_SCHED_DUMP), key=sortkey)])
         cls.add_db(cls.TEST_SCHED_UPDATER_DB,
                    [(sqlfn, 'psql') for sqlfn in
                     sorted(glob(cls.TEST_SCHED_UPDATER_DUMP), key=sortkey)])
         super().setUpClass()
 
     def tearDown(self):
         self.reset_db_tables(self.TEST_SCHED_UPDATER_DB)
         self.reset_db_tables(self.TEST_SCHED_DB,
                              excluded=['task_type', 'priority_ratio'])
         super().tearDown()
 
 
 class UpdaterWriterTest(UpdaterTestUtil, CommonSchedulerTest,
                         unittest.TestCase):
     def setUp(self):
         super().setUp()
 
         config = {
             'scheduler': {
                 'cls': 'local',
                 'args': {
                     'scheduling_db': 'dbname=softwareheritage-scheduler-test',
                 },
             },
             'scheduler_updater': {
                 'scheduling_updater_db':
                 'dbname=softwareheritage-scheduler-updater-test',
                 'cache_read_limit': 5,
             },
             'pause': 0.1,
             'verbose': False,
         }
         self.writer = UpdaterWriter(**config)
         self.scheduler_backend = self.writer.scheduler_backend
         self.scheduler_updater_backend = self.writer.scheduler_updater_backend
 
     def tearDown(self):
         self.scheduler_backend.close_connection()
         self.scheduler_updater_backend.close_connection()
         super().tearDown()
 
     def test_run_ko(self):
         """Only git tasks are supported for now, other types are dismissed.
 
         """
         ready_events = [
             SWHEvent(
                 self._make_simple_event(event_type, 'origin-%s' % i,
                                         'svn'))
             for i, event_type in enumerate(LISTENED_EVENTS)
         ]
 
         expected_length = len(ready_events)
 
         self.scheduler_updater_backend.cache_put(ready_events)
         data = list(self.scheduler_updater_backend.cache_read())
         self.assertEqual(len(data), expected_length)
 
         r = self.scheduler_backend.peek_ready_tasks(
             'origin-update-git')
 
         # first read on an empty scheduling db results with nothing in it
         self.assertEqual(len(r), 0)
 
         # Read from cache to scheduler db
         self.writer.run()
 
         r = self.scheduler_backend.peek_ready_tasks(
             'origin-update-git')
 
         # other reads after writes are still empty since it's not supported
         self.assertEqual(len(r), 0)
 
     def test_run_ok(self):
         """Only git origin are supported for now
 
         """
         ready_events = [
             SWHEvent(
                 self._make_simple_event(event_type, 'origin-%s' % i, 'git'))
             for i, event_type in enumerate(LISTENED_EVENTS)
         ]
 
         expected_length = len(ready_events)
 
         self.scheduler_updater_backend.cache_put(ready_events)
 
         data = list(self.scheduler_updater_backend.cache_read())
         self.assertEqual(len(data), expected_length)
 
         r = self.scheduler_backend.peek_ready_tasks(
             'origin-update-git')
 
         # first read on an empty scheduling db results with nothing in it
         self.assertEqual(len(r), 0)
 
         # Read from cache to scheduler db
         self.writer.run()
 
         # now, we should have scheduling task ready
         r = self.scheduler_backend.peek_ready_tasks(
             'origin-update-git')
 
-        self.assertEquals(len(r), expected_length)
+        self.assertEqual(len(r), expected_length)
 
         # Check the task has been scheduled
         for t in r:
-            self.assertEquals(t['type'], 'origin-update-git')
-            self.assertEquals(t['priority'], 'normal')
-            self.assertEquals(t['policy'], 'oneshot')
-            self.assertEquals(t['status'], 'next_run_not_scheduled')
+            self.assertEqual(t['type'], 'origin-update-git')
+            self.assertEqual(t['priority'], 'normal')
+            self.assertEqual(t['policy'], 'oneshot')
+            self.assertEqual(t['status'], 'next_run_not_scheduled')
 
         # writer has nothing to do now
         self.writer.run()
 
         # so no more data in cache
         data = list(self.scheduler_updater_backend.cache_read())
 
         self.assertEqual(len(data), 0)
 
         # provided, no runner is ran, still the same amount of scheduling tasks
         r = self.scheduler_backend.peek_ready_tasks(
             'origin-update-git')
 
-        self.assertEquals(len(r), expected_length)
+        self.assertEqual(len(r), expected_length)
diff --git a/swh/scheduler/updater/consumer.py b/swh/scheduler/updater/consumer.py
index e0a0760..e0465f2 100644
--- a/swh/scheduler/updater/consumer.py
+++ b/swh/scheduler/updater/consumer.py
@@ -1,140 +1,140 @@
 # Copyright (C) 2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import logging
 
 from abc import ABCMeta, abstractmethod
 
 from swh.scheduler.updater.backend import SchedulerUpdaterBackend
 
 
 class UpdaterConsumer(metaclass=ABCMeta):
     """Event consumer
 
     """
     def __init__(self, batch=1000, backend_class=SchedulerUpdaterBackend,
                  log_class='swh.scheduler.updater.consumer.UpdaterConsumer'):
         super().__init__()
         self._reset_cache()
         self.backend = backend_class()
         self.batch = batch
         logging.basicConfig(level=logging.DEBUG)
         self.log = logging.getLogger(log_class)
 
     def _reset_cache(self):
         """Reset internal cache.
 
         """
         self.count = 0
         self.seen_events = set()
         self.events = []
 
     def is_interesting(self, event):
         """Determine if an event is interesting or not.
 
         Args:
             event (SWHEvent): SWH event
 
         """
         return event.is_interesting()
 
     @abstractmethod
     def convert_event(self, event):
         """Parse an event into an SWHEvent.
 
         """
         pass
 
     def process_event(self, event):
         """Process converted and interesting event.
 
         Args:
             event (SWHEvent): Event to process if deemed interesting
 
         """
         try:
             if event.url in self.seen_events:
                 event.cnt += 1
             else:
                 self.events.append(event)
                 self.seen_events.add(event.url)
                 self.count += 1
         finally:
             if self.count >= self.batch:
                 if self.events:
                     self.backend.cache_put(self.events)
                 self._reset_cache()
 
     def _flush(self):
         """Flush remaining internal cache if any.
 
         """
         if self.events:
             self.backend.cache_put(self.events)
             self._reset_cache()
 
     @abstractmethod
     def has_events(self):
         """Determine if there remains events to consume.
 
         Returns
             boolean value, true for remaining events, False otherwise
 
         """
         pass
 
     @abstractmethod
     def consume_events(self):
         """The main entry point to consume events.
 
         This should either yield or return message for consumption.
 
         """
         pass
 
     @abstractmethod
     def open_connection(self):
         """Open a connection to the remote system we are supposed to consume
            from.
 
         """
         pass
 
     @abstractmethod
     def close_connection(self):
         """Close opened connection to the remote system.
 
         """
         pass
 
     def run(self):
         """The main entry point to consume events.
 
         """
         try:
             self.open_connection()
             while self.has_events():
                 for _event in self.consume_events():
                     event = self.convert_event(_event)
                     if not event:
-                        self.log.warn(
+                        self.log.warning(
                             'Incomplete event dropped %s' % _event)
                         continue
                     if not self.is_interesting(event):
                         continue
                     if self.debug:
                         self.log.debug('Event: %s' % event)
                     try:
                         self.process_event(event)
                     except Exception:
                         self.log.exception(
                             'Problem when processing event %s' % _event)
                         continue
         except Exception as e:
             self.log.error('Error raised during consumption: %s' % e)
             raise e
         finally:
             self.close_connection()
             self._flush()
diff --git a/swh/scheduler/updater/writer.py b/swh/scheduler/updater/writer.py
index cb10825..829f31c 100644
--- a/swh/scheduler/updater/writer.py
+++ b/swh/scheduler/updater/writer.py
@@ -1,122 +1,122 @@
 # Copyright (C) 2018  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 import click
 import logging
 import time
 
 from arrow import utcnow
 
 from swh.core.config import SWHConfig
 from swh.core import utils
 from swh.scheduler import get_scheduler
 from swh.scheduler.utils import create_oneshot_task_dict
 from swh.scheduler.updater.backend import SchedulerUpdaterBackend
 
 
 class UpdaterWriter(SWHConfig):
     """Updater writer in charge of updating the scheduler db with latest
        prioritized oneshot tasks
 
        In effect, this:
        - reads the events from scheduler updater's db
        - converts those events into priority oneshot tasks
        - dumps them into the scheduler db
 
     """
     CONFIG_BASE_FILENAME = 'backend/scheduler-updater-writer'
     DEFAULT_CONFIG = {
         # access to the scheduler backend
         'scheduler': ('dict', {
             'cls': 'local',
             'args': {
                 'scheduling_db': 'dbname=softwareheritage-scheduler-dev',
             },
         }),
         # access to the scheduler updater cache
         'scheduler_updater': ('dict', {
             'scheduling_updater_db':
             'dbname=softwareheritage-scheduler-updater-dev',
             'cache_read_limit': 1000,
         }),
         # waiting time between db reads
         'pause': ('int', 10),
         # verbose or not
         'verbose': ('bool', False),
     }
 
     def __init__(self, **config):
         if config:
             self.config = config
         else:
             self.config = self.parse_config_file()
 
         self.scheduler_updater_backend = SchedulerUpdaterBackend(
             **self.config['scheduler_updater'])
         self.scheduler_backend = get_scheduler(**self.config['scheduler'])
         self.pause = self.config['pause']
         self.log = logging.getLogger(
             'swh.scheduler.updater.writer.UpdaterWriter')
         self.log.setLevel(
             logging.DEBUG if self.config['verbose'] else logging.INFO)
 
     def convert_to_oneshot_task(self, event):
         """Given an event, convert it into oneshot task with priority
 
         Args:
             event (dict): The event to convert to task
 
         """
         if event['origin_type'] == 'git':
             return create_oneshot_task_dict(
                 'origin-update-git',
                 event['url'],
                 priority='normal')
-        self.log.warn('Type %s is not supported for now, only git' % (
+        self.log.warning('Type %s is not supported for now, only git' % (
             event['origin_type'], ))
         return None
 
     def write_event_to_scheduler(self, events):
         """Write events to the scheduler and yield ids when done"""
         # convert events to oneshot tasks
         oneshot_tasks = filter(lambda e: e is not None,
                                map(self.convert_to_oneshot_task, events))
         # write event to scheduler
         self.scheduler_backend.create_tasks(list(oneshot_tasks))
         for e in events:
             yield e['url']
 
     def run(self):
         """First retrieve events from cache (including origin_type, cnt),
            then convert them into oneshot tasks with priority, then
            write them to the scheduler db, at last remove them from
            cache.
 
         """
         while True:
             timestamp = utcnow()
             events = list(self.scheduler_updater_backend.cache_read(timestamp))
             if not events:
                 break
             for urls in utils.grouper(self.write_event_to_scheduler(events),
                                       n=100):
                 self.scheduler_updater_backend.cache_remove(urls)
             time.sleep(self.pause)
 
 
 @click.command()
 @click.option('--verbose/--no-verbose', '-v', default=False,
               help='Verbose mode')
 def main(verbose):
     log = logging.getLogger('swh.scheduler.updater.writer')
     log.addHandler(logging.StreamHandler())
     _loglevel = logging.DEBUG if verbose else logging.INFO
     log.setLevel(_loglevel)
 
     UpdaterWriter().run()
 
 
 if __name__ == '__main__':
     main()
diff --git a/tox.ini b/tox.ini
new file mode 100644
index 0000000..70265ee
--- /dev/null
+++ b/tox.ini
@@ -0,0 +1,17 @@
+[tox]
+envlist=flake8,py3
+
+[testenv:py3]
+deps =
+  .[testing]
+  pytest-cov
+  pifpaf
+commands =
+  pifpaf run postgresql -- pytest --cov=swh --cov-branch {posargs}
+
+[testenv:flake8]
+skip_install = true
+deps =
+  flake8
+commands =
+  {envpython} -m flake8
diff --git a/version.txt b/version.txt
index 565ae72..ce82f77 100644
--- a/version.txt
+++ b/version.txt
@@ -1 +1 @@
-v0.0.32-0-g8df816a
\ No newline at end of file
+v0.0.33-0-g923e0b5
\ No newline at end of file