Page MenuHomeSoftware Heritage

Jenkins > .tox.py3.lib.python3.7.site-packages.swh.storage.tests.test_backfill::test_backfiller
Failed

TEST RESULT

Run At
Jan 12 2021, 6:34 PM
Details
swh_storage_backend_config = {'check_config': {'check_write': True}, 'cls': 'local', 'db': "dbname=storage user=postgres host=127.0.0.1 port=17381 ...riter': {'brokers': ['127.0.0.1:34429'], 'client_id': 'kafka_writer-1', 'cls': 'kafka', 'prefix': 'myphavtsnz-1'}, ...} kafka_prefix = 'myphavtsnz', kafka_consumer_group = 'test-consumer-myphavtsnz' kafka_server = '127.0.0.1:34429' @patch("swh.storage.backfill.RANGE_GENERATORS", RANGE_GENERATORS) def test_backfiller( swh_storage_backend_config, kafka_prefix: str, kafka_consumer_group: str, kafka_server: str, ): prefix1 = f"{kafka_prefix}-1" prefix2 = f"{kafka_prefix}-2" journal1 = { "cls": "kafka", "brokers": [kafka_server], "client_id": "kafka_writer-1", "prefix": prefix1, } swh_storage_backend_config["journal_writer"] = journal1 storage = get_storage(**swh_storage_backend_config) # fill the storage and the journal (under prefix1) for object_type, objects in TEST_OBJECTS.items(): method = getattr(storage, object_type + "_add") method(objects) # now apply the backfiller on the storage to fill the journal under prefix2 backfiller_config = { "journal_writer": { "brokers": [kafka_server], "client_id": "kafka_writer-2", "prefix": prefix2, }, "storage": swh_storage_backend_config, } # Backfilling backfiller = JournalBackfiller(backfiller_config) for object_type in TEST_OBJECTS: backfiller.run(object_type, None, None) # now check journal content are the same under both topics # use the replayer scaffolding to fill storages to make is a bit easier # Replaying #1 sto1 = get_storage(cls="memory") replayer1 = JournalClient( brokers=kafka_server, group_id=f"{kafka_consumer_group}-1", prefix=prefix1, stop_on_eof=True, ) worker_fn1 = functools.partial(process_replay_objects, storage=sto1) > replayer1.process(worker_fn1) .tox/py3/lib/python3.7/site-packages/swh/storage/tests/test_backfill.py:234: _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ .tox/py3/lib/python3.7/site-packages/swh/journal/client.py:265: in process batch_processed, at_eof = self.handle_messages(messages, worker_fn) .tox/py3/lib/python3.7/site-packages/swh/journal/client.py:292: in handle_messages worker_fn(dict(objects)) .tox/py3/lib/python3.7/site-packages/swh/storage/replay.py:60: in process_replay_objects _insert_objects(object_type, objects, storage) .tox/py3/lib/python3.7/site-packages/swh/storage/replay.py:139: in _insert_objects method(model_objs) .tox/py3/lib/python3.7/site-packages/swh/storage/cassandra/storage.py:892: in origin_visit_add snapshot=None, .tox/py3/lib/python3.7/site-packages/swh/storage/cassandra/storage.py:902: in _origin_visit_status_add converters.visit_status_to_row(visit_status) .tox/py3/lib/python3.7/site-packages/swh/storage/cassandra/converters.py:113: in visit_status_to_row return OriginVisitStatusRow.from_dict({**d, "metadata": json.dumps(d["metadata"])}) _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ cls = <class 'swh.storage.cassandra.model.OriginVisitStatusRow'> d = {'date': datetime.datetime(2018, 11, 27, 17, 20, 39, tzinfo=datetime.timezone.utc), 'metadata': 'null', 'origin': 'https://somewhere.org/den/fox', 'snapshot': None, ...} @classmethod def from_dict(cls: Type[T], d: Dict[str, Any]) -> T: > return cls(**d) # type: ignore E TypeError: __init__() missing 1 required positional argument: 'type' .tox/py3/lib/python3.7/site-packages/swh/storage/cassandra/model.py:45: TypeError