cli_runner = <click.testing.CliRunner object at 0x7fcb1467da90>
swh_config = '/tmp/pytest-of-jenkins/pytest-0/test_cli_journal_client_index_4/indexer.yml'
kafka_prefix = 'farusiwnpa', kafka_server = '127.0.0.1:40417'
consumer = <cimpl.Consumer object at 0x7fcb16a51b88>
idx_storage = <swh.indexer.storage.IndexerStorage object at 0x7fcb145915f8>
obj_storage = <swh.objstorage.backends.in_memory.InMemoryObjStorage object at 0x7fcb145919e8>
storage = <swh.storage.postgresql.storage.Storage object at 0x7fcb1466ab38>
mocker = <pytest_mock.plugin.MockerFixture object at 0x7fcb14591048>
swh_indexer_config = {'compute_checksums': ['blake2b512'], 'indexer_storage': {'cls': 'local', 'db': "user=postgres password=xxx dbname=tes...cheduler': {'cls': 'local', 'db': "user=postgres password=xxx dbname=tests host=127.0.0.1 port=16585 options=''"}, ...}
def test_cli_journal_client_index__content_mimetype(
cli_runner,
swh_config,
kafka_prefix: str,
kafka_server,
consumer: Consumer,
idx_storage,
obj_storage,
storage,
mocker,
swh_indexer_config,
):
"""Test the 'swh indexer journal-client' cli tool."""
journal_writer = get_journal_writer(
"kafka",
brokers=[kafka_server],
prefix=kafka_prefix,
client_id="test producer",
value_sanitizer=lambda object_type, value: value,
flush_timeout=3, # fail early if something is going wrong
)
contents = []
expected_results = []
content_ids = []
for content_id, (raw_content, mimetypes, encoding) in RAW_CONTENTS.items():
content = Content.from_data(raw_content)
assert content_id == content.sha1
contents.append(content)
content_ids.append(content_id)
# Older libmagic versions (e.g. buster: 1:5.35-4+deb10u2, bullseye: 1:5.39-3)
# returns different results. This allows to deal with such a case when executing
# tests on different environments machines (e.g. ci tox, ci debian, dev machine,
# ...)
all_mimetypes = mimetypes if isinstance(mimetypes, tuple) else [mimetypes]
expected_results.extend(
[
ContentMimetypeRow(
id=content.sha1,
tool={"id": 1, **swh_indexer_config["tools"]},
mimetype=mimetype,
encoding=encoding,
)
for mimetype in all_mimetypes
]
)
assert len(contents) == len(RAW_CONTENTS)
journal_writer.write_additions("content", contents)
result = cli_runner.invoke(
indexer_cli_group,
[
"-C",
swh_config,
"journal-client",
"content_mimetype",
"--broker",
kafka_server,
"--prefix",
kafka_prefix,
"--group-id",
"test-consumer",
"--stop-after-objects",
len(contents),
],
> catch_exceptions=False,
)
.tox/py3/lib/python3.7/site-packages/swh/indexer/tests/test_cli.py:830:
_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
.tox/py3/lib/python3.7/site-packages/click/testing.py:408: in invoke
return_value = cli.main(args=args or (), prog_name=prog_name, **extra)
.tox/py3/lib/python3.7/site-packages/click/core.py:1055: in main
rv = self.invoke(ctx)
.tox/py3/lib/python3.7/site-packages/click/core.py:1657: in invoke
return _process_result(sub_ctx.command.invoke(sub_ctx))
.tox/py3/lib/python3.7/site-packages/click/core.py:1404: in invoke
return ctx.invoke(self.callback, **ctx.params)
.tox/py3/lib/python3.7/site-packages/click/core.py:760: in invoke
return __callback(*args, **kwargs)
.tox/py3/lib/python3.7/site-packages/click/decorators.py:26: in new_func
return f(get_current_context(), *args, **kwargs)
.tox/py3/lib/python3.7/site-packages/swh/indexer/cli.py:367: in journal_client
batch_size=batch_size,
.tox/py3/lib/python3.7/site-packages/swh/journal/client.py:67: in get_journal_client
return JournalClient(**kwargs)
_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _
self = <swh.journal.client.JournalClient object at 0x7fcb1466ae10>
brokers = ('127.0.0.1:40417',), group_id = 'test-consumer'
prefix = 'farusiwnpa', object_types = ['content'], privileged = False
stop_after_objects = 3, batch_size = None, process_timeout = None
auto_offset_reset = 'earliest', stop_on_eof = False, value_deserializer = None
kwargs = {}
def __init__(
self,
brokers: Union[str, List[str]],
group_id: str,
prefix: Optional[str] = None,
object_types: Optional[List[str]] = None,
privileged: bool = False,
stop_after_objects: Optional[int] = None,
batch_size: int = 200,
process_timeout: Optional[float] = None,
auto_offset_reset: str = "earliest",
stop_on_eof: bool = False,
value_deserializer: Optional[Callable[[str, bytes], Any]] = None,
**kwargs,
):
if prefix is None:
prefix = DEFAULT_PREFIX
if auto_offset_reset not in ACCEPTED_OFFSET_RESET:
raise ValueError(
"Option 'auto_offset_reset' only accept %s, not %s"
% (ACCEPTED_OFFSET_RESET, auto_offset_reset)
)
> if batch_size <= 0:
E TypeError: '<=' not supported between instances of 'NoneType' and 'int'
.tox/py3/lib/python3.7/site-packages/swh/journal/client.py:152: TypeError
TEST RESULT
TEST RESULT
- Run At
- Aug 31 2022, 5:26 PM