diff --git a/swh/dataset/exporters/orc.py b/swh/dataset/exporters/orc.py --- a/swh/dataset/exporters/orc.py +++ b/swh/dataset/exporters/orc.py @@ -8,6 +8,7 @@ from typing import Any, Optional, Tuple, Type, cast import uuid +from pkg_resources import get_distribution from pyorc import ( BigInt, Binary, @@ -132,6 +133,13 @@ }, ) ) + self.writers[table_name].set_user_metadata( + swh_object_type=table_name.encode(), + swh_uuid=unique_id.encode(), + swh_model_version=get_distribution("swh.model").version.encode(), + swh_dataset_version=get_distribution("swh.dataset").version.encode(), + # maybe put a copy of the config (redacted) also? + ) return self.writers[table_name] def process_origin(self, origin):