Changeset View
Changeset View
Standalone View
Standalone View
swh/indexer/fossology_license.py
Show First 20 Lines • Show All 154 Lines • ▼ Show 20 Lines | |||||
class FossologyLicenseRangeIndexer( | class FossologyLicenseRangeIndexer( | ||||
MixinFossologyLicenseIndexer, DiskIndexer, ContentRangeIndexer): | MixinFossologyLicenseIndexer, DiskIndexer, ContentRangeIndexer): | ||||
"""FossologyLicense Range Indexer working on range of content identifiers. | """FossologyLicense Range Indexer working on range of content identifiers. | ||||
It: | It: | ||||
- filters out the non textual content | - filters out the non textual content | ||||
- (optionally) filters out content already indexed (cf :callable:`range`) | - (optionally) filters out content already indexed (cf | ||||
:func:`indexed_contents_in_range`) | |||||
- reads content from objstorage per the content's id (sha1) | - reads content from objstorage per the content's id (sha1) | ||||
- computes {mimetype, encoding} from that content | - computes {mimetype, encoding} from that content | ||||
- stores result in storage | - stores result in storage | ||||
""" | """ | ||||
def indexed_contents_in_range(self, start, end): | def indexed_contents_in_range(self, start, end): | ||||
"""Retrieve indexed content id within range [start, end]. | """Retrieve indexed content id within range [start, end]. | ||||
Show All 13 Lines |