diff --git a/swh/indexer/metadata.py b/swh/indexer/metadata.py
index fd44a5f..5b7783a 100644
--- a/swh/indexer/metadata.py
+++ b/swh/indexer/metadata.py
@@ -1,300 +1,300 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 import click
 import logging
 
 from swh.indexer.indexer import ContentIndexer, RevisionIndexer
 from swh.indexer.metadata_dictionary import compute_metadata
 from swh.indexer.metadata_detector import detect_metadata
 from swh.indexer.metadata_detector import extract_minimal_metadata_dict
 from swh.indexer.storage import INDEXER_CFG_KEY
 
 from swh.model import hashutil
 
 
 class ContentMetadataIndexer(ContentIndexer):
     """Content-level indexer
 
     This indexer is in charge of:
 
     - filtering out content already indexed in content_metadata
     - reading content from objstorage with the content's id sha1
     - computing translated_metadata by given context
     - using the metadata_dictionary as the 'swh-metadata-translator' tool
     - store result in content_metadata table
 
     """
     CONFIG_BASE_FILENAME = 'indexer/metadata'
 
     def __init__(self, tool, config):
         # twisted way to use the exact same config of RevisionMetadataIndexer
         # object that uses internally ContentMetadataIndexer
         self.config = config
         self.config['tools'] = tool
         super().__init__()
 
     def prepare(self):
         self.results = []
         if self.config[INDEXER_CFG_KEY]:
             self.idx_storage = self.config[INDEXER_CFG_KEY]
         if self.config['objstorage']:
             self.objstorage = self.config['objstorage']
         l = logging.getLogger('requests.packages.urllib3.connectionpool')
         l.setLevel(logging.WARN)
         self.log = logging.getLogger('swh.indexer')
         self.tools = self.register_tools(self.config['tools'])
         # NOTE: only one tool so far, change when no longer true
         self.tool = self.tools[0]
 
     def filter(self, ids):
         """Filter out known sha1s and return only missing ones.
         """
         yield from self.idx_storage.content_metadata_missing((
             {
                 'id': sha1,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1 in ids
         ))
 
     def index(self, id, data):
         """Index sha1s' content and store result.
 
         Args:
             id (bytes): content's identifier
             data (bytes): raw content in bytes
 
         Returns:
             dict: dictionary representing a content_metadata. If the
             translation wasn't successful the translated_metadata keys will
             be returned as None
 
         """
         result = {
             'id': id,
             'indexer_configuration_id': self.tool['id'],
             'translated_metadata': None
         }
         try:
             context = self.tool['tool_configuration']['context']
             result['translated_metadata'] = compute_metadata(context, data)
             # a twisted way to keep result with indexer object for get_results
             self.results.append(result)
-        except:
+        except Exception:
             self.log.exception(
                 "Problem during tool retrieval of metadata translation")
         return result
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_metadata, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - translated_metadata (jsonb): detected metadata
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
         self.idx_storage.content_metadata_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
     def get_results(self):
         """can be called only if run method was called before
 
         Returns:
             list: list of content_metadata entries calculated by
                   current indexer
 
         """
         return self.results
 
 
 class RevisionMetadataIndexer(RevisionIndexer):
     """Revision-level indexer
 
     This indexer is in charge of:
 
     - filtering revisions already indexed in revision_metadata table with
       defined computation tool
     - retrieve all entry_files in root directory
     - use metadata_detector for file_names containig metadata
     - compute metadata translation if necessary and possible (depends on tool)
     - send sha1s to content indexing if possible
     - store the results for revision
 
     """
     CONFIG_BASE_FILENAME = 'indexer/metadata'
 
     ADDITIONAL_CONFIG = {
         'storage': ('dict', {
             'cls': 'remote',
             'args': {
                 'url': 'http://localhost:5002/',
             }
         }),
         'tools': ('dict', {
             'name': 'swh-metadata-detector',
             'version': '0.0.1',
             'configuration': {
                 'type': 'local',
                 'context': ['npm', 'codemeta']
             },
         }),
     }
 
     def prepare(self):
         super().prepare()
         self.tool = self.tools[0]
 
     def filter(self, sha1_gits):
         """Filter out known sha1s and return only missing ones.
 
         """
         yield from self.idx_storage.revision_metadata_missing((
             {
                 'id': sha1_git,
                 'indexer_configuration_id': self.tool['id'],
             } for sha1_git in sha1_gits
         ))
 
     def index(self, rev):
         """Index rev by processing it and organizing result.
 
         use metadata_detector to iterate on filenames
 
         - if one filename detected -> sends file to content indexer
         - if multiple file detected -> translation needed at revision level
 
         Args:
           rev (bytes): revision artifact from storage
 
         Returns:
             dict: dictionary representing a revision_metadata, with keys:
 
                 - id (bytes): rev's identifier (sha1_git)
                 - indexer_configuration_id (bytes): tool used
                 - translated_metadata (bytes): dict of retrieved metadata
 
         """
         try:
             result = {
                 'id': rev['id'],
                 'indexer_configuration_id': self.tool['id'],
                 'translated_metadata': None
             }
 
             root_dir = rev['directory']
             dir_ls = self.storage.directory_ls(root_dir, recursive=False)
             files = (entry for entry in dir_ls if entry['type'] == 'file')
             detected_files = detect_metadata(files)
             result['translated_metadata'] = self.translate_revision_metadata(
                                                                 detected_files)
         except Exception as e:
             self.log.exception(
                 'Problem when indexing rev')
         return result
 
     def persist_index_computations(self, results, policy_update):
         """Persist the results in storage.
 
         Args:
             results ([dict]): list of content_mimetype, dict with the
             following keys:
               - id (bytes): content's identifier (sha1)
               - mimetype (bytes): mimetype in bytes
               - encoding (bytes): encoding in bytes
             policy_update ([str]): either 'update-dups' or 'ignore-dups' to
             respectively update duplicates or ignore them
 
         """
         # TODO: add functions in storage to keep data in revision_metadata
         self.idx_storage.revision_metadata_add(
             results, conflict_update=(policy_update == 'update-dups'))
 
     def translate_revision_metadata(self, detected_files):
         """
         Determine plan of action to translate metadata when containing
         one or multiple detected files:
 
         Args:
             detected_files (dict): dictionary mapping context names (e.g.,
               "npm", "authors") to list of sha1
 
         Returns:
             dict: dict with translated metadata according to the CodeMeta
             vocabulary
 
         """
         translated_metadata = []
         tool = {
                 'name': 'swh-metadata-translator',
                 'version': '0.0.1',
                 'configuration': {
                     'type': 'local',
                     'context': None
                 },
             }
         # TODO: iterate on each context, on each file
         # -> get raw_contents
         # -> translate each content
         config = {
             INDEXER_CFG_KEY: self.idx_storage,
             'objstorage': self.objstorage
         }
         for context in detected_files.keys():
             tool['configuration']['context'] = context
             c_metadata_indexer = ContentMetadataIndexer(tool, config)
             # sha1s that are in content_metadata table
             sha1s_in_storage = []
             metadata_generator = self.idx_storage.content_metadata_get(
                 detected_files[context])
             for c in metadata_generator:
                 # extracting translated_metadata
                 sha1 = c['id']
                 sha1s_in_storage.append(sha1)
                 local_metadata = c['translated_metadata']
                 # local metadata is aggregated
                 if local_metadata:
                     translated_metadata.append(local_metadata)
 
             sha1s_filtered = [item for item in detected_files[context]
                               if item not in sha1s_in_storage]
 
             if sha1s_filtered:
                 # schedule indexation of content
                 try:
                     c_metadata_indexer.run(sha1s_filtered,
                                            policy_update='ignore-dups')
                     # on the fly possibility:
                     results = c_metadata_indexer.get_results()
 
                     for result in results:
                         local_metadata = result['translated_metadata']
                         translated_metadata.append(local_metadata)
 
                 except Exception as e:
                     self.log.warn("""Exception while indexing content""", e)
 
         # transform translated_metadata into min set with swh-metadata-detector
         min_metadata = extract_minimal_metadata_dict(translated_metadata)
         return min_metadata
 
 
 @click.command()
 @click.option('--revs', '-i',
               default=['8dbb6aeb036e7fd80664eb8bfd1507881af1ba9f',
                        '026040ea79dec1b49b4e3e7beda9132b6b26b51b',
                        '9699072e21eded4be8d45e3b8d543952533fa190'],
               help='Default sha1_git to lookup', multiple=True)
 def main(revs):
     _git_sha1s = list(map(hashutil.hash_to_bytes, revs))
     rev_metadata_indexer = RevisionMetadataIndexer()
     rev_metadata_indexer.run(_git_sha1s, 'update-dups')
 
 
 if __name__ == '__main__':
     logging.basicConfig(level=logging.INFO)
     main()
diff --git a/swh/indexer/metadata_dictionary.py b/swh/indexer/metadata_dictionary.py
index 56a0e54..3ed9fc5 100644
--- a/swh/indexer/metadata_dictionary.py
+++ b/swh/indexer/metadata_dictionary.py
@@ -1,210 +1,210 @@
 # Copyright (C) 2017  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 import json
 
 
 def convert(raw_content):
     """
     convert raw_content recursively:
 
     - from bytes to string
     - from string to dict
 
     Args:
         raw_content (bytes / string / dict)
 
     Returns:
         dict: content (if string was json, otherwise returns string)
 
     """
     if isinstance(raw_content, bytes):
         return convert(raw_content.decode())
     if isinstance(raw_content, str):
         try:
             content = json.loads(raw_content)
             if content:
                 return content
             else:
                 return raw_content
         except json.decoder.JSONDecodeError:
             return raw_content
     if isinstance(raw_content, dict):
         return raw_content
 
 
 class BaseMapping():
     """Base class for mappings to inherit from
 
     To implement a new mapping:
 
     - inherit this class
     - add a local property self.mapping
     - override translate function
     """
 
     def translate(self, content_dict):
         """
         Tranlsates content  by parsing content to a json object
         and translating with the npm mapping (for now hard_coded mapping)
 
         Args:
             context_text (text): should be json
 
         Returns:
             dict: translated metadata in jsonb form needed for the indexer
 
         """
         translated_metadata = {}
         default = 'other'
         translated_metadata['other'] = {}
         try:
             for k, v in content_dict.items():
                 try:
                     term = self.mapping.get(k, default)
                     if term not in translated_metadata:
                         translated_metadata[term] = v
                         continue
                     if isinstance(translated_metadata[term], str):
                         in_value = translated_metadata[term]
                         translated_metadata[term] = [in_value, v]
                         continue
                     if isinstance(translated_metadata[term], list):
                         translated_metadata[term].append(v)
                         continue
                     if isinstance(translated_metadata[term], dict):
                         translated_metadata[term][k] = v
                         continue
                 except KeyError:
                     self.log.exception(
                         "Problem during item mapping")
                     continue
-        except:
+        except Exception:
             return None
         return translated_metadata
 
 
 class NpmMapping(BaseMapping):
     """
     dedicated class for NPM (package.json) mapping and translation
     """
     mapping = {
         'repository': 'codeRepository',
         'os': 'operatingSystem',
         'cpu': 'processorRequirements',
         'engines': 'processorRequirements',
         'dependencies': 'softwareRequirements',
         'bundleDependencies': 'softwareRequirements',
         'peerDependencies': 'softwareRequirements',
         'author': 'author',
         'contributor': 'contributor',
         'keywords': 'keywords',
         'license': 'license',
         'version': 'version',
         'description': 'description',
         'name': 'name',
         'devDependencies': 'softwareSuggestions',
         'optionalDependencies': 'softwareSuggestions',
         'bugs': 'issueTracker',
         'homepage': 'url'
     }
 
     def translate(self, raw_content):
         content_dict = convert(raw_content)
         return super().translate(content_dict)
 
 
 class MavenMapping(BaseMapping):
     """
     dedicated class for Maven (pom.xml) mapping and translation
     """
     mapping = {
         'license': 'license',
         'version': 'version',
         'description': 'description',
         'name': 'name',
         'prerequisites': 'softwareRequirements',
         'repositories': 'codeRepository',
         'groupId': 'identifier',
         'ciManagement': 'contIntegration',
         'issuesManagement': 'issueTracker',
     }
 
     def translate(self, raw_content):
         content = convert(raw_content)
         # parse content from xml to dict
         return super().translate(content)
 
 
 class DoapMapping(BaseMapping):
     mapping = {
 
     }
 
     def translate(self, raw_content):
         content = convert(raw_content)
         # parse content from xml to dict
         return super().translate(content)
 
 
 def parse_xml(content):
     """
     Parses content from xml to a python dict
     Args:
         - content (text): the string form of the raw_content ( in xml)
 
     Returns:
         - parsed_xml (dict): a python dict of the content after parsing
     """
     # check if xml
     # use xml parser to dict
     return content
 
 
 mapping_tool_fn = {
     "npm": NpmMapping(),
     "maven": MavenMapping(),
     "doap_xml": DoapMapping()
 }
 
 
 def compute_metadata(context, raw_content):
     """
     first landing method: a dispatcher that sends content
     to the right function to carry out the real parsing of syntax
     and translation of terms
 
     Args:
         context (text): defines to which function/tool the content is sent
         content (text): the string form of the raw_content
 
     Returns:
         dict: translated metadata jsonb dictionary needed for the indexer to
           store in storage
 
     """
     if raw_content is None or raw_content is b"":
         return None
 
     # TODO: keep mapping not in code (maybe fetch crosswalk from storage?)
     # if fetched from storage should be done once for batch of sha1s
     dictionary = mapping_tool_fn[context]
     translated_metadata = dictionary.translate(raw_content)
     return translated_metadata
 
 
 def main():
     raw_content = """{"name": "test_name", "unknown_term": "ut"}"""
     raw_content1 = b"""{"name": "test_name",
                         "unknown_term": "ut",
                         "prerequisites" :"packageXYZ"}"""
     result = compute_metadata("npm", raw_content)
     result1 = compute_metadata("maven", raw_content1)
 
     print(result)
     print(result1)
 
 
 if __name__ == "__main__":
     main()