diff --git a/swh/loader/git/converters.py b/swh/loader/git/converters.py
index 11c9c0e..4beaf04 100644
--- a/swh/loader/git/converters.py
+++ b/swh/loader/git/converters.py
@@ -1,361 +1,363 @@
 # Copyright (C) 2015  The Software Heritage developers
 # See the AUTHORS file at the top-level directory of this distribution
 # License: GNU General Public License version 3, or any later version
 # See top-level LICENSE file for more information
 
 """Convert pygit2 objects to dictionaries suitable for swh.storage"""
 
 from pygit2 import GIT_OBJ_COMMIT
 
 from swh.core import hashutil
 
 from .utils import format_date
 
 HASH_ALGORITHMS = ['sha1', 'sha256']
 
 
 def blob_to_content(id, repo, log=None, max_content_size=None, origin_id=None):
     """Format a blob as a content"""
     blob = repo[id]
     size = blob.size
     ret = {
         'sha1_git': id.raw,
         'length': blob.size,
         'status': 'absent'
     }
 
     if max_content_size:
         if size > max_content_size:
             if log:
                 log.info('Skipping content %s, too large (%s > %s)' %
                          (id.hex, size, max_content_size), extra={
                              'swh_type': 'loader_git_content_skip',
                              'swh_repo': repo.path,
                              'swh_id': id.hex,
                              'swh_size': size,
                          })
             ret['reason'] = 'Content too large'
             ret['origin'] = origin_id
             return ret
 
     data = blob.data
     hashes = hashutil.hashdata(data, HASH_ALGORITHMS)
     ret.update(hashes)
     ret['data'] = data
     ret['status'] = 'visible'
 
     return ret
 
 
 def tree_to_directory(id, repo, log=None):
     """Format a tree as a directory"""
     ret = {
         'id': id.raw,
     }
     entries = []
     ret['entries'] = entries
 
     entry_type_map = {
         'tree': 'dir',
         'blob': 'file',
         'commit': 'rev',
     }
 
     for entry in repo[id]:
         entries.append({
             'type': entry_type_map[entry.type],
             'perms': entry.filemode,
             'name': entry._name,
             'target': entry.id.raw,
         })
 
     return ret
 
 
 def commit_to_revision(id, repo, log=None):
     """Format a commit as a revision"""
     commit = repo[id]
 
     author = commit.author
     committer = commit.committer
     return {
         'id': id.raw,
         'date': format_date(author),
         'committer_date': format_date(committer),
         'type': 'git',
         'directory': commit.tree_id.raw,
         'message': commit.raw_message,
         'metadata': None,
         'author': {
             'name': author.raw_name,
             'email': author.raw_email,
         },
         'committer': {
             'name': committer.raw_name,
             'email': committer.raw_email,
         },
         'synthetic': False,
         'parents': [p.raw for p in commit.parent_ids],
     }
 
 
 def annotated_tag_to_release(id, repo, log=None):
     """Format an annotated tag as a release"""
     tag = repo[id]
 
     tag_pointer = repo[tag.target]
     if tag_pointer.type != GIT_OBJ_COMMIT:
         if log:
             log.warn("Ignoring tag %s pointing at %s %s" % (
                 tag.id.hex, tag_pointer.__class__.__name__,
                 tag_pointer.id.hex), extra={
                     'swh_type': 'loader_git_tag_ignore',
                     'swh_repo': repo.path,
                     'swh_tag_id': tag.id.hex,
                     'swh_tag_dest': {
                         'type': tag_pointer.__class__.__name__,
                         'id': tag_pointer.id.hex,
                     },
                 })
         return
 
     if not tag.tagger:
         if log:
             log.warn("Tag %s has no author, using default values"
                      % id.hex,  extra={
                          'swh_type': 'loader_git_tag_author_default',
                          'swh_repo': repo.path,
                          'swh_tag_id': tag.id.hex,
                      })
         author = None
         date = None
     else:
         author = {
             'name': tag.tagger.raw_name,
             'email': tag.tagger.raw_email,
         }
         date = format_date(tag.tagger)
 
     return {
         'id': id.raw,
         'date': date,
         'target': tag.target.raw,
         'target_type': 'revision',
         'message': tag._message,
         'name': tag.name.raw,
         'author': author,
         'metadata': None,
         'synthetic': False,
     }
 
 
 def ref_to_occurrence(ref):
     """Format a reference as an occurrence"""
     occ = ref.copy()
     if 'branch' in ref:
         branch = ref['branch']
         if isinstance(branch, str):
             occ['branch'] = branch.encode('utf-8')
         else:
             occ['branch'] = branch
     return occ
 
 
 def origin_url_to_origin(origin_url):
     """Format a pygit2.Repository as an origin suitable for swh.storage"""
     return {
         'type': 'git',
         'url': origin_url,
     }
 
 
 def dulwich_blob_to_content(blob, log=None, max_content_size=None,
                             origin_id=None):
     """Convert a dulwich blob to a Software Heritage content"""
 
     if blob.type_name != b'blob':
         return
 
     size = blob.raw_length()
 
     ret = {
         'sha1_git': blob.sha().digest(),
         'length': size,
         'status': 'absent'
     }
 
     if max_content_size:
         if size > max_content_size:
             if log:
                 log.info('Skipping content %s, too large (%s > %s)' %
                          (blob.id.encode(), size, max_content_size), extra={
                              'swh_type': 'loader_git_content_skip',
                              'swh_id': id.hex,
                              'swh_size': size,
                          })
             ret['reason'] = 'Content too large'
             ret['origin'] = origin_id
             return ret
 
     data = blob.as_raw_string()
     hashes = hashutil.hashdata(data, HASH_ALGORITHMS)
     ret.update(hashes)
     ret['data'] = data
     ret['status'] = 'visible'
 
     return ret
 
 
 def dulwich_tree_to_directory(tree, log=None):
     """Format a tree as a directory"""
     if tree.type_name != b'tree':
         return
 
     ret = {
         'id': tree.sha().digest(),
     }
     entries = []
     ret['entries'] = entries
 
     entry_mode_map = {
         0o040000: 'dir',
         0o160000: 'rev',
         0o100644: 'file',
         0o100755: 'file',
         0o120000: 'file',
     }
 
     for entry in tree.iteritems():
         entries.append({
             'type': entry_mode_map.get(entry.mode, 'file'),
             'perms': entry.mode,
             'name': entry.path,
             'target': hashutil.hex_to_hash(entry.sha.decode('ascii')),
         })
 
     return ret
 
 
 def parse_author(name_email):
     """Parse an author line"""
 
     if name_email is None:
         return None
 
     try:
         open_bracket = name_email.index(b'<')
     except ValueError:
         name = email = None
     else:
         raw_name = name_email[:open_bracket]
         raw_email = name_email[open_bracket+1:]
 
         if not raw_name:
             name = None
         elif raw_name.endswith(b' '):
             name = raw_name[:-1]
         else:
             name = raw_name
 
         try:
             close_bracket = raw_email.index(b'>')
         except ValueError:
             email = None
         else:
             email = raw_email[:close_bracket]
 
     return {
         'name': name,
         'email': email,
         'fullname': name_email,
     }
 
 
 def dulwich_tsinfo_to_timestamp(timestamp, timezone, timezone_neg_utc):
     """Convert the dulwich timestamp information to a structure compatible with
     Software Heritage"""
     return {
         'timestamp': timestamp,
         'offset': timezone // 60,
         'negative_utc': timezone_neg_utc if timezone == 0 else None,
     }
 
 
 def dulwich_commit_to_revision(commit, log=None):
     if commit.type_name != b'commit':
         return
 
     ret = {
         'id': commit.sha().digest(),
         'author': parse_author(commit.author),
         'date': dulwich_tsinfo_to_timestamp(
             commit.author_time,
             commit.author_timezone,
             commit._author_timezone_neg_utc,
         ),
         'committer': parse_author(commit.committer),
         'committer_date': dulwich_tsinfo_to_timestamp(
             commit.commit_time,
             commit.commit_timezone,
             commit._commit_timezone_neg_utc,
         ),
         'type': 'git',
         'directory': bytes.fromhex(commit.tree.decode()),
         'message': commit.message,
         'metadata': None,
         'synthetic': False,
         'parents': [bytes.fromhex(p.decode()) for p in commit.parents],
     }
 
     git_metadata = []
+    if commit.encoding is not None:
+        git_metadata.append(['encoding', commit.encoding])
     if commit.mergetag:
         for mergetag in commit.mergetag:
             git_metadata.append(['mergetag', mergetag.as_raw_string()])
 
     if commit.extra:
-        git_metadata.extend([k, v] for k, v in commit.extra)
+        git_metadata.extend([k.decode('utf-8'), v] for k, v in commit.extra)
 
     if commit.gpgsig:
         git_metadata.append(['gpgsig', commit.gpgsig])
 
     if git_metadata:
         ret['metadata'] = {
-            'extra_git_headers': git_metadata,
+            'extra_headers': git_metadata,
         }
 
     return ret
 
 
 DULWICH_TYPES = {
     b'blob': 'content',
     b'tree': 'directory',
     b'commit': 'revision',
     b'tag': 'release',
 }
 
 
 def dulwich_tag_to_release(tag, log=None):
     if tag.type_name != b'tag':
         return
 
     target_type, target = tag.object
     ret = {
         'id': tag.sha().digest(),
         'name': tag.name,
         'target': bytes.fromhex(target.decode()),
         'target_type': DULWICH_TYPES[target_type.type_name],
         'message': tag._message,
         'metadata': None,
         'synthetic': False,
     }
     if tag.tagger:
         ret['author'] = parse_author(tag.tagger)
         ret['date'] = dulwich_tsinfo_to_timestamp(
             tag.tag_time,
             tag.tag_timezone,
             tag._tag_timezone_neg_utc,
         )
     else:
         ret['author'] = ret['date'] = None
 
     return ret