diff --git a/dulwich/index.py b/dulwich/index.py
index f1a49f7e..2d4a3545 100644
--- a/dulwich/index.py
+++ b/dulwich/index.py
@@ -1,791 +1,796 @@
 # index.py -- File parser/writer for the git index file
 # Copyright (C) 2008-2013 Jelmer Vernooij <jelmer@jelmer.uk>
 #
 # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
 # General Public License as public by the Free Software Foundation; version 2.0
 # or (at your option) any later version. You can redistribute it and/or
 # modify it under the terms of either of these two licenses.
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
 # You should have received a copy of the licenses; if not, see
 # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
 # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
 # License, Version 2.0.
 #
 
 """Parser for the git index file format."""
 
 import collections
 import errno
 import os
 import stat
 import struct
 import sys
 
 from dulwich.file import GitFile
 from dulwich.objects import (
     Blob,
     S_IFGITLINK,
     S_ISGITLINK,
     Tree,
     hex_to_sha,
     sha_to_hex,
     )
 from dulwich.pack import (
     SHA1Reader,
     SHA1Writer,
     )
 
 
 IndexEntry = collections.namedtuple(
     'IndexEntry', [
         'ctime', 'mtime', 'dev', 'ino', 'mode', 'uid', 'gid', 'size', 'sha',
         'flags'])
 
 
 FLAG_STAGEMASK = 0x3000
 FLAG_VALID = 0x8000
 FLAG_EXTENDED = 0x4000
 
 
 def pathsplit(path):
     """Split a /-delimited path into a directory part and a basename.
 
     :param path: The path to split.
     :return: Tuple with directory name and basename
     """
     try:
         (dirname, basename) = path.rsplit(b"/", 1)
     except ValueError:
         return (b"", path)
     else:
         return (dirname, basename)
 
 
 def pathjoin(*args):
     """Join a /-delimited path.
 
     """
     return b"/".join([p for p in args if p])
 
 
 def read_cache_time(f):
     """Read a cache time.
 
     :param f: File-like object to read from
     :return: Tuple with seconds and nanoseconds
     """
     return struct.unpack(">LL", f.read(8))
 
 
 def write_cache_time(f, t):
     """Write a cache time.
 
     :param f: File-like object to write to
     :param t: Time to write (as int, float or tuple with secs and nsecs)
     """
     if isinstance(t, int):
         t = (t, 0)
     elif isinstance(t, float):
         (secs, nsecs) = divmod(t, 1.0)
         t = (int(secs), int(nsecs * 1000000000))
     elif not isinstance(t, tuple):
         raise TypeError(t)
     f.write(struct.pack(">LL", *t))
 
 
 def read_cache_entry(f):
     """Read an entry from a cache file.
 
     :param f: File-like object to read from
     :return: tuple with: device, inode, mode, uid, gid, size, sha, flags
     """
     beginoffset = f.tell()
     ctime = read_cache_time(f)
     mtime = read_cache_time(f)
     (dev, ino, mode, uid, gid, size, sha, flags, ) = \
         struct.unpack(">LLLLLL20sH", f.read(20 + 4 * 6 + 2))
     name = f.read((flags & 0x0fff))
     # Padding:
     real_size = ((f.tell() - beginoffset + 8) & ~7)
     f.read((beginoffset + real_size) - f.tell())
     return (name, ctime, mtime, dev, ino, mode, uid, gid, size,
             sha_to_hex(sha), flags & ~0x0fff)
 
 
 def write_cache_entry(f, entry):
     """Write an index entry to a file.
 
     :param f: File object
     :param entry: Entry to write, tuple with:
         (name, ctime, mtime, dev, ino, mode, uid, gid, size, sha, flags)
     """
     beginoffset = f.tell()
     (name, ctime, mtime, dev, ino, mode, uid, gid, size, sha, flags) = entry
     write_cache_time(f, ctime)
     write_cache_time(f, mtime)
     flags = len(name) | (flags & ~0x0fff)
     f.write(struct.pack(
             b'>LLLLLL20sH', dev & 0xFFFFFFFF, ino & 0xFFFFFFFF,
             mode, uid, gid, size, hex_to_sha(sha), flags))
     f.write(name)
     real_size = ((f.tell() - beginoffset + 8) & ~7)
     f.write(b'\0' * ((beginoffset + real_size) - f.tell()))
 
 
 def read_index(f):
     """Read an index file, yielding the individual entries."""
     header = f.read(4)
     if header != b'DIRC':
         raise AssertionError("Invalid index file header: %r" % header)
     (version, num_entries) = struct.unpack(b'>LL', f.read(4 * 2))
     assert version in (1, 2)
     for i in range(num_entries):
         yield read_cache_entry(f)
 
 
 def read_index_dict(f):
     """Read an index file and return it as a dictionary.
 
     :param f: File object to read from
     """
     ret = {}
     for x in read_index(f):
         ret[x[0]] = IndexEntry(*x[1:])
     return ret
 
 
 def write_index(f, entries):
     """Write an index file.
 
     :param f: File-like object to write to
     :param entries: Iterable over the entries to write
     """
     f.write(b'DIRC')
     f.write(struct.pack(b'>LL', 2, len(entries)))
     for x in entries:
         write_cache_entry(f, x)
 
 
 def write_index_dict(f, entries):
     """Write an index file based on the contents of a dictionary.
 
     """
     entries_list = []
     for name in sorted(entries):
         entries_list.append((name,) + tuple(entries[name]))
     write_index(f, entries_list)
 
 
 def cleanup_mode(mode):
     """Cleanup a mode value.
 
     This will return a mode that can be stored in a tree object.
 
     :param mode: Mode to clean up.
     """
     if stat.S_ISLNK(mode):
         return stat.S_IFLNK
     elif stat.S_ISDIR(mode):
         return stat.S_IFDIR
     elif S_ISGITLINK(mode):
         return S_IFGITLINK
     ret = stat.S_IFREG | 0o644
     ret |= (mode & 0o111)
     return ret
 
 
 class Index(object):
     """A Git Index file."""
 
     def __init__(self, filename):
         """Open an index file.
 
         :param filename: Path to the index file
         """
         self._filename = filename
         self.clear()
         self.read()
 
     @property
     def path(self):
         return self._filename
 
     def __repr__(self):
         return "%s(%r)" % (self.__class__.__name__, self._filename)
 
     def write(self):
         """Write current contents of index to disk."""
         f = GitFile(self._filename, 'wb')
         try:
             f = SHA1Writer(f)
             write_index_dict(f, self._byname)
         finally:
             f.close()
 
     def read(self):
         """Read current contents of index from disk."""
         if not os.path.exists(self._filename):
             return
         f = GitFile(self._filename, 'rb')
         try:
             f = SHA1Reader(f)
             for x in read_index(f):
                 self[x[0]] = IndexEntry(*x[1:])
             # FIXME: Additional data?
             f.read(os.path.getsize(self._filename)-f.tell()-20)
             f.check_sha()
         finally:
             f.close()
 
     def __len__(self):
         """Number of entries in this index file."""
         return len(self._byname)
 
     def __getitem__(self, name):
         """Retrieve entry by relative path.
 
         :return: tuple with (ctime, mtime, dev, ino, mode, uid, gid, size, sha,
             flags)
         """
         return self._byname[name]
 
     def __iter__(self):
         """Iterate over the paths in this index."""
         return iter(self._byname)
 
     def get_sha1(self, path):
         """Return the (git object) SHA1 for the object at a path."""
         return self[path].sha
 
     def get_mode(self, path):
         """Return the POSIX file mode for the object at a path."""
         return self[path].mode
 
     def iterobjects(self):
         """Iterate over path, sha, mode tuples for use with commit_tree."""
         for path in self:
             entry = self[path]
             yield path, entry.sha, cleanup_mode(entry.mode)
 
     def iterblobs(self):
         import warnings
         warnings.warn('Use iterobjects() instead.', PendingDeprecationWarning)
         return self.iterobjects()
 
     def clear(self):
         """Remove all contents from this index."""
         self._byname = {}
 
     def __setitem__(self, name, x):
         assert isinstance(name, bytes)
         assert len(x) == 10
         # Remove the old entry if any
         self._byname[name] = IndexEntry(*x)
 
     def __delitem__(self, name):
         assert isinstance(name, bytes)
         del self._byname[name]
 
     def iteritems(self):
         return self._byname.items()
 
     def items(self):
         return self._byname.items()
 
     def update(self, entries):
         for name, value in entries.items():
             self[name] = value
 
     def changes_from_tree(self, object_store, tree, want_unchanged=False):
         """Find the differences between the contents of this index and a tree.
 
         :param object_store: Object store to use for retrieving tree contents
         :param tree: SHA1 of the root tree
         :param want_unchanged: Whether unchanged files should be reported
         :return: Iterator over tuples with (oldpath, newpath), (oldmode,
             newmode), (oldsha, newsha)
         """
         def lookup_entry(path):
             entry = self[path]
             return entry.sha, entry.mode
         for (name, mode, sha) in changes_from_tree(
                 self._byname.keys(), lookup_entry, object_store, tree,
                 want_unchanged=want_unchanged):
             yield (name, mode, sha)
 
     def commit(self, object_store):
         """Create a new tree from an index.
 
         :param object_store: Object store to save the tree in
         :return: Root tree SHA
         """
         return commit_tree(object_store, self.iterobjects())
 
 
 def commit_tree(object_store, blobs):
     """Commit a new tree.
 
     :param object_store: Object store to add trees to
     :param blobs: Iterable over blob path, sha, mode entries
     :return: SHA1 of the created tree.
     """
 
     trees = {b'': {}}
 
     def add_tree(path):
         if path in trees:
             return trees[path]
         dirname, basename = pathsplit(path)
         t = add_tree(dirname)
         assert isinstance(basename, bytes)
         newtree = {}
         t[basename] = newtree
         trees[path] = newtree
         return newtree
 
     for path, sha, mode in blobs:
         tree_path, basename = pathsplit(path)
         tree = add_tree(tree_path)
         tree[basename] = (mode, sha)
 
     def build_tree(path):
         tree = Tree()
         for basename, entry in trees[path].items():
             if isinstance(entry, dict):
                 mode = stat.S_IFDIR
                 sha = build_tree(pathjoin(path, basename))
             else:
                 (mode, sha) = entry
             tree.add(basename, mode, sha)
         object_store.add_object(tree)
         return tree.id
     return build_tree(b'')
 
 
 def commit_index(object_store, index):
     """Create a new tree from an index.
 
     :param object_store: Object store to save the tree in
     :param index: Index file
     :note: This function is deprecated, use index.commit() instead.
     :return: Root tree sha.
     """
     return commit_tree(object_store, index.iterobjects())
 
 
 def changes_from_tree(names, lookup_entry, object_store, tree,
                       want_unchanged=False):
     """Find the differences between the contents of a tree and
     a working copy.
 
     :param names: Iterable of names in the working copy
     :param lookup_entry: Function to lookup an entry in the working copy
     :param object_store: Object store to use for retrieving tree contents
     :param tree: SHA1 of the root tree, or None for an empty tree
     :param want_unchanged: Whether unchanged files should be reported
     :return: Iterator over tuples with (oldpath, newpath), (oldmode, newmode),
         (oldsha, newsha)
     """
     # TODO(jelmer): Support a include_trees option
     other_names = set(names)
 
     if tree is not None:
         for (name, mode, sha) in object_store.iter_tree_contents(tree):
             try:
                 (other_sha, other_mode) = lookup_entry(name)
             except KeyError:
                 # Was removed
                 yield ((name, None), (mode, None), (sha, None))
             else:
                 other_names.remove(name)
                 if (want_unchanged or other_sha != sha or other_mode != mode):
                     yield ((name, name), (mode, other_mode), (sha, other_sha))
 
     # Mention added files
     for name in other_names:
         try:
             (other_sha, other_mode) = lookup_entry(name)
         except KeyError:
             pass
         else:
             yield ((None, name), (None, other_mode), (None, other_sha))
 
 
 def index_entry_from_stat(stat_val, hex_sha, flags, mode=None):
     """Create a new index entry from a stat value.
 
     :param stat_val: POSIX stat_result instance
     :param hex_sha: Hex sha of the object
     :param flags: Index flags
     """
     if mode is None:
         mode = cleanup_mode(stat_val.st_mode)
 
     return IndexEntry(
             stat_val.st_ctime, stat_val.st_mtime, stat_val.st_dev,
             stat_val.st_ino, mode, stat_val.st_uid,
             stat_val.st_gid, stat_val.st_size, hex_sha, flags)
 
 
 def build_file_from_blob(blob, mode, target_path, honor_filemode=True):
     """Build a file or symlink on disk based on a Git object.
 
     :param obj: The git object
     :param mode: File mode
     :param target_path: Path to write to
     :param honor_filemode: An optional flag to honor core.filemode setting in
         config file, default is core.filemode=True, change executable bit
     :return: stat object for the file
     """
     try:
         oldstat = os.lstat(target_path)
     except OSError as e:
         if e.errno == errno.ENOENT:
             oldstat = None
         else:
             raise
     contents = blob.as_raw_string()
     if stat.S_ISLNK(mode):
         # FIXME: This will fail on Windows. What should we do instead?
         if oldstat:
             os.unlink(target_path)
         if sys.platform == 'win32' and sys.version_info[0] == 3:
             # os.readlink on Python3 on Windows requires a unicode string.
             # TODO(jelmer): Don't assume tree_encoding == fs_encoding
             tree_encoding = sys.getfilesystemencoding()
             contents = contents.decode(tree_encoding)
             target_path = target_path.decode(tree_encoding)
         os.symlink(contents, target_path)
     else:
         if oldstat is not None and oldstat.st_size == len(contents):
             with open(target_path, 'rb') as f:
                 if f.read() == contents:
                     return oldstat
 
         with open(target_path, 'wb') as f:
             # Write out file
             f.write(contents)
 
         if honor_filemode:
             os.chmod(target_path, mode)
 
     return os.lstat(target_path)
 
 
 INVALID_DOTNAMES = (b".git", b".", b"..", b"")
 
 
 def validate_path_element_default(element):
     return element.lower() not in INVALID_DOTNAMES
 
 
 def validate_path_element_ntfs(element):
     stripped = element.rstrip(b". ").lower()
     if stripped in INVALID_DOTNAMES:
         return False
     if stripped == b"git~1":
         return False
     return True
 
 
 def validate_path(path, element_validator=validate_path_element_default):
     """Default path validator that just checks for .git/."""
     parts = path.split(b"/")
     for p in parts:
         if not element_validator(p):
             return False
     else:
         return True
 
 
 def build_index_from_tree(root_path, index_path, object_store, tree_id,
                           honor_filemode=True,
                           validate_path_element=validate_path_element_default):
     """Generate and materialize index from a tree
 
     :param tree_id: Tree to materialize
     :param root_path: Target dir for materialized index files
     :param index_path: Target path for generated index
     :param object_store: Non-empty object store holding tree contents
     :param honor_filemode: An optional flag to honor core.filemode setting in
         config file, default is core.filemode=True, change executable bit
     :param validate_path_element: Function to validate path elements to check
         out; default just refuses .git and .. directories.
 
     :note:: existing index is wiped and contents are not merged
         in a working dir. Suitable only for fresh clones.
     """
 
     index = Index(index_path)
     if not isinstance(root_path, bytes):
         root_path = root_path.encode(sys.getfilesystemencoding())
 
     for entry in object_store.iter_tree_contents(tree_id):
         if not validate_path(entry.path, validate_path_element):
             continue
         full_path = _tree_to_fs_path(root_path, entry.path)
 
         if not os.path.exists(os.path.dirname(full_path)):
             os.makedirs(os.path.dirname(full_path))
 
         # TODO(jelmer): Merge new index into working tree
         if S_ISGITLINK(entry.mode):
             if not os.path.isdir(full_path):
                 os.mkdir(full_path)
             st = os.lstat(full_path)
             # TODO(jelmer): record and return submodule paths
         else:
             obj = object_store[entry.sha]
             st = build_file_from_blob(
                 obj, entry.mode, full_path, honor_filemode=honor_filemode)
         # Add file to index
         if not honor_filemode or S_ISGITLINK(entry.mode):
             # we can not use tuple slicing to build a new tuple,
             # because on windows that will convert the times to
             # longs, which causes errors further along
             st_tuple = (entry.mode, st.st_ino, st.st_dev, st.st_nlink,
                         st.st_uid, st.st_gid, st.st_size, st.st_atime,
                         st.st_mtime, st.st_ctime)
             st = st.__class__(st_tuple)
         index[entry.path] = index_entry_from_stat(st, entry.sha, 0)
 
     index.write()
 
 
 def blob_from_path_and_stat(fs_path, st):
     """Create a blob from a path and a stat object.
 
     :param fs_path: Full file system path to file
     :param st: A stat object
     :return: A `Blob` object
     """
     assert isinstance(fs_path, bytes)
     blob = Blob()
     if not stat.S_ISLNK(st.st_mode):
         with open(fs_path, 'rb') as f:
             blob.data = f.read()
     else:
         if sys.platform == 'win32' and sys.version_info[0] == 3:
             # os.readlink on Python3 on Windows requires a unicode string.
             # TODO(jelmer): Don't assume tree_encoding == fs_encoding
             tree_encoding = sys.getfilesystemencoding()
             fs_path = fs_path.decode(tree_encoding)
             blob.data = os.readlink(fs_path).encode(tree_encoding)
         else:
             blob.data = os.readlink(fs_path)
     return blob
 
 
 def read_submodule_head(path):
     """Read the head commit of a submodule.
 
     :param path: path to the submodule
     :return: HEAD sha, None if not a valid head/repository
     """
     from dulwich.errors import NotGitRepository
     from dulwich.repo import Repo
     # Repo currently expects a "str", so decode if necessary.
     # TODO(jelmer): Perhaps move this into Repo() ?
     if not isinstance(path, str):
         path = path.decode(sys.getfilesystemencoding())
     try:
         repo = Repo(path)
     except NotGitRepository:
         return None
     try:
         return repo.head()
     except KeyError:
         return None
 
 
-def get_unstaged_changes(index, root_path):
+def get_unstaged_changes(index, root_path, filter_blob_callback=None):
     """Walk through an index and check for differences against working tree.
 
     :param index: index to check
     :param root_path: path in which to find files
     :return: iterator over paths with unstaged changes
     """
     # For each entry in the index check the sha1 & ensure not staged
     if not isinstance(root_path, bytes):
         root_path = root_path.encode(sys.getfilesystemencoding())
 
     for tree_path, entry in index.iteritems():
         full_path = _tree_to_fs_path(root_path, tree_path)
         try:
-            blob = blob_from_path_and_stat(full_path, os.lstat(full_path))
+            blob = blob_from_path_and_stat(
+                full_path, os.lstat(full_path)
+            )
+
+            if filter_blob_callback is not None:
+                blob = filter_blob_callback(blob, tree_path)
         except OSError as e:
             if e.errno != errno.ENOENT:
                 raise
             # The file was removed, so we assume that counts as
             # different from whatever file used to exist.
             yield tree_path
         except IOError as e:
             if e.errno != errno.EISDIR:
                 raise
             # This is actually a directory
             if os.path.exists(os.path.join(tree_path, '.git')):
                 # Submodule
                 head = read_submodule_head(tree_path)
                 if entry.sha != head:
                     yield tree_path
             else:
                 # The file was changed to a directory, so consider it removed.
                 yield tree_path
         else:
             if blob.id != entry.sha:
                 yield tree_path
 
 
 os_sep_bytes = os.sep.encode('ascii')
 
 
 def _tree_to_fs_path(root_path, tree_path):
     """Convert a git tree path to a file system path.
 
     :param root_path: Root filesystem path
     :param tree_path: Git tree path as bytes
 
     :return: File system path.
     """
     assert isinstance(tree_path, bytes)
     if os_sep_bytes != b'/':
         sep_corrected_path = tree_path.replace(b'/', os_sep_bytes)
     else:
         sep_corrected_path = tree_path
     return os.path.join(root_path, sep_corrected_path)
 
 
 def _fs_to_tree_path(fs_path, fs_encoding=None):
     """Convert a file system path to a git tree path.
 
     :param fs_path: File system path.
     :param fs_encoding: File system encoding
 
     :return:  Git tree path as bytes
     """
     if fs_encoding is None:
         fs_encoding = sys.getfilesystemencoding()
     if not isinstance(fs_path, bytes):
         fs_path_bytes = fs_path.encode(fs_encoding)
     else:
         fs_path_bytes = fs_path
     if os_sep_bytes != b'/':
         tree_path = fs_path_bytes.replace(os_sep_bytes, b'/')
     else:
         tree_path = fs_path_bytes
     return tree_path
 
 
 def index_entry_from_path(path, object_store=None):
     """Create an index from a filesystem path.
 
     This returns an index value for files, symlinks
     and tree references. for directories and
     non-existant files it returns None
 
     :param path: Path to create an index entry for
     :param object_store: Optional object store to
         save new blobs in
     :return: An index entry
     """
     assert isinstance(path, bytes)
     try:
         st = os.lstat(path)
         blob = blob_from_path_and_stat(path, st)
     except EnvironmentError as e:
         if e.errno == errno.EISDIR:
             if os.path.exists(os.path.join(path, b'.git')):
                 head = read_submodule_head(path)
                 if head is None:
                     return None
                 return index_entry_from_stat(
                     st, head, 0, mode=S_IFGITLINK)
             else:
                 raise
         else:
             raise
     else:
         if object_store is not None:
             object_store.add_object(blob)
         return index_entry_from_stat(st, blob.id, 0)
 
 
 def iter_fresh_entries(paths, root_path, object_store=None):
     """Iterate over current versions of index entries on disk.
 
     :param paths: Paths to iterate over
     :param root_path: Root path to access from
     :param store: Optional store to save new blobs in
     :return: Iterator over path, index_entry
     """
     for path in paths:
         p = _tree_to_fs_path(root_path, path)
         try:
             entry = index_entry_from_path(p, object_store=object_store)
         except EnvironmentError as e:
             if e.errno in (errno.ENOENT, errno.EISDIR):
                 entry = None
             else:
                 raise
         yield path, entry
 
 
 def iter_fresh_blobs(index, root_path):
     """Iterate over versions of blobs on disk referenced by index.
 
     Don't use this function; it removes missing entries from index.
 
     :param index: Index file
     :param root_path: Root path to access from
     :param include_deleted: Include deleted entries with sha and
         mode set to None
     :return: Iterator over path, sha, mode
     """
     import warnings
     warnings.warn(PendingDeprecationWarning,
                   "Use iter_fresh_objects instead.")
     for entry in iter_fresh_objects(
             index, root_path, include_deleted=True):
         if entry[1] is None:
             del index[entry[0]]
         else:
             yield entry
 
 
 def iter_fresh_objects(paths, root_path, include_deleted=False,
                        object_store=None):
     """Iterate over versions of objecs on disk referenced by index.
 
     :param index: Index file
     :param root_path: Root path to access from
     :param include_deleted: Include deleted entries with sha and
         mode set to None
     :param object_store: Optional object store to report new items to
     :return: Iterator over path, sha, mode
     """
     for path, entry in iter_fresh_entries(paths, root_path,
                                           object_store=object_store):
         if entry is None:
             if include_deleted:
                 yield path, None, None
         else:
             entry = IndexEntry(*entry)
             yield path, entry.sha, cleanup_mode(entry.mode)
 
 
 def refresh_index(index, root_path):
     """Refresh the contents of an index.
 
     This is the equivalent to running 'git commit -a'.
 
     :param index: Index to update
     :param root_path: Root filesystem path
     """
     for path, entry in iter_fresh_entries(index, root_path):
         index[path] = path
diff --git a/dulwich/line_ending.py b/dulwich/line_ending.py
index 08e200d4..d16564b7 100644
--- a/dulwich/line_ending.py
+++ b/dulwich/line_ending.py
@@ -1,207 +1,241 @@
 # line_ending.py -- Line ending conversion functions
 # Copyright (C) 2018-2018 Boris Feld <boris.feld@comet.ml>
 #
 # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
 # General Public License as public by the Free Software Foundation; version 2.0
 # or (at your option) any later version. You can redistribute it and/or
 # modify it under the terms of either of these two licenses.
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
 # You should have received a copy of the licenses; if not, see
 # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
 # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
 # License, Version 2.0.
 #
 """ All line-ending related functions, from conversions to config processing
 
 Line-ending normalization is a complex beast. Here is some notes and details
 about how it seems to work.
 
 The normalization is a two-fold process that happens at two moments:
 
 - When reading a file from the index and to the working directory. For example
   when doing a `git clone` or `git checkout` call. We call this process the
   read filter in this module.
 - When writing a file to the index from the working directory. For example
   when doing a `git add` call. We call this process the write filter in this
   module.
 
 One thing to know is that Git does line-ending normalization only on text
 files. How does Git know that a file is text? We can either mark a file as a
 text file, a binary file or ask Git to automatically decides. Git has an
 heuristic to detect if a file is a text file or a binary file. It seems based
 on the percentage of non-printable characters in files.
 
 The code for this heuristic is here:
 https://git.kernel.org/pub/scm/git/git.git/tree/convert.c#n46
 
 Dulwich have an implementation with a slightly different heuristic, the
 `is_binary` function in `dulwich.patch`.
 
 The binary detection heuristic implementation is close to the one in JGit:
 https://github.com/eclipse/jgit/blob/f6873ffe522bbc3536969a3a3546bf9a819b92bf/org.eclipse.jgit/src/org/eclipse/jgit/diff/RawText.java#L300
 
 There is multiple variables that impact the normalization.
 
 First, a repository can contains a `.gitattributes` file (or more than one...)
 that can further customize the operation on some file patterns, for example:
 
     *.txt text
 
 Force all `.txt` files to be treated as text files and to have their lines
 endings normalized.
 
     *.jpg -text
 
 Force all `.jpg` files to be treated as binary files and to not have their
 lines endings converted.
 
     *.vcproj text eol=crlf
 
 Force all `.vcproj` files to be treated as text files and to have their lines
 endings converted into `CRLF` in working directory no matter the native EOL of
 the platform.
 
     *.sh text eol=lf
 
 Force all `.sh` files to be treated as text files and to have their lines
 endings converted into `LF` in working directory no matter the native EOL of
 the platform.
 
 If the `eol` attribute is not defined, Git uses the `core.eol` configuration
 value described later.
 
     * text=auto
 
 Force all files to be scanned by the text file heuristic detection and to have
 their line endings normalized in case they are detected as text files.
 
 Git also have a obsolete attribute named `crlf` that can be translated to the
 corresponding text attribute value.
 
 Then there are some configuration option (that can be defined at the
 repository or user level):
 
 - core.autocrlf
 - core.eol
 
 `core.autocrlf` is taken into account for all files that doesn't have a `text`
 attribute defined in `.gitattributes`; it takes three possible values:
 
     - `true`: This forces all files on the working directory to have CRLF
       line-endings in the working directory and convert line-endings to LF
       when writing to the index. When autocrlf is set to true, eol value is
       ignored.
     - `input`: Quite similar to the `true` value but only force the write
       filter, ie line-ending of new files added to the index will get their
       line-endings converted to LF.
     - `false` (default): No normalization is done.
 
 `core.eol` is the top-level configuration to define the line-ending to use
 when applying the read_filer. It takes three possible values:
 
     - `lf`: When normalization is done, force line-endings to be `LF` in the
       working directory.
     - `crlf`: When normalization is done, force line-endings to be `CRLF` in
       the working directory.
     - `native` (default): When normalization is done, force line-endings to be
       the platform's native line ending.
 
 One thing to remember is when line-ending normalization is done on a file, Git
 always normalize line-ending to `LF` when writing to the index.
 
 There are sources that seems to indicate that Git won't do line-ending
 normalization when a file contains mixed line-endings. I think this logic
 might be in text / binary detection heuristic but couldn't find it yet.
 
 Sources:
 - https://git-scm.com/docs/git-config#git-config-coreeol
 - https://git-scm.com/docs/git-config#git-config-coreautocrlf
 - https://git-scm.com/docs/gitattributes#_checking_out_and_checking_in
 - https://adaptivepatchwork.com/2012/03/01/mind-the-end-of-your-line/
 """
 
 from dulwich.objects import Blob
 
 CRLF = b"\r\n"
 LF = b"\n"
 
 
 def convert_crlf_to_lf(text_hunk):
     """Convert CRLF in text hunk into LF
 
     :param text_hunk: A bytes string representing a text hunk
     :return: The text hunk with the same type, with CRLF replaced into LF
     """
     return text_hunk.replace(CRLF, LF)
 
 
 def convert_lf_to_crlf(text_hunk):
     """Convert LF in text hunk into CRLF
 
     :param text_hunk: A bytes string representing a text hunk
     :return: The text hunk with the same type, with LF replaced into CRLF
     """
     # TODO find a more efficient way of doing it
     intermediary = text_hunk.replace(CRLF, LF)
     return intermediary.replace(LF, CRLF)
 
 
 def get_checkout_filter_autocrlf(core_autocrlf):
     """ Returns the correct checkout filter base on autocrlf value
 
     :param core_autocrlf: The bytes configuration value of core.autocrlf.
         Valid values are: b'true', b'false' or b'input'.
     :return: Either None if no filter has to be applied or a function
         accepting a single argument, a binary text hunk
     """
 
     if core_autocrlf == b"true":
         return convert_lf_to_crlf
 
     return None
 
 
 def get_checkin_filter_autocrlf(core_autocrlf):
     """ Returns the correct checkin filter base on autocrlf value
 
     :param core_autocrlf: The bytes configuration value of core.autocrlf.
         Valid values are: b'true', b'false' or b'input'.
     :return: Either None if no filter has to be applied or a function
         accepting a single argument, a binary text hunk
     """
 
     if core_autocrlf == b"true" or core_autocrlf == b"input":
         return convert_crlf_to_lf
 
     # Checking filter should never be `convert_lf_to_crlf`
     return None
 
 
+class BlobNormalizer(object):
+    """ An object to store computation result of which filter to apply based
+    on configuration, gitattributes, path and operation (checkin or checkout)
+    """
+
+    def __init__(self, config_stack, gitattributes, read_filter, write_filter):
+        self.config_stack = config_stack
+        self.gitattributes = gitattributes
+
+        # TODO compute them based on passed values
+        self.fallback_read_filter = read_filter
+        self.fallback_write_filter = write_filter
+
+    def checkin_normalize(self, blob, tree_path):
+        """ Normalize a blob during a checkin operation
+        """
+        if self.fallback_write_filter is not None:
+            return normalize_blob(
+                blob, self.fallback_write_filter, binary_detection=False
+            )
+
+        return blob
+
+    def checkout_normalize(self, blob, tree_path):
+        """ Normalize a blob during a checkout operation
+        """
+        if self.fallback_read_filter is not None:
+            return normalize_blob(
+                blob, self.fallback_read_filter, binary_detection=False
+            )
+
+        return blob
+
+
 def normalize_blob(blob, conversion, binary_detection):
     """ Takes a blob as input returns either the original blob if
     binary_detection is True and the blob content looks like binary, else
     return a new blob with converted data
     """
     # Read the original blob
     data = blob.data
 
     # If we need to detect if a file is binary and the file is detected as
     # binary, do not apply the conversion function and return the original
     # chunked text
     if binary_detection is True:
         if is_binary(data):
             return blob
 
     # Now apply the conversion
     converted_data = conversion(data)
 
     new_blob = Blob()
     new_blob.data = converted_data
 
     return new_blob
diff --git a/dulwich/porcelain.py b/dulwich/porcelain.py
index 187b9863..a29f69d7 100644
--- a/dulwich/porcelain.py
+++ b/dulwich/porcelain.py
@@ -1,1423 +1,1427 @@
 # porcelain.py -- Porcelain-like layer on top of Dulwich
 # Copyright (C) 2013 Jelmer Vernooij <jelmer@jelmer.uk>
 #
 # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
 # General Public License as public by the Free Software Foundation; version 2.0
 # or (at your option) any later version. You can redistribute it and/or
 # modify it under the terms of either of these two licenses.
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
 # You should have received a copy of the licenses; if not, see
 # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
 # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
 # License, Version 2.0.
 #
 
 """Simple wrapper that provides porcelain-like functions on top of Dulwich.
 
 Currently implemented:
  * archive
  * add
  * branch{_create,_delete,_list}
  * check-ignore
  * checkout
  * clone
  * commit
  * commit-tree
  * daemon
  * describe
  * diff-tree
  * fetch
  * init
  * ls-files
  * ls-remote
  * ls-tree
  * pull
  * push
  * rm
  * remote{_add}
  * receive-pack
  * reset
  * rev-list
  * tag{_create,_delete,_list}
  * upload-pack
  * update-server-info
  * status
  * symbolic-ref
 
 These functions are meant to behave similarly to the git subcommands.
 Differences in behaviour are considered bugs.
 
 Functions should generally accept both unicode strings and bytestrings
 """
 
 from collections import namedtuple
 from contextlib import (
     closing,
     contextmanager,
 )
 from io import BytesIO, RawIOBase
 import datetime
 import os
 import posixpath
 import stat
 import sys
 import time
 
 from dulwich.archive import (
     tar_stream,
     )
 from dulwich.client import (
     get_transport_and_path,
     )
 from dulwich.config import (
     StackedConfig,
     )
 from dulwich.diff_tree import (
     CHANGE_ADD,
     CHANGE_DELETE,
     CHANGE_MODIFY,
     CHANGE_RENAME,
     CHANGE_COPY,
     RENAME_CHANGE_TYPES,
     )
 from dulwich.errors import (
     SendPackError,
     UpdateRefsError,
     )
 from dulwich.ignore import IgnoreFilterManager
 from dulwich.index import (
     blob_from_path_and_stat,
     get_unstaged_changes,
     )
 from dulwich.object_store import (
     tree_lookup_path,
     )
 from dulwich.objects import (
     Commit,
     Tag,
     format_timezone,
     parse_timezone,
     pretty_format_tree_entry,
     )
 from dulwich.objectspec import (
     parse_commit,
     parse_object,
     parse_ref,
     parse_reftuples,
     parse_tree,
     )
 from dulwich.pack import (
     write_pack_index,
     write_pack_objects,
     )
 from dulwich.patch import write_tree_diff
 from dulwich.protocol import (
     Protocol,
     ZERO_SHA,
     )
 from dulwich.refs import (
     ANNOTATED_TAG_SUFFIX,
     strip_peeled_refs,
 )
 from dulwich.repo import (BaseRepo, Repo)
 from dulwich.server import (
     FileSystemBackend,
     TCPGitServer,
     ReceivePackHandler,
     UploadPackHandler,
     update_server_info as server_update_server_info,
     )
 
 
 # Module level tuple definition for status output
 GitStatus = namedtuple('GitStatus', 'staged unstaged untracked')
 
 
 class NoneStream(RawIOBase):
     """Fallback if stdout or stderr are unavailable, does nothing."""
     def read(self, size=-1):
         return None
 
     def readall(self):
         return None
 
     def readinto(self, b):
         return None
 
     def write(self, b):
         return None
 
 
 default_bytes_out_stream = getattr(
         sys.stdout, 'buffer', sys.stdout
     ) or NoneStream()
 default_bytes_err_stream = getattr(
         sys.stderr, 'buffer', sys.stderr
     ) or NoneStream()
 
 
 DEFAULT_ENCODING = 'utf-8'
 
 
 class RemoteExists(Exception):
     """Raised when the remote already exists."""
 
 
 def open_repo(path_or_repo):
     """Open an argument that can be a repository or a path for a repository."""
     if isinstance(path_or_repo, BaseRepo):
         return path_or_repo
     return Repo(path_or_repo)
 
 
 @contextmanager
 def _noop_context_manager(obj):
     """Context manager that has the same api as closing but does nothing."""
     yield obj
 
 
 def open_repo_closing(path_or_repo):
     """Open an argument that can be a repository or a path for a repository.
     returns a context manager that will close the repo on exit if the argument
     is a path, else does nothing if the argument is a repo.
     """
     if isinstance(path_or_repo, BaseRepo):
         return _noop_context_manager(path_or_repo)
     return closing(Repo(path_or_repo))
 
 
 def path_to_tree_path(repopath, path):
     """Convert a path to a path usable in an index, e.g. bytes and relative to
     the repository root.
 
     :param repopath: Repository path, absolute or relative to the cwd
     :param path: A path, absolute or relative to the cwd
     :return: A path formatted for use in e.g. an index
     """
     if not isinstance(path, bytes):
         path = path.encode(sys.getfilesystemencoding())
     if not isinstance(repopath, bytes):
         repopath = repopath.encode(sys.getfilesystemencoding())
     treepath = os.path.relpath(path, repopath)
     if treepath.startswith(b'..'):
         raise ValueError('Path not in repo')
     if os.path.sep != '/':
         treepath = treepath.replace(os.path.sep.encode('ascii'), b'/')
     return treepath
 
 
 def archive(repo, committish=None, outstream=default_bytes_out_stream,
             errstream=default_bytes_err_stream):
     """Create an archive.
 
     :param repo: Path of repository for which to generate an archive.
     :param committish: Commit SHA1 or ref to use
     :param outstream: Output stream (defaults to stdout)
     :param errstream: Error stream (defaults to stderr)
     """
 
     if committish is None:
         committish = "HEAD"
     with open_repo_closing(repo) as repo_obj:
         c = repo_obj[committish]
         for chunk in tar_stream(
                 repo_obj.object_store, repo_obj.object_store[c.tree],
                 c.commit_time):
             outstream.write(chunk)
 
 
 def update_server_info(repo="."):
     """Update server info files for a repository.
 
     :param repo: path to the repository
     """
     with open_repo_closing(repo) as r:
         server_update_server_info(r)
 
 
 def symbolic_ref(repo, ref_name, force=False):
     """Set git symbolic ref into HEAD.
 
     :param repo: path to the repository
     :param ref_name: short name of the new ref
     :param force: force settings without checking if it exists in refs/heads
     """
     with open_repo_closing(repo) as repo_obj:
         ref_path = _make_branch_ref(ref_name)
         if not force and ref_path not in repo_obj.refs.keys():
             raise ValueError('fatal: ref `%s` is not a ref' % ref_name)
         repo_obj.refs.set_symbolic_ref(b'HEAD', ref_path)
 
 
 def commit(repo=".", message=None, author=None, committer=None, encoding=None):
     """Create a new commit.
 
     :param repo: Path to repository
     :param message: Optional commit message
     :param author: Optional author name and email
     :param committer: Optional committer name and email
     :return: SHA1 of the new commit
     """
     # FIXME: Support --all argument
     # FIXME: Support --signoff argument
     if getattr(message, 'encode', None):
         message = message.encode(encoding or DEFAULT_ENCODING)
     if getattr(author, 'encode', None):
         author = author.encode(encoding or DEFAULT_ENCODING)
     if getattr(committer, 'encode', None):
         committer = committer.encode(encoding or DEFAULT_ENCODING)
     with open_repo_closing(repo) as r:
         return r.do_commit(
                 message=message, author=author, committer=committer,
                 encoding=encoding)
 
 
 def commit_tree(repo, tree, message=None, author=None, committer=None):
     """Create a new commit object.
 
     :param repo: Path to repository
     :param tree: An existing tree object
     :param author: Optional author name and email
     :param committer: Optional committer name and email
     """
     with open_repo_closing(repo) as r:
         return r.do_commit(
             message=message, tree=tree, committer=committer, author=author)
 
 
 def init(path=".", bare=False):
     """Create a new git repository.
 
     :param path: Path to repository.
     :param bare: Whether to create a bare repository.
     :return: A Repo instance
     """
     if not os.path.exists(path):
         os.mkdir(path)
 
     if bare:
         return Repo.init_bare(path)
     else:
         return Repo.init(path)
 
 
 def clone(source, target=None, bare=False, checkout=None,
           errstream=default_bytes_err_stream, outstream=None,
           origin=b"origin", depth=None, **kwargs):
     """Clone a local or remote git repository.
 
     :param source: Path or URL for source repository
     :param target: Path to target repository (optional)
     :param bare: Whether or not to create a bare repository
     :param checkout: Whether or not to check-out HEAD after cloning
     :param errstream: Optional stream to write progress to
     :param outstream: Optional stream to write progress to (deprecated)
     :param origin: Name of remote from the repository used to clone
     :param depth: Depth to fetch at
     :return: The new repository
     """
     # TODO(jelmer): This code overlaps quite a bit with Repo.clone
     if outstream is not None:
         import warnings
         warnings.warn(
             "outstream= has been deprecated in favour of errstream=.",
             DeprecationWarning, stacklevel=3)
         errstream = outstream
 
     if checkout is None:
         checkout = (not bare)
     if checkout and bare:
         raise ValueError("checkout and bare are incompatible")
 
     if target is None:
         target = source.split("/")[-1]
 
     if not os.path.exists(target):
         os.mkdir(target)
 
     if bare:
         r = Repo.init_bare(target)
     else:
         r = Repo.init(target)
 
     reflog_message = b'clone: from ' + source.encode('utf-8')
     try:
         fetch_result = fetch(
             r, source, origin, errstream=errstream, message=reflog_message,
             depth=depth, **kwargs)
         target_config = r.get_config()
         if not isinstance(source, bytes):
             source = source.encode(DEFAULT_ENCODING)
         target_config.set((b'remote', origin), b'url', source)
         target_config.set(
             (b'remote', origin), b'fetch',
             b'+refs/heads/*:refs/remotes/' + origin + b'/*')
         target_config.write_to_path()
         # TODO(jelmer): Support symref capability,
         # https://github.com/jelmer/dulwich/issues/485
         try:
             head = r[fetch_result[b'HEAD']]
         except KeyError:
             head = None
         else:
             r[b'HEAD'] = head.id
         if checkout and not bare and head is not None:
             errstream.write(b'Checking out ' + head.id + b'\n')
             r.reset_index(head.tree)
     except BaseException:
         r.close()
         raise
 
     return r
 
 
 def add(repo=".", paths=None):
     """Add files to the staging area.
 
     :param repo: Repository for the files
     :param paths: Paths to add.  No value passed stages all modified files.
     :return: Tuple with set of added files and ignored files
     """
     ignored = set()
     with open_repo_closing(repo) as r:
         ignore_manager = IgnoreFilterManager.from_repo(r)
         if not paths:
             paths = list(
                 get_untracked_paths(os.getcwd(), r.path, r.open_index()))
         relpaths = []
         if not isinstance(paths, list):
             paths = [paths]
         for p in paths:
             relpath = os.path.relpath(p, r.path)
             if relpath.startswith('..' + os.path.sep):
                 raise ValueError('path %r is not in repo' % relpath)
             # FIXME: Support patterns, directories.
             if ignore_manager.is_ignored(relpath):
                 ignored.add(relpath)
                 continue
             relpaths.append(relpath)
         r.stage(relpaths)
     return (relpaths, ignored)
 
 
 def remove(repo=".", paths=None, cached=False):
     """Remove files from the staging area.
 
     :param repo: Repository for the files
     :param paths: Paths to remove
     """
     with open_repo_closing(repo) as r:
         index = r.open_index()
         for p in paths:
             full_path = os.path.abspath(p).encode(sys.getfilesystemencoding())
             tree_path = path_to_tree_path(r.path, p)
             try:
                 index_sha = index[tree_path].sha
             except KeyError:
                 raise Exception('%s did not match any files' % p)
 
             if not cached:
                 try:
                     st = os.lstat(full_path)
                 except OSError:
                     pass
                 else:
                     try:
                         blob = blob_from_path_and_stat(full_path, st)
                     except IOError:
                         pass
                     else:
                         try:
                             committed_sha = tree_lookup_path(
                                 r.__getitem__, r[r.head()].tree, tree_path)[1]
                         except KeyError:
                             committed_sha = None
 
                         if blob.id != index_sha and index_sha != committed_sha:
                             raise Exception(
                                 'file has staged content differing '
                                 'from both the file and head: %s' % p)
 
                         if index_sha != committed_sha:
                             raise Exception(
                                 'file has staged changes: %s' % p)
                         os.remove(full_path)
             del index[tree_path]
         index.write()
 
 
 rm = remove
 
 
 def commit_decode(commit, contents, default_encoding=DEFAULT_ENCODING):
     if commit.encoding is not None:
         return contents.decode(commit.encoding, "replace")
     return contents.decode(default_encoding, "replace")
 
 
 def print_commit(commit, decode, outstream=sys.stdout):
     """Write a human-readable commit log entry.
 
     :param commit: A `Commit` object
     :param outstream: A stream file to write to
     """
     outstream.write("-" * 50 + "\n")
     outstream.write("commit: " + commit.id.decode('ascii') + "\n")
     if len(commit.parents) > 1:
         outstream.write(
             "merge: " +
             "...".join([c.decode('ascii') for c in commit.parents[1:]]) + "\n")
     outstream.write("Author: " + decode(commit.author) + "\n")
     if commit.author != commit.committer:
         outstream.write("Committer: " + decode(commit.committer) + "\n")
 
     time_tuple = time.gmtime(commit.author_time + commit.author_timezone)
     time_str = time.strftime("%a %b %d %Y %H:%M:%S", time_tuple)
     timezone_str = format_timezone(commit.author_timezone).decode('ascii')
     outstream.write("Date:   " + time_str + " " + timezone_str + "\n")
     outstream.write("\n")
     outstream.write(decode(commit.message) + "\n")
     outstream.write("\n")
 
 
 def print_tag(tag, decode, outstream=sys.stdout):
     """Write a human-readable tag.
 
     :param tag: A `Tag` object
     :param decode: Function for decoding bytes to unicode string
     :param outstream: A stream to write to
     """
     outstream.write("Tagger: " + decode(tag.tagger) + "\n")
     outstream.write("Date:   " + decode(tag.tag_time) + "\n")
     outstream.write("\n")
     outstream.write(decode(tag.message) + "\n")
     outstream.write("\n")
 
 
 def show_blob(repo, blob, decode, outstream=sys.stdout):
     """Write a blob to a stream.
 
     :param repo: A `Repo` object
     :param blob: A `Blob` object
     :param decode: Function for decoding bytes to unicode string
     :param outstream: A stream file to write to
     """
     outstream.write(decode(blob.data))
 
 
 def show_commit(repo, commit, decode, outstream=sys.stdout):
     """Show a commit to a stream.
 
     :param repo: A `Repo` object
     :param commit: A `Commit` object
     :param decode: Function for decoding bytes to unicode string
     :param outstream: Stream to write to
     """
     print_commit(commit, decode=decode, outstream=outstream)
     if commit.parents:
         parent_commit = repo[commit.parents[0]]
         base_tree = parent_commit.tree
     else:
         base_tree = None
     diffstream = BytesIO()
     write_tree_diff(
         diffstream,
         repo.object_store, base_tree, commit.tree)
     diffstream.seek(0)
     outstream.write(
         diffstream.getvalue().decode(
                 commit.encoding or DEFAULT_ENCODING, 'replace'))
 
 
 def show_tree(repo, tree, decode, outstream=sys.stdout):
     """Print a tree to a stream.
 
     :param repo: A `Repo` object
     :param tree: A `Tree` object
     :param decode: Function for decoding bytes to unicode string
     :param outstream: Stream to write to
     """
     for n in tree:
         outstream.write(decode(n) + "\n")
 
 
 def show_tag(repo, tag, decode, outstream=sys.stdout):
     """Print a tag to a stream.
 
     :param repo: A `Repo` object
     :param tag: A `Tag` object
     :param decode: Function for decoding bytes to unicode string
     :param outstream: Stream to write to
     """
     print_tag(tag, decode, outstream)
     show_object(repo, repo[tag.object[1]], outstream)
 
 
 def show_object(repo, obj, decode, outstream):
     return {
         b"tree": show_tree,
         b"blob": show_blob,
         b"commit": show_commit,
         b"tag": show_tag,
             }[obj.type_name](repo, obj, decode, outstream)
 
 
 def print_name_status(changes):
     """Print a simple status summary, listing changed files.
     """
     for change in changes:
         if not change:
             continue
         if isinstance(change, list):
             change = change[0]
         if change.type == CHANGE_ADD:
             path1 = change.new.path
             path2 = ''
             kind = 'A'
         elif change.type == CHANGE_DELETE:
             path1 = change.old.path
             path2 = ''
             kind = 'D'
         elif change.type == CHANGE_MODIFY:
             path1 = change.new.path
             path2 = ''
             kind = 'M'
         elif change.type in RENAME_CHANGE_TYPES:
             path1 = change.old.path
             path2 = change.new.path
             if change.type == CHANGE_RENAME:
                 kind = 'R'
             elif change.type == CHANGE_COPY:
                 kind = 'C'
         yield '%-8s%-20s%-20s' % (kind, path1, path2)
 
 
 def log(repo=".", paths=None, outstream=sys.stdout, max_entries=None,
         reverse=False, name_status=False):
     """Write commit logs.
 
     :param repo: Path to repository
     :param paths: Optional set of specific paths to print entries for
     :param outstream: Stream to write log output to
     :param reverse: Reverse order in which entries are printed
     :param name_status: Print name status
     :param max_entries: Optional maximum number of entries to display
     """
     with open_repo_closing(repo) as r:
         walker = r.get_walker(
             max_entries=max_entries, paths=paths, reverse=reverse)
         for entry in walker:
             def decode(x):
                 return commit_decode(entry.commit, x)
             print_commit(entry.commit, decode, outstream)
             if name_status:
                 outstream.writelines(
                     [l+'\n' for l in print_name_status(entry.changes())])
 
 
 # TODO(jelmer): better default for encoding?
 def show(repo=".", objects=None, outstream=sys.stdout,
          default_encoding=DEFAULT_ENCODING):
     """Print the changes in a commit.
 
     :param repo: Path to repository
     :param objects: Objects to show (defaults to [HEAD])
     :param outstream: Stream to write to
     :param default_encoding: Default encoding to use if none is set in the
         commit
     """
     if objects is None:
         objects = ["HEAD"]
     if not isinstance(objects, list):
         objects = [objects]
     with open_repo_closing(repo) as r:
         for objectish in objects:
             o = parse_object(r, objectish)
             if isinstance(o, Commit):
                 def decode(x):
                     return commit_decode(o, x, default_encoding)
             else:
                 def decode(x):
                     return x.decode(default_encoding)
             show_object(r, o, decode, outstream)
 
 
 def diff_tree(repo, old_tree, new_tree, outstream=sys.stdout):
     """Compares the content and mode of blobs found via two tree objects.
 
     :param repo: Path to repository
     :param old_tree: Id of old tree
     :param new_tree: Id of new tree
     :param outstream: Stream to write to
     """
     with open_repo_closing(repo) as r:
         write_tree_diff(outstream, r.object_store, old_tree, new_tree)
 
 
 def rev_list(repo, commits, outstream=sys.stdout):
     """Lists commit objects in reverse chronological order.
 
     :param repo: Path to repository
     :param commits: Commits over which to iterate
     :param outstream: Stream to write to
     """
     with open_repo_closing(repo) as r:
         for entry in r.get_walker(include=[r[c].id for c in commits]):
             outstream.write(entry.commit.id + b"\n")
 
 
 def tag(*args, **kwargs):
     import warnings
     warnings.warn("tag has been deprecated in favour of tag_create.",
                   DeprecationWarning)
     return tag_create(*args, **kwargs)
 
 
 def tag_create(
         repo, tag, author=None, message=None, annotated=False,
         objectish="HEAD", tag_time=None, tag_timezone=None):
     """Creates a tag in git via dulwich calls:
 
     :param repo: Path to repository
     :param tag: tag string
     :param author: tag author (optional, if annotated is set)
     :param message: tag message (optional)
     :param annotated: whether to create an annotated tag
     :param objectish: object the tag should point at, defaults to HEAD
     :param tag_time: Optional time for annotated tag
     :param tag_timezone: Optional timezone for annotated tag
     """
 
     with open_repo_closing(repo) as r:
         object = parse_object(r, objectish)
 
         if annotated:
             # Create the tag object
             tag_obj = Tag()
             if author is None:
                 # TODO(jelmer): Don't use repo private method.
                 author = r._get_user_identity()
             tag_obj.tagger = author
             tag_obj.message = message
             tag_obj.name = tag
             tag_obj.object = (type(object), object.id)
             if tag_time is None:
                 tag_time = int(time.time())
             tag_obj.tag_time = tag_time
             if tag_timezone is None:
                 # TODO(jelmer) Use current user timezone rather than UTC
                 tag_timezone = 0
             elif isinstance(tag_timezone, str):
                 tag_timezone = parse_timezone(tag_timezone)
             tag_obj.tag_timezone = tag_timezone
             r.object_store.add_object(tag_obj)
             tag_id = tag_obj.id
         else:
             tag_id = object.id
 
         r.refs[_make_tag_ref(tag)] = tag_id
 
 
 def list_tags(*args, **kwargs):
     import warnings
     warnings.warn("list_tags has been deprecated in favour of tag_list.",
                   DeprecationWarning)
     return tag_list(*args, **kwargs)
 
 
 def tag_list(repo, outstream=sys.stdout):
     """List all tags.
 
     :param repo: Path to repository
     :param outstream: Stream to write tags to
     """
     with open_repo_closing(repo) as r:
         tags = sorted(r.refs.as_dict(b"refs/tags"))
         return tags
 
 
 def tag_delete(repo, name):
     """Remove a tag.
 
     :param repo: Path to repository
     :param name: Name of tag to remove
     """
     with open_repo_closing(repo) as r:
         if isinstance(name, bytes):
             names = [name]
         elif isinstance(name, list):
             names = name
         else:
             raise TypeError("Unexpected tag name type %r" % name)
         for name in names:
             del r.refs[_make_tag_ref(name)]
 
 
 def reset(repo, mode, treeish="HEAD"):
     """Reset current HEAD to the specified state.
 
     :param repo: Path to repository
     :param mode: Mode ("hard", "soft", "mixed")
     :param treeish: Treeish to reset to
     """
 
     if mode != "hard":
         raise ValueError("hard is the only mode currently supported")
 
     with open_repo_closing(repo) as r:
         tree = parse_tree(r, treeish)
         r.reset_index(tree.id)
 
 
 def push(repo, remote_location, refspecs,
          outstream=default_bytes_out_stream,
          errstream=default_bytes_err_stream, **kwargs):
     """Remote push with dulwich via dulwich.client
 
     :param repo: Path to repository
     :param remote_location: Location of the remote
     :param refspecs: Refs to push to remote
     :param outstream: A stream file to write output
     :param errstream: A stream file to write errors
     """
 
     # Open the repo
     with open_repo_closing(repo) as r:
 
         # Get the client and path
         client, path = get_transport_and_path(
                 remote_location, config=r.get_config_stack(), **kwargs)
 
         selected_refs = []
 
         def update_refs(refs):
             selected_refs.extend(parse_reftuples(r.refs, refs, refspecs))
             new_refs = {}
             # TODO: Handle selected_refs == {None: None}
             for (lh, rh, force) in selected_refs:
                 if lh is None:
                     new_refs[rh] = ZERO_SHA
                 else:
                     new_refs[rh] = r.refs[lh]
             return new_refs
 
         err_encoding = getattr(errstream, 'encoding', None) or DEFAULT_ENCODING
         remote_location_bytes = client.get_url(path).encode(err_encoding)
         try:
             client.send_pack(
                 path, update_refs,
                 generate_pack_data=r.object_store.generate_pack_data,
                 progress=errstream.write)
             errstream.write(
                 b"Push to " + remote_location_bytes + b" successful.\n")
         except (UpdateRefsError, SendPackError) as e:
             errstream.write(b"Push to " + remote_location_bytes +
                             b" failed -> " + e.message.encode(err_encoding) +
                             b"\n")
 
 
 def pull(repo, remote_location=None, refspecs=None,
          outstream=default_bytes_out_stream,
          errstream=default_bytes_err_stream, **kwargs):
     """Pull from remote via dulwich.client
 
     :param repo: Path to repository
     :param remote_location: Location of the remote
     :param refspec: refspecs to fetch
     :param outstream: A stream file to write to output
     :param errstream: A stream file to write to errors
     """
     # Open the repo
     with open_repo_closing(repo) as r:
         if remote_location is None:
             # TODO(jelmer): Lookup 'remote' for current branch in config
             raise NotImplementedError(
                 "looking up remote from branch config not supported yet")
         if refspecs is None:
             refspecs = [b"HEAD"]
         selected_refs = []
 
         def determine_wants(remote_refs):
             selected_refs.extend(
                 parse_reftuples(remote_refs, r.refs, refspecs))
             return [remote_refs[lh] for (lh, rh, force) in selected_refs]
         client, path = get_transport_and_path(
                 remote_location, config=r.get_config_stack(), **kwargs)
         fetch_result = client.fetch(
             path, r, progress=errstream.write, determine_wants=determine_wants)
         for (lh, rh, force) in selected_refs:
             r.refs[rh] = fetch_result.refs[lh]
         if selected_refs:
             r[b'HEAD'] = fetch_result.refs[selected_refs[0][1]]
 
         # Perform 'git checkout .' - syncs staged changes
         tree = r[b"HEAD"].tree
         r.reset_index(tree=tree)
 
 
 def status(repo=".", ignored=False):
     """Returns staged, unstaged, and untracked changes relative to the HEAD.
 
     :param repo: Path to repository or repository object
     :param ignored: Whether to include ignored files in `untracked`
     :return: GitStatus tuple,
         staged -    list of staged paths (diff index/HEAD)
         unstaged -  list of unstaged paths (diff index/working-tree)
         untracked - list of untracked, un-ignored & non-.git paths
     """
     with open_repo_closing(repo) as r:
         # 1. Get status of staged
         tracked_changes = get_tree_changes(r)
         # 2. Get status of unstaged
         index = r.open_index()
-        unstaged_changes = list(get_unstaged_changes(index, r.path))
+        normalizer = r.get_blob_normalizer()
+        filter_callback = normalizer.checkin_normalize
+        unstaged_changes = list(
+            get_unstaged_changes(index, r.path, filter_callback)
+        )
         ignore_manager = IgnoreFilterManager.from_repo(r)
         untracked_paths = get_untracked_paths(r.path, r.path, index)
         if ignored:
             untracked_changes = list(untracked_paths)
         else:
             untracked_changes = [
                     p for p in untracked_paths
                     if not ignore_manager.is_ignored(p)]
         return GitStatus(tracked_changes, unstaged_changes, untracked_changes)
 
 
 def get_untracked_paths(frompath, basepath, index):
     """Get untracked paths.
 
     ;param frompath: Path to walk
     :param basepath: Path to compare to
     :param index: Index to check against
     """
     # If nothing is specified, add all non-ignored files.
     for dirpath, dirnames, filenames in os.walk(frompath):
         # Skip .git and below.
         if '.git' in dirnames:
             dirnames.remove('.git')
             if dirpath != basepath:
                 continue
         if '.git' in filenames:
             filenames.remove('.git')
             if dirpath != basepath:
                 continue
         for filename in filenames:
             ap = os.path.join(dirpath, filename)
             ip = path_to_tree_path(basepath, ap)
             if ip not in index:
                 yield os.path.relpath(ap, frompath)
 
 
 def get_tree_changes(repo):
     """Return add/delete/modify changes to tree by comparing index to HEAD.
 
     :param repo: repo path or object
     :return: dict with lists for each type of change
     """
     with open_repo_closing(repo) as r:
         index = r.open_index()
 
         # Compares the Index to the HEAD & determines changes
         # Iterate through the changes and report add/delete/modify
         # TODO: call out to dulwich.diff_tree somehow.
         tracked_changes = {
             'add': [],
             'delete': [],
             'modify': [],
         }
         try:
             tree_id = r[b'HEAD'].tree
         except KeyError:
             tree_id = None
 
         for change in index.changes_from_tree(r.object_store, tree_id):
             if not change[0][0]:
                 tracked_changes['add'].append(change[0][1])
             elif not change[0][1]:
                 tracked_changes['delete'].append(change[0][0])
             elif change[0][0] == change[0][1]:
                 tracked_changes['modify'].append(change[0][0])
             else:
                 raise AssertionError('git mv ops not yet supported')
         return tracked_changes
 
 
 def daemon(path=".", address=None, port=None):
     """Run a daemon serving Git requests over TCP/IP.
 
     :param path: Path to the directory to serve.
     :param address: Optional address to listen on (defaults to ::)
     :param port: Optional port to listen on (defaults to TCP_GIT_PORT)
     """
     # TODO(jelmer): Support git-daemon-export-ok and --export-all.
     backend = FileSystemBackend(path)
     server = TCPGitServer(backend, address, port)
     server.serve_forever()
 
 
 def web_daemon(path=".", address=None, port=None):
     """Run a daemon serving Git requests over HTTP.
 
     :param path: Path to the directory to serve
     :param address: Optional address to listen on (defaults to ::)
     :param port: Optional port to listen on (defaults to 80)
     """
     from dulwich.web import (
         make_wsgi_chain,
         make_server,
         WSGIRequestHandlerLogger,
         WSGIServerLogger)
 
     backend = FileSystemBackend(path)
     app = make_wsgi_chain(backend)
     server = make_server(address, port, app,
                          handler_class=WSGIRequestHandlerLogger,
                          server_class=WSGIServerLogger)
     server.serve_forever()
 
 
 def upload_pack(path=".", inf=None, outf=None):
     """Upload a pack file after negotiating its contents using smart protocol.
 
     :param path: Path to the repository
     :param inf: Input stream to communicate with client
     :param outf: Output stream to communicate with client
     """
     if outf is None:
         outf = getattr(sys.stdout, 'buffer', sys.stdout)
     if inf is None:
         inf = getattr(sys.stdin, 'buffer', sys.stdin)
     path = os.path.expanduser(path)
     backend = FileSystemBackend(path)
 
     def send_fn(data):
         outf.write(data)
         outf.flush()
     proto = Protocol(inf.read, send_fn)
     handler = UploadPackHandler(backend, [path], proto)
     # FIXME: Catch exceptions and write a single-line summary to outf.
     handler.handle()
     return 0
 
 
 def receive_pack(path=".", inf=None, outf=None):
     """Receive a pack file after negotiating its contents using smart protocol.
 
     :param path: Path to the repository
     :param inf: Input stream to communicate with client
     :param outf: Output stream to communicate with client
     """
     if outf is None:
         outf = getattr(sys.stdout, 'buffer', sys.stdout)
     if inf is None:
         inf = getattr(sys.stdin, 'buffer', sys.stdin)
     path = os.path.expanduser(path)
     backend = FileSystemBackend(path)
 
     def send_fn(data):
         outf.write(data)
         outf.flush()
     proto = Protocol(inf.read, send_fn)
     handler = ReceivePackHandler(backend, [path], proto)
     # FIXME: Catch exceptions and write a single-line summary to outf.
     handler.handle()
     return 0
 
 
 def _make_branch_ref(name):
     if getattr(name, 'encode', None):
         name = name.encode(DEFAULT_ENCODING)
     return b"refs/heads/" + name
 
 
 def _make_tag_ref(name):
     if getattr(name, 'encode', None):
         name = name.encode(DEFAULT_ENCODING)
     return b"refs/tags/" + name
 
 
 def branch_delete(repo, name):
     """Delete a branch.
 
     :param repo: Path to the repository
     :param name: Name of the branch
     """
     with open_repo_closing(repo) as r:
         if isinstance(name, list):
             names = name
         else:
             names = [name]
         for name in names:
             del r.refs[_make_branch_ref(name)]
 
 
 def branch_create(repo, name, objectish=None, force=False):
     """Create a branch.
 
     :param repo: Path to the repository
     :param name: Name of the new branch
     :param objectish: Target object to point new branch at (defaults to HEAD)
     :param force: Force creation of branch, even if it already exists
     """
     with open_repo_closing(repo) as r:
         if objectish is None:
             objectish = "HEAD"
         object = parse_object(r, objectish)
         refname = _make_branch_ref(name)
         ref_message = b"branch: Created from " + objectish.encode('utf-8')
         if force:
             r.refs.set_if_equals(refname, None, object.id, message=ref_message)
         else:
             if not r.refs.add_if_new(refname, object.id, message=ref_message):
                 raise KeyError("Branch with name %s already exists." % name)
 
 
 def branch_list(repo):
     """List all branches.
 
     :param repo: Path to the repository
     """
     with open_repo_closing(repo) as r:
         return r.refs.keys(base=b"refs/heads/")
 
 
 def fetch(repo, remote_location, remote_name=b'origin', outstream=sys.stdout,
           errstream=default_bytes_err_stream, message=None, depth=None,
           **kwargs):
     """Fetch objects from a remote server.
 
     :param repo: Path to the repository
     :param remote_location: String identifying a remote server
     :param remote_name: Name for remote server
     :param outstream: Output stream (defaults to stdout)
     :param errstream: Error stream (defaults to stderr)
     :param message: Reflog message (defaults to b"fetch: from <remote_name>")
     :param depth: Depth to fetch at
     :return: Dictionary with refs on the remote
     """
     if message is None:
         message = b'fetch: from ' + remote_location.encode("utf-8")
     with open_repo_closing(repo) as r:
         client, path = get_transport_and_path(
             remote_location, config=r.get_config_stack(), **kwargs)
         fetch_result = client.fetch(path, r, progress=errstream.write,
                                     depth=depth)
         stripped_refs = strip_peeled_refs(fetch_result.refs)
         branches = {
             n[len(b'refs/heads/'):]: v for (n, v) in stripped_refs.items()
             if n.startswith(b'refs/heads/')}
         r.refs.import_refs(
             b'refs/remotes/' + remote_name, branches, message=message)
         tags = {
             n[len(b'refs/tags/'):]: v for (n, v) in stripped_refs.items()
             if n.startswith(b'refs/tags/') and
             not n.endswith(ANNOTATED_TAG_SUFFIX)}
         r.refs.import_refs(b'refs/tags', tags, message=message)
     return fetch_result.refs
 
 
 def ls_remote(remote, config=None, **kwargs):
     """List the refs in a remote.
 
     :param remote: Remote repository location
     :param config: Configuration to use
     :return: Dictionary with remote refs
     """
     if config is None:
         config = StackedConfig.default()
     client, host_path = get_transport_and_path(remote, config=config, **kwargs)
     return client.get_refs(host_path)
 
 
 def repack(repo):
     """Repack loose files in a repository.
 
     Currently this only packs loose objects.
 
     :param repo: Path to the repository
     """
     with open_repo_closing(repo) as r:
         r.object_store.pack_loose_objects()
 
 
 def pack_objects(repo, object_ids, packf, idxf, delta_window_size=None):
     """Pack objects into a file.
 
     :param repo: Path to the repository
     :param object_ids: List of object ids to write
     :param packf: File-like object to write to
     :param idxf: File-like object to write to (can be None)
     """
     with open_repo_closing(repo) as r:
         entries, data_sum = write_pack_objects(
             packf,
             r.object_store.iter_shas((oid, None) for oid in object_ids),
             delta_window_size=delta_window_size)
     if idxf is not None:
         entries = sorted([(k, v[0], v[1]) for (k, v) in entries.items()])
         write_pack_index(idxf, entries, data_sum)
 
 
 def ls_tree(repo, treeish=b"HEAD", outstream=sys.stdout, recursive=False,
             name_only=False):
     """List contents of a tree.
 
     :param repo: Path to the repository
     :param tree_ish: Tree id to list
     :param outstream: Output stream (defaults to stdout)
     :param recursive: Whether to recursively list files
     :param name_only: Only print item name
     """
     def list_tree(store, treeid, base):
         for (name, mode, sha) in store[treeid].iteritems():
             if base:
                 name = posixpath.join(base, name)
             if name_only:
                 outstream.write(name + b"\n")
             else:
                 outstream.write(pretty_format_tree_entry(name, mode, sha))
             if stat.S_ISDIR(mode) and recursive:
                 list_tree(store, sha, name)
     with open_repo_closing(repo) as r:
         tree = parse_tree(r, treeish)
         list_tree(r.object_store, tree.id, "")
 
 
 def remote_add(repo, name, url):
     """Add a remote.
 
     :param repo: Path to the repository
     :param name: Remote name
     :param url: Remote URL
     """
     if not isinstance(name, bytes):
         name = name.encode(DEFAULT_ENCODING)
     if not isinstance(url, bytes):
         url = url.encode(DEFAULT_ENCODING)
     with open_repo_closing(repo) as r:
         c = r.get_config()
         section = (b'remote', name)
         if c.has_section(section):
             raise RemoteExists(section)
         c.set(section, b"url", url)
         c.write_to_path()
 
 
 def check_ignore(repo, paths, no_index=False):
     """Debug gitignore files.
 
     :param repo: Path to the repository
     :param paths: List of paths to check for
     :param no_index: Don't check index
     :return: List of ignored files
     """
     with open_repo_closing(repo) as r:
         index = r.open_index()
         ignore_manager = IgnoreFilterManager.from_repo(r)
         for path in paths:
             if not no_index and path_to_tree_path(r.path, path) in index:
                 continue
             if os.path.isabs(path):
                 path = os.path.relpath(path, r.path)
             if ignore_manager.is_ignored(path):
                 yield path
 
 
 def update_head(repo, target, detached=False, new_branch=None):
     """Update HEAD to point at a new branch/commit.
 
     Note that this does not actually update the working tree.
 
     :param repo: Path to the repository
     :param detach: Create a detached head
     :param target: Branch or committish to switch to
     :param new_branch: New branch to create
     """
     with open_repo_closing(repo) as r:
         if new_branch is not None:
             to_set = _make_branch_ref(new_branch)
         else:
             to_set = b"HEAD"
         if detached:
             # TODO(jelmer): Provide some way so that the actual ref gets
             # updated rather than what it points to, so the delete isn't
             # necessary.
             del r.refs[to_set]
             r.refs[to_set] = parse_commit(r, target).id
         else:
             r.refs.set_symbolic_ref(to_set, parse_ref(r, target))
         if new_branch is not None:
             r.refs.set_symbolic_ref(b"HEAD", to_set)
 
 
 def check_mailmap(repo, contact):
     """Check canonical name and email of contact.
 
     :param repo: Path to the repository
     :param contact: Contact name and/or email
     :return: Canonical contact data
     """
     with open_repo_closing(repo) as r:
         from dulwich.mailmap import Mailmap
         import errno
         try:
             mailmap = Mailmap.from_path(os.path.join(r.path, '.mailmap'))
         except IOError as e:
             if e.errno != errno.ENOENT:
                 raise
             mailmap = Mailmap()
         return mailmap.lookup(contact)
 
 
 def fsck(repo):
     """Check a repository.
 
     :param repo: A path to the repository
     :return: Iterator over errors/warnings
     """
     with open_repo_closing(repo) as r:
         # TODO(jelmer): check pack files
         # TODO(jelmer): check graph
         # TODO(jelmer): check refs
         for sha in r.object_store:
             o = r.object_store[sha]
             try:
                 o.check()
             except Exception as e:
                 yield (sha, e)
 
 
 def stash_list(repo):
     """List all stashes in a repository."""
     with open_repo_closing(repo) as r:
         from dulwich.stash import Stash
         stash = Stash.from_repo(r)
         return enumerate(list(stash.stashes()))
 
 
 def stash_push(repo):
     """Push a new stash onto the stack."""
     with open_repo_closing(repo) as r:
         from dulwich.stash import Stash
         stash = Stash.from_repo(r)
         stash.push()
 
 
 def stash_pop(repo):
     """Pop a new stash from the stack."""
     with open_repo_closing(repo) as r:
         from dulwich.stash import Stash
         stash = Stash.from_repo(r)
         stash.pop()
 
 
 def ls_files(repo):
     """List all files in an index."""
     with open_repo_closing(repo) as r:
         return sorted(r.open_index())
 
 
 def describe(repo):
     """Describe the repository version.
 
     :param projdir: git repository root
     :returns: a string description of the current git revision
 
     Examples: "gabcdefh", "v0.1" or "v0.1-5-gabcdefh".
     """
     # Get the repository
     with open_repo_closing(repo) as r:
         # Get a list of all tags
         refs = r.get_refs()
         tags = {}
         for key, value in refs.items():
             key = key.decode()
             obj = r.get_object(value)
             if u'tags' not in key:
                 continue
 
             _, tag = key.rsplit(u'/', 1)
 
             try:
                 commit = obj.object
             except AttributeError:
                 continue
             else:
                 commit = r.get_object(commit[1])
             tags[tag] = [
                 datetime.datetime(*time.gmtime(commit.commit_time)[:6]),
                 commit.id.decode('ascii'),
             ]
 
         sorted_tags = sorted(tags.items(),
                              key=lambda tag: tag[1][0],
                              reverse=True)
 
         # If there are no tags, return the current commit
         if len(sorted_tags) == 0:
             return 'g{}'.format(r[r.head()].id.decode('ascii')[:7])
 
         # We're now 0 commits from the top
         commit_count = 0
 
         # Get the latest commit
         latest_commit = r[r.head()]
 
         # Walk through all commits
         walker = r.get_walker()
         for entry in walker:
             # Check if tag
             commit_id = entry.commit.id.decode('ascii')
             for tag in sorted_tags:
                 tag_name = tag[0]
                 tag_commit = tag[1][1]
                 if commit_id == tag_commit:
                     if commit_count == 0:
                         return tag_name
                     else:
                         return '{}-{}-g{}'.format(
                                 tag_name,
                                 commit_count,
                                 latest_commit.id.decode('ascii')[:7])
 
             commit_count += 1
 
         # Return plain commit if no parent tag can be found
         return 'g{}'.format(latest_commit.id.decode('ascii')[:7])
 
 
 def get_object_by_path(repo, path, committish=None):
     """Get an object by path.
 
     :param repo: A path to the repository
     :param path: Path to look up
     :param committish: Commit to look up path in
     :return: A `ShaFile` object
     """
     if committish is None:
         committish = "HEAD"
     # Get the repository
     with open_repo_closing(repo) as r:
         commit = parse_commit(repo, committish)
         base_tree = commit.tree
         if not isinstance(path, bytes):
             path = path.encode(commit.encoding or DEFAULT_ENCODING)
         (mode, sha) = tree_lookup_path(
             r.object_store.__getitem__,
             base_tree, path)
         return r[sha]
 
 
 def write_tree(repo):
     """Write a tree object from the index.
 
     :param repo: Repository for which to write tree
     :return: tree id for the tree that was written
     """
     with open_repo_closing(repo) as r:
         return r.open_index().commit(r.object_store)
diff --git a/dulwich/repo.py b/dulwich/repo.py
index e6f2f214..f5151cfa 100644
--- a/dulwich/repo.py
+++ b/dulwich/repo.py
@@ -1,1356 +1,1370 @@
 # repo.py -- For dealing with git repositories.
 # Copyright (C) 2007 James Westby <jw+debian@jameswestby.net>
 # Copyright (C) 2008-2013 Jelmer Vernooij <jelmer@jelmer.uk>
 #
 # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
 # General Public License as public by the Free Software Foundation; version 2.0
 # or (at your option) any later version. You can redistribute it and/or
 # modify it under the terms of either of these two licenses.
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
 # You should have received a copy of the licenses; if not, see
 # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
 # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
 # License, Version 2.0.
 #
 
 
 """Repository access.
 
 This module contains the base class for git repositories
 (BaseRepo) and an implementation which uses a repository on
 local disk (Repo).
 
 """
 
 from io import BytesIO
 import errno
 import os
 import sys
 import stat
 import time
 
 from dulwich.errors import (
     NoIndexPresent,
     NotBlobError,
     NotCommitError,
     NotGitRepository,
     NotTreeError,
     NotTagError,
     CommitError,
     RefFormatError,
     HookError,
     )
 from dulwich.file import (
     GitFile,
     )
 from dulwich.object_store import (
     DiskObjectStore,
     MemoryObjectStore,
     ObjectStoreGraphWalker,
     )
 from dulwich.objects import (
     check_hexsha,
     Blob,
     Commit,
     ShaFile,
     Tag,
     Tree,
     )
 from dulwich.pack import (
     pack_objects_to_data,
     )
 
 from dulwich.hooks import (
     PreCommitShellHook,
     PostCommitShellHook,
     CommitMsgShellHook,
     )
 
+from dulwich.line_ending import BlobNormalizer
+
 from dulwich.refs import (  # noqa: F401
     ANNOTATED_TAG_SUFFIX,
     check_ref_format,
     RefsContainer,
     DictRefsContainer,
     InfoRefsContainer,
     DiskRefsContainer,
     read_packed_refs,
     read_packed_refs_with_peeled,
     write_packed_refs,
     SYMREF,
     )
 
 
 import warnings
 
 
 CONTROLDIR = '.git'
 OBJECTDIR = 'objects'
 REFSDIR = 'refs'
 REFSDIR_TAGS = 'tags'
 REFSDIR_HEADS = 'heads'
 INDEX_FILENAME = "index"
 COMMONDIR = 'commondir'
 GITDIR = 'gitdir'
 WORKTREES = 'worktrees'
 
 BASE_DIRECTORIES = [
     ["branches"],
     [REFSDIR],
     [REFSDIR, REFSDIR_TAGS],
     [REFSDIR, REFSDIR_HEADS],
     ["hooks"],
     ["info"]
     ]
 
 DEFAULT_REF = b'refs/heads/master'
 
 
 class InvalidUserIdentity(Exception):
     """User identity is not of the format 'user <email>'"""
 
     def __init__(self, identity):
         self.identity = identity
 
 
 def check_user_identity(identity):
     """Verify that a user identity is formatted correctly.
 
     :param identity: User identity bytestring
     :raise InvalidUserIdentity: Raised when identity is invalid
     """
     try:
         fst, snd = identity.split(b' <', 1)
     except ValueError:
         raise InvalidUserIdentity(identity)
     if b'>' not in snd:
         raise InvalidUserIdentity(identity)
 
 
 def parse_graftpoints(graftpoints):
     """Convert a list of graftpoints into a dict
 
     :param graftpoints: Iterator of graftpoint lines
 
     Each line is formatted as:
         <commit sha1> <parent sha1> [<parent sha1>]*
 
     Resulting dictionary is:
         <commit sha1>: [<parent sha1>*]
 
     https://git.wiki.kernel.org/index.php/GraftPoint
     """
     grafts = {}
     for l in graftpoints:
         raw_graft = l.split(None, 1)
 
         commit = raw_graft[0]
         if len(raw_graft) == 2:
             parents = raw_graft[1].split()
         else:
             parents = []
 
         for sha in [commit] + parents:
             check_hexsha(sha, 'Invalid graftpoint')
 
         grafts[commit] = parents
     return grafts
 
 
 def serialize_graftpoints(graftpoints):
     """Convert a dictionary of grafts into string
 
     The graft dictionary is:
         <commit sha1>: [<parent sha1>*]
 
     Each line is formatted as:
         <commit sha1> <parent sha1> [<parent sha1>]*
 
     https://git.wiki.kernel.org/index.php/GraftPoint
 
     """
     graft_lines = []
     for commit, parents in graftpoints.items():
         if parents:
             graft_lines.append(commit + b' ' + b' '.join(parents))
         else:
             graft_lines.append(commit)
     return b'\n'.join(graft_lines)
 
 
 class BaseRepo(object):
     """Base class for a git repository.
 
     :ivar object_store: Dictionary-like object for accessing
         the objects
     :ivar refs: Dictionary-like object with the refs in this
         repository
     """
 
     def __init__(self, object_store, refs):
         """Open a repository.
 
         This shouldn't be called directly, but rather through one of the
         base classes, such as MemoryRepo or Repo.
 
         :param object_store: Object store to use
         :param refs: Refs container to use
         """
         self.object_store = object_store
         self.refs = refs
 
         self._graftpoints = {}
         self.hooks = {}
 
     def _determine_file_mode(self):
         """Probe the file-system to determine whether permissions can be trusted.
 
         :return: True if permissions can be trusted, False otherwise.
         """
         raise NotImplementedError(self._determine_file_mode)
 
     def _init_files(self, bare):
         """Initialize a default set of named files."""
         from dulwich.config import ConfigFile
         self._put_named_file('description', b"Unnamed repository")
         f = BytesIO()
         cf = ConfigFile()
         cf.set("core", "repositoryformatversion", "0")
         if self._determine_file_mode():
             cf.set("core", "filemode", True)
         else:
             cf.set("core", "filemode", False)
 
         cf.set("core", "bare", bare)
         cf.set("core", "logallrefupdates", True)
         cf.write_to_file(f)
         self._put_named_file('config', f.getvalue())
         self._put_named_file(os.path.join('info', 'exclude'), b'')
 
     def get_named_file(self, path):
         """Get a file from the control dir with a specific name.
 
         Although the filename should be interpreted as a filename relative to
         the control dir in a disk-based Repo, the object returned need not be
         pointing to a file in that location.
 
         :param path: The path to the file, relative to the control dir.
         :return: An open file object, or None if the file does not exist.
         """
         raise NotImplementedError(self.get_named_file)
 
     def _put_named_file(self, path, contents):
         """Write a file to the control dir with the given name and contents.
 
         :param path: The path to the file, relative to the control dir.
         :param contents: A string to write to the file.
         """
         raise NotImplementedError(self._put_named_file)
 
     def _del_named_file(self, path):
         """Delete a file in the contrl directory with the given name."""
         raise NotImplementedError(self._del_named_file)
 
     def open_index(self):
         """Open the index for this repository.
 
         :raise NoIndexPresent: If no index is present
         :return: The matching `Index`
         """
         raise NotImplementedError(self.open_index)
 
     def fetch(self, target, determine_wants=None, progress=None, depth=None):
         """Fetch objects into another repository.
 
         :param target: The target repository
         :param determine_wants: Optional function to determine what refs to
             fetch.
         :param progress: Optional progress function
         :param depth: Optional shallow fetch depth
         :return: The local refs
         """
         if determine_wants is None:
             determine_wants = target.object_store.determine_wants_all
         count, pack_data = self.fetch_pack_data(
                 determine_wants, target.get_graph_walker(), progress=progress,
                 depth=depth)
         target.object_store.add_pack_data(count, pack_data, progress)
         return self.get_refs()
 
     def fetch_pack_data(self, determine_wants, graph_walker, progress,
                         get_tagged=None, depth=None):
         """Fetch the pack data required for a set of revisions.
 
         :param determine_wants: Function that takes a dictionary with heads
             and returns the list of heads to fetch.
         :param graph_walker: Object that can iterate over the list of revisions
             to fetch and has an "ack" method that will be called to acknowledge
             that a revision is present.
         :param progress: Simple progress function that will be called with
             updated progress strings.
         :param get_tagged: Function that returns a dict of pointed-to sha ->
             tag sha for including tags.
         :param depth: Shallow fetch depth
         :return: count and iterator over pack data
         """
         # TODO(jelmer): Fetch pack data directly, don't create objects first.
         objects = self.fetch_objects(determine_wants, graph_walker, progress,
                                      get_tagged, depth=depth)
         return pack_objects_to_data(objects)
 
     def fetch_objects(self, determine_wants, graph_walker, progress,
                       get_tagged=None, depth=None):
         """Fetch the missing objects required for a set of revisions.
 
         :param determine_wants: Function that takes a dictionary with heads
             and returns the list of heads to fetch.
         :param graph_walker: Object that can iterate over the list of revisions
             to fetch and has an "ack" method that will be called to acknowledge
             that a revision is present.
         :param progress: Simple progress function that will be called with
             updated progress strings.
         :param get_tagged: Function that returns a dict of pointed-to sha ->
             tag sha for including tags.
         :param depth: Shallow fetch depth
         :return: iterator over objects, with __len__ implemented
         """
         if depth not in (None, 0):
             raise NotImplementedError("depth not supported yet")
 
         refs = {}
         for ref, sha in self.get_refs().items():
             try:
                 obj = self.object_store[sha]
             except KeyError:
                 warnings.warn(
                     'ref %s points at non-present sha %s' % (
                         ref.decode('utf-8', 'replace'), sha.decode('ascii')),
                     UserWarning)
                 continue
             else:
                 if isinstance(obj, Tag):
                     refs[ref + ANNOTATED_TAG_SUFFIX] = obj.object[1]
                 refs[ref] = sha
 
         wants = determine_wants(refs)
         if not isinstance(wants, list):
             raise TypeError("determine_wants() did not return a list")
 
         shallows = getattr(graph_walker, 'shallow', frozenset())
         unshallows = getattr(graph_walker, 'unshallow', frozenset())
 
         if wants == []:
             # TODO(dborowitz): find a way to short-circuit that doesn't change
             # this interface.
 
             if shallows or unshallows:
                 # Do not send a pack in shallow short-circuit path
                 return None
 
             return []
 
         # If the graph walker is set up with an implementation that can
         # ACK/NAK to the wire, it will write data to the client through
         # this call as a side-effect.
         haves = self.object_store.find_common_revisions(graph_walker)
 
         # Deal with shallow requests separately because the haves do
         # not reflect what objects are missing
         if shallows or unshallows:
             # TODO: filter the haves commits from iter_shas. the specific
             # commits aren't missing.
             haves = []
 
         def get_parents(commit):
             if commit.id in shallows:
                 return []
             return self.get_parents(commit.id, commit)
 
         return self.object_store.iter_shas(
           self.object_store.find_missing_objects(
               haves, wants, progress,
               get_tagged,
               get_parents=get_parents))
 
     def get_graph_walker(self, heads=None):
         """Retrieve a graph walker.
 
         A graph walker is used by a remote repository (or proxy)
         to find out which objects are present in this repository.
 
         :param heads: Repository heads to use (optional)
         :return: A graph walker object
         """
         if heads is None:
             heads = self.refs.as_dict(b'refs/heads').values()
         return ObjectStoreGraphWalker(
             heads, self.get_parents, shallow=self.get_shallow())
 
     def get_refs(self):
         """Get dictionary with all refs.
 
         :return: A ``dict`` mapping ref names to SHA1s
         """
         return self.refs.as_dict()
 
     def head(self):
         """Return the SHA1 pointed at by HEAD."""
         return self.refs[b'HEAD']
 
     def _get_object(self, sha, cls):
         assert len(sha) in (20, 40)
         ret = self.get_object(sha)
         if not isinstance(ret, cls):
             if cls is Commit:
                 raise NotCommitError(ret)
             elif cls is Blob:
                 raise NotBlobError(ret)
             elif cls is Tree:
                 raise NotTreeError(ret)
             elif cls is Tag:
                 raise NotTagError(ret)
             else:
                 raise Exception("Type invalid: %r != %r" % (
                   ret.type_name, cls.type_name))
         return ret
 
     def get_object(self, sha):
         """Retrieve the object with the specified SHA.
 
         :param sha: SHA to retrieve
         :return: A ShaFile object
         :raise KeyError: when the object can not be found
         """
         return self.object_store[sha]
 
     def get_parents(self, sha, commit=None):
         """Retrieve the parents of a specific commit.
 
         If the specific commit is a graftpoint, the graft parents
         will be returned instead.
 
         :param sha: SHA of the commit for which to retrieve the parents
         :param commit: Optional commit matching the sha
         :return: List of parents
         """
 
         try:
             return self._graftpoints[sha]
         except KeyError:
             if commit is None:
                 commit = self[sha]
             return commit.parents
 
     def get_config(self):
         """Retrieve the config object.
 
         :return: `ConfigFile` object for the ``.git/config`` file.
         """
         raise NotImplementedError(self.get_config)
 
     def get_description(self):
         """Retrieve the description for this repository.
 
         :return: String with the description of the repository
             as set by the user.
         """
         raise NotImplementedError(self.get_description)
 
     def set_description(self, description):
         """Set the description for this repository.
 
         :param description: Text to set as description for this repository.
         """
         raise NotImplementedError(self.set_description)
 
     def get_config_stack(self):
         """Return a config stack for this repository.
 
         This stack accesses the configuration for both this repository
         itself (.git/config) and the global configuration, which usually
         lives in ~/.gitconfig.
 
         :return: `Config` instance for this repository
         """
         from dulwich.config import StackedConfig
         backends = [self.get_config()] + StackedConfig.default_backends()
         return StackedConfig(backends, writable=backends[0])
 
     def get_shallow(self):
         """Get the set of shallow commits.
 
         :return: Set of shallow commits.
         """
         f = self.get_named_file('shallow')
         if f is None:
             return set()
         with f:
             return set(l.strip() for l in f)
 
     def update_shallow(self, new_shallow, new_unshallow):
         """Update the list of shallow objects.
 
         :param new_shallow: Newly shallow objects
         :param new_unshallow: Newly no longer shallow objects
         """
         shallow = self.get_shallow()
         if new_shallow:
             shallow.update(new_shallow)
         if new_unshallow:
             shallow.difference_update(new_unshallow)
         self._put_named_file(
             'shallow',
             b''.join([sha + b'\n' for sha in shallow]))
 
     def get_peeled(self, ref):
         """Get the peeled value of a ref.
 
         :param ref: The refname to peel.
         :return: The fully-peeled SHA1 of a tag object, after peeling all
             intermediate tags; if the original ref does not point to a tag,
             this will equal the original SHA1.
         """
         cached = self.refs.get_peeled(ref)
         if cached is not None:
             return cached
         return self.object_store.peel_sha(self.refs[ref]).id
 
     def get_walker(self, include=None, *args, **kwargs):
         """Obtain a walker for this repository.
 
         :param include: Iterable of SHAs of commits to include along with their
             ancestors. Defaults to [HEAD]
         :param exclude: Iterable of SHAs of commits to exclude along with their
             ancestors, overriding includes.
         :param order: ORDER_* constant specifying the order of results.
             Anything other than ORDER_DATE may result in O(n) memory usage.
         :param reverse: If True, reverse the order of output, requiring O(n)
             memory.
         :param max_entries: The maximum number of entries to yield, or None for
             no limit.
         :param paths: Iterable of file or subtree paths to show entries for.
         :param rename_detector: diff.RenameDetector object for detecting
             renames.
         :param follow: If True, follow path across renames/copies. Forces a
             default rename_detector.
         :param since: Timestamp to list commits after.
         :param until: Timestamp to list commits before.
         :param queue_cls: A class to use for a queue of commits, supporting the
             iterator protocol. The constructor takes a single argument, the
             Walker.
         :return: A `Walker` object
         """
         from dulwich.walk import Walker
         if include is None:
             include = [self.head()]
         if isinstance(include, str):
             include = [include]
 
         kwargs['get_parents'] = lambda commit: self.get_parents(
             commit.id, commit)
 
         return Walker(self.object_store, include, *args, **kwargs)
 
     def __getitem__(self, name):
         """Retrieve a Git object by SHA1 or ref.
 
         :param name: A Git object SHA1 or a ref name
         :return: A `ShaFile` object, such as a Commit or Blob
         :raise KeyError: when the specified ref or object does not exist
         """
         if not isinstance(name, bytes):
             raise TypeError("'name' must be bytestring, not %.80s" %
                             type(name).__name__)
         if len(name) in (20, 40):
             try:
                 return self.object_store[name]
             except (KeyError, ValueError):
                 pass
         try:
             return self.object_store[self.refs[name]]
         except RefFormatError:
             raise KeyError(name)
 
     def __contains__(self, name):
         """Check if a specific Git object or ref is present.
 
         :param name: Git object SHA1 or ref name
         """
         if len(name) in (20, 40):
             return name in self.object_store or name in self.refs
         else:
             return name in self.refs
 
     def __setitem__(self, name, value):
         """Set a ref.
 
         :param name: ref name
         :param value: Ref value - either a ShaFile object, or a hex sha
         """
         if name.startswith(b"refs/") or name == b'HEAD':
             if isinstance(value, ShaFile):
                 self.refs[name] = value.id
             elif isinstance(value, bytes):
                 self.refs[name] = value
             else:
                 raise TypeError(value)
         else:
             raise ValueError(name)
 
     def __delitem__(self, name):
         """Remove a ref.
 
         :param name: Name of the ref to remove
         """
         if name.startswith(b"refs/") or name == b"HEAD":
             del self.refs[name]
         else:
             raise ValueError(name)
 
     def _get_user_identity(self, config):
         """Determine the identity to use for new commits.
         """
         user = os.environ.get("GIT_COMMITTER_NAME")
         email = os.environ.get("GIT_COMMITTER_EMAIL")
         if user is None:
             try:
                 user = config.get(("user", ), "name")
             except KeyError:
                 user = None
         if email is None:
             try:
                 email = config.get(("user", ), "email")
             except KeyError:
                 email = None
         if user is None:
             import getpass
             user = getpass.getuser().encode(sys.getdefaultencoding())
         if email is None:
             import getpass
             import socket
             email = ("{}@{}".format(getpass.getuser(), socket.gethostname())
                      .encode(sys.getdefaultencoding()))
         return (user + b" <" + email + b">")
 
     def _add_graftpoints(self, updated_graftpoints):
         """Add or modify graftpoints
 
         :param updated_graftpoints: Dict of commit shas to list of parent shas
         """
 
         # Simple validation
         for commit, parents in updated_graftpoints.items():
             for sha in [commit] + parents:
                 check_hexsha(sha, 'Invalid graftpoint')
 
         self._graftpoints.update(updated_graftpoints)
 
     def _remove_graftpoints(self, to_remove=[]):
         """Remove graftpoints
 
         :param to_remove: List of commit shas
         """
         for sha in to_remove:
             del self._graftpoints[sha]
 
     def _read_heads(self, name):
         f = self.get_named_file(name)
         if f is None:
             return []
         with f:
             return [l.strip() for l in f.readlines() if l.strip()]
 
     def do_commit(self, message=None, committer=None,
                   author=None, commit_timestamp=None,
                   commit_timezone=None, author_timestamp=None,
                   author_timezone=None, tree=None, encoding=None,
                   ref=b'HEAD', merge_heads=None):
         """Create a new commit.
 
         :param message: Commit message
         :param committer: Committer fullname
         :param author: Author fullname (defaults to committer)
         :param commit_timestamp: Commit timestamp (defaults to now)
         :param commit_timezone: Commit timestamp timezone (defaults to GMT)
         :param author_timestamp: Author timestamp (defaults to commit
             timestamp)
         :param author_timezone: Author timestamp timezone
             (defaults to commit timestamp timezone)
         :param tree: SHA1 of the tree root to use (if not specified the
             current index will be committed).
         :param encoding: Encoding
         :param ref: Optional ref to commit to (defaults to current branch)
         :param merge_heads: Merge heads (defaults to .git/MERGE_HEADS)
         :return: New commit SHA1
         """
         import time
         c = Commit()
         if tree is None:
             index = self.open_index()
             c.tree = index.commit(self.object_store)
         else:
             if len(tree) != 40:
                 raise ValueError("tree must be a 40-byte hex sha string")
             c.tree = tree
 
         try:
             self.hooks['pre-commit'].execute()
         except HookError as e:
             raise CommitError(e)
         except KeyError:  # no hook defined, silent fallthrough
             pass
 
         config = self.get_config_stack()
         if merge_heads is None:
             merge_heads = self._read_heads('MERGE_HEADS')
         if committer is None:
             committer = self._get_user_identity(config)
         check_user_identity(committer)
         c.committer = committer
         if commit_timestamp is None:
             # FIXME: Support GIT_COMMITTER_DATE environment variable
             commit_timestamp = time.time()
         c.commit_time = int(commit_timestamp)
         if commit_timezone is None:
             # FIXME: Use current user timezone rather than UTC
             commit_timezone = 0
         c.commit_timezone = commit_timezone
         if author is None:
             # FIXME: Support GIT_AUTHOR_NAME/GIT_AUTHOR_EMAIL environment
             # variables
             author = committer
         c.author = author
         check_user_identity(author)
         if author_timestamp is None:
             # FIXME: Support GIT_AUTHOR_DATE environment variable
             author_timestamp = commit_timestamp
         c.author_time = int(author_timestamp)
         if author_timezone is None:
             author_timezone = commit_timezone
         c.author_timezone = author_timezone
         if encoding is None:
             try:
                 encoding = config.get(('i18n', ), 'commitEncoding')
             except KeyError:
                 pass  # No dice
         if encoding is not None:
             c.encoding = encoding
         if message is None:
             # FIXME: Try to read commit message from .git/MERGE_MSG
             raise ValueError("No commit message specified")
 
         try:
             c.message = self.hooks['commit-msg'].execute(message)
             if c.message is None:
                 c.message = message
         except HookError as e:
             raise CommitError(e)
         except KeyError:  # no hook defined, message not modified
             c.message = message
 
         if ref is None:
             # Create a dangling commit
             c.parents = merge_heads
             self.object_store.add_object(c)
         else:
             try:
                 old_head = self.refs[ref]
                 c.parents = [old_head] + merge_heads
                 self.object_store.add_object(c)
                 ok = self.refs.set_if_equals(
                     ref, old_head, c.id, message=b"commit: " + message,
                     committer=committer, timestamp=commit_timestamp,
                     timezone=commit_timezone)
             except KeyError:
                 c.parents = merge_heads
                 self.object_store.add_object(c)
                 ok = self.refs.add_if_new(
                         ref, c.id, message=b"commit: " + message,
                         committer=committer, timestamp=commit_timestamp,
                         timezone=commit_timezone)
             if not ok:
                 # Fail if the atomic compare-and-swap failed, leaving the
                 # commit and all its objects as garbage.
                 raise CommitError("%s changed during commit" % (ref,))
 
         self._del_named_file('MERGE_HEADS')
 
         try:
             self.hooks['post-commit'].execute()
         except HookError as e:  # silent failure
             warnings.warn("post-commit hook failed: %s" % e, UserWarning)
         except KeyError:  # no hook defined, silent fallthrough
             pass
 
         return c.id
 
 
 def read_gitfile(f):
     """Read a ``.git`` file.
 
     The first line of the file should start with "gitdir: "
 
     :param f: File-like object to read from
     :return: A path
     """
     cs = f.read()
     if not cs.startswith("gitdir: "):
         raise ValueError("Expected file to start with 'gitdir: '")
     return cs[len("gitdir: "):].rstrip("\n")
 
 
 class Repo(BaseRepo):
     """A git repository backed by local disk.
 
     To open an existing repository, call the contructor with
     the path of the repository.
 
     To create a new repository, use the Repo.init class method.
     """
 
     def __init__(self, root):
         hidden_path = os.path.join(root, CONTROLDIR)
         if os.path.isdir(os.path.join(hidden_path, OBJECTDIR)):
             self.bare = False
             self._controldir = hidden_path
         elif (os.path.isdir(os.path.join(root, OBJECTDIR)) and
               os.path.isdir(os.path.join(root, REFSDIR))):
             self.bare = True
             self._controldir = root
         elif os.path.isfile(hidden_path):
             self.bare = False
             with open(hidden_path, 'r') as f:
                 path = read_gitfile(f)
             self.bare = False
             self._controldir = os.path.join(root, path)
         else:
             raise NotGitRepository(
                 "No git repository was found at %(path)s" % dict(path=root)
             )
         commondir = self.get_named_file(COMMONDIR)
         if commondir is not None:
             with commondir:
                 self._commondir = os.path.join(
                     self.controldir(),
                     commondir.read().rstrip(b"\r\n").decode(
                         sys.getfilesystemencoding()))
         else:
             self._commondir = self._controldir
         self.path = root
         object_store = DiskObjectStore(
             os.path.join(self.commondir(), OBJECTDIR))
         refs = DiskRefsContainer(self.commondir(), self._controldir,
                                  logger=self._write_reflog)
         BaseRepo.__init__(self, object_store, refs)
 
         self._graftpoints = {}
         graft_file = self.get_named_file(os.path.join("info", "grafts"),
                                          basedir=self.commondir())
         if graft_file:
             with graft_file:
                 self._graftpoints.update(parse_graftpoints(graft_file))
         graft_file = self.get_named_file("shallow",
                                          basedir=self.commondir())
         if graft_file:
             with graft_file:
                 self._graftpoints.update(parse_graftpoints(graft_file))
 
         self.hooks['pre-commit'] = PreCommitShellHook(self.controldir())
         self.hooks['commit-msg'] = CommitMsgShellHook(self.controldir())
         self.hooks['post-commit'] = PostCommitShellHook(self.controldir())
 
+        # Line ending convert filters
+        # TODO: Set them based on configuration
+        self.read_filter = None
+        self.write_filter = None
+
     def _write_reflog(self, ref, old_sha, new_sha, committer, timestamp,
                       timezone, message):
         from .reflog import format_reflog_line
         path = os.path.join(
                 self.controldir(), 'logs',
                 ref.decode(sys.getfilesystemencoding()))
         try:
             os.makedirs(os.path.dirname(path))
         except OSError as e:
             if e.errno != errno.EEXIST:
                 raise
         if committer is None:
             config = self.get_config_stack()
             committer = self._get_user_identity(config)
         check_user_identity(committer)
         if timestamp is None:
             timestamp = int(time.time())
         if timezone is None:
             timezone = 0  # FIXME
         with open(path, 'ab') as f:
             f.write(format_reflog_line(old_sha, new_sha, committer,
                     timestamp, timezone, message) + b'\n')
 
     @classmethod
     def discover(cls, start='.'):
         """Iterate parent directories to discover a repository
 
         Return a Repo object for the first parent directory that looks like a
         Git repository.
 
         :param start: The directory to start discovery from (defaults to '.')
         """
         remaining = True
         path = os.path.abspath(start)
         while remaining:
             try:
                 return cls(path)
             except NotGitRepository:
                 path, remaining = os.path.split(path)
         raise NotGitRepository(
             "No git repository was found at %(path)s" % dict(path=start)
         )
 
     def controldir(self):
         """Return the path of the control directory."""
         return self._controldir
 
     def commondir(self):
         """Return the path of the common directory.
 
         For a main working tree, it is identical to controldir().
 
         For a linked working tree, it is the control directory of the
         main working tree."""
 
         return self._commondir
 
     def _determine_file_mode(self):
         """Probe the file-system to determine whether permissions can be trusted.
 
         :return: True if permissions can be trusted, False otherwise.
         """
         fname = os.path.join(self.path, '.probe-permissions')
         with open(fname, 'w') as f:
             f.write('')
 
         st1 = os.lstat(fname)
         os.chmod(fname, st1.st_mode ^ stat.S_IXUSR)
         st2 = os.lstat(fname)
 
         os.unlink(fname)
 
         mode_differs = st1.st_mode != st2.st_mode
         st2_has_exec = (st2.st_mode & stat.S_IXUSR) != 0
 
         return mode_differs and st2_has_exec
 
     def _put_named_file(self, path, contents):
         """Write a file to the control dir with the given name and contents.
 
         :param path: The path to the file, relative to the control dir.
         :param contents: A string to write to the file.
         """
         path = path.lstrip(os.path.sep)
         with GitFile(os.path.join(self.controldir(), path), 'wb') as f:
             f.write(contents)
 
     def _del_named_file(self, path):
         try:
             os.unlink(os.path.join(self.controldir(), path))
         except (IOError, OSError) as e:
             if e.errno == errno.ENOENT:
                 return
             raise
 
     def get_named_file(self, path, basedir=None):
         """Get a file from the control dir with a specific name.
 
         Although the filename should be interpreted as a filename relative to
         the control dir in a disk-based Repo, the object returned need not be
         pointing to a file in that location.
 
         :param path: The path to the file, relative to the control dir.
         :param basedir: Optional argument that specifies an alternative to the
             control dir.
         :return: An open file object, or None if the file does not exist.
         """
         # TODO(dborowitz): sanitize filenames, since this is used directly by
         # the dumb web serving code.
         if basedir is None:
             basedir = self.controldir()
         path = path.lstrip(os.path.sep)
         try:
             return open(os.path.join(basedir, path), 'rb')
         except (IOError, OSError) as e:
             if e.errno == errno.ENOENT:
                 return None
             raise
 
     def index_path(self):
         """Return path to the index file."""
         return os.path.join(self.controldir(), INDEX_FILENAME)
 
     def open_index(self):
         """Open the index for this repository.
 
         :raise NoIndexPresent: If no index is present
         :return: The matching `Index`
         """
         from dulwich.index import Index
         if not self.has_index():
             raise NoIndexPresent()
         return Index(self.index_path())
 
     def has_index(self):
         """Check if an index is present."""
         # Bare repos must never have index files; non-bare repos may have a
         # missing index file, which is treated as empty.
         return not self.bare
 
     def stage(self, fs_paths):
         """Stage a set of paths.
 
         :param fs_paths: List of paths, relative to the repository path
         """
 
         root_path_bytes = self.path.encode(sys.getfilesystemencoding())
 
         if not isinstance(fs_paths, list):
             fs_paths = [fs_paths]
         from dulwich.index import (
             blob_from_path_and_stat,
             index_entry_from_stat,
             _fs_to_tree_path,
             )
         index = self.open_index()
         for fs_path in fs_paths:
             if not isinstance(fs_path, bytes):
                 fs_path = fs_path.encode(sys.getfilesystemencoding())
             if os.path.isabs(fs_path):
                 raise ValueError(
                     "path %r should be relative to "
                     "repository root, not absolute" % fs_path)
             tree_path = _fs_to_tree_path(fs_path)
             full_path = os.path.join(root_path_bytes, fs_path)
             try:
                 st = os.lstat(full_path)
             except OSError:
                 # File no longer exists
                 try:
                     del index[tree_path]
                 except KeyError:
                     pass  # already removed
             else:
                 if not stat.S_ISDIR(st.st_mode):
                     blob = blob_from_path_and_stat(full_path, st)
                     self.object_store.add_object(blob)
                     index[tree_path] = index_entry_from_stat(st, blob.id, 0)
                 else:
                     try:
                         del index[tree_path]
                     except KeyError:
                         pass
         index.write()
 
     def clone(self, target_path, mkdir=True, bare=False,
               origin=b"origin", checkout=None):
         """Clone this repository.
 
         :param target_path: Target path
         :param mkdir: Create the target directory
         :param bare: Whether to create a bare repository
         :param origin: Base name for refs in target repository
             cloned from this repository
         :return: Created repository as `Repo`
         """
         if not bare:
             target = self.init(target_path, mkdir=mkdir)
         else:
             if checkout:
                 raise ValueError("checkout and bare are incompatible")
             target = self.init_bare(target_path, mkdir=mkdir)
         self.fetch(target)
         encoded_path = self.path
         if not isinstance(encoded_path, bytes):
             encoded_path = encoded_path.encode(sys.getfilesystemencoding())
         ref_message = b"clone: from " + encoded_path
         target.refs.import_refs(
             b'refs/remotes/' + origin, self.refs.as_dict(b'refs/heads'),
             message=ref_message)
         target.refs.import_refs(
             b'refs/tags', self.refs.as_dict(b'refs/tags'),
             message=ref_message)
         try:
             target.refs.add_if_new(
                     DEFAULT_REF, self.refs[DEFAULT_REF],
                     message=ref_message)
         except KeyError:
             pass
         target_config = target.get_config()
         target_config.set(('remote', 'origin'), 'url', encoded_path)
         target_config.set(('remote', 'origin'), 'fetch',
                           '+refs/heads/*:refs/remotes/origin/*')
         target_config.write_to_path()
 
         # Update target head
         head_chain, head_sha = self.refs.follow(b'HEAD')
         if head_chain and head_sha is not None:
             target.refs.set_symbolic_ref(b'HEAD', head_chain[-1],
                                          message=ref_message)
             target[b'HEAD'] = head_sha
 
             if checkout is None:
                 checkout = (not bare)
             if checkout:
                 # Checkout HEAD to target dir
                 target.reset_index()
 
         return target
 
     def reset_index(self, tree=None):
         """Reset the index back to a specific tree.
 
         :param tree: Tree SHA to reset to, None for current HEAD tree.
         """
         from dulwich.index import (
             build_index_from_tree,
             validate_path_element_default,
             validate_path_element_ntfs,
             )
         if tree is None:
             tree = self[b'HEAD'].tree
         config = self.get_config()
         honor_filemode = config.get_boolean(
             b'core', b'filemode', os.name != "nt")
         if config.get_boolean(b'core', b'core.protectNTFS', os.name == "nt"):
             validate_path_element = validate_path_element_ntfs
         else:
             validate_path_element = validate_path_element_default
         return build_index_from_tree(
             self.path, self.index_path(), self.object_store, tree,
             honor_filemode=honor_filemode,
             validate_path_element=validate_path_element)
 
     def get_config(self):
         """Retrieve the config object.
 
         :return: `ConfigFile` object for the ``.git/config`` file.
         """
         from dulwich.config import ConfigFile
         path = os.path.join(self._controldir, 'config')
         try:
             return ConfigFile.from_path(path)
         except (IOError, OSError) as e:
             if e.errno != errno.ENOENT:
                 raise
             ret = ConfigFile()
             ret.path = path
             return ret
 
     def get_description(self):
         """Retrieve the description of this repository.
 
         :return: A string describing the repository or None.
         """
         path = os.path.join(self._controldir, 'description')
         try:
             with GitFile(path, 'rb') as f:
                 return f.read()
         except (IOError, OSError) as e:
             if e.errno != errno.ENOENT:
                 raise
             return None
 
     def __repr__(self):
         return "<Repo at %r>" % self.path
 
     def set_description(self, description):
         """Set the description for this repository.
 
         :param description: Text to set as description for this repository.
         """
 
         self._put_named_file('description', description)
 
     @classmethod
     def _init_maybe_bare(cls, path, bare):
         for d in BASE_DIRECTORIES:
             os.mkdir(os.path.join(path, *d))
         DiskObjectStore.init(os.path.join(path, OBJECTDIR))
         ret = cls(path)
         ret.refs.set_symbolic_ref(b'HEAD', DEFAULT_REF)
         ret._init_files(bare)
         return ret
 
     @classmethod
     def init(cls, path, mkdir=False):
         """Create a new repository.
 
         :param path: Path in which to create the repository
         :param mkdir: Whether to create the directory
         :return: `Repo` instance
         """
         if mkdir:
             os.mkdir(path)
         controldir = os.path.join(path, CONTROLDIR)
         os.mkdir(controldir)
         cls._init_maybe_bare(controldir, False)
         return cls(path)
 
     @classmethod
     def _init_new_working_directory(cls, path, main_repo, identifier=None,
                                     mkdir=False):
         """Create a new working directory linked to a repository.
 
         :param path: Path in which to create the working tree.
         :param main_repo: Main repository to reference
         :param identifier: Worktree identifier
         :param mkdir: Whether to create the directory
         :return: `Repo` instance
         """
         if mkdir:
             os.mkdir(path)
         if identifier is None:
             identifier = os.path.basename(path)
         main_worktreesdir = os.path.join(main_repo.controldir(), WORKTREES)
         worktree_controldir = os.path.join(main_worktreesdir, identifier)
         gitdirfile = os.path.join(path, CONTROLDIR)
         with open(gitdirfile, 'wb') as f:
             f.write(b'gitdir: ' +
                     worktree_controldir.encode(sys.getfilesystemencoding()) +
                     b'\n')
         try:
             os.mkdir(main_worktreesdir)
         except OSError as e:
             if e.errno != errno.EEXIST:
                 raise
         try:
             os.mkdir(worktree_controldir)
         except OSError as e:
             if e.errno != errno.EEXIST:
                 raise
         with open(os.path.join(worktree_controldir, GITDIR), 'wb') as f:
             f.write(gitdirfile.encode(sys.getfilesystemencoding()) + b'\n')
         with open(os.path.join(worktree_controldir, COMMONDIR), 'wb') as f:
             f.write(b'../..\n')
         with open(os.path.join(worktree_controldir, 'HEAD'), 'wb') as f:
             f.write(main_repo.head() + b'\n')
         r = cls(path)
         r.reset_index()
         return r
 
     @classmethod
     def init_bare(cls, path, mkdir=False):
         """Create a new bare repository.
 
         ``path`` should already exist and be an empty directory.
 
         :param path: Path to create bare repository in
         :return: a `Repo` instance
         """
         if mkdir:
             os.mkdir(path)
         return cls._init_maybe_bare(path, True)
 
     create = init_bare
 
     def close(self):
         """Close any files opened by this repository."""
         self.object_store.close()
 
     def __enter__(self):
         return self
 
     def __exit__(self, exc_type, exc_val, exc_tb):
         self.close()
 
+    def get_blob_normalizer(self):
+        """ Return a BlobNormalizer object
+        """
+        # TODO Parse the git attributes files
+        git_attributes = {}
+        return BlobNormalizer(self.get_config_stack(), git_attributes, self.read_filter, self.write_filter)
+
 
 class MemoryRepo(BaseRepo):
     """Repo that stores refs, objects, and named files in memory.
 
     MemoryRepos are always bare: they have no working tree and no index, since
     those have a stronger dependency on the filesystem.
     """
 
     def __init__(self):
         from dulwich.config import ConfigFile
         self._reflog = []
         refs_container = DictRefsContainer({}, logger=self._append_reflog)
         BaseRepo.__init__(self, MemoryObjectStore(), refs_container)
         self._named_files = {}
         self.bare = True
         self._config = ConfigFile()
         self._description = None
 
     def _append_reflog(self, *args):
         self._reflog.append(args)
 
     def set_description(self, description):
         self._description = description
 
     def get_description(self):
         return self._description
 
     def _determine_file_mode(self):
         """Probe the file-system to determine whether permissions can be trusted.
 
         :return: True if permissions can be trusted, False otherwise.
         """
         return sys.platform != 'win32'
 
     def _put_named_file(self, path, contents):
         """Write a file to the control dir with the given name and contents.
 
         :param path: The path to the file, relative to the control dir.
         :param contents: A string to write to the file.
         """
         self._named_files[path] = contents
 
     def _del_named_file(self, path):
         try:
             del self._named_files[path]
         except KeyError:
             pass
 
     def get_named_file(self, path):
         """Get a file from the control dir with a specific name.
 
         Although the filename should be interpreted as a filename relative to
         the control dir in a disk-baked Repo, the object returned need not be
         pointing to a file in that location.
 
         :param path: The path to the file, relative to the control dir.
         :return: An open file object, or None if the file does not exist.
         """
         contents = self._named_files.get(path, None)
         if contents is None:
             return None
         return BytesIO(contents)
 
     def open_index(self):
         """Fail to open index for this repo, since it is bare.
 
         :raise NoIndexPresent: Raised when no index is present
         """
         raise NoIndexPresent()
 
     def get_config(self):
         """Retrieve the config object.
 
         :return: `ConfigFile` object.
         """
         return self._config
 
     @classmethod
     def init_bare(cls, objects, refs):
         """Create a new bare repository in memory.
 
         :param objects: Objects for the new repository,
             as iterable
         :param refs: Refs as dictionary, mapping names
             to object SHA1s
         """
         ret = cls()
         for obj in objects:
             ret.object_store.add_object(obj)
         for refname, sha in refs.items():
             ret.refs.add_if_new(refname, sha)
         ret._init_files(bare=True)
         return ret
diff --git a/dulwich/tests/test_porcelain.py b/dulwich/tests/test_porcelain.py
index feed11f7..3b7ce5ed 100644
--- a/dulwich/tests/test_porcelain.py
+++ b/dulwich/tests/test_porcelain.py
@@ -1,1576 +1,1626 @@
 # test_porcelain.py -- porcelain tests
 # Copyright (C) 2013 Jelmer Vernooij <jelmer@jelmer.uk>
 #
 # Dulwich is dual-licensed under the Apache License, Version 2.0 and the GNU
 # General Public License as public by the Free Software Foundation; version 2.0
 # or (at your option) any later version. You can redistribute it and/or
 # modify it under the terms of either of these two licenses.
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
 # You should have received a copy of the licenses; if not, see
 # <http://www.gnu.org/licenses/> for a copy of the GNU General Public License
 # and <http://www.apache.org/licenses/LICENSE-2.0> for a copy of the Apache
 # License, Version 2.0.
 #
 
 """Tests for dulwich.porcelain."""
 
 from io import BytesIO
 try:
     from StringIO import StringIO
 except ImportError:
     from io import StringIO
 import os
 import shutil
 import tarfile
 import tempfile
 import time
 
 from dulwich import porcelain
 from dulwich.diff_tree import tree_changes
+from dulwich.line_ending import convert_crlf_to_lf
 from dulwich.objects import (
     Blob,
     Tag,
     Tree,
     ZERO_SHA,
     )
 from dulwich.repo import (
     NoIndexPresent,
     Repo,
     )
 from dulwich.tests import (
     TestCase,
     )
 from dulwich.tests.utils import (
     build_commit_graph,
     make_commit,
     make_object,
     )
 
 
 class PorcelainTestCase(TestCase):
 
     def setUp(self):
         super(PorcelainTestCase, self).setUp()
         self.test_dir = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, self.test_dir)
         self.repo = Repo.init(os.path.join(self.test_dir, 'repo'), mkdir=True)
         self.addCleanup(self.repo.close)
 
 
 class ArchiveTests(PorcelainTestCase):
     """Tests for the archive command."""
 
     def test_simple(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"refs/heads/master"] = c3.id
         out = BytesIO()
         err = BytesIO()
         porcelain.archive(self.repo.path, b"refs/heads/master", outstream=out,
                           errstream=err)
         self.assertEqual(b"", err.getvalue())
         tf = tarfile.TarFile(fileobj=out)
         self.addCleanup(tf.close)
         self.assertEqual([], tf.getnames())
 
 
 class UpdateServerInfoTests(PorcelainTestCase):
 
     def test_simple(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"refs/heads/foo"] = c3.id
         porcelain.update_server_info(self.repo.path)
         self.assertTrue(os.path.exists(
                 os.path.join(self.repo.controldir(), 'info', 'refs')))
 
 
 class CommitTests(PorcelainTestCase):
 
     def test_custom_author(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"refs/heads/foo"] = c3.id
         sha = porcelain.commit(
                 self.repo.path, message=b"Some message",
                 author=b"Joe <joe@example.com>",
                 committer=b"Bob <bob@example.com>")
         self.assertTrue(isinstance(sha, bytes))
         self.assertEqual(len(sha), 40)
 
     def test_unicode(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"refs/heads/foo"] = c3.id
         sha = porcelain.commit(
                 self.repo.path, message="Some message",
                 author="Joe <joe@example.com>",
                 committer="Bob <bob@example.com>")
         self.assertTrue(isinstance(sha, bytes))
         self.assertEqual(len(sha), 40)
 
 
 class CloneTests(PorcelainTestCase):
 
     def test_simple_local(self):
         f1_1 = make_object(Blob, data=b'f1')
         commit_spec = [[1], [2, 1], [3, 1, 2]]
         trees = {1: [(b'f1', f1_1), (b'f2', f1_1)],
                  2: [(b'f1', f1_1), (b'f2', f1_1)],
                  3: [(b'f1', f1_1), (b'f2', f1_1)], }
 
         c1, c2, c3 = build_commit_graph(self.repo.object_store,
                                         commit_spec, trees)
         self.repo.refs[b"refs/heads/master"] = c3.id
         self.repo.refs[b"refs/tags/foo"] = c3.id
         target_path = tempfile.mkdtemp()
         errstream = BytesIO()
         self.addCleanup(shutil.rmtree, target_path)
         r = porcelain.clone(self.repo.path, target_path,
                             checkout=False, errstream=errstream)
         self.addCleanup(r.close)
         self.assertEqual(r.path, target_path)
         target_repo = Repo(target_path)
         self.assertEqual(0, len(target_repo.open_index()))
         self.assertEqual(c3.id, target_repo.refs[b'refs/tags/foo'])
         self.assertTrue(b'f1' not in os.listdir(target_path))
         self.assertTrue(b'f2' not in os.listdir(target_path))
         c = r.get_config()
         encoded_path = self.repo.path
         if not isinstance(encoded_path, bytes):
             encoded_path = encoded_path.encode('utf-8')
         self.assertEqual(encoded_path, c.get((b'remote', b'origin'), b'url'))
         self.assertEqual(
             b'+refs/heads/*:refs/remotes/origin/*',
             c.get((b'remote', b'origin'), b'fetch'))
 
     def test_simple_local_with_checkout(self):
         f1_1 = make_object(Blob, data=b'f1')
         commit_spec = [[1], [2, 1], [3, 1, 2]]
         trees = {1: [(b'f1', f1_1), (b'f2', f1_1)],
                  2: [(b'f1', f1_1), (b'f2', f1_1)],
                  3: [(b'f1', f1_1), (b'f2', f1_1)], }
 
         c1, c2, c3 = build_commit_graph(self.repo.object_store,
                                         commit_spec, trees)
         self.repo.refs[b"refs/heads/master"] = c3.id
         target_path = tempfile.mkdtemp()
         errstream = BytesIO()
         self.addCleanup(shutil.rmtree, target_path)
         with porcelain.clone(self.repo.path, target_path,
                              checkout=True,
                              errstream=errstream) as r:
             self.assertEqual(r.path, target_path)
         with Repo(target_path) as r:
             self.assertEqual(r.head(), c3.id)
         self.assertTrue('f1' in os.listdir(target_path))
         self.assertTrue('f2' in os.listdir(target_path))
 
     def test_bare_local_with_checkout(self):
         f1_1 = make_object(Blob, data=b'f1')
         commit_spec = [[1], [2, 1], [3, 1, 2]]
         trees = {1: [(b'f1', f1_1), (b'f2', f1_1)],
                  2: [(b'f1', f1_1), (b'f2', f1_1)],
                  3: [(b'f1', f1_1), (b'f2', f1_1)], }
 
         c1, c2, c3 = build_commit_graph(self.repo.object_store,
                                         commit_spec, trees)
         self.repo.refs[b"refs/heads/master"] = c3.id
         target_path = tempfile.mkdtemp()
         errstream = BytesIO()
         self.addCleanup(shutil.rmtree, target_path)
         with porcelain.clone(
                 self.repo.path, target_path, bare=True,
                 errstream=errstream) as r:
             self.assertEqual(r.path, target_path)
         with Repo(target_path) as r:
             r.head()
             self.assertRaises(NoIndexPresent, r.open_index)
         self.assertFalse(b'f1' in os.listdir(target_path))
         self.assertFalse(b'f2' in os.listdir(target_path))
 
     def test_no_checkout_with_bare(self):
         f1_1 = make_object(Blob, data=b'f1')
         commit_spec = [[1]]
         trees = {1: [(b'f1', f1_1), (b'f2', f1_1)]}
 
         (c1, ) = build_commit_graph(self.repo.object_store, commit_spec, trees)
         self.repo.refs[b"refs/heads/master"] = c1.id
         self.repo.refs[b"HEAD"] = c1.id
         target_path = tempfile.mkdtemp()
         errstream = BytesIO()
         self.addCleanup(shutil.rmtree, target_path)
         self.assertRaises(
             ValueError, porcelain.clone, self.repo.path,
             target_path, checkout=True, bare=True, errstream=errstream)
 
     def test_no_head_no_checkout(self):
         f1_1 = make_object(Blob, data=b'f1')
         commit_spec = [[1]]
         trees = {1: [(b'f1', f1_1), (b'f2', f1_1)]}
 
         (c1, ) = build_commit_graph(self.repo.object_store, commit_spec, trees)
         self.repo.refs[b"refs/heads/master"] = c1.id
         target_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, target_path)
         errstream = BytesIO()
         r = porcelain.clone(
             self.repo.path, target_path, checkout=True, errstream=errstream)
         r.close()
 
     def test_no_head_no_checkout_outstream_errstream_autofallback(self):
         f1_1 = make_object(Blob, data=b'f1')
         commit_spec = [[1]]
         trees = {1: [(b'f1', f1_1), (b'f2', f1_1)]}
 
         (c1, ) = build_commit_graph(self.repo.object_store, commit_spec, trees)
         self.repo.refs[b"refs/heads/master"] = c1.id
         target_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, target_path)
         errstream = porcelain.NoneStream()
         r = porcelain.clone(
             self.repo.path, target_path, checkout=True, errstream=errstream)
         r.close()
 
 
 class InitTests(TestCase):
 
     def test_non_bare(self):
         repo_dir = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, repo_dir)
         porcelain.init(repo_dir)
 
     def test_bare(self):
         repo_dir = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, repo_dir)
         porcelain.init(repo_dir, bare=True)
 
 
 class AddTests(PorcelainTestCase):
 
     def test_add_default_paths(self):
         # create a file for initial commit
         fullpath = os.path.join(self.repo.path, 'blah')
         with open(fullpath, 'w') as f:
             f.write("\n")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         porcelain.commit(repo=self.repo.path, message=b'test',
                          author=b'test <email>', committer=b'test <email>')
 
         # Add a second test file and a file in a directory
         with open(os.path.join(self.repo.path, 'foo'), 'w') as f:
             f.write("\n")
         os.mkdir(os.path.join(self.repo.path, 'adir'))
         with open(os.path.join(self.repo.path, 'adir', 'afile'), 'w') as f:
             f.write("\n")
         cwd = os.getcwd()
         try:
             os.chdir(self.repo.path)
             porcelain.add(self.repo.path)
         finally:
             os.chdir(cwd)
 
         # Check that foo was added and nothing in .git was modified
         index = self.repo.open_index()
         self.assertEqual(sorted(index), [b'adir/afile', b'blah', b'foo'])
 
     def test_add_default_paths_subdir(self):
         os.mkdir(os.path.join(self.repo.path, 'foo'))
         with open(os.path.join(self.repo.path, 'blah'), 'w') as f:
             f.write("\n")
         with open(os.path.join(self.repo.path, 'foo', 'blie'), 'w') as f:
             f.write("\n")
 
         cwd = os.getcwd()
         try:
             os.chdir(os.path.join(self.repo.path, 'foo'))
             porcelain.add(repo=self.repo.path)
             porcelain.commit(repo=self.repo.path, message=b'test',
                              author=b'test <email>',
                              committer=b'test <email>')
         finally:
             os.chdir(cwd)
 
         index = self.repo.open_index()
         self.assertEqual(sorted(index), [b'foo/blie'])
 
     def test_add_file(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(self.repo.path, paths=[fullpath])
         self.assertIn(b"foo", self.repo.open_index())
 
     def test_add_ignored(self):
         with open(os.path.join(self.repo.path, '.gitignore'), 'w') as f:
             f.write("foo")
         with open(os.path.join(self.repo.path, 'foo'), 'w') as f:
             f.write("BAR")
         with open(os.path.join(self.repo.path, 'bar'), 'w') as f:
             f.write("BAR")
         (added, ignored) = porcelain.add(self.repo.path, paths=[
             os.path.join(self.repo.path, "foo"),
             os.path.join(self.repo.path, "bar")])
         self.assertIn(b"bar", self.repo.open_index())
         self.assertEqual(set(['bar']), set(added))
         self.assertEqual(set(['foo']), ignored)
 
     def test_add_file_absolute_path(self):
         # Absolute paths are (not yet) supported
         with open(os.path.join(self.repo.path, 'foo'), 'w') as f:
             f.write("BAR")
         porcelain.add(self.repo, paths=[os.path.join(self.repo.path, "foo")])
         self.assertIn(b"foo", self.repo.open_index())
 
     def test_add_not_in_repo(self):
         with open(os.path.join(self.test_dir, 'foo'), 'w') as f:
             f.write("BAR")
         self.assertRaises(
             ValueError,
             porcelain.add, self.repo,
             paths=[os.path.join(self.test_dir, "foo")])
         self.assertRaises(
             ValueError,
             porcelain.add, self.repo,
             paths=["../foo"])
         self.assertEqual([], list(self.repo.open_index()))
 
 
 class RemoveTests(PorcelainTestCase):
 
     def test_remove_file(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(self.repo.path, paths=[fullpath])
         porcelain.commit(repo=self.repo, message=b'test',
                          author=b'test <email>',
                          committer=b'test <email>')
         self.assertTrue(os.path.exists(os.path.join(self.repo.path, 'foo')))
         cwd = os.getcwd()
         try:
             os.chdir(self.repo.path)
             porcelain.remove(self.repo.path, paths=["foo"])
         finally:
             os.chdir(cwd)
         self.assertFalse(os.path.exists(os.path.join(self.repo.path, 'foo')))
 
     def test_remove_file_staged(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         cwd = os.getcwd()
         try:
             os.chdir(self.repo.path)
             porcelain.add(self.repo.path, paths=[fullpath])
             self.assertRaises(Exception, porcelain.rm, self.repo.path,
                               paths=["foo"])
         finally:
             os.chdir(cwd)
 
 
 class LogTests(PorcelainTestCase):
 
     def test_simple(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
         outstream = StringIO()
         porcelain.log(self.repo.path, outstream=outstream)
         self.assertEqual(3, outstream.getvalue().count("-" * 50))
 
     def test_max_entries(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
         outstream = StringIO()
         porcelain.log(self.repo.path, outstream=outstream, max_entries=1)
         self.assertEqual(1, outstream.getvalue().count("-" * 50))
 
 
 class ShowTests(PorcelainTestCase):
 
     def test_nolist(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
         outstream = StringIO()
         porcelain.show(self.repo.path, objects=c3.id, outstream=outstream)
         self.assertTrue(outstream.getvalue().startswith("-" * 50))
 
     def test_simple(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
         outstream = StringIO()
         porcelain.show(self.repo.path, objects=[c3.id], outstream=outstream)
         self.assertTrue(outstream.getvalue().startswith("-" * 50))
 
     def test_blob(self):
         b = Blob.from_string(b"The Foo\n")
         self.repo.object_store.add_object(b)
         outstream = StringIO()
         porcelain.show(self.repo.path, objects=[b.id], outstream=outstream)
         self.assertEqual(outstream.getvalue(), "The Foo\n")
 
     def test_commit_no_parent(self):
         a = Blob.from_string(b"The Foo\n")
         ta = Tree()
         ta.add(b"somename", 0o100644, a.id)
         ca = make_commit(tree=ta.id)
         self.repo.object_store.add_objects([(a, None), (ta, None), (ca, None)])
         outstream = StringIO()
         porcelain.show(self.repo.path, objects=[ca.id], outstream=outstream)
         self.assertMultiLineEqual(outstream.getvalue(), """\
 --------------------------------------------------
 commit: 344da06c1bb85901270b3e8875c988a027ec087d
 Author: Test Author <test@nodomain.com>
 Committer: Test Committer <test@nodomain.com>
 Date:   Fri Jan 01 2010 00:00:00 +0000
 
 Test message.
 
 diff --git /dev/null b/somename
 new mode 100644
 index 0000000..ea5c7bf 100644
 --- /dev/null
 +++ b/somename
 @@ -0,0 +1 @@
 +The Foo
 """)
 
     def test_commit_with_change(self):
         a = Blob.from_string(b"The Foo\n")
         ta = Tree()
         ta.add(b"somename", 0o100644, a.id)
         ca = make_commit(tree=ta.id)
         b = Blob.from_string(b"The Bar\n")
         tb = Tree()
         tb.add(b"somename", 0o100644, b.id)
         cb = make_commit(tree=tb.id, parents=[ca.id])
         self.repo.object_store.add_objects(
             [(a, None), (b, None), (ta, None), (tb, None),
              (ca, None), (cb, None)])
         outstream = StringIO()
         porcelain.show(self.repo.path, objects=[cb.id], outstream=outstream)
         self.assertMultiLineEqual(outstream.getvalue(), """\
 --------------------------------------------------
 commit: 2c6b6c9cb72c130956657e1fdae58e5b103744fa
 Author: Test Author <test@nodomain.com>
 Committer: Test Committer <test@nodomain.com>
 Date:   Fri Jan 01 2010 00:00:00 +0000
 
 Test message.
 
 diff --git a/somename b/somename
 index ea5c7bf..fd38bcb 100644
 --- a/somename
 +++ b/somename
 @@ -1 +1 @@
 -The Foo
 +The Bar
 """)
 
 
 class SymbolicRefTests(PorcelainTestCase):
 
     def test_set_wrong_symbolic_ref(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
 
         self.assertRaises(ValueError, porcelain.symbolic_ref, self.repo.path,
                           b'foobar')
 
     def test_set_force_wrong_symbolic_ref(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
 
         porcelain.symbolic_ref(self.repo.path, b'force_foobar', force=True)
 
         # test if we actually changed the file
         with self.repo.get_named_file('HEAD') as f:
             new_ref = f.read()
         self.assertEqual(new_ref, b'ref: refs/heads/force_foobar\n')
 
     def test_set_symbolic_ref(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
 
         porcelain.symbolic_ref(self.repo.path, b'master')
 
     def test_set_symbolic_ref_other_than_master(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]],
                 attrs=dict(refs='develop'))
         self.repo.refs[b"HEAD"] = c3.id
         self.repo.refs[b"refs/heads/develop"] = c3.id
 
         porcelain.symbolic_ref(self.repo.path, b'develop')
 
         # test if we actually changed the file
         with self.repo.get_named_file('HEAD') as f:
             new_ref = f.read()
         self.assertEqual(new_ref, b'ref: refs/heads/develop\n')
 
 
 class DiffTreeTests(PorcelainTestCase):
 
     def test_empty(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
         outstream = BytesIO()
         porcelain.diff_tree(self.repo.path, c2.tree, c3.tree,
                             outstream=outstream)
         self.assertEqual(outstream.getvalue(), b"")
 
 
 class CommitTreeTests(PorcelainTestCase):
 
     def test_simple(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         b = Blob()
         b.data = b"foo the bar"
         t = Tree()
         t.add(b"somename", 0o100644, b.id)
         self.repo.object_store.add_object(t)
         self.repo.object_store.add_object(b)
         sha = porcelain.commit_tree(
             self.repo.path, t.id, message=b"Withcommit.",
             author=b"Joe <joe@example.com>",
             committer=b"Jane <jane@example.com>")
         self.assertTrue(isinstance(sha, bytes))
         self.assertEqual(len(sha), 40)
 
 
 class RevListTests(PorcelainTestCase):
 
     def test_simple(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         outstream = BytesIO()
         porcelain.rev_list(
             self.repo.path, [c3.id], outstream=outstream)
         self.assertEqual(
             c3.id + b"\n" +
             c2.id + b"\n" +
             c1.id + b"\n",
             outstream.getvalue())
 
 
 class TagCreateTests(PorcelainTestCase):
 
     def test_annotated(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
 
         porcelain.tag_create(self.repo.path, b"tryme", b'foo <foo@bar.com>',
                              b'bar', annotated=True)
 
         tags = self.repo.refs.as_dict(b"refs/tags")
         self.assertEqual(list(tags.keys()), [b"tryme"])
         tag = self.repo[b'refs/tags/tryme']
         self.assertTrue(isinstance(tag, Tag))
         self.assertEqual(b"foo <foo@bar.com>", tag.tagger)
         self.assertEqual(b"bar", tag.message)
         self.assertLess(time.time() - tag.tag_time, 5)
 
     def test_unannotated(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
 
         porcelain.tag_create(self.repo.path, b"tryme", annotated=False)
 
         tags = self.repo.refs.as_dict(b"refs/tags")
         self.assertEqual(list(tags.keys()), [b"tryme"])
         self.repo[b'refs/tags/tryme']
         self.assertEqual(list(tags.values()), [self.repo.head()])
 
     def test_unannotated_unicode(self):
         c1, c2, c3 = build_commit_graph(
                 self.repo.object_store, [[1], [2, 1], [3, 1, 2]])
         self.repo.refs[b"HEAD"] = c3.id
 
         porcelain.tag_create(self.repo.path, "tryme", annotated=False)
 
         tags = self.repo.refs.as_dict(b"refs/tags")
         self.assertEqual(list(tags.keys()), [b"tryme"])
         self.repo[b'refs/tags/tryme']
         self.assertEqual(list(tags.values()), [self.repo.head()])
 
 
 class TagListTests(PorcelainTestCase):
 
     def test_empty(self):
         tags = porcelain.tag_list(self.repo.path)
         self.assertEqual([], tags)
 
     def test_simple(self):
         self.repo.refs[b"refs/tags/foo"] = b"aa" * 20
         self.repo.refs[b"refs/tags/bar/bla"] = b"bb" * 20
         tags = porcelain.tag_list(self.repo.path)
 
         self.assertEqual([b"bar/bla", b"foo"], tags)
 
 
 class TagDeleteTests(PorcelainTestCase):
 
     def test_simple(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo[b"HEAD"] = c1.id
         porcelain.tag_create(self.repo, b'foo')
         self.assertTrue(b"foo" in porcelain.tag_list(self.repo))
         porcelain.tag_delete(self.repo, b'foo')
         self.assertFalse(b"foo" in porcelain.tag_list(self.repo))
 
 
 class ResetTests(PorcelainTestCase):
 
     def test_hard_head(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(self.repo.path, paths=[fullpath])
         porcelain.commit(self.repo.path, message=b"Some message",
                          committer=b"Jane <jane@example.com>",
                          author=b"John <john@example.com>")
 
         with open(os.path.join(self.repo.path, 'foo'), 'wb') as f:
             f.write(b"OOH")
 
         porcelain.reset(self.repo, "hard", b"HEAD")
 
         index = self.repo.open_index()
         changes = list(tree_changes(self.repo,
                        index.commit(self.repo.object_store),
                        self.repo[b'HEAD'].tree))
 
         self.assertEqual([], changes)
 
     def test_hard_commit(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(self.repo.path, paths=[fullpath])
         sha = porcelain.commit(self.repo.path, message=b"Some message",
                                committer=b"Jane <jane@example.com>",
                                author=b"John <john@example.com>")
 
         with open(fullpath, 'wb') as f:
             f.write(b"BAZ")
         porcelain.add(self.repo.path, paths=[fullpath])
         porcelain.commit(self.repo.path, message=b"Some other message",
                          committer=b"Jane <jane@example.com>",
                          author=b"John <john@example.com>")
 
         porcelain.reset(self.repo, "hard", sha)
 
         index = self.repo.open_index()
         changes = list(tree_changes(self.repo,
                        index.commit(self.repo.object_store),
                        self.repo[sha].tree))
 
         self.assertEqual([], changes)
 
 
 class PushTests(PorcelainTestCase):
 
     def test_simple(self):
         """
         Basic test of porcelain push where self.repo is the remote.  First
         clone the remote, commit a file to the clone, then push the changes
         back to the remote.
         """
         outstream = BytesIO()
         errstream = BytesIO()
 
         porcelain.commit(repo=self.repo.path, message=b'init',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         # Setup target repo cloned from temp test repo
         clone_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, clone_path)
         target_repo = porcelain.clone(self.repo.path, target=clone_path,
                                       errstream=errstream)
         try:
             self.assertEqual(target_repo[b'HEAD'], self.repo[b'HEAD'])
         finally:
             target_repo.close()
 
         # create a second file to be pushed back to origin
         handle, fullpath = tempfile.mkstemp(dir=clone_path)
         os.close(handle)
         porcelain.add(repo=clone_path, paths=[fullpath])
         porcelain.commit(repo=clone_path, message=b'push',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         # Setup a non-checked out branch in the remote
         refs_path = b"refs/heads/foo"
         new_id = self.repo[b'HEAD'].id
         self.assertNotEqual(new_id, ZERO_SHA)
         self.repo.refs[refs_path] = new_id
 
         # Push to the remote
         porcelain.push(clone_path, self.repo.path, b"HEAD:" + refs_path,
                        outstream=outstream, errstream=errstream)
 
         # Check that the target and source
         with Repo(clone_path) as r_clone:
             self.assertEqual({
                 b'HEAD': new_id,
                 b'refs/heads/foo': r_clone[b'HEAD'].id,
                 b'refs/heads/master': new_id,
                 }, self.repo.get_refs())
             self.assertEqual(r_clone[b'HEAD'].id, self.repo[refs_path].id)
 
             # Get the change in the target repo corresponding to the add
             # this will be in the foo branch.
             change = list(tree_changes(self.repo, self.repo[b'HEAD'].tree,
                                        self.repo[b'refs/heads/foo'].tree))[0]
             self.assertEqual(os.path.basename(fullpath),
                              change.new.path.decode('ascii'))
 
     def test_delete(self):
         """Basic test of porcelain push, removing a branch.
         """
         outstream = BytesIO()
         errstream = BytesIO()
 
         porcelain.commit(repo=self.repo.path, message=b'init',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         # Setup target repo cloned from temp test repo
         clone_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, clone_path)
         target_repo = porcelain.clone(self.repo.path, target=clone_path,
                                       errstream=errstream)
         target_repo.close()
 
         # Setup a non-checked out branch in the remote
         refs_path = b"refs/heads/foo"
         new_id = self.repo[b'HEAD'].id
         self.assertNotEqual(new_id, ZERO_SHA)
         self.repo.refs[refs_path] = new_id
 
         # Push to the remote
         porcelain.push(clone_path, self.repo.path, b":" + refs_path,
                        outstream=outstream, errstream=errstream)
 
         self.assertEqual({
             b'HEAD': new_id,
             b'refs/heads/master': new_id,
             }, self.repo.get_refs())
 
 
 class PullTests(PorcelainTestCase):
 
     def setUp(self):
         super(PullTests, self).setUp()
         # create a file for initial commit
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test',
                          author=b'test <email>',
                          committer=b'test <email>')
 
         # Setup target repo
         self.target_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, self.target_path)
         target_repo = porcelain.clone(self.repo.path, target=self.target_path,
                                       errstream=BytesIO())
         target_repo.close()
 
         # create a second file to be pushed
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test2',
                          author=b'test2 <email>',
                          committer=b'test2 <email>')
 
         self.assertTrue(b'refs/heads/master' in self.repo.refs)
         self.assertTrue(b'refs/heads/master' in target_repo.refs)
 
     def test_simple(self):
         outstream = BytesIO()
         errstream = BytesIO()
 
         # Pull changes into the cloned repo
         porcelain.pull(self.target_path, self.repo.path, b'refs/heads/master',
                        outstream=outstream, errstream=errstream)
 
         # Check the target repo for pushed changes
         with Repo(self.target_path) as r:
             self.assertEqual(r[b'HEAD'].id, self.repo[b'HEAD'].id)
 
     def test_no_refspec(self):
         outstream = BytesIO()
         errstream = BytesIO()
 
         # Pull changes into the cloned repo
         porcelain.pull(self.target_path, self.repo.path, outstream=outstream,
                        errstream=errstream)
 
         # Check the target repo for pushed changes
         with Repo(self.target_path) as r:
             self.assertEqual(r[b'HEAD'].id, self.repo[b'HEAD'].id)
 
 
 class StatusTests(PorcelainTestCase):
 
     def test_empty(self):
         results = porcelain.status(self.repo)
         self.assertEqual(
             {'add': [], 'delete': [], 'modify': []},
             results.staged)
         self.assertEqual([], results.unstaged)
 
     def test_status_base(self):
         """Integration test for `status` functionality."""
 
         # Commit a dummy file then modify it
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write('origstuff')
 
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         # modify access and modify time of path
         os.utime(fullpath, (0, 0))
 
         with open(fullpath, 'wb') as f:
             f.write(b'stuff')
 
         # Make a dummy file and stage it
         filename_add = 'bar'
         fullpath = os.path.join(self.repo.path, filename_add)
         with open(fullpath, 'w') as f:
             f.write('stuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
 
         results = porcelain.status(self.repo)
 
         self.assertEqual(results.staged['add'][0],
                          filename_add.encode('ascii'))
         self.assertEqual(results.unstaged, [b'foo'])
 
     def test_status_all(self):
         del_path = os.path.join(self.repo.path, 'foo')
         mod_path = os.path.join(self.repo.path, 'bar')
         add_path = os.path.join(self.repo.path, 'baz')
         us_path = os.path.join(self.repo.path, 'blye')
         ut_path = os.path.join(self.repo.path, 'blyat')
         with open(del_path, 'w') as f:
             f.write('origstuff')
         with open(mod_path, 'w') as f:
             f.write('origstuff')
         with open(us_path, 'w') as f:
             f.write('origstuff')
         porcelain.add(repo=self.repo.path, paths=[del_path, mod_path, us_path])
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
         porcelain.remove(self.repo.path, [del_path])
         with open(add_path, 'w') as f:
             f.write('origstuff')
         with open(mod_path, 'w') as f:
             f.write('more_origstuff')
         with open(us_path, 'w') as f:
             f.write('more_origstuff')
         porcelain.add(repo=self.repo.path, paths=[add_path, mod_path])
         with open(us_path, 'w') as f:
             f.write('\norigstuff')
         with open(ut_path, 'w') as f:
             f.write('origstuff')
         results = porcelain.status(self.repo.path)
         self.assertDictEqual(
             {'add': [b'baz'], 'delete': [b'foo'], 'modify': [b'bar']},
             results.staged)
         self.assertListEqual(results.unstaged, [b'blye'])
         self.assertListEqual(results.untracked, ['blyat'])
 
+    def test_status_crlf_mismatch(self):
+        # First make a commit as if the file has been added on a Linux system
+        # or with core.autocrlf=True
+        file_path = os.path.join(self.repo.path, 'crlf')
+        with open(file_path, 'wb') as f:
+            f.write(b'line1\nline2')
+        porcelain.add(repo=self.repo.path, paths=[file_path])
+        porcelain.commit(repo=self.repo.path, message=b'test status',
+                         author=b'author <email>',
+                         committer=b'committer <email>')
+
+        # Then update the file as if it was created by CGit on a Windows
+        # system with core.autocrlf=true
+        with open(file_path, 'wb') as f:
+            f.write(b'line1\r\nline2')
+
+        results = porcelain.status(self.repo)
+        self.assertDictEqual(
+            {'add': [], 'delete': [], 'modify': []},
+            results.staged)
+        self.assertListEqual(results.unstaged, [b'crlf'])
+        self.assertListEqual(results.untracked, [])
+
+    def test_status_crlf_convert(self):
+        # First make a commit as if the file has been added on a Linux system
+        # or with core.autocrlf=True
+        file_path = os.path.join(self.repo.path, 'crlf')
+        with open(file_path, 'wb') as f:
+            f.write(b'line1\nline2')
+        porcelain.add(repo=self.repo.path, paths=[file_path])
+        porcelain.commit(repo=self.repo.path, message=b'test status',
+                         author=b'author <email>',
+                         committer=b'committer <email>')
+
+        # Then update the file as if it was created by CGit on a Windows
+        # system with core.autocrlf=true
+        with open(file_path, 'wb') as f:
+            f.write(b'line1\r\nline2')
+
+        # TODO: It should be set automatically by looking at the configuration
+        self.repo.write_filter = convert_crlf_to_lf
+
+        results = porcelain.status(self.repo)
+        self.assertDictEqual(
+            {'add': [], 'delete': [], 'modify': []},
+            results.staged)
+        self.assertListEqual(results.unstaged, [])
+        self.assertListEqual(results.untracked, [])
+
     def test_get_tree_changes_add(self):
         """Unit test for get_tree_changes add."""
 
         # Make a dummy file, stage
         filename = 'bar'
         fullpath = os.path.join(self.repo.path, filename)
         with open(fullpath, 'w') as f:
             f.write('stuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         filename = 'foo'
         fullpath = os.path.join(self.repo.path, filename)
         with open(fullpath, 'w') as f:
             f.write('stuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
         changes = porcelain.get_tree_changes(self.repo.path)
 
         self.assertEqual(changes['add'][0], filename.encode('ascii'))
         self.assertEqual(len(changes['add']), 1)
         self.assertEqual(len(changes['modify']), 0)
         self.assertEqual(len(changes['delete']), 0)
 
     def test_get_tree_changes_modify(self):
         """Unit test for get_tree_changes modify."""
 
         # Make a dummy file, stage, commit, modify
         filename = 'foo'
         fullpath = os.path.join(self.repo.path, filename)
         with open(fullpath, 'w') as f:
             f.write('stuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
         with open(fullpath, 'w') as f:
             f.write('otherstuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
         changes = porcelain.get_tree_changes(self.repo.path)
 
         self.assertEqual(changes['modify'][0], filename.encode('ascii'))
         self.assertEqual(len(changes['add']), 0)
         self.assertEqual(len(changes['modify']), 1)
         self.assertEqual(len(changes['delete']), 0)
 
     def test_get_tree_changes_delete(self):
         """Unit test for get_tree_changes delete."""
 
         # Make a dummy file, stage, commit, remove
         filename = 'foo'
         fullpath = os.path.join(self.repo.path, filename)
         with open(fullpath, 'w') as f:
             f.write('stuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
         cwd = os.getcwd()
         try:
             os.chdir(self.repo.path)
             porcelain.remove(repo=self.repo.path, paths=[filename])
         finally:
             os.chdir(cwd)
         changes = porcelain.get_tree_changes(self.repo.path)
 
         self.assertEqual(changes['delete'][0], filename.encode('ascii'))
         self.assertEqual(len(changes['add']), 0)
         self.assertEqual(len(changes['modify']), 0)
         self.assertEqual(len(changes['delete']), 1)
 
     def test_get_untracked_paths(self):
         with open(os.path.join(self.repo.path, '.gitignore'), 'w') as f:
             f.write('ignored\n')
         with open(os.path.join(self.repo.path, 'ignored'), 'w') as f:
             f.write('blah\n')
         with open(os.path.join(self.repo.path, 'notignored'), 'w') as f:
             f.write('blah\n')
         self.assertEqual(
             set(['ignored', 'notignored', '.gitignore']),
             set(porcelain.get_untracked_paths(self.repo.path, self.repo.path,
                                               self.repo.open_index())))
         self.assertEqual(set(['.gitignore', 'notignored']),
                          set(porcelain.status(self.repo).untracked))
         self.assertEqual(set(['.gitignore', 'notignored', 'ignored']),
                          set(porcelain.status(self.repo, ignored=True)
                              .untracked))
 
     def test_get_untracked_paths_nested(self):
         with open(os.path.join(self.repo.path, 'notignored'), 'w') as f:
             f.write('blah\n')
         subrepo = Repo.init(os.path.join(self.repo.path, 'nested'), mkdir=True)
         with open(os.path.join(subrepo.path, 'another'), 'w') as f:
             f.write('foo\n')
 
         self.assertEqual(
             set(['notignored']),
             set(porcelain.get_untracked_paths(self.repo.path, self.repo.path,
                                               self.repo.open_index())))
         self.assertEqual(
             set(['another']),
             set(porcelain.get_untracked_paths(subrepo.path, subrepo.path,
                                               subrepo.open_index())))
 
 
 # TODO(jelmer): Add test for dulwich.porcelain.daemon
 
 
 class UploadPackTests(PorcelainTestCase):
     """Tests for upload_pack."""
 
     def test_upload_pack(self):
         outf = BytesIO()
         exitcode = porcelain.upload_pack(
                 self.repo.path, BytesIO(b"0000"), outf)
         outlines = outf.getvalue().splitlines()
         self.assertEqual([b"0000"], outlines)
         self.assertEqual(0, exitcode)
 
 
 class ReceivePackTests(PorcelainTestCase):
     """Tests for receive_pack."""
 
     def test_receive_pack(self):
         filename = 'foo'
         fullpath = os.path.join(self.repo.path, filename)
         with open(fullpath, 'w') as f:
             f.write('stuff')
         porcelain.add(repo=self.repo.path, paths=fullpath)
         self.repo.do_commit(message=b'test status',
                             author=b'author <email>',
                             committer=b'committer <email>',
                             author_timestamp=1402354300,
                             commit_timestamp=1402354300, author_timezone=0,
                             commit_timezone=0)
         outf = BytesIO()
         exitcode = porcelain.receive_pack(
                 self.repo.path, BytesIO(b"0000"), outf)
         outlines = outf.getvalue().splitlines()
         self.assertEqual([
             b'0091319b56ce3aee2d489f759736a79cc552c9bb86d9 HEAD\x00 report-status '  # noqa: E501
             b'delete-refs quiet ofs-delta side-band-64k '
             b'no-done symref=HEAD:refs/heads/master',
            b'003f319b56ce3aee2d489f759736a79cc552c9bb86d9 refs/heads/master',
             b'0000'], outlines)
         self.assertEqual(0, exitcode)
 
 
 class BranchListTests(PorcelainTestCase):
 
     def test_standard(self):
         self.assertEqual(set([]), set(porcelain.branch_list(self.repo)))
 
     def test_new_branch(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo[b"HEAD"] = c1.id
         porcelain.branch_create(self.repo, b"foo")
         self.assertEqual(
             set([b"master", b"foo"]),
             set(porcelain.branch_list(self.repo)))
 
 
 class BranchCreateTests(PorcelainTestCase):
 
     def test_branch_exists(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo[b"HEAD"] = c1.id
         porcelain.branch_create(self.repo, b"foo")
         self.assertRaises(KeyError, porcelain.branch_create, self.repo, b"foo")
         porcelain.branch_create(self.repo, b"foo", force=True)
 
     def test_new_branch(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo[b"HEAD"] = c1.id
         porcelain.branch_create(self.repo, b"foo")
         self.assertEqual(
             set([b"master", b"foo"]),
             set(porcelain.branch_list(self.repo)))
 
 
 class BranchDeleteTests(PorcelainTestCase):
 
     def test_simple(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo[b"HEAD"] = c1.id
         porcelain.branch_create(self.repo, b'foo')
         self.assertTrue(b"foo" in porcelain.branch_list(self.repo))
         porcelain.branch_delete(self.repo, b'foo')
         self.assertFalse(b"foo" in porcelain.branch_list(self.repo))
 
     def test_simple_unicode(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo[b"HEAD"] = c1.id
         porcelain.branch_create(self.repo, 'foo')
         self.assertTrue(b"foo" in porcelain.branch_list(self.repo))
         porcelain.branch_delete(self.repo, 'foo')
         self.assertFalse(b"foo" in porcelain.branch_list(self.repo))
 
 
 class FetchTests(PorcelainTestCase):
 
     def test_simple(self):
         outstream = BytesIO()
         errstream = BytesIO()
 
         # create a file for initial commit
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test',
                          author=b'test <email>',
                          committer=b'test <email>')
 
         # Setup target repo
         target_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, target_path)
         target_repo = porcelain.clone(self.repo.path, target=target_path,
                                       errstream=errstream)
 
         # create a second file to be pushed
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test2',
                          author=b'test2 <email>',
                          committer=b'test2 <email>')
 
         self.assertFalse(self.repo[b'HEAD'].id in target_repo)
         target_repo.close()
 
         # Fetch changes into the cloned repo
         porcelain.fetch(target_path, self.repo.path,
                         outstream=outstream, errstream=errstream)
 
         # Assert that fetch updated the local image of the remote
         self.assert_correct_remote_refs(
             target_repo.get_refs(), self.repo.get_refs())
 
         # Check the target repo for pushed changes
         with Repo(target_path) as r:
             self.assertTrue(self.repo[b'HEAD'].id in r)
 
     def test_with_remote_name(self):
         remote_name = b'origin'
         outstream = BytesIO()
         errstream = BytesIO()
 
         # create a file for initial commit
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test',
                          author=b'test <email>',
                          committer=b'test <email>')
 
         # Setup target repo
         target_path = tempfile.mkdtemp()
         self.addCleanup(shutil.rmtree, target_path)
         target_repo = porcelain.clone(self.repo.path, target=target_path,
                                       errstream=errstream)
 
         # Capture current refs
         target_refs = target_repo.get_refs()
 
         # create a second file to be pushed
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.commit(repo=self.repo.path, message=b'test2',
                          author=b'test2 <email>',
                          committer=b'test2 <email>')
 
         self.assertFalse(self.repo[b'HEAD'].id in target_repo)
         target_repo.close()
 
         # Fetch changes into the cloned repo
         porcelain.fetch(target_path, self.repo.path, remote_name=remote_name,
                         outstream=outstream, errstream=errstream)
 
         # Assert that fetch updated the local image of the remote
         self.assert_correct_remote_refs(
             target_repo.get_refs(), self.repo.get_refs())
 
         # Check the target repo for pushed changes, as well as updates
         # for the refs
         with Repo(target_path) as r:
             self.assertTrue(self.repo[b'HEAD'].id in r)
             self.assertNotEqual(self.repo.get_refs(), target_refs)
 
     def assert_correct_remote_refs(
             self, local_refs, remote_refs, remote_name=b'origin'):
         """Assert that known remote refs corresponds to actual remote refs."""
         local_ref_prefix = b'refs/heads'
         remote_ref_prefix = b'refs/remotes/' + remote_name
 
         locally_known_remote_refs = {
             k[len(remote_ref_prefix) + 1:]: v for k, v in local_refs.items()
             if k.startswith(remote_ref_prefix)}
 
         normalized_remote_refs = {
             k[len(local_ref_prefix) + 1:]: v for k, v in remote_refs.items()
             if k.startswith(local_ref_prefix)}
 
         self.assertEqual(locally_known_remote_refs, normalized_remote_refs)
 
 
 class RepackTests(PorcelainTestCase):
 
     def test_empty(self):
         porcelain.repack(self.repo)
 
     def test_simple(self):
         handle, fullpath = tempfile.mkstemp(dir=self.repo.path)
         os.close(handle)
         porcelain.add(repo=self.repo.path, paths=fullpath)
         porcelain.repack(self.repo)
 
 
 class LsTreeTests(PorcelainTestCase):
 
     def test_empty(self):
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         f = StringIO()
         porcelain.ls_tree(self.repo, b"HEAD", outstream=f)
         self.assertEqual(f.getvalue(), "")
 
     def test_simple(self):
         # Commit a dummy file then modify it
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write('origstuff')
 
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
 
         f = StringIO()
         porcelain.ls_tree(self.repo, b"HEAD", outstream=f)
         self.assertEqual(
                 f.getvalue(),
                 '100644 blob 8b82634d7eae019850bb883f06abf428c58bc9aa\tfoo\n')
 
     def test_recursive(self):
         # Create a directory then write a dummy file in it
         dirpath = os.path.join(self.repo.path, 'adir')
         filepath = os.path.join(dirpath, 'afile')
         os.mkdir(dirpath)
         with open(filepath, 'w') as f:
             f.write('origstuff')
         porcelain.add(repo=self.repo.path, paths=[filepath])
         porcelain.commit(repo=self.repo.path, message=b'test status',
                          author=b'author <email>',
                          committer=b'committer <email>')
         f = StringIO()
         porcelain.ls_tree(self.repo, b"HEAD", outstream=f)
         self.assertEqual(
                 f.getvalue(),
                 '40000 tree b145cc69a5e17693e24d8a7be0016ed8075de66d\tadir\n')
         f = StringIO()
         porcelain.ls_tree(self.repo, b"HEAD", outstream=f, recursive=True)
         self.assertEqual(
                 f.getvalue(),
                 '40000 tree b145cc69a5e17693e24d8a7be0016ed8075de66d\tadir\n'
                 '100644 blob 8b82634d7eae019850bb883f06abf428c58bc9aa\tadir'
                 '/afile\n')
 
 
 class LsRemoteTests(PorcelainTestCase):
 
     def test_empty(self):
         self.assertEqual({}, porcelain.ls_remote(self.repo.path))
 
     def test_some(self):
         cid = porcelain.commit(repo=self.repo.path, message=b'test status',
                                author=b'author <email>',
                                committer=b'committer <email>')
 
         self.assertEqual({
             b'refs/heads/master': cid,
             b'HEAD': cid},
             porcelain.ls_remote(self.repo.path))
 
 
 class LsFilesTests(PorcelainTestCase):
 
     def test_empty(self):
         self.assertEqual([], list(porcelain.ls_files(self.repo)))
 
     def test_simple(self):
         # Commit a dummy file then modify it
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write('origstuff')
 
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         self.assertEqual([b'foo'], list(porcelain.ls_files(self.repo)))
 
 
 class RemoteAddTests(PorcelainTestCase):
 
     def test_new(self):
         porcelain.remote_add(
             self.repo, 'jelmer', 'git://jelmer.uk/code/dulwich')
         c = self.repo.get_config()
         self.assertEqual(
             c.get((b'remote', b'jelmer'), b'url'),
             b'git://jelmer.uk/code/dulwich')
 
     def test_exists(self):
         porcelain.remote_add(
             self.repo, 'jelmer', 'git://jelmer.uk/code/dulwich')
         self.assertRaises(porcelain.RemoteExists, porcelain.remote_add,
                           self.repo, 'jelmer', 'git://jelmer.uk/code/dulwich')
 
 
 class CheckIgnoreTests(PorcelainTestCase):
 
     def test_check_ignored(self):
         with open(os.path.join(self.repo.path, '.gitignore'), 'w') as f:
             f.write('foo')
         foo_path = os.path.join(self.repo.path, 'foo')
         with open(foo_path, 'w') as f:
             f.write('BAR')
         bar_path = os.path.join(self.repo.path, 'bar')
         with open(bar_path, 'w') as f:
             f.write('BAR')
         self.assertEqual(
             ['foo'],
             list(porcelain.check_ignore(self.repo, [foo_path])))
         self.assertEqual(
             [], list(porcelain.check_ignore(self.repo, [bar_path])))
 
     def test_check_added_abs(self):
         path = os.path.join(self.repo.path, 'foo')
         with open(path, 'w') as f:
             f.write('BAR')
         self.repo.stage(['foo'])
         with open(os.path.join(self.repo.path, '.gitignore'), 'w') as f:
             f.write('foo\n')
         self.assertEqual(
             [], list(porcelain.check_ignore(self.repo, [path])))
         self.assertEqual(
             ['foo'],
             list(porcelain.check_ignore(self.repo, [path], no_index=True)))
 
     def test_check_added_rel(self):
         with open(os.path.join(self.repo.path, 'foo'), 'w') as f:
             f.write('BAR')
         self.repo.stage(['foo'])
         with open(os.path.join(self.repo.path, '.gitignore'), 'w') as f:
             f.write('foo\n')
         cwd = os.getcwd()
         os.mkdir(os.path.join(self.repo.path, 'bar'))
         os.chdir(os.path.join(self.repo.path, 'bar'))
         try:
             self.assertEqual(
                 list(porcelain.check_ignore(self.repo, ['../foo'])), [])
             self.assertEqual(['../foo'], list(
                porcelain.check_ignore(self.repo, ['../foo'], no_index=True)))
         finally:
             os.chdir(cwd)
 
 
 class UpdateHeadTests(PorcelainTestCase):
 
     def test_set_to_branch(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo.refs[b"refs/heads/blah"] = c1.id
         porcelain.update_head(self.repo, "blah")
         self.assertEqual(c1.id, self.repo.head())
         self.assertEqual(b'ref: refs/heads/blah',
                          self.repo.refs.read_ref(b'HEAD'))
 
     def test_set_to_branch_detached(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo.refs[b"refs/heads/blah"] = c1.id
         porcelain.update_head(self.repo, "blah", detached=True)
         self.assertEqual(c1.id, self.repo.head())
         self.assertEqual(c1.id, self.repo.refs.read_ref(b'HEAD'))
 
     def test_set_to_commit_detached(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo.refs[b"refs/heads/blah"] = c1.id
         porcelain.update_head(self.repo, c1.id, detached=True)
         self.assertEqual(c1.id, self.repo.head())
         self.assertEqual(c1.id, self.repo.refs.read_ref(b'HEAD'))
 
     def test_set_new_branch(self):
         [c1] = build_commit_graph(self.repo.object_store, [[1]])
         self.repo.refs[b"refs/heads/blah"] = c1.id
         porcelain.update_head(self.repo, "blah", new_branch="bar")
         self.assertEqual(c1.id, self.repo.head())
         self.assertEqual(b'ref: refs/heads/bar',
                          self.repo.refs.read_ref(b'HEAD'))
 
 
 class MailmapTests(PorcelainTestCase):
 
     def test_no_mailmap(self):
         self.assertEqual(
             b'Jelmer Vernooij <jelmer@samba.org>',
             porcelain.check_mailmap(
                 self.repo, b'Jelmer Vernooij <jelmer@samba.org>'))
 
     def test_mailmap_lookup(self):
         with open(os.path.join(self.repo.path, '.mailmap'), 'wb') as f:
             f.write(b"""\
 Jelmer Vernooij <jelmer@debian.org>
 """)
         self.assertEqual(
             b'Jelmer Vernooij <jelmer@debian.org>',
             porcelain.check_mailmap(
                 self.repo, b'Jelmer Vernooij <jelmer@samba.org>'))
 
 
 class FsckTests(PorcelainTestCase):
 
     def test_none(self):
         self.assertEqual(
                 [],
                 list(porcelain.fsck(self.repo)))
 
     def test_git_dir(self):
         obj = Tree()
         a = Blob()
         a.data = b"foo"
         obj.add(b".git", 0o100644, a.id)
         self.repo.object_store.add_objects(
             [(a, None), (obj, None)])
         self.assertEqual(
                 [(obj.id, 'invalid name .git')],
                 [(sha, str(e)) for (sha, e) in porcelain.fsck(self.repo)])
 
 
 class DescribeTests(PorcelainTestCase):
 
     def test_no_commits(self):
         self.assertRaises(KeyError, porcelain.describe, self.repo.path)
 
     def test_single_commit(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         sha = porcelain.commit(
                 self.repo.path, message=b"Some message",
                 author=b"Joe <joe@example.com>",
                 committer=b"Bob <bob@example.com>")
         self.assertEqual(
                 'g{}'.format(sha[:7].decode('ascii')),
                 porcelain.describe(self.repo.path))
 
     def test_tag(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         porcelain.commit(
                 self.repo.path, message=b"Some message",
                 author=b"Joe <joe@example.com>",
                 committer=b"Bob <bob@example.com>")
         porcelain.tag_create(self.repo.path, b"tryme", b'foo <foo@bar.com>',
                              b'bar', annotated=True)
         self.assertEqual(
                 "tryme",
                 porcelain.describe(self.repo.path))
 
     def test_tag_and_commit(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         porcelain.commit(
                 self.repo.path, message=b"Some message",
                 author=b"Joe <joe@example.com>",
                 committer=b"Bob <bob@example.com>")
         porcelain.tag_create(self.repo.path, b"tryme", b'foo <foo@bar.com>',
                              b'bar', annotated=True)
         with open(fullpath, 'w') as f:
             f.write("BAR2")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         sha = porcelain.commit(
                 self.repo.path, message=b"Some message",
                 author=b"Joe <joe@example.com>",
                 committer=b"Bob <bob@example.com>")
         self.assertEqual(
                 'tryme-1-g{}'.format(sha[:7].decode('ascii')),
                 porcelain.describe(self.repo.path))
 
 
 class HelperTests(PorcelainTestCase):
 
     def test_path_to_tree_path_base(self):
         self.assertEqual(
             b'bar', porcelain.path_to_tree_path('/home/foo', '/home/foo/bar'))
         self.assertEqual(b'bar', porcelain.path_to_tree_path('.', './bar'))
         self.assertEqual(b'bar', porcelain.path_to_tree_path('.', 'bar'))
         cwd = os.getcwd()
         self.assertEqual(
             b'bar', porcelain.path_to_tree_path('.', os.path.join(cwd, 'bar')))
         self.assertEqual(b'bar', porcelain.path_to_tree_path(cwd, 'bar'))
 
     def test_path_to_tree_path_syntax(self):
         self.assertEqual(b'bar', porcelain.path_to_tree_path(b'.', './bar'))
         self.assertEqual(b'bar', porcelain.path_to_tree_path('.', b'./bar'))
         self.assertEqual(b'bar', porcelain.path_to_tree_path(b'.', b'./bar'))
 
     def test_path_to_tree_path_error(self):
         with self.assertRaises(ValueError):
             porcelain.path_to_tree_path('/home/foo/', '/home/bar/baz')
 
     def test_path_to_tree_path_rel(self):
         cwd = os.getcwd()
         os.mkdir(os.path.join(self.repo.path, 'foo'))
         os.mkdir(os.path.join(self.repo.path, 'foo/bar'))
         try:
             os.chdir(os.path.join(self.repo.path, 'foo/bar'))
             self.assertEqual(b'bar/baz', porcelain.path_to_tree_path(
                 '..', 'baz'))
             self.assertEqual(b'bar/baz', porcelain.path_to_tree_path(
                 os.path.join(os.getcwd(), '..'),
                 os.path.join(os.getcwd(), 'baz')))
             self.assertEqual(b'bar/baz', porcelain.path_to_tree_path(
                 '..', os.path.join(os.getcwd(), 'baz')))
             self.assertEqual(b'bar/baz', porcelain.path_to_tree_path(
                 os.path.join(os.getcwd(), '..'), 'baz'))
         finally:
             os.chdir(cwd)
 
 
 class GetObjectBypathTests(PorcelainTestCase):
 
     def test_simple(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         porcelain.commit(
                 self.repo.path, message=b"Some message",
                 author=b"Joe <joe@example.com>",
                 committer=b"Bob <bob@example.com>")
         self.assertEqual(
             b"BAR",
             porcelain.get_object_by_path(self.repo, 'foo').data)
 
     def test_missing(self):
         self.assertRaises(
             KeyError,
             porcelain.get_object_by_path, self.repo, 'foo')
 
 
 class WriteTreeTests(PorcelainTestCase):
 
     def test_simple(self):
         fullpath = os.path.join(self.repo.path, 'foo')
         with open(fullpath, 'w') as f:
             f.write("BAR")
         porcelain.add(repo=self.repo.path, paths=[fullpath])
         self.assertEqual(
             b'd2092c8a9f311f0311083bf8d177f2ca0ab5b241',
             porcelain.write_tree(self.repo))