Browse Source

porcelain: add untracked_files kwarg to status

This kwarg is intended to match `git`'s `-u/--untracked-file`:
- `untracked_files="no"` returns no untracked files
- `untracked_files="all"` (dulwich default) returns all untracked files
- `untracked_files="normal"` (git default) is not implemented

Using `untracked_files="no"` can speed up `status` for worktrees with
large untracked directories
Daniele Trifirò 2 years ago
parent
commit
526dc0ef32
2 changed files with 54 additions and 9 deletions
  1. 32 8
      dulwich/porcelain.py
  2. 22 1
      dulwich/tests/test_porcelain.py

+ 32 - 8
dulwich/porcelain.py

@@ -1156,12 +1156,20 @@ def pull(
             _import_remote_refs(r.refs, remote_name, fetch_result.refs)
             _import_remote_refs(r.refs, remote_name, fetch_result.refs)
 
 
 
 
-def status(repo=".", ignored=False):
+def status(repo=".", ignored=False, untracked_files="all"):
     """Returns staged, unstaged, and untracked changes relative to the HEAD.
     """Returns staged, unstaged, and untracked changes relative to the HEAD.
 
 
     Args:
     Args:
       repo: Path to repository or repository object
       repo: Path to repository or repository object
       ignored: Whether to include ignored files in untracked
       ignored: Whether to include ignored files in untracked
+      untracked_files: How to handle untracked files, defaults to "all":
+          "no": do not return untracked files
+          "all": include all files in untracked directories
+        Using `untracked_files="no"` can be faster than "all" when the worktreee
+          contains many untracked files/directories.
+
+    Note: `untracked_files="normal" (`git`'s default) is not implemented.
+
     Returns: GitStatus tuple,
     Returns: GitStatus tuple,
         staged -  dict with lists of staged paths (diff index/HEAD)
         staged -  dict with lists of staged paths (diff index/HEAD)
         unstaged -  list of unstaged paths (diff index/working-tree)
         unstaged -  list of unstaged paths (diff index/working-tree)
@@ -1177,7 +1185,11 @@ def status(repo=".", ignored=False):
         unstaged_changes = list(get_unstaged_changes(index, r.path, filter_callback))
         unstaged_changes = list(get_unstaged_changes(index, r.path, filter_callback))
 
 
         untracked_paths = get_untracked_paths(
         untracked_paths = get_untracked_paths(
-            r.path, r.path, index, exclude_ignored=not ignored
+            r.path,
+            r.path,
+            index,
+            exclude_ignored=not ignored,
+            untracked_files=untracked_files,
         )
         )
         untracked_changes = list(untracked_paths)
         untracked_changes = list(untracked_paths)
 
 
@@ -1216,7 +1228,9 @@ def _walk_working_dir_paths(frompath, basepath, prune_dirnames=None):
             dirnames[:] = prune_dirnames(dirpath, dirnames)
             dirnames[:] = prune_dirnames(dirpath, dirnames)
 
 
 
 
-def get_untracked_paths(frompath, basepath, index, exclude_ignored=False):
+def get_untracked_paths(
+    frompath, basepath, index, exclude_ignored=False, untracked_files="all"
+):
     """Get untracked paths.
     """Get untracked paths.
 
 
     Args:
     Args:
@@ -1224,11 +1238,24 @@ def get_untracked_paths(frompath, basepath, index, exclude_ignored=False):
       basepath: Path to compare to
       basepath: Path to compare to
       index: Index to check against
       index: Index to check against
       exclude_ignored: Whether to exclude ignored paths
       exclude_ignored: Whether to exclude ignored paths
+      untracked_files: How to handle untracked files:
+        - "no": return an empty list
+        - "all": return all files in untracked directories
+        - "normal": Not implemented
 
 
     Note: ignored directories will never be walked for performance reasons.
     Note: ignored directories will never be walked for performance reasons.
       If exclude_ignored is False, only the path to an ignored directory will
       If exclude_ignored is False, only the path to an ignored directory will
       be yielded, no files inside the directory will be returned
       be yielded, no files inside the directory will be returned
     """
     """
+    if untracked_files == "normal":
+        raise NotImplementedError("normal is not yet supported")
+
+    if untracked_files not in ("no", "all"):
+        raise ValueError("untracked_files must be one of (no, all)")
+
+    if untracked_files == "no":
+        return
+
     with open_repo_closing(basepath) as r:
     with open_repo_closing(basepath) as r:
         ignore_manager = IgnoreFilterManager.from_repo(r)
         ignore_manager = IgnoreFilterManager.from_repo(r)
 
 
@@ -1252,11 +1279,8 @@ def get_untracked_paths(frompath, basepath, index, exclude_ignored=False):
         if not is_dir:
         if not is_dir:
             ip = path_to_tree_path(basepath, ap)
             ip = path_to_tree_path(basepath, ap)
             if ip not in index:
             if ip not in index:
-                if (
-                    not exclude_ignored
-                    or not ignore_manager.is_ignored(
-                        os.path.relpath(ap, basepath)
-                    )
+                if not exclude_ignored or not ignore_manager.is_ignored(
+                    os.path.relpath(ap, basepath)
                 ):
                 ):
                     yield os.path.relpath(ap, frompath)
                     yield os.path.relpath(ap, frompath)
 
 

+ 22 - 1
dulwich/tests/test_porcelain.py

@@ -1874,7 +1874,12 @@ class StatusTests(PorcelainTestCase):
             results.staged,
             results.staged,
         )
         )
         self.assertListEqual(results.unstaged, [b"blye"])
         self.assertListEqual(results.unstaged, [b"blye"])
-        self.assertListEqual(results.untracked, ["blyat"])
+        results_no_untracked = porcelain.status(self.repo.path, untracked_files="no")
+        self.assertListEqual(results_no_untracked.untracked, [])
+
+    def test_status_wrong_untracked_files_value(self):
+        with self.assertRaises(ValueError):
+            porcelain.status(self.repo.path, untracked_files="antani")
 
 
     def test_status_crlf_mismatch(self):
     def test_status_crlf_mismatch(self):
         # First make a commit as if the file has been added on a Linux system
         # First make a commit as if the file has been added on a Linux system
@@ -2170,6 +2175,22 @@ class StatusTests(PorcelainTestCase):
             )
             )
         )
         )
 
 
+    def test_get_untracked_paths_invalid_untracked_files(self):
+        with self.assertRaises(ValueError):
+            list(
+                porcelain.get_untracked_paths(
+                    self.repo.path,
+                    self.repo.path,
+                    self.repo.open_index(),
+                    untracked_files="invalid_value",
+                )
+            )
+
+    def test_get_untracked_paths_normal(self):
+        with self.assertRaises(NotImplementedError):
+            _, _, _ = porcelain.status(
+                repo=self.repo.path, untracked_files="normal"
+            )
 
 
 # TODO(jelmer): Add test for dulwich.porcelain.daemon
 # TODO(jelmer): Add test for dulwich.porcelain.daemon