diff --git a/terrarium/dl_gitmanager/README.md b/terrarium/dl_gitmanager/README.md
index fdeada893..fd10683e6 100644
--- a/terrarium/dl_gitmanager/README.md
+++ b/terrarium/dl_gitmanager/README.md
@@ -47,12 +47,13 @@ List files that have changed between two given revisions including the changes i
dl-git range-diff-paths --base --head
dl-git range-diff-paths --base --head --absolute
dl-git range-diff-paths --base --head --only-added-commits
+dl-git range-diff-paths --base --head --without-deleted-files
```
Here `base` and `head` can be a commit ID, branch name, `HEAD~3` or any similar notation
that is usually accepted by git.
These arguments are optional. By default `head` is `HEAD` and `base` is `HEAD~1`.
-Thgis means you can use the following command to see the diff of the last commit in the current branch:
+This means you can use the following command to see the diff of the last commit in the current branch:
```
dl-git diff-paths
```
@@ -63,13 +64,16 @@ By default they are printed relative to the repository root.
The `--only-added-commits` option makes the tool inspect only commits
that have been added in the head version.
+The `--without-deleted-files` option makes the tool omit deleted (non-existent) files in the resulting list.
+
### list-diff-paths
List files that have changed in commits passed on as input
```
echo | dl-git list-diff-paths
-echo > | dl-git list-diff-paths --absolute
+echo | dl-git list-diff-paths --absolute
+echo | dl-git list-diff-paths --without-deleted-files
```
-Option `--absolute` has the same meaning as in `range-diff-paths`.
+Options `--absolute` and `--without-deleted-files` have the same meaning as in `range-diff-paths`.
diff --git a/terrarium/dl_gitmanager/dl_gitmanager/git_manager.py b/terrarium/dl_gitmanager/dl_gitmanager/git_manager.py
index 2199b92db..b1e2b664a 100644
--- a/terrarium/dl_gitmanager/dl_gitmanager/git_manager.py
+++ b/terrarium/dl_gitmanager/dl_gitmanager/git_manager.py
@@ -1,5 +1,6 @@
from __future__ import annotations
+import os
from pathlib import Path
from typing import (
Collection,
@@ -114,23 +115,35 @@ def _iter_list_diffs(
for _, diff_item in submodule_manager._iter_list_diffs(commits=sm_commits_for_all_commits):
yield submodule_base_path, diff_item
- def _collect_paths_from_diffs(self, diff_iterable: Iterable[tuple[Path, Diff]]) -> list[str]:
+ def _collect_paths_from_diffs(
+ self, diff_iterable: Iterable[tuple[Path, Diff]], without_deleted: bool = False
+ ) -> list[str]:
result: set[str] = set()
for base_path, diff_item in diff_iterable:
- if diff_item.a_path:
- result.add(str(base_path / diff_item.a_path))
- if diff_item.b_path:
- result.add(str(base_path / diff_item.b_path))
+ for diff_path in (diff_item.a_path, diff_item.b_path):
+ if not diff_path:
+ continue
+ absolute_path = base_path / diff_path
+ if not without_deleted or absolute_path.exists():
+ result.add(str(absolute_path))
return sorted(result)
- def get_range_diff_paths(self, base: str, head: str, absolute: bool = False) -> list[str]:
+ def get_range_diff_paths(
+ self, base: str, head: str, absolute: bool = False, without_deleted: bool = False
+ ) -> list[str]:
return self._collect_paths_from_diffs(
- diff_iterable=self._iter_range_diffs(base=base, head=head, absolute=absolute)
+ diff_iterable=self._iter_range_diffs(base=base, head=head, absolute=absolute),
+ without_deleted=without_deleted,
)
- def get_list_diff_paths(self, commits: Collection[str], absolute: bool = False) -> list[str]:
- return self._collect_paths_from_diffs(diff_iterable=self._iter_list_diffs(commits=commits, absolute=absolute))
+ def get_list_diff_paths(
+ self, commits: Collection[str], absolute: bool = False, without_deleted: bool = False
+ ) -> list[str]:
+ return self._collect_paths_from_diffs(
+ diff_iterable=self._iter_list_diffs(commits=commits, absolute=absolute),
+ without_deleted=without_deleted,
+ )
def get_all_ancestor_commits(self, commit: str) -> set[str]:
result: set[str] = {commit}
diff --git a/terrarium/dl_gitmanager/dl_gitmanager/scripts/gitmanager_cli.py b/terrarium/dl_gitmanager/dl_gitmanager/scripts/gitmanager_cli.py
index f9e635b7e..8f16b6baa 100644
--- a/terrarium/dl_gitmanager/dl_gitmanager/scripts/gitmanager_cli.py
+++ b/terrarium/dl_gitmanager/dl_gitmanager/scripts/gitmanager_cli.py
@@ -49,6 +49,9 @@ def get_parser(cls) -> argparse.ArgumentParser:
range_diff_paths_parser.add_argument(
"--only-added-commits", action="store_true", help="Inspect only commits that are added in head"
)
+ range_diff_paths_parser.add_argument(
+ "--without-deleted-files", action="store_true", help="Omit deleted files in the resulting list"
+ )
subparsers.add_parser(
"list-diff-paths",
@@ -58,18 +61,26 @@ def get_parser(cls) -> argparse.ArgumentParser:
return parser
- def range_diff_paths(self, base: str, head: Optional[str], absolute: bool, only_added_commits: bool) -> None:
+ def range_diff_paths(
+ self, base: str, head: Optional[str], absolute: bool, only_added_commits: bool, without_deleted: bool = False
+ ) -> None:
diff_name_list: list[str]
if only_added_commits:
commits = self.git_manager.get_missing_commits(base=base, head=head)
- diff_name_list = self.git_manager.get_list_diff_paths(commits=commits, absolute=absolute)
+ diff_name_list = self.git_manager.get_list_diff_paths(
+ commits=commits, absolute=absolute, without_deleted=without_deleted
+ )
else:
- diff_name_list = self.git_manager.get_range_diff_paths(base=base, head=head, absolute=absolute)
+ diff_name_list = self.git_manager.get_range_diff_paths(
+ base=base, head=head, absolute=absolute, without_deleted=without_deleted
+ )
print("\n".join(diff_name_list))
- def list_diff_paths(self, absolute: bool) -> None:
+ def list_diff_paths(self, absolute: bool, without_deleted: bool = False) -> None:
commits = [line.strip() for line in self.input_text_io if line.strip()]
- diff_name_list = self.git_manager.get_list_diff_paths(commits=commits, absolute=absolute)
+ diff_name_list = self.git_manager.get_list_diff_paths(
+ commits=commits, absolute=absolute, without_deleted=without_deleted
+ )
print("\n".join(diff_name_list))
@classmethod
@@ -86,10 +97,14 @@ def run_parsed_args(cls, args: argparse.Namespace) -> None:
match args.command:
case "range-diff-paths":
tool.range_diff_paths(
- base=args.base, head=args.head, absolute=args.absolute, only_added_commits=args.only_added_commits
+ base=args.base,
+ head=args.head,
+ absolute=args.absolute,
+ only_added_commits=args.only_added_commits,
+ without_deleted=args.without_deleted_files,
)
case "list-diff-paths":
- tool.list_diff_paths(absolute=args.absolute)
+ tool.list_diff_paths(absolute=args.absolute, without_deleted=args.without_deleted_files)
case _:
raise RuntimeError(f"Got unknown command: {args.command}")