From c24d8f36a30478807a65b9f56969d5aac593f3b7 Mon Sep 17 00:00:00 2001 From: "http://joeyh.name/" Date: Wed, 28 Nov 2012 18:16:10 +0000 Subject: Added a comment --- .../comment_1_93a86cb03b66e7ab5dd7146e7b86c9e8._comment | 15 +++++++++++++++ 1 file changed, 15 insertions(+) create mode 100644 doc/forum/benefit_of_splitting_a_repository/comment_1_93a86cb03b66e7ab5dd7146e7b86c9e8._comment diff --git a/doc/forum/benefit_of_splitting_a_repository/comment_1_93a86cb03b66e7ab5dd7146e7b86c9e8._comment b/doc/forum/benefit_of_splitting_a_repository/comment_1_93a86cb03b66e7ab5dd7146e7b86c9e8._comment new file mode 100644 index 000000000..72ea4f29b --- /dev/null +++ b/doc/forum/benefit_of_splitting_a_repository/comment_1_93a86cb03b66e7ab5dd7146e7b86c9e8._comment @@ -0,0 +1,15 @@ +[[!comment format=mdwn + username="http://joeyh.name/" + ip="4.154.6.49" + subject="comment 1" + date="2012-11-28T18:16:10Z" + content=""" +`git-annex unused` needs to scan the entire repository. But it uses a bloom filter, so its complexity is O(n) to the number of keys. + +`git annex fsck` scans the entire repository and also reads all available file content. But we have incremental fsck support now. + +The rest of git-annex is designed to have good locality. + +The main problem you are likely to run into is innefficiencies with git's index file. This file records the status of every file in the repository, and commands like `git add` rewrite the whole file. git-annex uses a journal to minimise operations that need to rewrite the git index file, but this won't help you when you're using raw git commands in the repository. + +"""]] -- cgit v1.2.3