Browse Source
If a treewalk walks also over index and the workingtree then the IndexDiffFilter filter can be used which works much faster then the semantically equivalent ANY_DIFF filter. This is because this filter can better avoid computing SHA-1 ids over the content of working-tree files which is very costly. This fix will significantly improve the performance of e.g. EGit's commit dialog. Change-Id: I2a51816f4ed9df2900c6307a54cd09f50004266f Signed-off-by: Christian Halstrick <christian.halstrick@sap.com> Signed-off-by: Philipp Thun <philipp.thun@sap.com>stable-0.10
Christian Halstrick
14 years ago
4 changed files with 301 additions and 3 deletions
@ -0,0 +1,100 @@
|
||||
/* |
||||
* Copyright (C) 2010, Christian Halstrick <christian.halstrick@sap.com>, |
||||
* Copyright (C) 2010, Philipp Thun <philipp.thun@sap.com> |
||||
* and other copyright owners as documented in the project's IP log. |
||||
* |
||||
* This program and the accompanying materials are made available |
||||
* under the terms of the Eclipse Distribution License v1.0 which |
||||
* accompanies this distribution, is reproduced below, and is |
||||
* available at http://www.eclipse.org/org/documents/edl-v10.php
|
||||
* |
||||
* All rights reserved. |
||||
* |
||||
* Redistribution and use in source and binary forms, with or |
||||
* without modification, are permitted provided that the following |
||||
* conditions are met: |
||||
* |
||||
* - Redistributions of source code must retain the above copyright |
||||
* notice, this list of conditions and the following disclaimer. |
||||
* |
||||
* - Redistributions in binary form must reproduce the above |
||||
* copyright notice, this list of conditions and the following |
||||
* disclaimer in the documentation and/or other materials provided |
||||
* with the distribution. |
||||
* |
||||
* - Neither the name of the Eclipse Foundation, Inc. nor the |
||||
* names of its contributors may be used to endorse or promote |
||||
* products derived from this software without specific prior |
||||
* written permission. |
||||
* |
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND |
||||
* CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, |
||||
* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES |
||||
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
||||
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR |
||||
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
||||
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT |
||||
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
||||
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |
||||
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, |
||||
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
||||
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF |
||||
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
||||
*/ |
||||
package org.eclipse.jgit.treewalk.filter; |
||||
|
||||
import org.eclipse.jgit.api.Git; |
||||
import org.eclipse.jgit.dircache.DirCacheIterator; |
||||
import org.eclipse.jgit.lib.RepositoryTestCase; |
||||
import org.eclipse.jgit.revwalk.RevCommit; |
||||
import org.eclipse.jgit.treewalk.FileTreeIterator; |
||||
import org.eclipse.jgit.treewalk.TreeWalk; |
||||
|
||||
public class IndexDiffFilterTest extends RepositoryTestCase { |
||||
private RevCommit commit; |
||||
|
||||
public void setUp() throws Exception { |
||||
super.setUp(); |
||||
|
||||
Git git = new Git(db); |
||||
writeTrashFile("folder/file", "content"); |
||||
git.add().addFilepattern("folder/file").call(); |
||||
commit = git.commit().setMessage("commit").call(); |
||||
|
||||
deleteTrashFile("folder/file"); |
||||
deleteTrashFile("folder"); |
||||
writeTrashFile("folder", "content"); |
||||
} |
||||
|
||||
public void testRecursiveTreeWalk() throws Exception { |
||||
TreeWalk treeWalk = new TreeWalk(db); |
||||
treeWalk.setRecursive(true); |
||||
treeWalk.addTree(commit.getTree()); |
||||
treeWalk.addTree(new DirCacheIterator(db.readDirCache())); |
||||
treeWalk.addTree(new FileTreeIterator(db)); |
||||
treeWalk.setFilter(new IndexDiffFilter(1, 2)); |
||||
assertTrue(treeWalk.next()); |
||||
assertEquals("folder", treeWalk.getPathString()); |
||||
assertTrue(treeWalk.next()); |
||||
assertEquals("folder/file", treeWalk.getPathString()); |
||||
assertFalse(treeWalk.next()); |
||||
} |
||||
|
||||
public void testNonRecursiveTreeWalk() throws Exception { |
||||
TreeWalk treeWalk = new TreeWalk(db); |
||||
treeWalk.setRecursive(false); |
||||
treeWalk.addTree(commit.getTree()); |
||||
treeWalk.addTree(new DirCacheIterator(db.readDirCache())); |
||||
treeWalk.addTree(new FileTreeIterator(db)); |
||||
treeWalk.setFilter(new IndexDiffFilter(1, 2)); |
||||
assertTrue(treeWalk.next()); |
||||
assertEquals("folder", treeWalk.getPathString()); |
||||
assertTrue(treeWalk.next()); |
||||
assertEquals("folder", treeWalk.getPathString()); |
||||
assertTrue(treeWalk.isSubtree()); |
||||
treeWalk.enterSubtree(); |
||||
assertTrue(treeWalk.next()); |
||||
assertEquals("folder/file", treeWalk.getPathString()); |
||||
assertFalse(treeWalk.next()); |
||||
} |
||||
} |
@ -0,0 +1,194 @@
|
||||
/* |
||||
* Copyright (C) 2010, Christian Halstrick <christian.halstrick@sap.com> |
||||
* and other copyright owners as documented in the project's IP log. |
||||
* |
||||
* This program and the accompanying materials are made available |
||||
* under the terms of the Eclipse Distribution License v1.0 which |
||||
* accompanies this distribution, is reproduced below, and is |
||||
* available at http://www.eclipse.org/org/documents/edl-v10.php
|
||||
* |
||||
* All rights reserved. |
||||
* |
||||
* Redistribution and use in source and binary forms, with or |
||||
* without modification, are permitted provided that the following |
||||
* conditions are met: |
||||
* |
||||
* - Redistributions of source code must retain the above copyright |
||||
* notice, this list of conditions and the following disclaimer. |
||||
* |
||||
* - Redistributions in binary form must reproduce the above |
||||
* copyright notice, this list of conditions and the following |
||||
* disclaimer in the documentation and/or other materials provided |
||||
* with the distribution. |
||||
* |
||||
* - Neither the name of the Eclipse Foundation, Inc. nor the |
||||
* names of its contributors may be used to endorse or promote |
||||
* products derived from this software without specific prior |
||||
* written permission. |
||||
* |
||||
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND |
||||
* CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, |
||||
* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES |
||||
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
||||
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR |
||||
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
||||
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT |
||||
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
||||
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |
||||
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, |
||||
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
||||
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF |
||||
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
||||
*/ |
||||
package org.eclipse.jgit.treewalk.filter; |
||||
|
||||
import java.io.IOException; |
||||
|
||||
import org.eclipse.jgit.dircache.DirCacheIterator; |
||||
import org.eclipse.jgit.errors.IncorrectObjectTypeException; |
||||
import org.eclipse.jgit.errors.MissingObjectException; |
||||
import org.eclipse.jgit.treewalk.TreeWalk; |
||||
import org.eclipse.jgit.treewalk.WorkingTreeIterator; |
||||
|
||||
/** |
||||
* A performance optimized variant of {@link TreeFilter#ANY_DIFF} which should |
||||
* be used when among the walked trees there is a {@link DirCacheIterator} and a |
||||
* {@link WorkingTreeIterator}. Please see the documentation of |
||||
* {@link TreeFilter#ANY_DIFF} for a basic description of the semantics. |
||||
* <p> |
||||
* This filter tries to avoid computing content ids of the files in the |
||||
* working-tree. In contrast to {@link TreeFilter#ANY_DIFF} this filter takes |
||||
* care to first compare the entry from the {@link DirCacheIterator} with the |
||||
* entries from all other iterators besides the {@link WorkingTreeIterator}. |
||||
* Since all those entries have fast access to content ids that is very fast. If |
||||
* a difference is detected in this step this filter decides to include that |
||||
* path before even looking at the working-tree entry. |
||||
* <p> |
||||
* If no difference is found then we have to compare index and working-tree as |
||||
* the last step. By making use of |
||||
* {@link WorkingTreeIterator#isModified(org.eclipse.jgit.dircache.DirCacheEntry, boolean)} |
||||
* we can avoid the computation of the content id if the file is not dirty. |
||||
* <p> |
||||
* Instances of this filter should not be used for multiple {@link TreeWalk}s. |
||||
* Always construct a new instance of this filter for each TreeWalk. |
||||
*/ |
||||
public class IndexDiffFilter extends TreeFilter { |
||||
private final int dirCache; |
||||
|
||||
private final int workingTree; |
||||
|
||||
private final boolean honorIgnores; |
||||
|
||||
/** |
||||
* Creates a new instance of this filter. Do not use an instance of this |
||||
* filter in multiple treewalks. |
||||
* |
||||
* @param dirCacheIndex |
||||
* the index of the {@link DirCacheIterator} in the associated |
||||
* treewalk |
||||
* @param workingTreeIndex |
||||
* the index of the {@link WorkingTreeIterator} in the associated |
||||
* treewalk |
||||
*/ |
||||
public IndexDiffFilter(int dirCacheIndex, int workingTreeIndex) { |
||||
this(dirCacheIndex, workingTreeIndex, true /* honor ignores */); |
||||
} |
||||
|
||||
/** |
||||
* Creates a new instance of this filter. Do not use an instance of this |
||||
* filter in multiple treewalks. |
||||
* |
||||
* @param dirCacheIndex |
||||
* the index of the {@link DirCacheIterator} in the associated |
||||
* treewalk |
||||
* @param workingTreeIndex |
||||
* the index of the {@link WorkingTreeIterator} in the associated |
||||
* treewalk |
||||
* @param honorIgnores |
||||
* true if the filter should skip working tree files that are |
||||
* declared as ignored by the standard exclude mechanisms.. |
||||
*/ |
||||
public IndexDiffFilter(int dirCacheIndex, int workingTreeIndex, |
||||
boolean honorIgnores) { |
||||
this.dirCache = dirCacheIndex; |
||||
this.workingTree = workingTreeIndex; |
||||
this.honorIgnores = honorIgnores; |
||||
} |
||||
|
||||
@Override |
||||
public boolean include(TreeWalk tw) throws MissingObjectException, |
||||
IncorrectObjectTypeException, IOException { |
||||
// If the working tree file doesn't exist, it does exist for at least
|
||||
// one other so include this difference.
|
||||
final int wm = tw.getRawMode(workingTree); |
||||
if (wm == 0) |
||||
return true; |
||||
|
||||
// If the path does not appear in the DirCache and its ignored
|
||||
// we can avoid returning a result here, but only if its not in any
|
||||
// other tree.
|
||||
final int cnt = tw.getTreeCount(); |
||||
final int dm = tw.getRawMode(dirCache); |
||||
if (dm == 0) { |
||||
if (honorIgnores && workingTree(tw).isEntryIgnored()) { |
||||
int i = 0; |
||||
for (; i < cnt; i++) { |
||||
if (i == dirCache || i == workingTree) |
||||
continue; |
||||
if (tw.getRawMode(i) != 0) |
||||
break; |
||||
} |
||||
|
||||
// If i is cnt then the path does not appear in any other tree,
|
||||
// and this working tree entry can be safely ignored.
|
||||
return i == cnt ? false : true; |
||||
} else { |
||||
// In working tree and not ignored, and not in DirCache.
|
||||
return true; |
||||
} |
||||
} |
||||
|
||||
// Always include subtrees as WorkingTreeIterator cannot provide
|
||||
// efficient elimination of unmodified subtrees.
|
||||
if (tw.isSubtree()) |
||||
return true; |
||||
|
||||
// Try the inexpensive comparisons between index and all real trees
|
||||
// first. Only if we don't find a diff here we have to bother with
|
||||
// the working tree
|
||||
for (int i = 0; i < cnt; i++) { |
||||
if (i == dirCache || i == workingTree) |
||||
continue; |
||||
if (tw.getRawMode(i) != dm || !tw.idEqual(i, dirCache)) |
||||
return true; |
||||
} |
||||
|
||||
// Only one chance left to detect a diff: between index and working
|
||||
// tree. Make use of the WorkingTreeIterator#isModified() method to
|
||||
// avoid computing SHA1 on filesystem content if not really needed.
|
||||
WorkingTreeIterator wi = workingTree(tw); |
||||
DirCacheIterator di = tw.getTree(dirCache, DirCacheIterator.class); |
||||
return wi.isModified(di.getDirCacheEntry(), true); |
||||
} |
||||
|
||||
private WorkingTreeIterator workingTree(TreeWalk tw) { |
||||
return tw.getTree(workingTree, WorkingTreeIterator.class); |
||||
} |
||||
|
||||
@Override |
||||
public boolean shouldBeRecursive() { |
||||
// We cannot compare subtrees in the working tree, so encourage
|
||||
// use of recursive walks where the subtrees are always dived into.
|
||||
return true; |
||||
} |
||||
|
||||
@Override |
||||
public TreeFilter clone() { |
||||
return this; |
||||
} |
||||
|
||||
@Override |
||||
public String toString() { |
||||
return "INDEX_DIFF_FILTER"; |
||||
} |
||||
} |
Loading…
Reference in new issue