Mercurial > jhg
comparison src/org/tmatesoft/hg/repo/HgBlameFacility.java @ 596:43cfa08ff3fd
HgBlameFacility refactoring: extract code to build file history that spans renames
| author | Artem Tikhomirov <tikhomirov.artem@gmail.com> | 
|---|---|
| date | Thu, 02 May 2013 19:23:53 +0200 | 
| parents | e49f9d9513fa | 
| children | 
   comparison
  equal
  deleted
  inserted
  replaced
| 595:92c3ad9c2a51 | 596:43cfa08ff3fd | 
|---|---|
| 14 * the terms of a license other than GNU General Public License | 14 * the terms of a license other than GNU General Public License | 
| 15 * contact TMate Software at support@hg4j.com | 15 * contact TMate Software at support@hg4j.com | 
| 16 */ | 16 */ | 
| 17 package org.tmatesoft.hg.repo; | 17 package org.tmatesoft.hg.repo; | 
| 18 | 18 | 
| 19 import static org.tmatesoft.hg.core.HgIterateDirection.NewToOld; | |
| 20 import static org.tmatesoft.hg.core.HgIterateDirection.OldToNew; | 19 import static org.tmatesoft.hg.core.HgIterateDirection.OldToNew; | 
| 21 import static org.tmatesoft.hg.repo.HgInternals.wrongRevisionIndex; | 20 import static org.tmatesoft.hg.repo.HgInternals.wrongRevisionIndex; | 
| 22 import static org.tmatesoft.hg.repo.HgRepository.*; | 21 import static org.tmatesoft.hg.repo.HgRepository.NO_REVISION; | 
| 23 | 22 import static org.tmatesoft.hg.repo.HgRepository.TIP; | 
| 24 import java.util.Arrays; | |
| 25 import java.util.BitSet; | |
| 26 import java.util.Collections; | |
| 27 import java.util.LinkedList; | |
| 28 | 23 | 
| 29 import org.tmatesoft.hg.core.HgCallbackTargetException; | 24 import org.tmatesoft.hg.core.HgCallbackTargetException; | 
| 30 import org.tmatesoft.hg.core.HgIterateDirection; | 25 import org.tmatesoft.hg.core.HgIterateDirection; | 
| 31 import org.tmatesoft.hg.core.Nodeid; | 26 import org.tmatesoft.hg.core.Nodeid; | 
| 32 import org.tmatesoft.hg.internal.BlameHelper; | 27 import org.tmatesoft.hg.internal.BlameHelper; | 
| 33 import org.tmatesoft.hg.internal.Callback; | 28 import org.tmatesoft.hg.internal.Callback; | 
| 34 import org.tmatesoft.hg.internal.Experimental; | 29 import org.tmatesoft.hg.internal.Experimental; | 
| 35 import org.tmatesoft.hg.internal.IntVector; | 30 import org.tmatesoft.hg.internal.FileHistory; | 
| 31 import org.tmatesoft.hg.internal.FileRevisionHistoryChunk; | |
| 36 import org.tmatesoft.hg.util.Adaptable; | 32 import org.tmatesoft.hg.util.Adaptable; | 
| 37 | 33 | 
| 38 /** | 34 /** | 
| 39 * Facility with diff/annotate functionality. | 35 * Facility with diff/annotate functionality. | 
| 40 * | 36 * | 
| 87 } | 83 } | 
| 88 HgInternals.checkRevlogRange(changelogRevIndexStart, changelogRevIndexEnd, lastRevision); | 84 HgInternals.checkRevlogRange(changelogRevIndexStart, changelogRevIndexEnd, lastRevision); | 
| 89 if (!df.exists()) { | 85 if (!df.exists()) { | 
| 90 return; | 86 return; | 
| 91 } | 87 } | 
| 88 FileHistory fileHistory = new FileHistory(df, changelogRevIndexStart, changelogRevIndexEnd); | |
| 89 fileHistory.build(); | |
| 92 BlameHelper bh = new BlameHelper(insp, 10); | 90 BlameHelper bh = new BlameHelper(insp, 10); | 
| 93 HgDataFile currentFile = df; | 91 for (FileRevisionHistoryChunk fhc : fileHistory.iterate(OldToNew)) { | 
| 94 int fileLastClogRevIndex = changelogRevIndexEnd; | 92 // iteration order is not important here | 
| 95 FileRevisionHistoryChunk nextChunk = null; | 93 bh.useFileUpTo(fhc.getFile(), fhc.getEndChangeset()); | 
| 96 LinkedList<FileRevisionHistoryChunk> fileCompleteHistory = new LinkedList<FileRevisionHistoryChunk>(); | 94 } | 
| 97 do { | |
| 98 FileRevisionHistoryChunk fileHistory = new FileRevisionHistoryChunk(currentFile); | |
| 99 fileHistory.init(fileLastClogRevIndex); | |
| 100 fileHistory.linkTo(nextChunk); | |
| 101 fileCompleteHistory.addFirst(fileHistory); // to get the list in old-to-new order | |
| 102 nextChunk = fileHistory; | |
| 103 bh.useFileUpTo(currentFile, fileLastClogRevIndex); | |
| 104 if (fileHistory.changeset(0) > changelogRevIndexStart && currentFile.isCopy()) { | |
| 105 // fileHistory.changeset(0) is the earliest revision we know about so far, | |
| 106 // once we get to revisions earlier than the requested start, stop digging. | |
| 107 // The reason there's NO == (i.e. not >=) because: | |
| 108 // (easy): once it's equal, we've reached our intended start | |
| 109 // (hard): if changelogRevIndexStart happens to be exact start of one of renames in the | |
| 110 // chain of renames (test-annotate2 repository, file1->file1a->file1b, i.e. points | |
| 111 // to the very start of file1a or file1 history), presence of == would get us to the next | |
| 112 // chunk and hence changed parents of present chunk's first element. Our annotate alg | |
| 113 // relies on parents only (i.e. knows nothing about 'last iteration element') to find out | |
| 114 // what to compare, and hence won't report all lines of 'last iteration element' (which is the | |
| 115 // first revision of the renamed file) as "added in this revision", leaving gaps in annotate | |
| 116 HgRepository repo = currentFile.getRepo(); | |
| 117 Nodeid originLastRev = currentFile.getCopySourceRevision(); | |
| 118 currentFile = repo.getFileNode(currentFile.getCopySourceName()); | |
| 119 fileLastClogRevIndex = currentFile.getChangesetRevisionIndex(currentFile.getRevisionIndex(originLastRev)); | |
| 120 // XXX perhaps, shall fail with meaningful exception if new file doesn't exist (.i/.d not found for whatever reason) | |
| 121 // or source revision is missing? | |
| 122 } else { | |
| 123 fileHistory.chopAtChangeset(changelogRevIndexStart); | |
| 124 currentFile = null; // stop iterating | |
| 125 } | |
| 126 } while (currentFile != null && fileLastClogRevIndex > changelogRevIndexStart); | |
| 127 // fileCompleteHistory is in (origin, intermediate target, ultimate target) order | |
| 128 | |
| 129 int[] fileClogParentRevs = new int[2]; | 95 int[] fileClogParentRevs = new int[2]; | 
| 130 int[] fileParentRevs = new int[2]; | 96 int[] fileParentRevs = new int[2]; | 
| 131 if (iterateOrder == NewToOld) { | 97 for (FileRevisionHistoryChunk fhc : fileHistory.iterate(iterateOrder)) { | 
| 132 Collections.reverse(fileCompleteHistory); | 98 for (int fri : fhc.fileRevisions(iterateOrder)) { | 
| 133 } | 99 int clogRevIndex = fhc.changeset(fri); | 
| 134 boolean shallFilterStart = changelogRevIndexStart != 0; // no reason if complete history is walked | 100 // the way we built fileHistory ensures we won't walk past [changelogRevIndexStart..changelogRevIndexEnd] | 
| 135 for (FileRevisionHistoryChunk fileHistory : fileCompleteHistory) { | 101 assert clogRevIndex >= changelogRevIndexStart; | 
| 136 for (int fri : fileHistory.fileRevisions(iterateOrder)) { | 102 assert clogRevIndex <= changelogRevIndexEnd; | 
| 137 int clogRevIndex = fileHistory.changeset(fri); | 103 fhc.fillFileParents(fri, fileParentRevs); | 
| 138 if (shallFilterStart) { | 104 fhc.fillCsetParents(fri, fileClogParentRevs); | 
| 139 if (iterateOrder == NewToOld) { | |
| 140 // clogRevIndex decreases | |
| 141 if (clogRevIndex < changelogRevIndexStart) { | |
| 142 break; | |
| 143 } | |
| 144 // fall-through, clogRevIndex is in the [start..end] range | |
| 145 } else { // old to new | |
| 146 // the way we built fileHistory ensures we won't walk past changelogRevIndexEnd | |
| 147 // here we ensure we start from the right one, the one indicated with changelogRevIndexStart | |
| 148 if (clogRevIndex < changelogRevIndexStart) { | |
| 149 continue; | |
| 150 } else { | |
| 151 shallFilterStart = false; // once boundary is crossed, no need to check | |
| 152 // fall-through | |
| 153 } | |
| 154 } | |
| 155 } | |
| 156 fileHistory.fillFileParents(fri, fileParentRevs); | |
| 157 fileHistory.fillCsetParents(fri, fileClogParentRevs); | |
| 158 bh.annotateChange(fri, clogRevIndex, fileParentRevs, fileClogParentRevs); | 105 bh.annotateChange(fri, clogRevIndex, fileParentRevs, fileClogParentRevs); | 
| 159 } | 106 } | 
| 160 } | 107 } | 
| 161 } | 108 } | 
| 162 | 109 | 
| 193 public interface Inspector { | 140 public interface Inspector { | 
| 194 void same(EqualBlock block) throws HgCallbackTargetException; | 141 void same(EqualBlock block) throws HgCallbackTargetException; | 
| 195 void added(AddBlock block) throws HgCallbackTargetException; | 142 void added(AddBlock block) throws HgCallbackTargetException; | 
| 196 void changed(ChangeBlock block) throws HgCallbackTargetException; | 143 void changed(ChangeBlock block) throws HgCallbackTargetException; | 
| 197 void deleted(DeleteBlock block) throws HgCallbackTargetException; | 144 void deleted(DeleteBlock block) throws HgCallbackTargetException; | 
| 198 } | |
| 199 | |
| 200 /** | |
| 201 * No need to keep "Block" prefix as long as there's only one {@link Inspector} | |
| 202 */ | |
| 203 @Deprecated | |
| 204 public interface BlockInspector extends Inspector { | |
| 205 } | 145 } | 
| 206 | 146 | 
| 207 /** | 147 /** | 
| 208 * Represents content of a block, either as a sequence of bytes or a | 148 * Represents content of a block, either as a sequence of bytes or a | 
| 209 * sequence of smaller blocks (lines), if appropriate (according to usage context). | 149 * sequence of smaller blocks (lines), if appropriate (according to usage context). | 
| 351 | 291 | 
| 352 private static int fileRevIndex(HgDataFile df, int csetRevIndex) { | 292 private static int fileRevIndex(HgDataFile df, int csetRevIndex) { | 
| 353 Nodeid fileRev = df.getRepo().getManifest().getFileRevision(csetRevIndex, df.getPath()); | 293 Nodeid fileRev = df.getRepo().getManifest().getFileRevision(csetRevIndex, df.getPath()); | 
| 354 return df.getRevisionIndex(fileRev); | 294 return df.getRevisionIndex(fileRev); | 
| 355 } | 295 } | 
| 356 | |
| 357 private static class FileRevisionHistoryChunk { | |
| 358 private final HgDataFile df; | |
| 359 // change ancestry, sequence of file revisions | |
| 360 private IntVector fileRevsToVisit; | |
| 361 // parent pairs of complete file history | |
| 362 private IntVector fileParentRevs; | |
| 363 // map file revision to changelog revision (sparse array, only file revisions to visit are set) | |
| 364 private int[] file2changelog; | |
| 365 private int originChangelogRev = BAD_REVISION, originFileRev = BAD_REVISION; | |
| 366 | |
| 367 public FileRevisionHistoryChunk(HgDataFile file) { | |
| 368 df = file; | |
| 369 } | |
| 370 | |
| 371 public void init(int changelogRevisionIndex) { | |
| 372 // XXX df.indexWalk(0, fileRevIndex, ) might be more effective | |
| 373 int fileRevIndex = fileRevIndex(df, changelogRevisionIndex); | |
| 374 int[] fileRevParents = new int[2]; | |
| 375 fileParentRevs = new IntVector((fileRevIndex+1) * 2, 0); | |
| 376 fileParentRevs.add(NO_REVISION, NO_REVISION); // parents of fileRevIndex == 0 | |
| 377 for (int i = 1; i <= fileRevIndex; i++) { | |
| 378 df.parents(i, fileRevParents, null, null); | |
| 379 fileParentRevs.add(fileRevParents[0], fileRevParents[1]); | |
| 380 } | |
| 381 // fileRevsToVisit keep file change ancestry from new to old | |
| 382 fileRevsToVisit = new IntVector(fileRevIndex + 1, 0); | |
| 383 // keep map of file revision to changelog revision | |
| 384 file2changelog = new int[fileRevIndex+1]; | |
| 385 // only elements worth visit would get mapped, so there would be unfilled areas in the file2changelog, | |
| 386 // prevent from error (make it explicit) by bad value | |
| 387 Arrays.fill(file2changelog, BAD_REVISION); | |
| 388 LinkedList<Integer> queue = new LinkedList<Integer>(); | |
| 389 BitSet seen = new BitSet(fileRevIndex + 1); | |
| 390 queue.add(fileRevIndex); | |
| 391 do { | |
| 392 int x = queue.removeFirst(); | |
| 393 if (seen.get(x)) { | |
| 394 continue; | |
| 395 } | |
| 396 seen.set(x); | |
| 397 fileRevsToVisit.add(x); | |
| 398 file2changelog[x] = df.getChangesetRevisionIndex(x); | |
| 399 int p1 = fileParentRevs.get(2*x); | |
| 400 int p2 = fileParentRevs.get(2*x + 1); | |
| 401 if (p1 != NO_REVISION) { | |
| 402 queue.addLast(p1); | |
| 403 } | |
| 404 if (p2 != NO_REVISION) { | |
| 405 queue.addLast(p2); | |
| 406 } | |
| 407 } while (!queue.isEmpty()); | |
| 408 // make sure no child is processed before we handled all (grand-)parents of the element | |
| 409 fileRevsToVisit.sort(false); | |
| 410 } | |
| 411 | |
| 412 public void linkTo(FileRevisionHistoryChunk target) { | |
| 413 // assume that target.init() has been called already | |
| 414 if (target == null) { | |
| 415 return; | |
| 416 } | |
| 417 target.originFileRev = fileRevsToVisit.get(0); // files to visit are new to old | |
| 418 target.originChangelogRev = changeset(target.originFileRev); | |
| 419 } | |
| 420 | |
| 421 /** | |
| 422 * Mark revision closest(ceil) to specified as the very first one (no parents) | |
| 423 */ | |
| 424 public void chopAtChangeset(int firstChangelogRevOfInterest) { | |
| 425 if (firstChangelogRevOfInterest == 0) { | |
| 426 return; // nothing to do | |
| 427 } | |
| 428 int i = 0, x = fileRevsToVisit.size(), fileRev = BAD_REVISION; | |
| 429 // fileRevsToVisit is new to old, greater numbers to smaller | |
| 430 while (i < x && changeset(fileRev = fileRevsToVisit.get(i)) >= firstChangelogRevOfInterest) { | |
| 431 i++; | |
| 432 } | |
| 433 assert fileRev != BAD_REVISION; // there's at least 1 revision in fileRevsToVisit | |
| 434 if (i == x && changeset(fileRev) != firstChangelogRevOfInterest) { | |
| 435 assert false : "Requested changeset shall belong to the chunk"; | |
| 436 return; | |
| 437 } | |
| 438 fileRevsToVisit.trimTo(i); // no need to iterate more | |
| 439 // pretend fileRev got no parents | |
| 440 fileParentRevs.set(fileRev * 2, NO_REVISION); | |
| 441 fileParentRevs.set(fileRev, NO_REVISION); | |
| 442 } | |
| 443 | |
| 444 public int[] fileRevisions(HgIterateDirection iterateOrder) { | |
| 445 // fileRevsToVisit is { r10, r7, r6, r5, r0 }, new to old | |
| 446 int[] rv = fileRevsToVisit.toArray(); | |
| 447 if (iterateOrder == OldToNew) { | |
| 448 // reverse return value | |
| 449 for (int a = 0, b = rv.length-1; a < b; a++, b--) { | |
| 450 int t = rv[b]; | |
| 451 rv[b] = rv[a]; | |
| 452 rv[a] = t; | |
| 453 } | |
| 454 } | |
| 455 return rv; | |
| 456 } | |
| 457 | |
| 458 public int changeset(int fileRevIndex) { | |
| 459 return file2changelog[fileRevIndex]; | |
| 460 } | |
| 461 | |
| 462 public void fillFileParents(int fileRevIndex, int[] fileParents) { | |
| 463 if (fileRevIndex == 0 && originFileRev != BAD_REVISION) { | |
| 464 // this chunk continues another file | |
| 465 assert originFileRev != NO_REVISION; | |
| 466 fileParents[0] = originFileRev; | |
| 467 fileParents[1] = NO_REVISION; | |
| 468 return; | |
| 469 } | |
| 470 fileParents[0] = fileParentRevs.get(fileRevIndex * 2); | |
| 471 fileParents[1] = fileParentRevs.get(fileRevIndex * 2 + 1); | |
| 472 } | |
| 473 | |
| 474 public void fillCsetParents(int fileRevIndex, int[] csetParents) { | |
| 475 if (fileRevIndex == 0 && originFileRev != BAD_REVISION) { | |
| 476 assert originFileRev != NO_REVISION; | |
| 477 csetParents[0] = originChangelogRev; | |
| 478 csetParents[1] = NO_REVISION; // I wonder if possible to start a copy with two parents? | |
| 479 return; | |
| 480 } | |
| 481 int fp1 = fileParentRevs.get(fileRevIndex * 2); | |
| 482 int fp2 = fileParentRevs.get(fileRevIndex * 2 + 1); | |
| 483 csetParents[0] = fp1 == NO_REVISION ? NO_REVISION : changeset(fp1); | |
| 484 csetParents[1] = fp2 == NO_REVISION ? NO_REVISION : changeset(fp2); | |
| 485 } | |
| 486 } | |
| 487 } | 296 } | 
