org.spearce.jgit/src/org/spearce/jgit/treewalk/WorkingTreeIterator.java

   1 /*
   2  * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
   3  *
   4  * All rights reserved.
   5  *
   6  * Redistribution and use in source and binary forms, with or
   7  * without modification, are permitted provided that the following
   8  * conditions are met:
   9  *
  10  * - Redistributions of source code must retain the above copyright
  11  *   notice, this list of conditions and the following disclaimer.
  12  *
  13  * - Redistributions in binary form must reproduce the above
  14  *   copyright notice, this list of conditions and the following
  15  *   disclaimer in the documentation and/or other materials provided
  16  *   with the distribution.
  17  *
  18  * - Neither the name of the Git Development Community nor the
  19  *   names of its contributors may be used to endorse or promote
  20  *   products derived from this software without specific prior
  21  *   written permission.
  22  *
  23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  24  * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  25  * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  26  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  28  * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  29  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  30  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  31  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  32  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  33  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  34  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  35  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  36  */
  37
  38 package org.spearce.jgit.treewalk;
  39
  40 import java.io.IOException;
  41 import java.io.InputStream;
  42 import java.nio.ByteBuffer;
  43 import java.nio.CharBuffer;
  44 import java.nio.charset.CharacterCodingException;
  45 import java.nio.charset.CharsetEncoder;
  46 import java.security.MessageDigest;
  47 import java.util.Arrays;
  48 import java.util.Comparator;
  49
  50 import org.spearce.jgit.errors.CorruptObjectException;
  51 import org.spearce.jgit.lib.Constants;
  52 import org.spearce.jgit.lib.FileMode;
  53
  54 /**
  55  * Walks a working directory tree as part of a {@link TreeWalk}.
  56  * <p>
  57  * Most applications will want to use the standard implementation of this
  58  * iterator, {@link FileTreeIterator}, as that does all IO through the standard
  59  * <code>java.io</code> package. Plugins for a Java based IDE may however wish
  60  * to create their own implementations of this class to allow traversal of the
  61  * IDE's project space, as well as benefit from any caching the IDE may have.
  62  *
  63  * @see FileTreeIterator
  64  */
  65 public abstract class WorkingTreeIterator extends AbstractTreeIterator {
  66         /** An empty entry array, suitable for {@link #init(Entry[])}. */
  67         protected static final Entry[] EOF = {};
  68
  69         /** Size we perform file IO in if we have to read and hash a file. */
  70         private static final int BUFFER_SIZE = 2048;
  71
  72         /** The {@link #idBuffer()} for the current entry. */
  73         private byte[] contentId;
  74
  75         /** Index within {@link #entries} that {@link #contentId} came from. */
  76         private int contentIdFromPtr;
  77
  78         /** Buffer used to perform {@link #contentId} computations. */
  79         private byte[] contentReadBuffer;
  80
  81         /** Digest computer for {@link #contentId} computations. */
  82         private MessageDigest contentDigest;
  83
  84         /** File name character encoder. */
  85         private final CharsetEncoder nameEncoder;
  86
  87         /** List of entries obtained from the subclass. */
  88         private Entry[] entries;
  89
  90         /** Total number of entries in {@link #entries} that are valid. */
  91         private int entryCnt;
  92
  93         /** Current position within {@link #entries}. */
  94         private int ptr;
  95
  96         /** Create a new iterator with no parent. */
  97         protected WorkingTreeIterator() {
  98                 super();
  99                 nameEncoder = Constants.CHARSET.newEncoder();
 100         }
 101
 102         /**
 103          * Create a new iterator with no parent and a prefix.
 104          * <p>
 105          * The prefix path supplied is inserted in front of all paths generated by
 106          * this iterator. It is intended to be used when an iterator is being
 107          * created for a subsection of an overall repository and needs to be
 108          * combined with other iterators that are created to run over the entire
 109          * repository namespace.
 110          *
 111          * @param prefix
 112          *            position of this iterator in the repository tree. The value
 113          *            may be null or the empty string to indicate the prefix is the
 114          *            root of the repository. A trailing slash ('/') is
 115          *            automatically appended if the prefix does not end in '/'.
 116          */
 117         protected WorkingTreeIterator(final String prefix) {
 118                 super(prefix);
 119                 nameEncoder = Constants.CHARSET.newEncoder();
 120         }
 121
 122         /**
 123          * Create an iterator for a subtree of an existing iterator.
 124          *
 125          * @param p
 126          *            parent tree iterator.
 127          */
 128         protected WorkingTreeIterator(final WorkingTreeIterator p) {
 129                 super(p);
 130                 nameEncoder = p.nameEncoder;
 131         }
 132
 133         @Override
 134         public byte[] idBuffer() {
 135                 if (contentIdFromPtr == ptr)
 136                         return contentId;
 137                 switch (mode & 0170000) {
 138                 case 0100000: /* normal files */
 139                         contentIdFromPtr = ptr;
 140                         return contentId = idBufferBlob(entries[ptr]);
 141                 case 0120000: /* symbolic links */
 142                         // Java does not support symbolic links, so we should not
 143                         // have reached this particular part of the walk code.
 144                         //
 145                         return zeroid;
 146                 case 0160000: /* gitlink */
 147                         // TODO: Support obtaining current HEAD SHA-1 from nested repository
 148                         //
 149                         return zeroid;
 150                 }
 151                 return zeroid;
 152         }
 153
 154         private void initializeDigest() {
 155                 if (contentDigest != null)
 156                         return;
 157
 158                 if (parent == null) {
 159                         contentReadBuffer = new byte[BUFFER_SIZE];
 160                         contentDigest = Constants.newMessageDigest();
 161                 } else {
 162                         final WorkingTreeIterator p = (WorkingTreeIterator) parent;
 163                         p.initializeDigest();
 164                         contentReadBuffer = p.contentReadBuffer;
 165                         contentDigest = p.contentDigest;
 166                 }
 167         }
 168
 169         private static final byte[] digits = { '0', '1', '2', '3', '4', '5', '6',
 170                         '7', '8', '9' };
 171
 172         private static final byte[] hblob = Constants
 173                         .encodedTypeString(Constants.OBJ_BLOB);
 174
 175         private byte[] idBufferBlob(final Entry e) {
 176                 try {
 177                         final InputStream is = e.openInputStream();
 178                         if (is == null)
 179                                 return zeroid;
 180                         try {
 181                                 initializeDigest();
 182
 183                                 contentDigest.reset();
 184                                 contentDigest.update(hblob);
 185                                 contentDigest.update((byte) ' ');
 186
 187                                 final long blobLength = e.getLength();
 188                                 long sz = blobLength;
 189                                 if (sz == 0) {
 190                                         contentDigest.update((byte) '0');
 191                                 } else {
 192                                         final int bufn = contentReadBuffer.length;
 193                                         int p = bufn;
 194                                         do {
 195                                                 contentReadBuffer[--p] = digits[(int) (sz % 10)];
 196                                                 sz /= 10;
 197                                         } while (sz > 0);
 198                                         contentDigest.update(contentReadBuffer, p, bufn - p);
 199                                 }
 200                                 contentDigest.update((byte) 0);
 201
 202                                 for (;;) {
 203                                         final int r = is.read(contentReadBuffer);
 204                                         if (r <= 0)
 205                                                 break;
 206                                         contentDigest.update(contentReadBuffer, 0, r);
 207                                         sz += r;
 208                                 }
 209                                 if (sz != blobLength)
 210                                         return zeroid;
 211                                 return contentDigest.digest();
 212                         } finally {
 213                                 try {
 214                                         is.close();
 215                                 } catch (IOException err2) {
 216                                         // Suppress any error related to closing an input
 217                                         // stream. We don't care, we should not have any
 218                                         // outstanding data to flush or anything like that.
 219                                 }
 220                         }
 221                 } catch (IOException err) {
 222                         // Can't read the file? Don't report the failure either.
 223                         //
 224                         return zeroid;
 225                 }
 226         }
 227
 228         @Override
 229         public int idOffset() {
 230                 return 0;
 231         }
 232
 233         @Override
 234         public boolean eof() {
 235                 return ptr == entryCnt;
 236         }
 237
 238         @Override
 239         public void next(final int delta) throws CorruptObjectException {
 240                 ptr += delta;
 241                 if (!eof())
 242                         parseEntry();
 243         }
 244
 245         @Override
 246         public void back(final int delta) throws CorruptObjectException {
 247                 ptr -= delta;
 248                 parseEntry();
 249         }
 250
 251         private void parseEntry() {
 252                 final Entry e = entries[ptr];
 253                 mode = e.getMode().getBits();
 254
 255                 final int nameLen = e.encodedNameLen;
 256                 while (pathOffset + nameLen > path.length)
 257                         growPath(pathOffset);
 258                 System.arraycopy(e.encodedName, 0, path, pathOffset, nameLen);
 259                 pathLen = pathOffset + nameLen;
 260         }
 261
 262         /**
 263          * Get the byte length of this entry.
 264          *
 265          * @return size of this file, in bytes.
 266          */
 267         public long getEntryLength() {
 268                 return current().getLength();
 269         }
 270
 271         /**
 272          * Get the last modified time of this entry.
 273          *
 274          * @return last modified time of this file, in milliseconds since the epoch
 275          *         (Jan 1, 1970 UTC).
 276          */
 277         public long getEntryLastModified() {
 278                 return current().getLastModified();
 279         }
 280
 281         private static final Comparator<Entry> ENTRY_CMP = new Comparator<Entry>() {
 282                 public int compare(final Entry o1, final Entry o2) {
 283                         final byte[] a = o1.encodedName;
 284                         final byte[] b = o2.encodedName;
 285                         final int aLen = o1.encodedNameLen;
 286                         final int bLen = o2.encodedNameLen;
 287                         int cPos;
 288
 289                         for (cPos = 0; cPos < aLen && cPos < bLen; cPos++) {
 290                                 final int cmp = (a[cPos] & 0xff) - (b[cPos] & 0xff);
 291                                 if (cmp != 0)
 292                                         return cmp;
 293                         }
 294
 295                         if (cPos < aLen) {
 296                                 final int aj = a[cPos] & 0xff;
 297                                 final int lastb = lastPathChar(o2);
 298                                 if (aj < lastb)
 299                                         return -1;
 300                                 else if (aj > lastb)
 301                                         return 1;
 302                                 else if (cPos == aLen - 1)
 303                                         return 0;
 304                                 else
 305                                         return -1;
 306                         }
 307
 308                         if (cPos < bLen) {
 309                                 final int bk = b[cPos] & 0xff;
 310                                 final int lasta = lastPathChar(o1);
 311                                 if (lasta < bk)
 312                                         return -1;
 313                                 else if (lasta > bk)
 314                                         return 1;
 315                                 else if (cPos == bLen - 1)
 316                                         return 0;
 317                                 else
 318                                         return 1;
 319                         }
 320
 321                         final int lasta = lastPathChar(o1);
 322                         final int lastb = lastPathChar(o2);
 323                         if (lasta < lastb)
 324                                 return -1;
 325                         else if (lasta > lastb)
 326                                 return 1;
 327
 328                         if (aLen == bLen)
 329                                 return 0;
 330                         else if (aLen < bLen)
 331                                 return -1;
 332                         else
 333                                 return 1;
 334                 }
 335         };
 336
 337         static int lastPathChar(final Entry e) {
 338                 return e.getMode() == FileMode.TREE ? '/' : '\0';
 339         }
 340
 341         protected void init(final Entry[] list) {
 342                 // Filter out nulls, . and .. as these are not valid tree entries,
 343                 // also cache the encoded forms of the path names for efficient use
 344                 // later on during sorting and iteration.
 345                 //
 346                 entries = list;
 347                 int i, o;
 348
 349                 for (i = 0, o = 0; i < entries.length; i++) {
 350                         final Entry e = entries[i];
 351                         if (e == null)
 352                                 continue;
 353                         final String name = e.getName();
 354                         if (".".equals(name) || "..".equals(name))
 355                                 continue;
 356                         if (parent == null && ".git".equals(name))
 357                                 continue;
 358                         if (i != o)
 359                                 entries[o] = e;
 360                         e.encodeName(nameEncoder);
 361                         o++;
 362                 }
 363                 entryCnt = o;
 364                 Arrays.sort(entries, 0, entryCnt, ENTRY_CMP);
 365
 366                 contentIdFromPtr = -1;
 367                 ptr = 0;
 368                 if (!eof())
 369                         parseEntry();
 370         }
 371
 372         /**
 373          * Obtain the current entry from this iterator.
 374          *
 375          * @return the currently selected entry.
 376          */
 377         protected Entry current() {
 378                 return entries[ptr];
 379         }
 380
 381         /** A single entry within a working directory tree. */
 382         protected static abstract class Entry {
 383                 byte[] encodedName;
 384
 385                 int encodedNameLen;
 386
 387                 void encodeName(final CharsetEncoder enc) {
 388                         final ByteBuffer b;
 389                         try {
 390                                 b = enc.encode(CharBuffer.wrap(getName()));
 391                         } catch (CharacterCodingException e) {
 392                                 // This should so never happen.
 393                                 throw new RuntimeException("Unencodeable file: " + getName());
 394                         }
 395
 396                         encodedNameLen = b.limit();
 397                         if (b.hasArray() && b.arrayOffset() == 0)
 398                                 encodedName = b.array();
 399                         else
 400                                 b.get(encodedName = new byte[encodedNameLen]);
 401                 }
 402
 403                 public String toString() {
 404                         return getMode().toString() + " " + getName();
 405                 }
 406
 407                 /**
 408                  * Get the type of this entry.
 409                  * <p>
 410                  * <b>Note: Efficient implementation required.</b>
 411                  * <p>
 412                  * The implementation of this method must be efficient. If a subclass
 413                  * needs to compute the value they should cache the reference within an
 414                  * instance member instead.
 415                  *
 416                  * @return a file mode constant from {@link FileMode}.
 417                  */
 418                 public abstract FileMode getMode();
 419
 420                 /**
 421                  * Get the byte length of this entry.
 422                  * <p>
 423                  * <b>Note: Efficient implementation required.</b>
 424                  * <p>
 425                  * The implementation of this method must be efficient. If a subclass
 426                  * needs to compute the value they should cache the reference within an
 427                  * instance member instead.
 428                  *
 429                  * @return size of this file, in bytes.
 430                  */
 431                 public abstract long getLength();
 432
 433                 /**
 434                  * Get the last modified time of this entry.
 435                  * <p>
 436                  * <b>Note: Efficient implementation required.</b>
 437                  * <p>
 438                  * The implementation of this method must be efficient. If a subclass
 439                  * needs to compute the value they should cache the reference within an
 440                  * instance member instead.
 441                  *
 442                  * @return time since the epoch (in ms) of the last change.
 443                  */
 444                 public abstract long getLastModified();
 445
 446                 /**
 447                  * Get the name of this entry within its directory.
 448                  * <p>
 449                  * Efficient implementations are not required. The caller will obtain
 450                  * the name only once and cache it once obtained.
 451                  *
 452                  * @return name of the entry.
 453                  */
 454                 public abstract String getName();
 455
 456                 /**
 457                  * Obtain an input stream to read the file content.
 458                  * <p>
 459                  * Efficient implementations are not required. The caller will usually
 460                  * obtain the stream only once per entry, if at all.
 461                  * <p>
 462                  * The input stream should not use buffering if the implementation can
 463                  * avoid it. The caller will buffer as necessary to perform efficient
 464                  * block IO operations.
 465                  * <p>
 466                  * The caller will close the stream once complete.
 467                  *
 468                  * @return a stream to read from the file.
 469                  * @throws IOException
 470                  *             the file could not be opened for reading.
 471                  */
 472                 public abstract InputStream openInputStream() throws IOException;
 473         }
 474 }