org.spearce.jgit/src/org/spearce/jgit/treewalk/WorkingTreeIterator.java

   1 /*
   2  * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
   3  *
   4  * All rights reserved.
   5  *
   6  * Redistribution and use in source and binary forms, with or
   7  * without modification, are permitted provided that the following
   8  * conditions are met:
   9  *
  10  * - Redistributions of source code must retain the above copyright
  11  *   notice, this list of conditions and the following disclaimer.
  12  *
  13  * - Redistributions in binary form must reproduce the above
  14  *   copyright notice, this list of conditions and the following
  15  *   disclaimer in the documentation and/or other materials provided
  16  *   with the distribution.
  17  *
  18  * - Neither the name of the Git Development Community nor the
  19  *   names of its contributors may be used to endorse or promote
  20  *   products derived from this software without specific prior
  21  *   written permission.
  22  *
  23  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  24  * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  25  * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  26  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  27  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  28  * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  29  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  30  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  31  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  32  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  33  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  34  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  35  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  36  */
  37
  38 package org.spearce.jgit.treewalk;
  39
  40 import java.io.IOException;
  41 import java.io.InputStream;
  42 import java.nio.ByteBuffer;
  43 import java.nio.CharBuffer;
  44 import java.nio.charset.CharacterCodingException;
  45 import java.nio.charset.CharsetEncoder;
  46 import java.security.MessageDigest;
  47 import java.util.Arrays;
  48 import java.util.Comparator;
  49
  50 import org.spearce.jgit.errors.CorruptObjectException;
  51 import org.spearce.jgit.lib.Constants;
  52 import org.spearce.jgit.lib.FileMode;
  53
  54 /**
  55  * Walks a working directory tree as part of a {@link TreeWalk}.
  56  * <p>
  57  * Most applications will want to use the standard implementation of this
  58  * iterator, {@link FileTreeIterator}, as that does all IO through the standard
  59  * <code>java.io</code> package. Plugins for a Java based IDE may however wish
  60  * to create their own implementations of this class to allow traversal of the
  61  * IDE's project space, as well as benefit from any caching the IDE may have.
  62  *
  63  * @see FileTreeIterator
  64  */
  65 public abstract class WorkingTreeIterator extends AbstractTreeIterator {
  66         /** An empty entry array, suitable for {@link #init(Entry[])}. */
  67         protected static final Entry[] EOF = {};
  68
  69         /** Size we perform file IO in if we have to read and hash a file. */
  70         private static final int BUFFER_SIZE = 2048;
  71
  72         /** The {@link #idBuffer()} for the current entry. */
  73         private byte[] contentId;
  74
  75         /** Index within {@link #entries} that {@link #contentId} came from. */
  76         private int contentIdFromPtr;
  77
  78         /** Buffer used to perform {@link #contentId} computations. */
  79         private byte[] contentReadBuffer;
  80
  81         /** Digest computer for {@link #contentId} computations. */
  82         private MessageDigest contentDigest;
  83
  84         /** File name character encoder. */
  85         private final CharsetEncoder nameEncoder;
  86
  87         /** List of entries obtained from the subclass. */
  88         private Entry[] entries;
  89
  90         /** Total number of entries in {@link #entries} that are valid. */
  91         private int entryCnt;
  92
  93         /** Current position within {@link #entries}. */
  94         private int ptr;
  95
  96         /** Create a new iterator with no parent. */
  97         protected WorkingTreeIterator() {
  98                 super();
  99                 nameEncoder = Constants.CHARSET.newEncoder();
 100         }
 101
 102         /**
 103          * Create a new iterator with no parent and a prefix.
 104          * <p>
 105          * The prefix path supplied is inserted in front of all paths generated by
 106          * this iterator. It is intended to be used when an iterator is being
 107          * created for a subsection of an overall repository and needs to be
 108          * combined with other iterators that are created to run over the entire
 109          * repository namespace.
 110          *
 111          * @param prefix
 112          *            position of this iterator in the repository tree. The value
 113          *            may be null or the empty string to indicate the prefix is the
 114          *            root of the repository. A trailing slash ('/') is
 115          *            automatically appended if the prefix does not end in '/'.
 116          */
 117         protected WorkingTreeIterator(final String prefix) {
 118                 super(prefix);
 119                 nameEncoder = Constants.CHARSET.newEncoder();
 120         }
 121
 122         /**
 123          * Create an iterator for a subtree of an existing iterator.
 124          *
 125          * @param p
 126          *            parent tree iterator.
 127          */
 128         protected WorkingTreeIterator(final WorkingTreeIterator p) {
 129                 super(p);
 130                 nameEncoder = p.nameEncoder;
 131         }
 132
 133         @Override
 134         public byte[] idBuffer() {
 135                 if (contentIdFromPtr == ptr)
 136                         return contentId;
 137                 switch (mode & 0170000) {
 138                 case 0100000: /* normal files */
 139                         contentIdFromPtr = ptr;
 140                         return contentId = idBufferBlob(entries[ptr]);
 141                 case 0120000: /* symbolic links */
 142                         // Java does not support symbolic links, so we should not
 143                         // have reached this particular part of the walk code.
 144                         //
 145                         return zeroid;
 146                 case 0160000: /* gitlink */
 147                         // TODO: Support obtaining current HEAD SHA-1 from nested repository
 148                         //
 149                         return zeroid;
 150                 }
 151                 return zeroid;
 152         }
 153
 154         private void initializeDigest() {
 155                 if (contentDigest != null)
 156                         return;
 157
 158                 if (parent == null) {
 159                         contentReadBuffer = new byte[BUFFER_SIZE];
 160                         contentDigest = Constants.newMessageDigest();
 161                 } else {
 162                         final WorkingTreeIterator p = (WorkingTreeIterator) parent;
 163                         p.initializeDigest();
 164                         contentReadBuffer = p.contentReadBuffer;
 165                         contentDigest = p.contentDigest;
 166                 }
 167         }
 168
 169         private static final byte[] digits = { '0', '1', '2', '3', '4', '5', '6',
 170                         '7', '8', '9' };
 171
 172         private static final byte[] hblob = Constants
 173                         .encodedTypeString(Constants.OBJ_BLOB);
 174
 175         private byte[] idBufferBlob(final Entry e) {
 176                 try {
 177                         final InputStream is = e.openInputStream();
 178                         if (is == null)
 179                                 return zeroid;
 180                         try {
 181                                 initializeDigest();
 182
 183                                 contentDigest.reset();
 184                                 contentDigest.update(hblob);
 185                                 contentDigest.update((byte) ' ');
 186
 187                                 final long blobLength = e.getLength();
 188                                 long sz = blobLength;
 189                                 if (sz == 0) {
 190                                         contentDigest.update((byte) '0');
 191                                 } else {
 192                                         final int bufn = contentReadBuffer.length;
 193                                         int p = bufn;
 194                                         do {
 195                                                 contentReadBuffer[--p] = digits[(int) (sz % 10)];
 196                                                 sz /= 10;
 197                                         } while (sz > 0);
 198                                         contentDigest.update(contentReadBuffer, p, bufn - p);
 199                                 }
 200                                 contentDigest.update((byte) 0);
 201
 202                                 for (;;) {
 203                                         final int r = is.read(contentReadBuffer);
 204                                         if (r <= 0)
 205                                                 break;
 206                                         contentDigest.update(contentReadBuffer, 0, r);
 207                                         sz += r;
 208                                 }
 209                                 if (sz != blobLength)
 210                                         return zeroid;
 211                                 return contentDigest.digest();
 212                         } finally {
 213                                 try {
 214                                         is.close();
 215                                 } catch (IOException err2) {
 216                                         // Suppress any error related to closing an input
 217                                         // stream. We don't care, we should not have any
 218                                         // outstanding data to flush or anything like that.
 219                                 }
 220                         }
 221                 } catch (IOException err) {
 222                         // Can't read the file? Don't report the failure either.
 223                         //
 224                         return zeroid;
 225                 }
 226         }
 227
 228         @Override
 229         public int idOffset() {
 230                 return 0;
 231         }
 232
 233         @Override
 234         public boolean first() {
 235                 return ptr == 0;
 236         }
 237
 238         @Override
 239         public boolean eof() {
 240                 return ptr == entryCnt;
 241         }
 242
 243         @Override
 244         public void next(final int delta) throws CorruptObjectException {
 245                 ptr += delta;
 246                 if (!eof())
 247                         parseEntry();
 248         }
 249
 250         @Override
 251         public void back(final int delta) throws CorruptObjectException {
 252                 ptr -= delta;
 253                 parseEntry();
 254         }
 255
 256         private void parseEntry() {
 257                 final Entry e = entries[ptr];
 258                 mode = e.getMode().getBits();
 259
 260                 final int nameLen = e.encodedNameLen;
 261                 while (pathOffset + nameLen > path.length)
 262                         growPath(pathOffset);
 263                 System.arraycopy(e.encodedName, 0, path, pathOffset, nameLen);
 264                 pathLen = pathOffset + nameLen;
 265         }
 266
 267         /**
 268          * Get the byte length of this entry.
 269          *
 270          * @return size of this file, in bytes.
 271          */
 272         public long getEntryLength() {
 273                 return current().getLength();
 274         }
 275
 276         /**
 277          * Get the last modified time of this entry.
 278          *
 279          * @return last modified time of this file, in milliseconds since the epoch
 280          *         (Jan 1, 1970 UTC).
 281          */
 282         public long getEntryLastModified() {
 283                 return current().getLastModified();
 284         }
 285
 286         private static final Comparator<Entry> ENTRY_CMP = new Comparator<Entry>() {
 287                 public int compare(final Entry o1, final Entry o2) {
 288                         final byte[] a = o1.encodedName;
 289                         final byte[] b = o2.encodedName;
 290                         final int aLen = o1.encodedNameLen;
 291                         final int bLen = o2.encodedNameLen;
 292                         int cPos;
 293
 294                         for (cPos = 0; cPos < aLen && cPos < bLen; cPos++) {
 295                                 final int cmp = (a[cPos] & 0xff) - (b[cPos] & 0xff);
 296                                 if (cmp != 0)
 297                                         return cmp;
 298                         }
 299
 300                         if (cPos < aLen)
 301                                 return (a[cPos] & 0xff) - lastPathChar(o2);
 302                         if (cPos < bLen)
 303                                 return lastPathChar(o1) - (b[cPos] & 0xff);
 304                         return lastPathChar(o1) - lastPathChar(o2);
 305                 }
 306         };
 307
 308         static int lastPathChar(final Entry e) {
 309                 return e.getMode() == FileMode.TREE ? '/' : '\0';
 310         }
 311
 312         /**
 313          * Constructor helper.
 314          *
 315          * @param list
 316          *            files in the subtree of the work tree this iterator operates
 317          *            on
 318          */
 319         protected void init(final Entry[] list) {
 320                 // Filter out nulls, . and .. as these are not valid tree entries,
 321                 // also cache the encoded forms of the path names for efficient use
 322                 // later on during sorting and iteration.
 323                 //
 324                 entries = list;
 325                 int i, o;
 326
 327                 for (i = 0, o = 0; i < entries.length; i++) {
 328                         final Entry e = entries[i];
 329                         if (e == null)
 330                                 continue;
 331                         final String name = e.getName();
 332                         if (".".equals(name) || "..".equals(name))
 333                                 continue;
 334                         if (".git".equals(name))
 335                                 continue;
 336                         if (i != o)
 337                                 entries[o] = e;
 338                         e.encodeName(nameEncoder);
 339                         o++;
 340                 }
 341                 entryCnt = o;
 342                 Arrays.sort(entries, 0, entryCnt, ENTRY_CMP);
 343
 344                 contentIdFromPtr = -1;
 345                 ptr = 0;
 346                 if (!eof())
 347                         parseEntry();
 348         }
 349
 350         /**
 351          * Obtain the current entry from this iterator.
 352          *
 353          * @return the currently selected entry.
 354          */
 355         protected Entry current() {
 356                 return entries[ptr];
 357         }
 358
 359         /** A single entry within a working directory tree. */
 360         protected static abstract class Entry {
 361                 byte[] encodedName;
 362
 363                 int encodedNameLen;
 364
 365                 void encodeName(final CharsetEncoder enc) {
 366                         final ByteBuffer b;
 367                         try {
 368                                 b = enc.encode(CharBuffer.wrap(getName()));
 369                         } catch (CharacterCodingException e) {
 370                                 // This should so never happen.
 371                                 throw new RuntimeException("Unencodeable file: " + getName());
 372                         }
 373
 374                         encodedNameLen = b.limit();
 375                         if (b.hasArray() && b.arrayOffset() == 0)
 376                                 encodedName = b.array();
 377                         else
 378                                 b.get(encodedName = new byte[encodedNameLen]);
 379                 }
 380
 381                 public String toString() {
 382                         return getMode().toString() + " " + getName();
 383                 }
 384
 385                 /**
 386                  * Get the type of this entry.
 387                  * <p>
 388                  * <b>Note: Efficient implementation required.</b>
 389                  * <p>
 390                  * The implementation of this method must be efficient. If a subclass
 391                  * needs to compute the value they should cache the reference within an
 392                  * instance member instead.
 393                  *
 394                  * @return a file mode constant from {@link FileMode}.
 395                  */
 396                 public abstract FileMode getMode();
 397
 398                 /**
 399                  * Get the byte length of this entry.
 400                  * <p>
 401                  * <b>Note: Efficient implementation required.</b>
 402                  * <p>
 403                  * The implementation of this method must be efficient. If a subclass
 404                  * needs to compute the value they should cache the reference within an
 405                  * instance member instead.
 406                  *
 407                  * @return size of this file, in bytes.
 408                  */
 409                 public abstract long getLength();
 410
 411                 /**
 412                  * Get the last modified time of this entry.
 413                  * <p>
 414                  * <b>Note: Efficient implementation required.</b>
 415                  * <p>
 416                  * The implementation of this method must be efficient. If a subclass
 417                  * needs to compute the value they should cache the reference within an
 418                  * instance member instead.
 419                  *
 420                  * @return time since the epoch (in ms) of the last change.
 421                  */
 422                 public abstract long getLastModified();
 423
 424                 /**
 425                  * Get the name of this entry within its directory.
 426                  * <p>
 427                  * Efficient implementations are not required. The caller will obtain
 428                  * the name only once and cache it once obtained.
 429                  *
 430                  * @return name of the entry.
 431                  */
 432                 public abstract String getName();
 433
 434                 /**
 435                  * Obtain an input stream to read the file content.
 436                  * <p>
 437                  * Efficient implementations are not required. The caller will usually
 438                  * obtain the stream only once per entry, if at all.
 439                  * <p>
 440                  * The input stream should not use buffering if the implementation can
 441                  * avoid it. The caller will buffer as necessary to perform efficient
 442                  * block IO operations.
 443                  * <p>
 444                  * The caller will close the stream once complete.
 445                  *
 446                  * @return a stream to read from the file.
 447                  * @throws IOException
 448                  *             the file could not be opened for reading.
 449                  */
 450                 public abstract InputStream openInputStream() throws IOException;
 451         }
 452 }