org.eclipse.jgit/src/org/eclipse/jgit/lib/ObjectChecker.java - jgit - Git at Google

 /*
  * Copyright (C) 2008-2010, Google Inc.
  * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
  * and other copyright owners as documented in the project's IP log.
  *
  * This program and the accompanying materials are made available
  * under the terms of the Eclipse Distribution License v1.0 which
  * accompanies this distribution, is reproduced below, and is
  * available at http://www.eclipse.org/org/documents/edl-v10.php
  *
  * All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or
  * without modification, are permitted provided that the following
  * conditions are met:
  *
  * - Redistributions of source code must retain the above copyright
  *   notice, this list of conditions and the following disclaimer.
  *
  * - Redistributions in binary form must reproduce the above
  *   copyright notice, this list of conditions and the following
  *   disclaimer in the documentation and/or other materials provided
  *   with the distribution.
  *
  * - Neither the name of the Eclipse Foundation, Inc. nor the
  *   names of its contributors may be used to endorse or promote
  *   products derived from this software without specific prior
  *   written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */

 package org.eclipse.jgit.lib;

 import static org.eclipse.jgit.util.RawParseUtils.match;
 import static org.eclipse.jgit.util.RawParseUtils.nextLF;
 import static org.eclipse.jgit.util.RawParseUtils.parseBase10;

 import java.lang.reflect.InvocationTargetException;
 import java.lang.reflect.Method;
 import java.text.MessageFormat;
 import java.util.HashSet;
 import java.util.Locale;
 import java.util.Set;

 import org.eclipse.jgit.errors.CorruptObjectException;
 import org.eclipse.jgit.internal.JGitText;
 import org.eclipse.jgit.util.MutableInteger;
 import org.eclipse.jgit.util.RawParseUtils;

 /**
  * Verifies that an object is formatted correctly.
  * <p>
  * Verifications made by this class only check that the fields of an object are
  * formatted correctly. The ObjectId checksum of the object is not verified, and
  * connectivity links between objects are also not verified. Its assumed that
  * the caller can provide both of these validations on its own.
  * <p>
  * Instances of this class are not thread safe, but they may be reused to
  * perform multiple object validations.
  */
 public class ObjectChecker {
 	/** Header "tree " */
 	public static final byte[] tree = Constants.encodeASCII("tree "); //$NON-NLS-1$

 	/** Header "parent " */
 	public static final byte[] parent = Constants.encodeASCII("parent "); //$NON-NLS-1$

 	/** Header "author " */
 	public static final byte[] author = Constants.encodeASCII("author "); //$NON-NLS-1$

 	/** Header "committer " */
 	public static final byte[] committer = Constants.encodeASCII("committer "); //$NON-NLS-1$

 	/** Header "encoding " */
 	public static final byte[] encoding = Constants.encodeASCII("encoding "); //$NON-NLS-1$

 	/** Header "object " */
 	public static final byte[] object = Constants.encodeASCII("object "); //$NON-NLS-1$

 	/** Header "type " */
 	public static final byte[] type = Constants.encodeASCII("type "); //$NON-NLS-1$

 	/** Header "tag " */
 	public static final byte[] tag = Constants.encodeASCII("tag "); //$NON-NLS-1$

 	/** Header "tagger " */
 	public static final byte[] tagger = Constants.encodeASCII("tagger "); //$NON-NLS-1$

 	private final MutableObjectId tempId = new MutableObjectId();

 	private final MutableInteger ptrout = new MutableInteger();

 	private boolean allowZeroMode;

 	private boolean allowInvalidPersonIdent;
 	private boolean windows;
 	private boolean macosx;

 	/**
 	 * Enable accepting leading zero mode in tree entries.
 	 * <p>
 	 * Some broken Git libraries generated leading zeros in the mode part of
 	 * tree entries. This is technically incorrect but gracefully allowed by
 	 * git-core. JGit rejects such trees by default, but may need to accept
 	 * them on broken histories.
 	 *
 	 * @param allow allow leading zero mode.
 	 * @return {@code this}.
 	 * @since 3.4
 	 */
 	public ObjectChecker setAllowLeadingZeroFileMode(boolean allow) {
 		allowZeroMode = allow;
 		return this;
 	}

 	/**
 	 * Enable accepting invalid author, committer and tagger identities.
 	 * <p>
 	 * Some broken Git versions/libraries allowed users to create commits and
 	 * tags with invalid formatting between the name, email and timestamp.
 	 *
 	 * @param allow
 	 *            if true accept invalid person identity strings.
 	 * @return {@code this}.
 	 * @since 4.0
 	 */
 	public ObjectChecker setAllowInvalidPersonIdent(boolean allow) {
 		allowInvalidPersonIdent = allow;
 		return this;
 	}

 	/**
 	 * Restrict trees to only names legal on Windows platforms.
 	 * <p>
 	 * Also rejects any mixed case forms of reserved names ({@code .git}).
 	 *
 	 * @param win true if Windows name checking should be performed.
 	 * @return {@code this}.
 	 * @since 3.4
 	 */
 	public ObjectChecker setSafeForWindows(boolean win) {
 		windows = win;
 		return this;
 	}

 	/**
 	 * Restrict trees to only names legal on Mac OS X platforms.
 	 * <p>
 	 * Rejects any mixed case forms of reserved names ({@code .git})
 	 * for users working on HFS+ in case-insensitive (default) mode.
 	 *
 	 * @param mac true if Mac OS X name checking should be performed.
 	 * @return {@code this}.
 	 * @since 3.4
 	 */
 	public ObjectChecker setSafeForMacOS(boolean mac) {
 		macosx = mac;
 		return this;
 	}

 	/**
 	 * Check an object for parsing errors.
 	 *
 	 * @param objType
 	 *            type of the object. Must be a valid object type code in
 	 *            {@link Constants}.
 	 * @param raw
 	 *            the raw data which comprises the object. This should be in the
 	 *            canonical format (that is the format used to generate the
 	 *            ObjectId of the object). The array is never modified.
 	 * @throws CorruptObjectException
 	 *             if an error is identified.
 	 */
 	public void check(final int objType, final byte[] raw)
 			throws CorruptObjectException {
 		switch (objType) {
 		case Constants.OBJ_COMMIT:
 			checkCommit(raw);
 			break;
 		case Constants.OBJ_TAG:
 			checkTag(raw);
 			break;
 		case Constants.OBJ_TREE:
 			checkTree(raw);
 			break;
 		case Constants.OBJ_BLOB:
 			checkBlob(raw);
 			break;
 		default:
 			throw new CorruptObjectException(MessageFormat.format(
 					JGitText.get().corruptObjectInvalidType2,
 					Integer.valueOf(objType)));
 		}
 	}

 	private int id(final byte[] raw, final int ptr) {
 		try {
 			tempId.fromString(raw, ptr);
 			return ptr + Constants.OBJECT_ID_STRING_LENGTH;
 		} catch (IllegalArgumentException e) {
 			return -1;
 		}
 	}

 	private int personIdent(final byte[] raw, int ptr) {
 		if (allowInvalidPersonIdent)
 			return nextLF(raw, ptr) - 1;

 		final int emailB = nextLF(raw, ptr, '<');
 		if (emailB == ptr || raw[emailB - 1] != '<')
 			return -1;

 		final int emailE = nextLF(raw, emailB, '>');
 		if (emailE == emailB || raw[emailE - 1] != '>')
 			return -1;
 		if (emailE == raw.length || raw[emailE] != ' ')
 			return -1;

 		parseBase10(raw, emailE + 1, ptrout); // when
 		ptr = ptrout.value;
 		if (emailE + 1 == ptr)
 			return -1;
 		if (ptr == raw.length || raw[ptr] != ' ')
 			return -1;

 		parseBase10(raw, ptr + 1, ptrout); // tz offset
 		if (ptr + 1 == ptrout.value)
 			return -1;
 		return ptrout.value;
 	}

 	/**
 	 * Check a commit for errors.
 	 *
 	 * @param raw
 	 *            the commit data. The array is never modified.
 	 * @throws CorruptObjectException
 	 *             if any error was detected.
 	 */
 	public void checkCommit(final byte[] raw) throws CorruptObjectException {
 		int ptr = 0;

 		if ((ptr = match(raw, ptr, tree)) < 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNotreeHeader);
 		if ((ptr = id(raw, ptr)) < 0 || raw[ptr++] != '\n')
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectInvalidTree);

 		while (match(raw, ptr, parent) >= 0) {
 			ptr += parent.length;
 			if ((ptr = id(raw, ptr)) < 0 || raw[ptr++] != '\n')
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectInvalidParent);
 		}

 		if ((ptr = match(raw, ptr, author)) < 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNoAuthor);
 		if ((ptr = personIdent(raw, ptr)) < 0 || raw[ptr++] != '\n')
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectInvalidAuthor);

 		if ((ptr = match(raw, ptr, committer)) < 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNoCommitter);
 		if ((ptr = personIdent(raw, ptr)) < 0 || raw[ptr++] != '\n')
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectInvalidCommitter);
 	}

 	/**
 	 * Check an annotated tag for errors.
 	 *
 	 * @param raw
 	 *            the tag data. The array is never modified.
 	 * @throws CorruptObjectException
 	 *             if any error was detected.
 	 */
 	public void checkTag(final byte[] raw) throws CorruptObjectException {
 		int ptr = 0;

 		if ((ptr = match(raw, ptr, object)) < 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNoObjectHeader);
 		if ((ptr = id(raw, ptr)) < 0 || raw[ptr++] != '\n')
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectInvalidObject);

 		if ((ptr = match(raw, ptr, type)) < 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNoTypeHeader);
 		ptr = nextLF(raw, ptr);

 		if ((ptr = match(raw, ptr, tag)) < 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNoTagHeader);
 		ptr = nextLF(raw, ptr);

 		if ((ptr = match(raw, ptr, tagger)) > 0) {
 			if ((ptr = personIdent(raw, ptr)) < 0 || raw[ptr++] != '\n')
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectInvalidTagger);
 		}
 	}

 	private static int lastPathChar(final int mode) {
 		return FileMode.TREE.equals(mode) ? '/' : '\0';
 	}

 	private static int pathCompare(final byte[] raw, int aPos, final int aEnd,
 			final int aMode, int bPos, final int bEnd, final int bMode) {
 		while (aPos < aEnd && bPos < bEnd) {
 			final int cmp = (raw[aPos++] & 0xff) - (raw[bPos++] & 0xff);
 			if (cmp != 0)
 				return cmp;
 		}

 		if (aPos < aEnd)
 			return (raw[aPos] & 0xff) - lastPathChar(bMode);
 		if (bPos < bEnd)
 			return lastPathChar(aMode) - (raw[bPos] & 0xff);
 		return 0;
 	}

 	private static boolean duplicateName(final byte[] raw,
 			final int thisNamePos, final int thisNameEnd) {
 		final int sz = raw.length;
 		int nextPtr = thisNameEnd + 1 + Constants.OBJECT_ID_LENGTH;
 		for (;;) {
 			int nextMode = 0;
 			for (;;) {
 				if (nextPtr >= sz)
 					return false;
 				final byte c = raw[nextPtr++];
 				if (' ' == c)
 					break;
 				nextMode <<= 3;
 				nextMode += c - '0';
 			}

 			final int nextNamePos = nextPtr;
 			for (;;) {
 				if (nextPtr == sz)
 					return false;
 				final byte c = raw[nextPtr++];
 				if (c == 0)
 					break;
 			}
 			if (nextNamePos + 1 == nextPtr)
 				return false;

 			final int cmp = pathCompare(raw, thisNamePos, thisNameEnd,
 					FileMode.TREE.getBits(), nextNamePos, nextPtr - 1, nextMode);
 			if (cmp < 0)
 				return false;
 			else if (cmp == 0)
 				return true;

 			nextPtr += Constants.OBJECT_ID_LENGTH;
 		}
 	}

 	/**
 	 * Check a canonical formatted tree for errors.
 	 *
 	 * @param raw
 	 *            the raw tree data. The array is never modified.
 	 * @throws CorruptObjectException
 	 *             if any error was detected.
 	 */
 	public void checkTree(final byte[] raw) throws CorruptObjectException {
 		final int sz = raw.length;
 		int ptr = 0;
 		int lastNameB = 0, lastNameE = 0, lastMode = 0;
 		Set<String> normalized = windows || macosx
 				? new HashSet<String>()
 				: null;

 		while (ptr < sz) {
 			int thisMode = 0;
 			for (;;) {
 				if (ptr == sz)
 					throw new CorruptObjectException(
 							JGitText.get().corruptObjectTruncatedInMode);
 				final byte c = raw[ptr++];
 				if (' ' == c)
 					break;
 				if (c < '0' || c > '7')
 					throw new CorruptObjectException(
 							JGitText.get().corruptObjectInvalidModeChar);
 				if (thisMode == 0 && c == '0' && !allowZeroMode)
 					throw new CorruptObjectException(
 							JGitText.get().corruptObjectInvalidModeStartsZero);
 				thisMode <<= 3;
 				thisMode += c - '0';
 			}

 			if (FileMode.fromBits(thisMode).getObjectType() == Constants.OBJ_BAD)
 				throw new CorruptObjectException(MessageFormat.format(
 						JGitText.get().corruptObjectInvalidMode2,
 						Integer.valueOf(thisMode)));

 			final int thisNameB = ptr;
 			ptr = scanPathSegment(raw, ptr, sz);
 			if (ptr == sz || raw[ptr] != 0)
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectTruncatedInName);
 			checkPathSegment2(raw, thisNameB, ptr);
 			if (normalized != null) {
 				if (!normalized.add(normalize(raw, thisNameB, ptr)))
 					throw new CorruptObjectException(
 							JGitText.get().corruptObjectDuplicateEntryNames);
 			} else if (duplicateName(raw, thisNameB, ptr))
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectDuplicateEntryNames);

 			if (lastNameB != 0) {
 				final int cmp = pathCompare(raw, lastNameB, lastNameE,
 						lastMode, thisNameB, ptr, thisMode);
 				if (cmp > 0)
 					throw new CorruptObjectException(
 							JGitText.get().corruptObjectIncorrectSorting);
 			}

 			lastNameB = thisNameB;
 			lastNameE = ptr;
 			lastMode = thisMode;

 			ptr += 1 + Constants.OBJECT_ID_LENGTH;
 			if (ptr > sz)
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectTruncatedInObjectId);
 		}
 	}

 	private int scanPathSegment(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		for (; ptr < end; ptr++) {
 			byte c = raw[ptr];
 			if (c == 0)
 				return ptr;
 			if (c == '/')
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectNameContainsSlash);
 			if (windows && isInvalidOnWindows(c)) {
 				if (c > 31)
 					throw new CorruptObjectException(String.format(
 							JGitText.get().corruptObjectNameContainsChar,
 							Byte.valueOf(c)));
 				throw new CorruptObjectException(String.format(
 						JGitText.get().corruptObjectNameContainsByte,
 						Integer.valueOf(c & 0xff)));
 			}
 		}
 		return ptr;
 	}

 	/**
 	 * Check tree path entry for validity.
 	 * <p>
 	 * Unlike {@link #checkPathSegment(byte[], int, int)}, this version
 	 * scans a multi-directory path string such as {@code "src/main.c"}.
 	 *
 	 * @param path path string to scan.
 	 * @throws CorruptObjectException path is invalid.
 	 * @since 3.6
 	 */
 	public void checkPath(String path) throws CorruptObjectException {
 		byte[] buf = Constants.encode(path);
 		checkPath(buf, 0, buf.length);
 	}

 	/**
 	 * Check tree path entry for validity.
 	 * <p>
 	 * Unlike {@link #checkPathSegment(byte[], int, int)}, this version
 	 * scans a multi-directory path string such as {@code "src/main.c"}.
 	 *
 	 * @param raw buffer to scan.
 	 * @param ptr offset to first byte of the name.
 	 * @param end offset to one past last byte of name.
 	 * @throws CorruptObjectException path is invalid.
 	 * @since 3.6
 	 */
 	public void checkPath(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		int start = ptr;
 		for (; ptr < end; ptr++) {
 			if (raw[ptr] == '/') {
 				checkPathSegment(raw, start, ptr);
 				start = ptr + 1;
 			}
 		}
 		checkPathSegment(raw, start, end);
 	}

 	/**
 	 * Check tree path entry for validity.
 	 *
 	 * @param raw buffer to scan.
 	 * @param ptr offset to first byte of the name.
 	 * @param end offset to one past last byte of name.
 	 * @throws CorruptObjectException name is invalid.
 	 * @since 3.4
 	 */
 	public void checkPathSegment(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		int e = scanPathSegment(raw, ptr, end);
 		if (e < end && raw[e] == 0)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNameContainsNullByte);
 		checkPathSegment2(raw, ptr, end);
 	}

 	private void checkPathSegment2(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		if (ptr == end)
 			throw new CorruptObjectException(
 					JGitText.get().corruptObjectNameZeroLength);
 		if (raw[ptr] == '.') {
 			switch (end - ptr) {
 			case 1:
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectNameDot);
 			case 2:
 				if (raw[ptr + 1] == '.')
 					throw new CorruptObjectException(
 							JGitText.get().corruptObjectNameDotDot);
 				break;
 			case 4:
 				if (isGit(raw, ptr + 1))
 					throw new CorruptObjectException(String.format(
 							JGitText.get().corruptObjectInvalidName,
 							RawParseUtils.decode(raw, ptr, end)));
 				break;
 			default:
 				if (end - ptr > 4 && isNormalizedGit(raw, ptr + 1, end))
 					throw new CorruptObjectException(String.format(
 							JGitText.get().corruptObjectInvalidName,
 							RawParseUtils.decode(raw, ptr, end)));
 			}
 		} else if (isGitTilde1(raw, ptr, end)) {
 			throw new CorruptObjectException(String.format(
 					JGitText.get().corruptObjectInvalidName,
 					RawParseUtils.decode(raw, ptr, end)));
 		}

 		if (macosx && isMacHFSGit(raw, ptr, end))
 			throw new CorruptObjectException(String.format(
 					JGitText.get().corruptObjectInvalidNameIgnorableUnicode,
 					RawParseUtils.decode(raw, ptr, end)));

 		if (windows) {
 			// Windows ignores space and dot at end of file name.
 			if (raw[end - 1] == ' ' || raw[end - 1] == '.')
 				throw new CorruptObjectException(String.format(
 						JGitText.get().corruptObjectInvalidNameEnd,
 						Character.valueOf(((char) raw[end - 1]))));
 			if (end - ptr >= 3)
 				checkNotWindowsDevice(raw, ptr, end);
 		}
 	}

 	// Mac's HFS+ folds permutations of ".git" and Unicode ignorable characters
 	// to ".git" therefore we should prevent such names
 	private static boolean isMacHFSGit(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		boolean ignorable = false;
 		byte[] git = new byte[] { '.', 'g', 'i', 't' };
 		int g = 0;
 		while (ptr < end) {
 			switch (raw[ptr]) {
 			case (byte) 0xe2: // http://www.utf8-chartable.de/unicode-utf8-table.pl?start=8192
 				checkTruncatedIgnorableUTF8(raw, ptr, end);
 				switch (raw[ptr + 1]) {
 				case (byte) 0x80:
 					switch (raw[ptr + 2]) {
 					case (byte) 0x8c:	// U+200C 0xe2808c ZERO WIDTH NON-JOINER
 					case (byte) 0x8d:	// U+200D 0xe2808d ZERO WIDTH JOINER
 					case (byte) 0x8e:	// U+200E 0xe2808e LEFT-TO-RIGHT MARK
 					case (byte) 0x8f:	// U+200F 0xe2808f RIGHT-TO-LEFT MARK
 					case (byte) 0xaa:	// U+202A 0xe280aa LEFT-TO-RIGHT EMBEDDING
 					case (byte) 0xab:	// U+202B 0xe280ab RIGHT-TO-LEFT EMBEDDING
 					case (byte) 0xac:	// U+202C 0xe280ac POP DIRECTIONAL FORMATTING
 					case (byte) 0xad:	// U+202D 0xe280ad LEFT-TO-RIGHT OVERRIDE
 					case (byte) 0xae:	// U+202E 0xe280ae RIGHT-TO-LEFT OVERRIDE
 						ignorable = true;
 						ptr += 3;
 						continue;
 					default:
 						return false;
 					}
 				case (byte) 0x81:
 					switch (raw[ptr + 2]) {
 					case (byte) 0xaa:	// U+206A 0xe281aa INHIBIT SYMMETRIC SWAPPING
 					case (byte) 0xab:	// U+206B 0xe281ab ACTIVATE SYMMETRIC SWAPPING
 					case (byte) 0xac:	// U+206C 0xe281ac INHIBIT ARABIC FORM SHAPING
 					case (byte) 0xad:	// U+206D 0xe281ad ACTIVATE ARABIC FORM SHAPING
 					case (byte) 0xae:	// U+206E 0xe281ae NATIONAL DIGIT SHAPES
 					case (byte) 0xaf:	// U+206F 0xe281af NOMINAL DIGIT SHAPES
 						ignorable = true;
 						ptr += 3;
 						continue;
 					default:
 						return false;
 					}
 				}
 				break;
 			case (byte) 0xef: // http://www.utf8-chartable.de/unicode-utf8-table.pl?start=65024
 				checkTruncatedIgnorableUTF8(raw, ptr, end);
 				// U+FEFF 0xefbbbf ZERO WIDTH NO-BREAK SPACE
 				if ((raw[ptr + 1] == (byte) 0xbb)
 						&& (raw[ptr + 2] == (byte) 0xbf)) {
 					ignorable = true;
 					ptr += 3;
 					continue;
 				}
 				return false;
 			default:
 				if (g == 4)
 					return false;
 				if (raw[ptr++] != git[g++])
 					return false;
 			}
 		}
 		if (g == 4 && ignorable)
 			return true;
 		return false;
 	}

 	private static void checkTruncatedIgnorableUTF8(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		if ((ptr + 2) >= end)
 			throw new CorruptObjectException(MessageFormat.format(
 					JGitText.get().corruptObjectInvalidNameInvalidUtf8,
 					toHexString(raw, ptr, end)));
 	}

 	private static String toHexString(byte[] raw, int ptr, int end) {
 		StringBuilder b = new StringBuilder("0x"); //$NON-NLS-1$
 		for (int i = ptr; i < end; i++)
 			b.append(String.format("%02x", Byte.valueOf(raw[i]))); //$NON-NLS-1$
 		return b.toString();
 	}

 	private static void checkNotWindowsDevice(byte[] raw, int ptr, int end)
 			throws CorruptObjectException {
 		switch (toLower(raw[ptr])) {
 		case 'a': // AUX
 			if (end - ptr >= 3
 					&& toLower(raw[ptr + 1]) == 'u'
 					&& toLower(raw[ptr + 2]) == 'x'
 					&& (end - ptr == 3 || raw[ptr + 3] == '.'))
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectInvalidNameAux);
 			break;

 		case 'c': // CON, COM[1-9]
 			if (end - ptr >= 3
 					&& toLower(raw[ptr + 2]) == 'n'
 					&& toLower(raw[ptr + 1]) == 'o'
 					&& (end - ptr == 3 || raw[ptr + 3] == '.'))
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectInvalidNameCon);
 			if (end - ptr >= 4
 					&& toLower(raw[ptr + 2]) == 'm'
 					&& toLower(raw[ptr + 1]) == 'o'
 					&& isPositiveDigit(raw[ptr + 3])
 					&& (end - ptr == 4 || raw[ptr + 4] == '.'))
 				throw new CorruptObjectException(String.format(
 						JGitText.get().corruptObjectInvalidNameCom,
 						Character.valueOf(((char) raw[ptr + 3]))));
 			break;

 		case 'l': // LPT[1-9]
 			if (end - ptr >= 4
 					&& toLower(raw[ptr + 1]) == 'p'
 					&& toLower(raw[ptr + 2]) == 't'
 					&& isPositiveDigit(raw[ptr + 3])
 					&& (end - ptr == 4 || raw[ptr + 4] == '.'))
 				throw new CorruptObjectException(String.format(
 						JGitText.get().corruptObjectInvalidNameLpt,
 						Character.valueOf(((char) raw[ptr + 3]))));
 			break;

 		case 'n': // NUL
 			if (end - ptr >= 3
 					&& toLower(raw[ptr + 1]) == 'u'
 					&& toLower(raw[ptr + 2]) == 'l'
 					&& (end - ptr == 3 || raw[ptr + 3] == '.'))
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectInvalidNameNul);
 			break;

 		case 'p': // PRN
 			if (end - ptr >= 3
 					&& toLower(raw[ptr + 1]) == 'r'
 					&& toLower(raw[ptr + 2]) == 'n'
 					&& (end - ptr == 3 || raw[ptr + 3] == '.'))
 				throw new CorruptObjectException(
 						JGitText.get().corruptObjectInvalidNamePrn);
 			break;
 		}
 	}

 	private static boolean isInvalidOnWindows(byte c) {
 		// Windows disallows "special" characters in a path component.
 		switch (c) {
 		case '"':
 		case '*':
 		case ':':
 		case '<':
 		case '>':
 		case '?':
 		case '\\':
 		case '|':
 			return true;
 		}
 		return 1 <= c && c <= 31;
 	}

 	private static boolean isGit(byte[] buf, int p) {
 		return toLower(buf[p]) == 'g'
 				&& toLower(buf[p + 1]) == 'i'
 				&& toLower(buf[p + 2]) == 't';
 	}

 	private static boolean isGitTilde1(byte[] buf, int p, int end) {
 		if (end - p != 5)
 			return false;
 		return toLower(buf[p]) == 'g' && toLower(buf[p + 1]) == 'i'
 				&& toLower(buf[p + 2]) == 't' && buf[p + 3] == '~'
 				&& buf[p + 4] == '1';
 	}

 	private static boolean isNormalizedGit(byte[] raw, int ptr, int end) {
 		if (isGit(raw, ptr)) {
 			int dots = 0;
 			boolean space = false;
 			int p = end - 1;
 			for (; (ptr + 2) < p; p--) {
 				if (raw[p] == '.')
 					dots++;
 				else if (raw[p] == ' ')
 					space = true;
 				else
 					break;
 			}
 			return p == ptr + 2 && (dots == 1 || space);
 		}
 		return false;
 	}

 	private static char toLower(byte b) {
 		if ('A' <= b && b <= 'Z')
 			return (char) (b + ('a' - 'A'));
 		return (char) b;
 	}

 	private static boolean isPositiveDigit(byte b) {
 		return '1' <= b && b <= '9';
 	}

 	/**
 	 * Check a blob for errors.
 	 *
 	 * @param raw
 	 *            the blob data. The array is never modified.
 	 * @throws CorruptObjectException
 	 *             if any error was detected.
 	 */
 	public void checkBlob(final byte[] raw) throws CorruptObjectException {
 		// We can always assume the blob is valid.
 	}

 	private String normalize(byte[] raw, int ptr, int end) {
 		String n = RawParseUtils.decode(raw, ptr, end).toLowerCase(Locale.US);
 		return macosx ? Normalizer.normalize(n) : n;
 	}

 	private static class Normalizer {
 		// TODO Simplify invocation to Normalizer after dropping Java 5.
 		private static final Method normalize;
 		private static final Object nfc;
 		static {
 			Method method;
 			Object formNfc;
 			try {
 				Class<?> formClazz = Class.forName("java.text.Normalizer$Form"); //$NON-NLS-1$
 				formNfc = formClazz.getField("NFC").get(null); //$NON-NLS-1$
 				method = Class.forName("java.text.Normalizer") //$NON-NLS-1$
 					.getMethod("normalize", CharSequence.class, formClazz); //$NON-NLS-1$
 			} catch (ClassNotFoundException e) {
 				method = null;
 				formNfc = null;
 			} catch (NoSuchFieldException e) {
 				method = null;
 				formNfc = null;
 			} catch (NoSuchMethodException e) {
 				method = null;
 				formNfc = null;
 			} catch (SecurityException e) {
 				method = null;
 				formNfc = null;
 			} catch (IllegalArgumentException e) {
 				method = null;
 				formNfc = null;
 			} catch (IllegalAccessException e) {
 				method = null;
 				formNfc = null;
 			}
 			normalize = method;
 			nfc = formNfc;
 		}

 		static String normalize(String in) {
 			if (normalize == null)
 				return in;
 			try {
 				return (String) normalize.invoke(null, in, nfc);
 			} catch (IllegalAccessException e) {
 				return in;
 			} catch (InvocationTargetException e) {
 				if (e.getCause() instanceof RuntimeException)
 					throw (RuntimeException) e.getCause();
 				if (e.getCause() instanceof Error)
 					throw (Error) e.getCause();
 				return in;
 			}
 		}
 	}
 }