1 /* 2 * Copyright (C) 2016 The Android Open Source Project 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 package android.util.apk; 18 19 import android.util.Pair; 20 21 import java.io.IOException; 22 import java.io.RandomAccessFile; 23 import java.nio.ByteBuffer; 24 import java.nio.ByteOrder; 25 26 /** 27 * Assorted ZIP format helpers. 28 * 29 * <p>NOTE: Most helper methods operating on {@code ByteBuffer} instances expect that the byte 30 * order of these buffers is little-endian. 31 */ 32 abstract class ZipUtils { ZipUtils()33 private ZipUtils() {} 34 35 private static final int ZIP_EOCD_REC_MIN_SIZE = 22; 36 private static final int ZIP_EOCD_REC_SIG = 0x06054b50; 37 private static final int ZIP_EOCD_CENTRAL_DIR_SIZE_FIELD_OFFSET = 12; 38 private static final int ZIP_EOCD_CENTRAL_DIR_OFFSET_FIELD_OFFSET = 16; 39 private static final int ZIP_EOCD_COMMENT_LENGTH_FIELD_OFFSET = 20; 40 41 private static final int ZIP64_EOCD_LOCATOR_SIZE = 20; 42 private static final int ZIP64_EOCD_LOCATOR_SIG_REVERSE_BYTE_ORDER = 0x504b0607; 43 44 private static final int UINT16_MAX_VALUE = 0xffff; 45 46 /** 47 * Returns the ZIP End of Central Directory record of the provided ZIP file. 48 * 49 * @return contents of the ZIP End of Central Directory record and the record's offset in the 50 * file or {@code null} if the file does not contain the record. 51 * 52 * @throws IOException if an I/O error occurs while reading the file. 53 */ findZipEndOfCentralDirectoryRecord(RandomAccessFile zip)54 static Pair<ByteBuffer, Long> findZipEndOfCentralDirectoryRecord(RandomAccessFile zip) 55 throws IOException { 56 // ZIP End of Central Directory (EOCD) record is located at the very end of the ZIP archive. 57 // The record can be identified by its 4-byte signature/magic which is located at the very 58 // beginning of the record. A complication is that the record is variable-length because of 59 // the comment field. 60 // The algorithm for locating the ZIP EOCD record is as follows. We search backwards from 61 // end of the buffer for the EOCD record signature. Whenever we find a signature, we check 62 // the candidate record's comment length is such that the remainder of the record takes up 63 // exactly the remaining bytes in the buffer. The search is bounded because the maximum 64 // size of the comment field is 65535 bytes because the field is an unsigned 16-bit number. 65 66 long fileSize = zip.length(); 67 if (fileSize < ZIP_EOCD_REC_MIN_SIZE) { 68 return null; 69 } 70 71 // Optimization: 99.99% of APKs have a zero-length comment field in the EoCD record and thus 72 // the EoCD record offset is known in advance. Try that offset first to avoid unnecessarily 73 // reading more data. 74 Pair<ByteBuffer, Long> result = findZipEndOfCentralDirectoryRecord(zip, 0); 75 if (result != null) { 76 return result; 77 } 78 79 // EoCD does not start where we expected it to. Perhaps it contains a non-empty comment 80 // field. Expand the search. The maximum size of the comment field in EoCD is 65535 because 81 // the comment length field is an unsigned 16-bit number. 82 return findZipEndOfCentralDirectoryRecord(zip, UINT16_MAX_VALUE); 83 } 84 85 /** 86 * Returns the ZIP End of Central Directory record of the provided ZIP file. 87 * 88 * @param maxCommentSize maximum accepted size (in bytes) of EoCD comment field. The permitted 89 * value is from 0 to 65535 inclusive. The smaller the value, the faster this method 90 * locates the record, provided its comment field is no longer than this value. 91 * 92 * @return contents of the ZIP End of Central Directory record and the record's offset in the 93 * file or {@code null} if the file does not contain the record. 94 * 95 * @throws IOException if an I/O error occurs while reading the file. 96 */ findZipEndOfCentralDirectoryRecord( RandomAccessFile zip, int maxCommentSize)97 private static Pair<ByteBuffer, Long> findZipEndOfCentralDirectoryRecord( 98 RandomAccessFile zip, int maxCommentSize) throws IOException { 99 // ZIP End of Central Directory (EOCD) record is located at the very end of the ZIP archive. 100 // The record can be identified by its 4-byte signature/magic which is located at the very 101 // beginning of the record. A complication is that the record is variable-length because of 102 // the comment field. 103 // The algorithm for locating the ZIP EOCD record is as follows. We search backwards from 104 // end of the buffer for the EOCD record signature. Whenever we find a signature, we check 105 // the candidate record's comment length is such that the remainder of the record takes up 106 // exactly the remaining bytes in the buffer. The search is bounded because the maximum 107 // size of the comment field is 65535 bytes because the field is an unsigned 16-bit number. 108 109 if ((maxCommentSize < 0) || (maxCommentSize > UINT16_MAX_VALUE)) { 110 throw new IllegalArgumentException("maxCommentSize: " + maxCommentSize); 111 } 112 113 long fileSize = zip.length(); 114 if (fileSize < ZIP_EOCD_REC_MIN_SIZE) { 115 // No space for EoCD record in the file. 116 return null; 117 } 118 // Lower maxCommentSize if the file is too small. 119 maxCommentSize = (int) Math.min(maxCommentSize, fileSize - ZIP_EOCD_REC_MIN_SIZE); 120 121 ByteBuffer buf = ByteBuffer.allocate(ZIP_EOCD_REC_MIN_SIZE + maxCommentSize); 122 buf.order(ByteOrder.LITTLE_ENDIAN); 123 long bufOffsetInFile = fileSize - buf.capacity(); 124 zip.seek(bufOffsetInFile); 125 zip.readFully(buf.array(), buf.arrayOffset(), buf.capacity()); 126 int eocdOffsetInBuf = findZipEndOfCentralDirectoryRecord(buf); 127 if (eocdOffsetInBuf == -1) { 128 // No EoCD record found in the buffer 129 return null; 130 } 131 // EoCD found 132 buf.position(eocdOffsetInBuf); 133 ByteBuffer eocd = buf.slice(); 134 eocd.order(ByteOrder.LITTLE_ENDIAN); 135 return Pair.create(eocd, bufOffsetInFile + eocdOffsetInBuf); 136 } 137 138 /** 139 * Returns the position at which ZIP End of Central Directory record starts in the provided 140 * buffer or {@code -1} if the record is not present. 141 * 142 * <p>NOTE: Byte order of {@code zipContents} must be little-endian. 143 */ findZipEndOfCentralDirectoryRecord(ByteBuffer zipContents)144 private static int findZipEndOfCentralDirectoryRecord(ByteBuffer zipContents) { 145 assertByteOrderLittleEndian(zipContents); 146 147 // ZIP End of Central Directory (EOCD) record is located at the very end of the ZIP archive. 148 // The record can be identified by its 4-byte signature/magic which is located at the very 149 // beginning of the record. A complication is that the record is variable-length because of 150 // the comment field. 151 // The algorithm for locating the ZIP EOCD record is as follows. We search backwards from 152 // end of the buffer for the EOCD record signature. Whenever we find a signature, we check 153 // the candidate record's comment length is such that the remainder of the record takes up 154 // exactly the remaining bytes in the buffer. The search is bounded because the maximum 155 // size of the comment field is 65535 bytes because the field is an unsigned 16-bit number. 156 157 int archiveSize = zipContents.capacity(); 158 if (archiveSize < ZIP_EOCD_REC_MIN_SIZE) { 159 return -1; 160 } 161 int maxCommentLength = Math.min(archiveSize - ZIP_EOCD_REC_MIN_SIZE, UINT16_MAX_VALUE); 162 int eocdWithEmptyCommentStartPosition = archiveSize - ZIP_EOCD_REC_MIN_SIZE; 163 for (int expectedCommentLength = 0; expectedCommentLength < maxCommentLength; 164 expectedCommentLength++) { 165 int eocdStartPos = eocdWithEmptyCommentStartPosition - expectedCommentLength; 166 if (zipContents.getInt(eocdStartPos) == ZIP_EOCD_REC_SIG) { 167 int actualCommentLength = 168 getUnsignedInt16( 169 zipContents, eocdStartPos + ZIP_EOCD_COMMENT_LENGTH_FIELD_OFFSET); 170 if (actualCommentLength == expectedCommentLength) { 171 return eocdStartPos; 172 } 173 } 174 } 175 176 return -1; 177 } 178 179 /** 180 * Returns {@code true} if the provided file contains a ZIP64 End of Central Directory 181 * Locator. 182 * 183 * @param zipEndOfCentralDirectoryPosition offset of the ZIP End of Central Directory record 184 * in the file. 185 * 186 * @throws IOException if an I/O error occurs while reading the file. 187 */ isZip64EndOfCentralDirectoryLocatorPresent( RandomAccessFile zip, long zipEndOfCentralDirectoryPosition)188 public static final boolean isZip64EndOfCentralDirectoryLocatorPresent( 189 RandomAccessFile zip, long zipEndOfCentralDirectoryPosition) throws IOException { 190 191 // ZIP64 End of Central Directory Locator immediately precedes the ZIP End of Central 192 // Directory Record. 193 long locatorPosition = zipEndOfCentralDirectoryPosition - ZIP64_EOCD_LOCATOR_SIZE; 194 if (locatorPosition < 0) { 195 return false; 196 } 197 198 zip.seek(locatorPosition); 199 // RandomAccessFile.readInt assumes big-endian byte order, but ZIP format uses 200 // little-endian. 201 return zip.readInt() == ZIP64_EOCD_LOCATOR_SIG_REVERSE_BYTE_ORDER; 202 } 203 204 /** 205 * Returns the offset of the start of the ZIP Central Directory in the archive. 206 * 207 * <p>NOTE: Byte order of {@code zipEndOfCentralDirectory} must be little-endian. 208 */ getZipEocdCentralDirectoryOffset(ByteBuffer zipEndOfCentralDirectory)209 public static long getZipEocdCentralDirectoryOffset(ByteBuffer zipEndOfCentralDirectory) { 210 assertByteOrderLittleEndian(zipEndOfCentralDirectory); 211 return getUnsignedInt32( 212 zipEndOfCentralDirectory, 213 zipEndOfCentralDirectory.position() + ZIP_EOCD_CENTRAL_DIR_OFFSET_FIELD_OFFSET); 214 } 215 216 /** 217 * Sets the offset of the start of the ZIP Central Directory in the archive. 218 * 219 * <p>NOTE: Byte order of {@code zipEndOfCentralDirectory} must be little-endian. 220 */ setZipEocdCentralDirectoryOffset( ByteBuffer zipEndOfCentralDirectory, long offset)221 public static void setZipEocdCentralDirectoryOffset( 222 ByteBuffer zipEndOfCentralDirectory, long offset) { 223 assertByteOrderLittleEndian(zipEndOfCentralDirectory); 224 setUnsignedInt32( 225 zipEndOfCentralDirectory, 226 zipEndOfCentralDirectory.position() + ZIP_EOCD_CENTRAL_DIR_OFFSET_FIELD_OFFSET, 227 offset); 228 } 229 230 /** 231 * Returns the size (in bytes) of the ZIP Central Directory. 232 * 233 * <p>NOTE: Byte order of {@code zipEndOfCentralDirectory} must be little-endian. 234 */ getZipEocdCentralDirectorySizeBytes(ByteBuffer zipEndOfCentralDirectory)235 public static long getZipEocdCentralDirectorySizeBytes(ByteBuffer zipEndOfCentralDirectory) { 236 assertByteOrderLittleEndian(zipEndOfCentralDirectory); 237 return getUnsignedInt32( 238 zipEndOfCentralDirectory, 239 zipEndOfCentralDirectory.position() + ZIP_EOCD_CENTRAL_DIR_SIZE_FIELD_OFFSET); 240 } 241 assertByteOrderLittleEndian(ByteBuffer buffer)242 private static void assertByteOrderLittleEndian(ByteBuffer buffer) { 243 if (buffer.order() != ByteOrder.LITTLE_ENDIAN) { 244 throw new IllegalArgumentException("ByteBuffer byte order must be little endian"); 245 } 246 } 247 getUnsignedInt16(ByteBuffer buffer, int offset)248 private static int getUnsignedInt16(ByteBuffer buffer, int offset) { 249 return buffer.getShort(offset) & 0xffff; 250 } 251 getUnsignedInt32(ByteBuffer buffer, int offset)252 private static long getUnsignedInt32(ByteBuffer buffer, int offset) { 253 return buffer.getInt(offset) & 0xffffffffL; 254 } 255 setUnsignedInt32(ByteBuffer buffer, int offset, long value)256 private static void setUnsignedInt32(ByteBuffer buffer, int offset, long value) { 257 if ((value < 0) || (value > 0xffffffffL)) { 258 throw new IllegalArgumentException("uint32 value of out range: " + value); 259 } 260 buffer.putInt(buffer.position() + offset, (int) value); 261 } 262 } 263