1/*
2 * Copyright (c) 1996, 2015, Oracle and/or its affiliates. All rights reserved.
3 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4 *
5 * This code is free software; you can redistribute it and/or modify it
6 * under the terms of the GNU General Public License version 2 only, as
7 * published by the Free Software Foundation.  Oracle designates this
8 * particular file as subject to the "Classpath" exception as provided
9 * by Oracle in the LICENSE file that accompanied this code.
10 *
11 * This code is distributed in the hope that it will be useful, but WITHOUT
12 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
13 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
14 * version 2 for more details (a copy is included in the LICENSE file that
15 * accompanied this code).
16 *
17 * You should have received a copy of the GNU General Public License version
18 * 2 along with this work; if not, write to the Free Software Foundation,
19 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
20 *
21 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
22 * or visit www.oracle.com if you need additional information or have any
23 * questions.
24 */
25
26package java.util.zip;
27
28import java.io.InputStream;
29import java.io.IOException;
30import java.io.EOFException;
31import java.io.PushbackInputStream;
32import java.nio.charset.Charset;
33import java.nio.charset.StandardCharsets;
34import static java.util.zip.ZipConstants64.*;
35import static java.util.zip.ZipUtils.*;
36
37/**
38 * This class implements an input stream filter for reading files in the
39 * ZIP file format. Includes support for both compressed and uncompressed
40 * entries.
41 *
42 * @author      David Connelly
43 * @since 1.1
44 */
45public
46class ZipInputStream extends InflaterInputStream implements ZipConstants {
47    private ZipEntry entry;
48    private int flag;
49    private CRC32 crc = new CRC32();
50    private long remaining;
51    private byte[] tmpbuf = new byte[512];
52
53    private static final int STORED = ZipEntry.STORED;
54    private static final int DEFLATED = ZipEntry.DEFLATED;
55
56    private boolean closed = false;
57    // this flag is set to true after EOF has reached for
58    // one entry
59    private boolean entryEOF = false;
60
61    private ZipCoder zc;
62
63    /**
64     * Check to make sure that this stream has not been closed
65     */
66    private void ensureOpen() throws IOException {
67        if (closed) {
68            throw new IOException("Stream closed");
69        }
70    }
71
72    /**
73     * Creates a new ZIP input stream.
74     *
75     * <p>The UTF-8 {@link java.nio.charset.Charset charset} is used to
76     * decode the entry names.
77     *
78     * @param in the actual input stream
79     */
80    public ZipInputStream(InputStream in) {
81        this(in, StandardCharsets.UTF_8);
82    }
83
84    /**
85     * Creates a new ZIP input stream.
86     *
87     * @param in the actual input stream
88     *
89     * @param charset
90     *        The {@linkplain java.nio.charset.Charset charset} to be
91     *        used to decode the ZIP entry name (ignored if the
92     *        <a href="package-summary.html#lang_encoding"> language
93     *        encoding bit</a> of the ZIP entry's general purpose bit
94     *        flag is set).
95     *
96     * @since 1.7
97     */
98    public ZipInputStream(InputStream in, Charset charset) {
99        super(new PushbackInputStream(in, 512), new Inflater(true), 512);
100        usesDefaultInflater = true;
101        if(in == null) {
102            throw new NullPointerException("in is null");
103        }
104        if (charset == null)
105            throw new NullPointerException("charset is null");
106        this.zc = ZipCoder.get(charset);
107    }
108
109    /**
110     * Reads the next ZIP file entry and positions the stream at the
111     * beginning of the entry data.
112     * @return the next ZIP file entry, or null if there are no more entries
113     * @exception ZipException if a ZIP file error has occurred
114     * @exception IOException if an I/O error has occurred
115     */
116    public ZipEntry getNextEntry() throws IOException {
117        ensureOpen();
118        if (entry != null) {
119            closeEntry();
120        }
121        crc.reset();
122        inf.reset();
123        if ((entry = readLOC()) == null) {
124            return null;
125        }
126        if (entry.method == STORED) {
127            remaining = entry.size;
128        }
129        entryEOF = false;
130        return entry;
131    }
132
133    /**
134     * Closes the current ZIP entry and positions the stream for reading the
135     * next entry.
136     * @exception ZipException if a ZIP file error has occurred
137     * @exception IOException if an I/O error has occurred
138     */
139    public void closeEntry() throws IOException {
140        ensureOpen();
141        while (read(tmpbuf, 0, tmpbuf.length) != -1) ;
142        entryEOF = true;
143    }
144
145    /**
146     * Returns 0 after EOF has reached for the current entry data,
147     * otherwise always return 1.
148     * <p>
149     * Programs should not count on this method to return the actual number
150     * of bytes that could be read without blocking.
151     *
152     * @return     1 before EOF and 0 after EOF has reached for current entry.
153     * @exception  IOException  if an I/O error occurs.
154     *
155     */
156    public int available() throws IOException {
157        ensureOpen();
158        if (entryEOF) {
159            return 0;
160        } else {
161            return 1;
162        }
163    }
164
165    /**
166     * Reads from the current ZIP entry into an array of bytes.
167     * If <code>len</code> is not zero, the method
168     * blocks until some input is available; otherwise, no
169     * bytes are read and <code>0</code> is returned.
170     * @param b the buffer into which the data is read
171     * @param off the start offset in the destination array <code>b</code>
172     * @param len the maximum number of bytes read
173     * @return the actual number of bytes read, or -1 if the end of the
174     *         entry is reached
175     * @exception  NullPointerException if <code>b</code> is <code>null</code>.
176     * @exception  IndexOutOfBoundsException if <code>off</code> is negative,
177     * <code>len</code> is negative, or <code>len</code> is greater than
178     * <code>b.length - off</code>
179     * @exception ZipException if a ZIP file error has occurred
180     * @exception IOException if an I/O error has occurred
181     */
182    public int read(byte[] b, int off, int len) throws IOException {
183        ensureOpen();
184        if (off < 0 || len < 0 || off > b.length - len) {
185            throw new IndexOutOfBoundsException();
186        } else if (len == 0) {
187            return 0;
188        }
189
190        if (entry == null) {
191            return -1;
192        }
193        switch (entry.method) {
194        case DEFLATED:
195            len = super.read(b, off, len);
196            if (len == -1) {
197                readEnd(entry);
198                entryEOF = true;
199                entry = null;
200            } else {
201                crc.update(b, off, len);
202            }
203            return len;
204        case STORED:
205            if (remaining <= 0) {
206                entryEOF = true;
207                entry = null;
208                return -1;
209            }
210            if (len > remaining) {
211                len = (int)remaining;
212            }
213            len = in.read(b, off, len);
214            if (len == -1) {
215                throw new ZipException("unexpected EOF");
216            }
217            crc.update(b, off, len);
218            remaining -= len;
219            if (remaining == 0 && entry.crc != crc.getValue()) {
220                throw new ZipException(
221                    "invalid entry CRC (expected 0x" + Long.toHexString(entry.crc) +
222                    " but got 0x" + Long.toHexString(crc.getValue()) + ")");
223            }
224            return len;
225        default:
226            throw new ZipException("invalid compression method");
227        }
228    }
229
230    /**
231     * Skips specified number of bytes in the current ZIP entry.
232     * @param n the number of bytes to skip
233     * @return the actual number of bytes skipped
234     * @exception ZipException if a ZIP file error has occurred
235     * @exception IOException if an I/O error has occurred
236     * @exception IllegalArgumentException if {@code n < 0}
237     */
238    public long skip(long n) throws IOException {
239        if (n < 0) {
240            throw new IllegalArgumentException("negative skip length");
241        }
242        ensureOpen();
243        int max = (int)Math.min(n, Integer.MAX_VALUE);
244        int total = 0;
245        while (total < max) {
246            int len = max - total;
247            if (len > tmpbuf.length) {
248                len = tmpbuf.length;
249            }
250            len = read(tmpbuf, 0, len);
251            if (len == -1) {
252                entryEOF = true;
253                break;
254            }
255            total += len;
256        }
257        return total;
258    }
259
260    /**
261     * Closes this input stream and releases any system resources associated
262     * with the stream.
263     * @exception IOException if an I/O error has occurred
264     */
265    public void close() throws IOException {
266        if (!closed) {
267            super.close();
268            closed = true;
269        }
270    }
271
272    private byte[] b = new byte[256];
273
274    /*
275     * Reads local file (LOC) header for next entry.
276     */
277    private ZipEntry readLOC() throws IOException {
278        try {
279            readFully(tmpbuf, 0, LOCHDR);
280        } catch (EOFException e) {
281            return null;
282        }
283        if (get32(tmpbuf, 0) != LOCSIG) {
284            return null;
285        }
286        // get flag first, we need check EFS.
287        flag = get16(tmpbuf, LOCFLG);
288        // get the entry name and create the ZipEntry first
289        int len = get16(tmpbuf, LOCNAM);
290        int blen = b.length;
291        if (len > blen) {
292            do {
293                blen = blen * 2;
294            } while (len > blen);
295            b = new byte[blen];
296        }
297        readFully(b, 0, len);
298        // Force to use UTF-8 if the EFS bit is ON, even the cs is NOT UTF-8
299        ZipEntry e = createZipEntry(((flag & EFS) != 0)
300                                    ? zc.toStringUTF8(b, len)
301                                    : zc.toString(b, len));
302        // now get the remaining fields for the entry
303        if ((flag & 1) == 1) {
304            throw new ZipException("encrypted ZIP entry not supported");
305        }
306        e.method = get16(tmpbuf, LOCHOW);
307        e.xdostime = get32(tmpbuf, LOCTIM);
308        if ((flag & 8) == 8) {
309            /* "Data Descriptor" present */
310            if (e.method != DEFLATED) {
311                throw new ZipException(
312                        "only DEFLATED entries can have EXT descriptor");
313            }
314        } else {
315            e.crc = get32(tmpbuf, LOCCRC);
316            e.csize = get32(tmpbuf, LOCSIZ);
317            e.size = get32(tmpbuf, LOCLEN);
318        }
319        len = get16(tmpbuf, LOCEXT);
320        if (len > 0) {
321            byte[] extra = new byte[len];
322            readFully(extra, 0, len);
323            e.setExtra0(extra,
324                        e.csize == ZIP64_MAGICVAL || e.size == ZIP64_MAGICVAL);
325        }
326        return e;
327    }
328
329    /**
330     * Creates a new <code>ZipEntry</code> object for the specified
331     * entry name.
332     *
333     * @param name the ZIP file entry name
334     * @return the ZipEntry just created
335     */
336    protected ZipEntry createZipEntry(String name) {
337        return new ZipEntry(name);
338    }
339
340    /**
341     * Reads end of deflated entry as well as EXT descriptor if present.
342     *
343     * Local headers for DEFLATED entries may optionally be followed by a
344     * data descriptor, and that data descriptor may optionally contain a
345     * leading signature (EXTSIG).
346     *
347     * From the zip spec http://www.pkware.com/documents/casestudies/APPNOTE.TXT
348     *
349     * """Although not originally assigned a signature, the value 0x08074b50
350     * has commonly been adopted as a signature value for the data descriptor
351     * record.  Implementers should be aware that ZIP files may be
352     * encountered with or without this signature marking data descriptors
353     * and should account for either case when reading ZIP files to ensure
354     * compatibility."""
355     */
356    private void readEnd(ZipEntry e) throws IOException {
357        int n = inf.getRemaining();
358        if (n > 0) {
359            ((PushbackInputStream)in).unread(buf, len - n, n);
360        }
361        if ((flag & 8) == 8) {
362            /* "Data Descriptor" present */
363            if (inf.getBytesWritten() > ZIP64_MAGICVAL ||
364                inf.getBytesRead() > ZIP64_MAGICVAL) {
365                // ZIP64 format
366                readFully(tmpbuf, 0, ZIP64_EXTHDR);
367                long sig = get32(tmpbuf, 0);
368                if (sig != EXTSIG) { // no EXTSIG present
369                    e.crc = sig;
370                    e.csize = get64(tmpbuf, ZIP64_EXTSIZ - ZIP64_EXTCRC);
371                    e.size = get64(tmpbuf, ZIP64_EXTLEN - ZIP64_EXTCRC);
372                    ((PushbackInputStream)in).unread(
373                        tmpbuf, ZIP64_EXTHDR - ZIP64_EXTCRC, ZIP64_EXTCRC);
374                } else {
375                    e.crc = get32(tmpbuf, ZIP64_EXTCRC);
376                    e.csize = get64(tmpbuf, ZIP64_EXTSIZ);
377                    e.size = get64(tmpbuf, ZIP64_EXTLEN);
378                }
379            } else {
380                readFully(tmpbuf, 0, EXTHDR);
381                long sig = get32(tmpbuf, 0);
382                if (sig != EXTSIG) { // no EXTSIG present
383                    e.crc = sig;
384                    e.csize = get32(tmpbuf, EXTSIZ - EXTCRC);
385                    e.size = get32(tmpbuf, EXTLEN - EXTCRC);
386                    ((PushbackInputStream)in).unread(
387                                               tmpbuf, EXTHDR - EXTCRC, EXTCRC);
388                } else {
389                    e.crc = get32(tmpbuf, EXTCRC);
390                    e.csize = get32(tmpbuf, EXTSIZ);
391                    e.size = get32(tmpbuf, EXTLEN);
392                }
393            }
394        }
395        if (e.size != inf.getBytesWritten()) {
396            throw new ZipException(
397                "invalid entry size (expected " + e.size +
398                " but got " + inf.getBytesWritten() + " bytes)");
399        }
400        if (e.csize != inf.getBytesRead()) {
401            throw new ZipException(
402                "invalid entry compressed size (expected " + e.csize +
403                " but got " + inf.getBytesRead() + " bytes)");
404        }
405        if (e.crc != crc.getValue()) {
406            throw new ZipException(
407                "invalid entry CRC (expected 0x" + Long.toHexString(e.crc) +
408                " but got 0x" + Long.toHexString(crc.getValue()) + ")");
409        }
410    }
411
412    /*
413     * Reads bytes, blocking until all bytes are read.
414     */
415    private void readFully(byte[] b, int off, int len) throws IOException {
416        while (len > 0) {
417            int n = in.read(b, off, len);
418            if (n == -1) {
419                throw new EOFException();
420            }
421            off += n;
422            len -= n;
423        }
424    }
425
426}
427