001/*
002 * Licensed to the Apache Software Foundation (ASF) under one or more
003 * contributor license agreements.  See the NOTICE file distributed with
004 * this work for additional information regarding copyright ownership.
005 * The ASF licenses this file to You under the Apache License, Version 2.0
006 * (the "License"); you may not use this file except in compliance with
007 * the License.  You may obtain a copy of the License at
008 * 
009 *      http://www.apache.org/licenses/LICENSE-2.0
010 * 
011 * Unless required by applicable law or agreed to in writing, software
012 * distributed under the License is distributed on an "AS IS" BASIS,
013 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
014 * See the License for the specific language governing permissions and
015 * limitations under the License.
016 */
017package org.apache.commons.io.filefilter;
018
019import java.io.File;
020import java.io.IOException;
021import java.io.RandomAccessFile;
022import java.io.Serializable;
023import java.util.Arrays;
024
025import org.apache.commons.io.IOUtils;
026
027/**
028 * <p>
029 * File filter for matching files containing a "magic number". A magic number 
030 * is a unique series of bytes common to all files of a specific file format.
031 * For instance, all Java class files begin with the bytes 
032 * <code>0xCAFEBABE</code>. 
033 * </p>
034 * 
035 * <code><pre>
036 * File dir = new File(".");
037 * MagicNumberFileFilter javaClassFileFilter =
038 *     MagicNumberFileFilter(new byte[] {(byte) 0xCA, (byte) 0xFE, 
039 *       (byte) 0xBA, (byte) 0xBE}); 
040 * String[] javaClassFiles = dir.list(javaClassFileFilter);
041 * for (String javaClassFile : javaClassFiles) {
042 *     System.out.println(javaClassFile);
043 * }
044 * </pre></code>
045 * 
046 * <p>
047 * Sometimes, such as in the case of TAR files, the
048 * magic number will be offset by a certain number of bytes in the file. In the
049 * case of TAR archive files, this offset is 257 bytes.
050 * </p>
051 * 
052 * <code><pre>
053 * File dir = new File(".");
054 * MagicNumberFileFilter tarFileFilter = 
055 *     MagicNumberFileFilter("ustar", 257); 
056 * String[] tarFiles = dir.list(tarFileFilter);
057 * for (String tarFile : tarFiles) {
058 *     System.out.println(tarFile);
059 * }
060 * </pre></code>
061 * @since 2.0
062 * @see FileFilterUtils#magicNumberFileFilter(byte[])
063 * @see FileFilterUtils#magicNumberFileFilter(String)
064 * @see FileFilterUtils#magicNumberFileFilter(byte[], long)
065 * @see FileFilterUtils#magicNumberFileFilter(String, long)
066 */
067public class MagicNumberFileFilter extends AbstractFileFilter implements
068        Serializable {
069    
070    /**
071     * The serialization version unique identifier.
072     */
073    private static final long serialVersionUID = -547733176983104172L;
074
075    /**
076     * The magic number to compare against the file's bytes at the provided 
077     * offset.
078     */
079    private final byte[] magicNumbers;
080    
081    /**
082     * The offset (in bytes) within the files that the magic number's bytes 
083     * should appear.
084     */
085    private final long byteOffset;
086    
087    /**
088     * <p>
089     * Constructs a new MagicNumberFileFilter and associates it with the magic
090     * number to test for in files. This constructor assumes a starting offset
091     * of <code>0</code>.
092     * </p>
093     * 
094     * <p>
095     * It is important to note that <em>the array is not cloned</em> and that
096     * any changes to the magic number array after construction will affect the
097     * behavior of this file filter.
098     * </p>
099     * 
100     * <code><pre>
101     * MagicNumberFileFilter javaClassFileFilter =
102     *     MagicNumberFileFilter(new byte[] {(byte) 0xCA, (byte) 0xFE, 
103     *       (byte) 0xBA, (byte) 0xBE}); 
104     * </pre></code>
105     * 
106     * @param magicNumber the magic number to look for in the file.
107     * 
108     * @throws IllegalArgumentException if <code>magicNumber</code> is 
109     *         {@code null}, or contains no bytes.
110     */
111    public MagicNumberFileFilter(byte[] magicNumber) {
112        this(magicNumber, 0);
113    }
114    
115    /**
116     * <p>
117     * Constructs a new MagicNumberFileFilter and associates it with the magic
118     * number to test for in files. This constructor assumes a starting offset
119     * of <code>0</code>.
120     * </p>
121     * 
122     * Example usage:
123     * <pre>
124     * {@code
125     * MagicNumberFileFilter xmlFileFilter = 
126     *     MagicNumberFileFilter("<?xml"); 
127     * }
128     * </pre>
129     * 
130     * @param magicNumber the magic number to look for in the file.
131     *        The string is converted to bytes using the platform default charset.
132     *
133     * @throws IllegalArgumentException if <code>magicNumber</code> is 
134     *         {@code null} or the empty String.
135     */
136    public MagicNumberFileFilter(String magicNumber) {
137        this(magicNumber, 0);
138    }
139    
140    /**
141     * <p>
142     * Constructs a new MagicNumberFileFilter and associates it with the magic
143     * number to test for in files and the byte offset location in the file to
144     * to look for that magic number.
145     * </p>
146     * 
147     * <code><pre>
148     * MagicNumberFileFilter tarFileFilter = 
149     *     MagicNumberFileFilter("ustar", 257); 
150     * </pre></code>
151     * 
152     * @param magicNumber the magic number to look for in the file. 
153     *        The string is converted to bytes using the platform default charset.
154     * @param offset the byte offset in the file to start comparing bytes.
155     * 
156     * @throws IllegalArgumentException if <code>magicNumber</code> is 
157     *         {@code null} or the empty String, or <code>offset</code> is 
158     *         a negative number.
159     */
160    public MagicNumberFileFilter(String magicNumber, long offset) {
161        if (magicNumber == null) {
162            throw new IllegalArgumentException("The magic number cannot be null");
163        }
164        if (magicNumber.length() == 0) {
165            throw new IllegalArgumentException("The magic number must contain at least one byte");
166        }
167        if (offset < 0) {
168            throw new IllegalArgumentException("The offset cannot be negative");
169        }
170        
171        this.magicNumbers = magicNumber.getBytes(); // uses the platform default charset
172        this.byteOffset = offset;
173    }
174    
175    /**
176     * <p>
177     * Constructs a new MagicNumberFileFilter and associates it with the magic
178     * number to test for in files and the byte offset location in the file to
179     * to look for that magic number.
180     * </p>
181     * 
182     * <p>
183     * It is important to note that <em>the array is not cloned</em> and that
184     * any changes to the magic number array after construction will affect the
185     * behavior of this file filter.
186     * </p>
187     * 
188     * <code><pre>
189     * MagicNumberFileFilter tarFileFilter =
190     *     MagicNumberFileFilter(new byte[] {0x75, 0x73, 0x74, 0x61, 0x72}, 257); 
191     * </pre></code>
192     * 
193     * <code><pre>
194     * MagicNumberFileFilter javaClassFileFilter =
195     *     MagicNumberFileFilter(new byte[] {0xCA, 0xFE, 0xBA, 0xBE}, 0); 
196     * </pre></code>
197     * 
198     * @param magicNumber the magic number to look for in the file.
199     * @param offset the byte offset in the file to start comparing bytes.
200     * 
201     * @throws IllegalArgumentException if <code>magicNumber</code> is 
202     *         {@code null}, or contains no bytes, or <code>offset</code> 
203     *         is a negative number.
204     */
205    public MagicNumberFileFilter(byte[] magicNumber, long offset) {
206        if (magicNumber == null) {
207            throw new IllegalArgumentException("The magic number cannot be null");
208        }
209        if (magicNumber.length == 0) {
210            throw new IllegalArgumentException("The magic number must contain at least one byte");
211        }
212        if (offset < 0) {
213            throw new IllegalArgumentException("The offset cannot be negative");
214        }
215        
216        this.magicNumbers = new byte[magicNumber.length];
217        System.arraycopy(magicNumber, 0, this.magicNumbers, 0, magicNumber.length);
218        this.byteOffset = offset;
219    }
220    
221    /**
222     * <p>
223     * Accepts the provided file if the file contains the file filter's magic
224     * number at the specified offset.
225     * </p>
226     * 
227     * <p>
228     * If any {@link IOException}s occur while reading the file, the file will
229     * be rejected.
230     * </p>
231     * 
232     * @param file the file to accept or reject.
233     * 
234     * @return {@code true} if the file contains the filter's magic number 
235     *         at the specified offset, {@code false} otherwise.
236     */
237    @Override
238    public boolean accept(File file) {
239        if (file != null && file.isFile() && file.canRead()) {
240            RandomAccessFile randomAccessFile = null;
241            try {
242                byte[] fileBytes = new byte[this.magicNumbers.length]; 
243                randomAccessFile = new RandomAccessFile(file, "r");
244                randomAccessFile.seek(byteOffset);
245                int read = randomAccessFile.read(fileBytes);
246                if (read != magicNumbers.length) {
247                    return false;
248                }
249                return Arrays.equals(this.magicNumbers, fileBytes);
250            } catch (IOException ioe) {
251                // Do nothing, fall through and do not accept file
252            } finally {
253                IOUtils.closeQuietly(randomAccessFile);
254            }
255        }
256        
257        return false;
258    }
259
260    /**
261     * Returns a String representation of the file filter, which includes the 
262     * magic number bytes and byte offset.
263     * 
264     * @return a String representation of the file filter.
265     */
266    @Override
267    public String toString() {
268        StringBuilder builder = new StringBuilder(super.toString());
269        builder.append("(");
270        builder.append(new String(magicNumbers));// TODO perhaps use hex if value is not printable
271        builder.append(",");
272        builder.append(this.byteOffset);
273        builder.append(")");
274        return builder.toString();
275    }
276}