/* * Copyright 2005,2009 Ivan SZKIBA * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.ini4j.spi; import java.io.IOException; import java.io.InputStream; import java.io.InputStreamReader; import java.io.PushbackInputStream; import java.io.Reader; import java.nio.charset.Charset; class UnicodeInputStreamReader extends Reader { private static final int BOM_SIZE = 4; private static enum Bom { UTF32BE("UTF-32BE", new byte[] { (byte) 0x00, (byte) 0x00, (byte) 0xFE, (byte) 0xFF }), UTF32LE("UTF-32LE", new byte[] { (byte) 0xFF, (byte) 0xFE, (byte) 0x00, (byte) 0x00 }), UTF16BE("UTF-16BE", new byte[] { (byte) 0xFE, (byte) 0xFF }), UTF16LE("UTF-16LE", new byte[] { (byte) 0xFF, (byte) 0xFE }), UTF8("UTF-8", new byte[] { (byte) 0xEF, (byte) 0xBB, (byte) 0xBF }); private final byte[] _bytes; private Charset _charset; @SuppressWarnings("PMD.ArrayIsStoredDirectly") private Bom(String charsetName, byte[] bytes) { try { _charset = Charset.forName(charsetName); } catch (Exception x) { _charset = null; } _bytes = bytes; } private static Bom find(byte[] data) { Bom ret = null; for (Bom bom : values()) { if (bom.supported() && bom.match(data)) { ret = bom; break; } } return ret; } private boolean match(byte[] data) { boolean ok = true; for (int i = 0; i < _bytes.length; i++) { if (data[i] != _bytes[i]) { ok = false; break; } } return ok; } private boolean supported() { return _charset != null; } } private final Charset _defaultEncoding; private InputStreamReader _reader; private final PushbackInputStream _stream; UnicodeInputStreamReader(InputStream in, Charset defaultEnc) { _stream = new PushbackInputStream(in, BOM_SIZE); _defaultEncoding = defaultEnc; } public void close() throws IOException { init(); _reader.close(); } public int read(char[] cbuf, int off, int len) throws IOException { init(); return _reader.read(cbuf, off, len); } /** * Read-ahead four bytes and check for BOM marks. Extra bytes are * unread back to the stream, only BOM bytes are skipped. */ protected void init() throws IOException { if (_reader != null) { return; } Charset encoding; byte[] data = new byte[BOM_SIZE]; int n; int unread; n = _stream.read(data, 0, data.length); Bom bom = Bom.find(data); if (bom == null) { encoding = _defaultEncoding; unread = n; } else { encoding = bom._charset; unread = data.length - bom._bytes.length; } if (unread > 0) { _stream.unread(data, (n - unread), unread); } _reader = new InputStreamReader(_stream, encoding); } }
# | Change | User | Description | Committed | |
---|---|---|---|---|---|
#1 | 8023 | Sven Erik Knop |
Complete rewrite of the configuration file, now based on an ini-file format. The ini file has a general [reader] section for settings like verbose, outputFile, case-sensitivity and so on. It also allows to set up a range of Actions and Filters. The section name here is the fully classified class name, followed by settings for the particular actions. An example will make this clearer: ================================================================ [reader] verbose=true [journal.action.UserRenamer] fileName=user.txt patch=True outputFile=user.out [journal.action.ClientRenamer] fileName=client.txt outputFile=client.out patch=true ================================================================ I will provide more example set-ups in the near future. Filters are classes implementing journal.action.Filter (soon to be journal.filter.Filter) which can be chained together and are all executed before the actions. Actions are applied in order that they are given in the config file. |