/*
* Copyright (C) 2007 Steve Ratcliffe
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License version 2 as
* published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
*
* Author: Steve Ratcliffe
* Create date: Feb 19, 2008
*/
package uk.me.parabola.imgfmt.app.labelenc;
import java.io.ByteArrayOutputStream;
import java.nio.charset.Charset;
/**
* Decoder for labels in utf-8, note that I am not actually sure that any
* map uses utf-8.
*
* @author Steve Ratcliffe
*/
public class Utf8Decoder implements CharacterDecoder {
private final ByteArrayOutputStream out = new ByteArrayOutputStream();
private boolean needreset;
private final Charset charset = Charset.forName("utf-8");
/**
* Add a byte to this decoder. This will be saved until a complete
* label string has been detected.
*
* @param b The byte read from the lbl file.
* @return True if a label string is finished and is ready to be retrieved
* via the {@link #getText} method.
*/
public boolean addByte(int b) {
if (b == 0) {
needreset = true;
return true;
}
if (needreset) {
out.reset();
needreset = false;
}
out.write(b);
return false;
}
/**
* Get the valid text. This is guaranteed to be encoded as utf-8.
*
* @return The byte array and length as an EncodedText struct.
*/
public DecodedText getText() {
byte[] ba = out.toByteArray();
return new DecodedText(ba, charset);
}
/**
* Resets the state. This should be called for example if the reader is
* jumping to a new place in the file and cannot guarantee that the previous
* label was fully read.
*/
public void reset() {
needreset = false;
out.reset();
}
}