Utf8_Enumeration.java example

Explorer
bugvm-master
/* Soot - a J*va Optimization Framework
 * Copyright (C) 1997 Clark Verbrugge
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the
 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
 * Boston, MA 02111-1307, USA.
 */

/*
 * Modified by the Sable Research Group and others 1997-1999.  
 * See the 'credits' file distributed with Soot for the complete list of
 * contributors.  (Soot is distributed at http://www.sable.mcgill.ca/soot)
 */







package soot.coffi;

import java.util.Enumeration;

/** An enumeration of a Utf8 allows one to run through the characters in a
 * unicode string; used primarily for comparing unicode strings.  Note that
 * unlike regular enumerations, and to be efficient (ie to avoid allocating
 * an object in each call to nextElement), the return value is accessed by
 * this object's 'c' field, and nextElement merely returns this.
 * @see CONSTANT_Utf8_info
 * @see Utf8_Enumeration#c
 * @see Utf8_Enumeration#nextElement
 * @author Clark Verbrugge
 */
public class Utf8_Enumeration implements Enumeration {

   /** The latest character, as determined by nextElement.
    * @see Utf8_Enumeration#nextElement
    */
   public int c;            // latest character

   private short curindex;
   private short length;
   private byte bytes[];

   /** For creating an empty enumeration; you must use reset() after this
    * to initialize the enumeration.
    * @see Utf8_Enumeration#reset
    */
   public Utf8_Enumeration() {}
   /** For creating a normal enumeration of the given Utf8 string.
    * @param b array of bytes in Utf8 format.
    */
   public Utf8_Enumeration(byte b[]) {
      bytes = b;
      curindex = (short)2;
      length = (short)(((((bytes[0]))&0xff)<<8) + (((bytes[1]))&0xff) + 2);
   }
   /** Resets this object to be an enumeration of the given Utf8 string.
    * @param b array of bytes in Utf8 format.
    */
   public void reset(byte b[]) {
      bytes = b;
      curindex = (short)2;
      length = (short)(((((bytes[0]))&0xff)<<8) + (((bytes[1]))&0xff) + 2);
   }

   /** <i>true</i> if the entire string hasn't been enumerated yet. */
   public boolean hasMoreElements() {
      if (curindex<length) return true;
      return false;
   }

   /** Determines the next Utf8 character, and stores it in c.
    * @return <i>this</i>
    * @see Utf8_Enumeration#c
    */
   public Object nextElement() {
      byte b;
      b = bytes[curindex++];
      if ((b&((byte)0x80))==0) { // one-byte character
         c = b;
      } else if ((b&((byte)0xe0))==0xc0) { // two-byte character
         c = ((b&((byte)0x1f)))<<6;
         b = bytes[curindex++];
         c |= (b&((byte)0x3f));
      } else {  // three-byte character
         c = ((b&((byte)0x0f)))<<12;
         b = bytes[curindex++];
         c |= ((b&((byte)0x3f)))<<6;
         b = bytes[curindex++];
         c |= (b&((byte)0x3f));
      }
      return this;
   }
}