ReplaceableUCharacterIterator.java
// © 2016 and later: Unicode, Inc. and others.
// License & terms of use: http://www.unicode.org/copyright.html
/*
*******************************************************************************
* Copyright (C) 1996-2015, International Business Machines Corporation and
* others. All Rights Reserved.
*******************************************************************************
*/
package com.ibm.icu.impl;
import com.ibm.icu.text.Replaceable;
import com.ibm.icu.text.ReplaceableString;
import com.ibm.icu.text.UCharacterIterator;
import com.ibm.icu.text.UTF16;
/**
* DLF docs must define behavior when Replaceable is mutated underneath the iterator.
*
* <p>This and ICUCharacterIterator share some code, maybe they should share an implementation, or
* the common state and implementation should be moved up into UCharacterIterator.
*
* <p>What are first, last, and getBeginIndex doing here?!?!?!
*/
public class ReplaceableUCharacterIterator extends UCharacterIterator implements Cloneable {
// public constructor ------------------------------------------------------
/**
* Public constructor
*
* @param replaceable text which the iterator will be based on
*/
public ReplaceableUCharacterIterator(Replaceable replaceable) {
if (replaceable == null) {
throw new IllegalArgumentException();
}
this.replaceable = replaceable;
this.currentIndex = 0;
}
/**
* Public constructor
*
* @param str text which the iterator will be based on
*/
public ReplaceableUCharacterIterator(String str) {
if (str == null) {
throw new IllegalArgumentException();
}
this.replaceable = new ReplaceableString(str);
this.currentIndex = 0;
}
/**
* Public constructor
*
* @param buf buffer of text on which the iterator will be based
*/
public ReplaceableUCharacterIterator(StringBuffer buf) {
if (buf == null) {
throw new IllegalArgumentException();
}
this.replaceable = new ReplaceableString(buf);
this.currentIndex = 0;
}
// public methods ----------------------------------------------------------
/**
* Creates a copy of this iterator, does not clone the underlying <code>Replaceable</code>object
*
* @return copy of this iterator
*/
@Override
public ReplaceableUCharacterIterator clone() {
try {
return (ReplaceableUCharacterIterator) super.clone();
} catch (CloneNotSupportedException e) {
return null; // never invoked
}
}
/**
* Returns the current UTF16 character.
*
* @return current UTF16 character
*/
@Override
public int current() {
if (currentIndex < replaceable.length()) {
return replaceable.charAt(currentIndex);
}
return DONE;
}
/**
* Returns the current codepoint
*
* @return current codepoint
*/
@Override
public int currentCodePoint() {
// cannot use charAt due to it different
// behaviour when index is pointing at a
// trail surrogate, check for surrogates
int ch = current();
if (UTF16.isLeadSurrogate(ch)) {
// advance the index to get the next code point
next();
// due to post increment semantics current() after next()
// actually returns the next char which is what we want
int ch2 = current();
// current should never change the current index so back off
previous();
if (UTF16.isTrailSurrogate(ch2)) {
// we found a surrogate pair
return Character.toCodePoint((char) ch, (char) ch2);
}
}
return ch;
}
/**
* Returns the length of the text
*
* @return length of the text
*/
@Override
public int getLength() {
return replaceable.length();
}
/**
* Gets the current currentIndex in text.
*
* @return current currentIndex in text.
*/
@Override
public int getIndex() {
return currentIndex;
}
/**
* Returns next UTF16 character and increments the iterator's currentIndex by 1. If the
* resulting currentIndex is greater or equal to the text length, the currentIndex is reset to
* the text length and a value of DONECODEPOINT is returned.
*
* @return next UTF16 character in text or DONE if the new currentIndex is off the end of the
* text range.
*/
@Override
public int next() {
if (currentIndex < replaceable.length()) {
return replaceable.charAt(currentIndex++);
}
return DONE;
}
/**
* Returns previous UTF16 character and decrements the iterator's currentIndex by 1. If the
* resulting currentIndex is less than 0, the currentIndex is reset to 0 and a value of
* DONECODEPOINT is returned.
*
* @return next UTF16 character in text or DONE if the new currentIndex is off the start of the
* text range.
*/
@Override
public int previous() {
if (currentIndex > 0) {
return replaceable.charAt(--currentIndex);
}
return DONE;
}
/**
* Sets the currentIndex to the specified currentIndex in the text and returns that single UTF16
* character at currentIndex. This assumes the text is stored as 16-bit code units.
*
* @param currentIndex the currentIndex within the text.
* @exception IllegalArgumentException is thrown if an invalid currentIndex is supplied. i.e.
* currentIndex is out of bounds.
* @returns the character at the specified currentIndex or DONE if the specified currentIndex is
* equal to the end of the text.
*/
@Override
public void setIndex(int currentIndex) throws IndexOutOfBoundsException {
if (currentIndex < 0 || currentIndex > replaceable.length()) {
throw new IndexOutOfBoundsException();
}
this.currentIndex = currentIndex;
}
@Override
public int getText(char[] fillIn, int offset) {
int length = replaceable.length();
if (offset < 0 || offset + length > fillIn.length) {
throw new IndexOutOfBoundsException(Integer.toString(length));
}
replaceable.getChars(0, length, fillIn, offset);
return length;
}
// private data members ----------------------------------------------------
/** Replacable object */
private Replaceable replaceable;
/** Current currentIndex */
private int currentIndex;
}