dev.cel.common.internal.CelCodePointArray Maven / Gradle / Ivy
// Copyright 2022 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// https://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package dev.cel.common.internal;
import static com.google.common.base.Strings.isNullOrEmpty;
import com.google.errorprone.annotations.Immutable;
import dev.cel.common.annotations.Internal;
import java.util.PrimitiveIterator;
/**
* Represents an in-memory read-only contiguous source of Unicode code points.
*
* CEL Library Internals. Do Not Use.
*/
@Immutable
@Internal
public abstract class CelCodePointArray {
// Package-private default constructor to prevent extensions outside of the codebase.
CelCodePointArray() {}
/** Returns a new {@link CelCodePointArray} that is a subview of this between [i, j). */
public abstract CelCodePointArray slice(int i, int j);
/** Get the code point at the given index. */
public abstract int get(int index);
/** Returns the number of code points. */
public abstract int size();
public final int length() {
return size();
}
/** Returns true if empty, false otherwise. */
public boolean isEmpty() {
return length() == 0;
}
@Override
public abstract String toString();
public static CelCodePointArray fromString(String text) {
if (isNullOrEmpty(text)) {
return EmptyCodePointArray.INSTANCE;
}
PrimitiveIterator.OfInt codePoints = text.codePoints().iterator();
byte[] byteArray = new byte[text.length()];
int byteIndex = 0;
while (codePoints.hasNext()) {
int codePoint = codePoints.nextInt();
if (codePoint <= 0xff) {
byteArray[byteIndex++] = (byte) codePoint;
continue;
}
if (codePoint <= 0xffff) {
char[] charArray = new char[text.length()];
int charIndex = 0;
for (; charIndex < byteIndex; charIndex++) {
charArray[charIndex] = (char) (byteArray[charIndex] & 0xff);
}
byteArray = null;
charArray[charIndex++] = (char) codePoint;
while (codePoints.hasNext()) {
codePoint = codePoints.nextInt();
if (codePoint <= 0xffff) {
charArray[charIndex++] = (char) codePoint;
continue;
}
int[] intArray = new int[text.length()];
int intIndex = 0;
for (; intIndex < charIndex; intIndex++) {
intArray[intIndex] = charArray[intIndex] & 0xffff;
}
charArray = null;
intArray[intIndex++] = codePoint;
while (codePoints.hasNext()) {
codePoint = codePoints.nextInt();
intArray[intIndex++] = codePoint;
}
return new SupplementalCodePointArray(intArray, intIndex);
}
return new BasicCodePointArray(charArray, charIndex);
}
int[] intArray = new int[text.length()];
int intIndex = 0;
for (; intIndex < byteIndex; intIndex++) {
intArray[intIndex] = byteArray[intIndex] & 0xff;
}
byteArray = null;
intArray[intIndex++] = codePoint;
while (codePoints.hasNext()) {
codePoint = codePoints.nextInt();
intArray[intIndex++] = codePoint;
}
return new SupplementalCodePointArray(intArray, intIndex);
}
return new Latin1CodePointArray(byteArray, byteIndex);
}
}