/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.lucene.store;

import java.io.IOException;

import org.apache.lucene.util.ArrayUtil;
import org.apache.lucene.util.UnicodeUtil;

A DataOutput that can be used to build a byte[].
@lucene.internal
/** * A {@link DataOutput} that can be used to build a byte[]. * * @lucene.internal */
public final class GrowableByteArrayDataOutput extends DataOutput {
Minimum utf8 byte size of a string over which double pass over string is to save memory during encode
/** Minimum utf8 byte size of a string over which double pass over string is to save memory during encode */
static final int MIN_UTF8_SIZE_TO_ENABLE_DOUBLE_PASS_ENCODING = 65536;
The bytes
/** The bytes */
private byte[] bytes;
The length
/** The length */
private int length; // scratch for utf8 encoding of small strings private byte[] scratchBytes;
Create a GrowableByteArrayDataOutput with the given initial capacity.
/** Create a {@link GrowableByteArrayDataOutput} with the given initial capacity. */
public GrowableByteArrayDataOutput(int cp) { this.bytes = new byte[ArrayUtil.oversize(cp, 1)]; this.length = 0; } @Override public void writeByte(byte b) { if (length >= bytes.length) { bytes = ArrayUtil.grow(bytes); } bytes[length++] = b; } @Override public void writeBytes(byte[] b, int off, int len) { final int newLength = length + len; if (newLength > bytes.length) { bytes = ArrayUtil.grow(bytes, newLength); } System.arraycopy(b, off, bytes, length, len); length = newLength; } @Override public void writeString(String string) throws IOException { int maxLen = UnicodeUtil.maxUTF8Length(string.length()); if (maxLen <= MIN_UTF8_SIZE_TO_ENABLE_DOUBLE_PASS_ENCODING) { // string is small enough that we don't need to save memory by falling back to double-pass approach // this is just an optimized writeString() that re-uses scratchBytes. if (scratchBytes == null) { scratchBytes = new byte[ArrayUtil.oversize(maxLen, Character.BYTES)]; } else { scratchBytes = ArrayUtil.grow(scratchBytes, maxLen); } int len = UnicodeUtil.UTF16toUTF8(string, 0, string.length(), scratchBytes); writeVInt(len); writeBytes(scratchBytes, len); } else { // use a double pass approach to avoid allocating a large intermediate buffer for string encoding int numBytes = UnicodeUtil.calcUTF16toUTF8Length(string, 0, string.length()); writeVInt(numBytes); bytes = ArrayUtil.grow(bytes, length + numBytes); length = UnicodeUtil.UTF16toUTF8(string, 0, string.length(), bytes, length); } } public byte[] getBytes() { return bytes; } public int getPosition() { return length; } public void reset() { length = 0; } }