FrequencyTrieBuilders.java
/*******************************************************************************
* Copyright (C) 2026, Leo Galambos
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are met:
*
* 1. Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright notice,
* this list of conditions and the following disclaimer in the documentation
* and/or other materials provided with the distribution.
*
* 3. All advertising materials mentioning features or use of this software must
* display the following acknowledgement:
* This product includes software developed by the Egothor project.
*
* 4. Neither the name of the copyright holder nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
******************************************************************************/
package org.egothor.stemmer;
import java.util.Objects;
import java.util.function.IntFunction;
import java.util.logging.Level;
import java.util.logging.Logger;
import org.egothor.stemmer.trie.CompiledNode;
/**
* Factory utilities related to {@link FrequencyTrie.Builder}.
*
* <p>
* This helper reconstructs writable builders from compiled read-only tries. The
* reconstruction preserves the semantics and local counts of the compiled trie
* as currently stored, which makes it suitable for subsequent modifications
* followed by recompilation.
*
* <p>
* Reconstruction operates on the compiled form. Therefore, if the compiled trie
* was produced using a reduction mode that merged semantically equivalent
* subtrees, the recreated builder reflects that reduced compiled state rather
* than the exact original unreduced insertion history.
*/
public final class FrequencyTrieBuilders {
/**
* Logger of this class.
*/
private static final Logger LOGGER = Logger.getLogger(FrequencyTrieBuilders.class.getName());
/**
* Utility class.
*/
private FrequencyTrieBuilders() {
throw new AssertionError("No instances.");
}
/**
* Reconstructs a new writable builder from a compiled read-only trie.
*
* <p>
* The returned builder contains the same key-local value counts as the supplied
* compiled trie. Callers may continue modifying the returned builder and then
* compile a new {@link FrequencyTrie} instance.
*
* @param source source compiled trie
* @param arrayFactory array factory for the reconstructed builder
* @param reductionSettings reduction settings to associate with the new builder
* @param <V> value type
* @return reconstructed writable builder
* @throws NullPointerException if any argument is {@code null}
*/
public static <V> FrequencyTrie.Builder<V> copyOf(final FrequencyTrie<V> source,
final IntFunction<V[]> arrayFactory, final ReductionSettings reductionSettings) {
Objects.requireNonNull(source, "source");
Objects.requireNonNull(arrayFactory, "arrayFactory");
Objects.requireNonNull(reductionSettings, "reductionSettings");
final FrequencyTrie.Builder<V> builder = new FrequencyTrie.Builder<>(arrayFactory, reductionSettings);
final StringBuilder keyBuilder = new StringBuilder(64);
copyNode(source.root(), keyBuilder, builder);
LOGGER.log(Level.FINE, "Reconstructed writable builder from compiled trie.");
return builder;
}
/**
* Reconstructs a new writable builder from a compiled read-only trie using
* default settings for the supplied reduction mode.
*
* @param source source compiled trie
* @param arrayFactory array factory for the reconstructed builder
* @param reductionMode reduction mode to associate with the new builder
* @param <V> value type
* @return reconstructed writable builder
* @throws NullPointerException if any argument is {@code null}
*/
public static <V> FrequencyTrie.Builder<V> copyOf(final FrequencyTrie<V> source,
final IntFunction<V[]> arrayFactory, final ReductionMode reductionMode) {
Objects.requireNonNull(reductionMode, "reductionMode");
return copyOf(source, arrayFactory, ReductionSettings.withDefaults(reductionMode));
}
/**
* Copies one compiled node and all reachable descendants into the target
* builder.
*
* @param node current compiled node
* @param keyBuilder current key builder
* @param builder target mutable builder
* @param <V> value type
*/
private static <V> void copyNode(final CompiledNode<V> node, final StringBuilder keyBuilder,
final FrequencyTrie.Builder<V> builder) {
for (int valueIndex = 0; valueIndex < node.orderedValues().length; valueIndex++) {
builder.put(keyBuilder.toString(), node.orderedValues()[valueIndex], node.orderedCounts()[valueIndex]);
}
for (int childIndex = 0; childIndex < node.edgeLabels().length; childIndex++) {
keyBuilder.append(node.edgeLabels()[childIndex]);
copyNode(node.children()[childIndex], keyBuilder, builder);
keyBuilder.setLength(keyBuilder.length() - 1);
}
}
}