FrequencyTrieBuilders.java

/*******************************************************************************
 * Copyright (C) 2026, Leo Galambos
 * All rights reserved.
 * 
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 * 
 * 1. Redistributions of source code must retain the above copyright notice,
 *    this list of conditions and the following disclaimer.
 * 
 * 2. Redistributions in binary form must reproduce the above copyright notice,
 *    this list of conditions and the following disclaimer in the documentation
 *    and/or other materials provided with the distribution.
 * 
 * 3. All advertising materials mentioning features or use of this software must
 *    display the following acknowledgement:
 *    This product includes software developed by the Egothor project.
 * 
 * 4. Neither the name of the copyright holder nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 * 
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 ******************************************************************************/
package org.egothor.stemmer;

import java.util.Objects;
import java.util.function.IntFunction;
import java.util.logging.Level;
import java.util.logging.Logger;

import org.egothor.stemmer.trie.CompiledNode;

/**
 * Factory utilities related to {@link FrequencyTrie.Builder}.
 *
 * <p>
 * This helper reconstructs writable builders from compiled read-only tries. The
 * reconstruction preserves the semantics and local counts of the compiled trie
 * as currently stored, which makes it suitable for subsequent modifications
 * followed by recompilation.
 *
 * <p>
 * Reconstruction operates on the compiled form. Therefore, if the compiled trie
 * was produced using a reduction mode that merged semantically equivalent
 * subtrees, the recreated builder reflects that reduced compiled state rather
 * than the exact original unreduced insertion history.
 */
public final class FrequencyTrieBuilders {

    /**
     * Logger of this class.
     */
    private static final Logger LOGGER = Logger.getLogger(FrequencyTrieBuilders.class.getName());

    /**
     * Utility class.
     */
    private FrequencyTrieBuilders() {
        throw new AssertionError("No instances.");
    }

    /**
     * Reconstructs a new writable builder from a compiled read-only trie.
     *
     * <p>
     * The returned builder contains the same key-local value counts as the supplied
     * compiled trie. Callers may continue modifying the returned builder and then
     * compile a new {@link FrequencyTrie} instance.
     *
     * @param source            source compiled trie
     * @param arrayFactory      array factory for the reconstructed builder
     * @param reductionSettings reduction settings to associate with the new builder
     * @param <V>               value type
     * @return reconstructed writable builder
     * @throws NullPointerException if any argument is {@code null}
     */
    public static <V> FrequencyTrie.Builder<V> copyOf(final FrequencyTrie<V> source,
            final IntFunction<V[]> arrayFactory, final ReductionSettings reductionSettings) {
        Objects.requireNonNull(source, "source");
        Objects.requireNonNull(arrayFactory, "arrayFactory");
        Objects.requireNonNull(reductionSettings, "reductionSettings");

        final FrequencyTrie.Builder<V> builder = new FrequencyTrie.Builder<>(arrayFactory, reductionSettings);
        final StringBuilder keyBuilder = new StringBuilder(64);

        copyNode(source.root(), keyBuilder, builder);

        LOGGER.log(Level.FINE, "Reconstructed writable builder from compiled trie.");
        return builder;
    }

    /**
     * Reconstructs a new writable builder from a compiled read-only trie using
     * default settings for the supplied reduction mode.
     *
     * @param source        source compiled trie
     * @param arrayFactory  array factory for the reconstructed builder
     * @param reductionMode reduction mode to associate with the new builder
     * @param <V>           value type
     * @return reconstructed writable builder
     * @throws NullPointerException if any argument is {@code null}
     */
    public static <V> FrequencyTrie.Builder<V> copyOf(final FrequencyTrie<V> source,
            final IntFunction<V[]> arrayFactory, final ReductionMode reductionMode) {
        Objects.requireNonNull(reductionMode, "reductionMode");
        return copyOf(source, arrayFactory, ReductionSettings.withDefaults(reductionMode));
    }

    /**
     * Copies one compiled node and all reachable descendants into the target
     * builder.
     *
     * @param node       current compiled node
     * @param keyBuilder current key builder
     * @param builder    target mutable builder
     * @param <V>        value type
     */
    private static <V> void copyNode(final CompiledNode<V> node, final StringBuilder keyBuilder,
            final FrequencyTrie.Builder<V> builder) {
        for (int valueIndex = 0; valueIndex < node.orderedValues().length; valueIndex++) {
            builder.put(keyBuilder.toString(), node.orderedValues()[valueIndex], node.orderedCounts()[valueIndex]);
        }

        for (int childIndex = 0; childIndex < node.edgeLabels().length; childIndex++) {
            keyBuilder.append(node.edgeLabels()[childIndex]);
            copyNode(node.children()[childIndex], keyBuilder, builder);
            keyBuilder.setLength(keyBuilder.length() - 1);
        }
    }
}