src/Atn/PredictionMode.php

*37748cd8SNickeau<?php
*37748cd8SNickeau
*37748cd8SNickeaudeclare(strict_types=1);
*37748cd8SNickeau
*37748cd8SNickeaunamespace Antlr\Antlr4\Runtime\Atn;
*37748cd8SNickeau
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Atn\SemanticContexts\SemanticContext;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Atn\States\RuleStopState;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Comparison\Equality;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Comparison\Equivalence;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Comparison\Hashable;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Comparison\Hasher;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Utils\BitSet;
*37748cd8SNickeauuse Antlr\Antlr4\Runtime\Utils\Map;
*37748cd8SNickeau
*37748cd8SNickeau/**
*37748cd8SNickeau * This enumeration defines the prediction modes available in ANTLR 4 along with
*37748cd8SNickeau * utility methods for analyzing configuration sets for conflicts and/or
*37748cd8SNickeau * ambiguities.
*37748cd8SNickeau */
*37748cd8SNickeaufinal class PredictionMode
*37748cd8SNickeau{
*37748cd8SNickeau    /**
*37748cd8SNickeau     * The SLL(*) prediction mode. This prediction mode ignores the current
*37748cd8SNickeau     * parser context when making predictions. This is the fastest prediction
*37748cd8SNickeau     * mode, and provides correct results for many grammars. This prediction
*37748cd8SNickeau     * mode is more powerful than the prediction mode provided by ANTLR 3, but
*37748cd8SNickeau     * may result in syntax errors for grammar and input combinations which are
*37748cd8SNickeau     * not SLL.
*37748cd8SNickeau     *
*37748cd8SNickeau     * When using this prediction mode, the parser will either return a correct
*37748cd8SNickeau     * parse tree (i.e. the same parse tree that would be returned with the
*37748cd8SNickeau     * {@see PredictionMode::LL()} prediction mode), or it will report a syntax
*37748cd8SNickeau     * error. If a syntax error is encountered when using the
*37748cd8SNickeau     * {@see PredictionMode::SLL()} prediction mode, it may be due to either
*37748cd8SNickeau     * an actual syntax error in the input or indicate that the particular
*37748cd8SNickeau     * ombination of grammar and input requires the more powerful
*37748cd8SNickeau     * {@see PredictionMode::LL()} prediction abilities to complete successfully.
*37748cd8SNickeau     *
*37748cd8SNickeau     * This prediction mode does not provide any guarantees for prediction
*37748cd8SNickeau     * behavior for syntactically-incorrect inputs.
*37748cd8SNickeau     */
*37748cd8SNickeau    public const SLL = 0;
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * The LL(*) prediction mode. This prediction mode allows the current parser
*37748cd8SNickeau     * context to be used for resolving SLL conflicts that occur during
*37748cd8SNickeau     * prediction. This is the fastest prediction mode that guarantees correct
*37748cd8SNickeau     * parse results for all combinations of grammars with syntactically correct
*37748cd8SNickeau     * inputs.
*37748cd8SNickeau     *
*37748cd8SNickeau     * When using this prediction mode, the parser will make correct decisions
*37748cd8SNickeau     * for all syntactically-correct grammar and input combinations. However, in
*37748cd8SNickeau     * cases where the grammar is truly ambiguous this prediction mode might not
*37748cd8SNickeau     * report a precise answer for exactly which alternatives are ambiguous.
*37748cd8SNickeau     *
*37748cd8SNickeau     * This prediction mode does not provide any guarantees for prediction
*37748cd8SNickeau     * behavior for syntactically-incorrect inputs.
*37748cd8SNickeau     */
*37748cd8SNickeau    public const LL = 1;
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * The LL(*) prediction mode with exact ambiguity detection. In addition to
*37748cd8SNickeau     * the correctness guarantees provided by the {@see PredictionMode::LL}
*37748cd8SNickeau     * prediction mode, this prediction mode instructs the prediction algorithm
*37748cd8SNickeau     * to determine the complete and exact set of ambiguous alternatives for
*37748cd8SNickeau     * every ambiguous decision encountered while parsing.
*37748cd8SNickeau     *
*37748cd8SNickeau     * This prediction mode may be used for diagnosing ambiguities during
*37748cd8SNickeau     * grammar development. Due to the performance overhead of calculating sets
*37748cd8SNickeau     * of ambiguous alternatives, this prediction mode should be avoided when
*37748cd8SNickeau     * the exact results are not necessary.
*37748cd8SNickeau     *
*37748cd8SNickeau     * This prediction mode does not provide any guarantees for prediction
*37748cd8SNickeau     * behavior for syntactically-incorrect inputs.
*37748cd8SNickeau     */
*37748cd8SNickeau    public const LL_EXACT_AMBIG_DETECTION = 2;
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Computes the SLL prediction termination condition.
*37748cd8SNickeau     *
*37748cd8SNickeau     * This method computes the SLL prediction termination condition for both of
*37748cd8SNickeau     * the following cases.
*37748cd8SNickeau     *
*37748cd8SNickeau     * - The usual SLL+LL fallback upon SLL conflict
*37748cd8SNickeau     * - Pure SLL without LL fallback
*37748cd8SNickeau     *
*37748cd8SNickeau     * COMBINED SLL+LL PARSING
*37748cd8SNickeau     *
*37748cd8SNickeau     * When LL-fallback is enabled upon SLL conflict, correct predictions are
*37748cd8SNickeau     * ensured regardless of how the termination condition is computed by this
*37748cd8SNickeau     * method. Due to the substantially higher cost of LL prediction, the
*37748cd8SNickeau     * prediction should only fall back to LL when the additional lookahead
*37748cd8SNickeau     * cannot lead to a unique SLL prediction.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Assuming combined SLL+LL parsing, an SLL configuration set with only
*37748cd8SNickeau     * conflicting subsets should fall back to full LL, even if the
*37748cd8SNickeau     * configuration sets don't resolve to the same alternative (e.g.
*37748cd8SNickeau     * `{1,2}` and `{3,4}`. If there is at least one non-conflicting
*37748cd8SNickeau     * configuration, SLL could continue with the hopes that more lookahead will
*37748cd8SNickeau     * resolve via one of those non-conflicting configurations.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Here's the prediction termination rule them: SLL (for SLL+LL parsing)
*37748cd8SNickeau     * stops when it sees only conflicting configuration subsets. In contrast,
*37748cd8SNickeau     * full LL keeps going when there is uncertainty.
*37748cd8SNickeau     *
*37748cd8SNickeau     * HEURISTIC
*37748cd8SNickeau     *
*37748cd8SNickeau     * As a heuristic, we stop prediction when we see any conflicting subset
*37748cd8SNickeau     * unless we see a state that only has one alternative associated with it.
*37748cd8SNickeau     * The single-alt-state thing lets prediction continue upon rules like
*37748cd8SNickeau     * (otherwise, it would admit defeat too soon):
*37748cd8SNickeau     *
*37748cd8SNickeau     * `[12|1|[], 6|2|[], 12|2|[]]. s : (ID | ID ID?) ';' ;`
*37748cd8SNickeau     *
*37748cd8SNickeau     * When the ATN simulation reaches the state before `';'`, it has a
*37748cd8SNickeau     * DFA state that looks like: `[12|1|[], 6|2|[], 12|2|[]]`. Naturally
*37748cd8SNickeau     * `12|1|[]` and `12|2|[]` conflict, but we cannot stop processing this
*37748cd8SNickeau     * node because alternative to has another way to continue, via `[6|2|[]]`.
*37748cd8SNickeau     *
*37748cd8SNickeau     * It also let's us continue for this rule: `[1|1|[], 1|2|[], 8|3|[]] a : A | A | A B ;`
*37748cd8SNickeau     *
*37748cd8SNickeau     * After matching input A, we reach the stop state for rule A, state 1.
*37748cd8SNickeau     * State 8 is the state right before B. Clearly alternatives 1 and 2
*37748cd8SNickeau     * conflict and no amount of further lookahead will separate the two.
*37748cd8SNickeau     * However, alternative 3 will be able to continue and so we do not stop
*37748cd8SNickeau     * working on this state. In the previous example, we're concerned with
*37748cd8SNickeau     * states associated with the conflicting alternatives. Here alt 3 is not
*37748cd8SNickeau     * associated with the conflicting configs, but since we can continue
*37748cd8SNickeau     * looking for input reasonably, don't declare the state done.
*37748cd8SNickeau     *
*37748cd8SNickeau     * PURE SLL PARSING
*37748cd8SNickeau     *
*37748cd8SNickeau     * To handle pure SLL parsing, all we have to do is make sure that we
*37748cd8SNickeau     * combine stack contexts for configurations that differ only by semantic
*37748cd8SNickeau     * predicate. From there, we can do the usual SLL termination heuristic.
*37748cd8SNickeau     *
*37748cd8SNickeau     * PREDICATES IN SLL+LL PARSING
*37748cd8SNickeau     *
*37748cd8SNickeau     * SLL decisions don't evaluate predicates until after they reach DFA stop
*37748cd8SNickeau     * states because they need to create the DFA cache that works in all
*37748cd8SNickeau     * semantic situations. In contrast, full LL evaluates predicates collected
*37748cd8SNickeau     * during start state computation so it can ignore predicates thereafter.
*37748cd8SNickeau     * This means that SLL termination detection can totally ignore semantic
*37748cd8SNickeau     * predicates.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Implementation-wise, {@see ATNConfigSet} combines stack contexts but not
*37748cd8SNickeau     * semantic predicate contexts so we might see two configurations like the
*37748cd8SNickeau     * following.
*37748cd8SNickeau     *
*37748cd8SNickeau     * `s, 1, x, {}), (s, 1, x', {p})`
*37748cd8SNickeau     *
*37748cd8SNickeau     * Before testing these configurations against others, we have to merge
*37748cd8SNickeau     * `x` and `x'` (without modifying the existing configurations).
*37748cd8SNickeau     * For example, we test `(x+x') === x''` when looking for conflicts in
*37748cd8SNickeau     * the following configurations.
*37748cd8SNickeau     *
*37748cd8SNickeau     * `(s, 1, x, {}), (s, 1, x', {p}), (s, 2, x'', {})`
*37748cd8SNickeau     *
*37748cd8SNickeau     * If the configuration set has predicates (as indicated by
*37748cd8SNickeau     * {@see ATNConfigSet::hasSemanticContext()}), this algorithm makes a copy of
*37748cd8SNickeau     * the configurations to strip out all of the predicates so that a standard
*37748cd8SNickeau     * {@see ATNConfigSet} will merge everything ignoring predicates.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function hasSLLConflictTerminatingPrediction(int $mode, ATNConfigSet $configs) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        /* Configs in rule stop states indicate reaching the end of the decision
*37748cd8SNickeau         * rule (local context) or end of start rule (full context). If all
*37748cd8SNickeau         * configs meet this condition, then none of the configurations is able
*37748cd8SNickeau         * to match additional input so we terminate prediction.
*37748cd8SNickeau         */
*37748cd8SNickeau        if (self::allConfigsInRuleStopStates($configs)) {
*37748cd8SNickeau            return true;
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        // pure SLL mode parsing
*37748cd8SNickeau        if ($mode === self::SLL) {
*37748cd8SNickeau            // Don't bother with combining configs from different semantic
*37748cd8SNickeau            // contexts if we can fail over to full LL; costs more time
*37748cd8SNickeau            // since we'll often fail over anyway.
*37748cd8SNickeau            if ($configs->hasSemanticContext) {
*37748cd8SNickeau                // dup configs, tossing out semantic predicates
*37748cd8SNickeau                $dup = new ATNConfigSet();
*37748cd8SNickeau
*37748cd8SNickeau                foreach ($configs->elements() as $c) {
*37748cd8SNickeau                    $c = new ATNConfig($c, null, null, SemanticContext::none());
*37748cd8SNickeau                    $dup->add($c);
*37748cd8SNickeau                }
*37748cd8SNickeau
*37748cd8SNickeau                $configs = $dup;
*37748cd8SNickeau            }
*37748cd8SNickeau            // now we have combined contexts for configs with dissimilar preds
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        // pure SLL or combined SLL+LL mode parsing
*37748cd8SNickeau        $altsets = self::getConflictingAltSubsets($configs);
*37748cd8SNickeau
*37748cd8SNickeau        return self::hasConflictingAltSet($altsets) && !self::hasStateAssociatedWithOneAlt($configs);
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Checks if any configuration in `configs` is in a {@see RuleStopState}.
*37748cd8SNickeau     * Configurations meeting this condition have reached the end of the decision
*37748cd8SNickeau     * rule (local context) or end of start rule (full context).
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param ATNConfigSet $configs The configuration set to test.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return bool If any configuration in  is in a if any configuration in
*37748cd8SNickeau     *              `configs` is in a {@see RuleStopState}, otherwise `false`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function hasConfigInRuleStopState(ATNConfigSet $configs) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        foreach ($configs->elements() as $c) {
*37748cd8SNickeau            if ($c->state instanceof RuleStopState) {
*37748cd8SNickeau                return true;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return false;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Checks if all configurations in `configs` are in a {@see RuleStopState}.
*37748cd8SNickeau     * Configurations meeting this condition have reached the end of the decision
*37748cd8SNickeau     * rule (local context) or end of start rule (full context).
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param ATNConfigSet $configs the configuration set to test.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return bool If all configurations in  are in a if all configurations in
*37748cd8SNickeau     *              `configs` are in a {@see RuleStopState}, otherwise `false`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function allConfigsInRuleStopStates(ATNConfigSet $configs) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        foreach ($configs->elements() as $c) {
*37748cd8SNickeau            if (!$c->state instanceof RuleStopState) {
*37748cd8SNickeau                return false;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return true;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Full LL prediction termination.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Can we stop looking ahead during ATN simulation or is there some
*37748cd8SNickeau     * uncertainty as to which alternative we will ultimately pick, after
*37748cd8SNickeau     * consuming more input? Even if there are partial conflicts, we might know
*37748cd8SNickeau     * that everything is going to resolve to the same minimum alternative. That
*37748cd8SNickeau     * means we can stop since no more lookahead will change that fact. On the
*37748cd8SNickeau     * other hand, there might be multiple conflicts that resolve to different
*37748cd8SNickeau     * minimums. That means we need more look ahead to decide which of those
*37748cd8SNickeau     * alternatives we should predict.
*37748cd8SNickeau     *
*37748cd8SNickeau     * The basic idea is to split the set of configurations `C`, into
*37748cd8SNickeau     * conflicting subsets `(s, _, ctx, _)` and singleton subsets with
*37748cd8SNickeau     * non-conflicting configurations. Two configurations conflict if they have
*37748cd8SNickeau     * identical {@see ATNConfig::state()} and {@see ATNConfig::context()} values
*37748cd8SNickeau     * but different {@see ATNConfig::alt()} value, e.g. `(s, i, ctx, _)` and
*37748cd8SNickeau     * `(s, j, ctx, _)` for `i!=j`.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Reduce these configuration subsets to the set of possible alternatives.
*37748cd8SNickeau     * You can compute the alternative subsets in one pass as follows:
*37748cd8SNickeau     *
*37748cd8SNickeau     * `A_s,ctx = {i | (s, i, ctx, _)}` for each configuration in `C` holding
*37748cd8SNickeau     * `s` and `ctx` fixed.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Or in pseudo-code, for each configuration `c` in `C`:
*37748cd8SNickeau     *
*37748cd8SNickeau     *     map[c] U= c.{@see ATNConfig::alt alt} # map hash/equals uses s and x,
*37748cd8SNickeau     *     not alt and not pred
*37748cd8SNickeau     *
*37748cd8SNickeau     * The values in `map` are the set of `A_s,ctx` sets.
*37748cd8SNickeau     *
*37748cd8SNickeau     * If `|A_s,ctx|=1` then there is no conflict associated with `s` and `ctx`.
*37748cd8SNickeau     *
*37748cd8SNickeau     * Reduce the subsets to singletons by choosing a minimum of each subset. If
*37748cd8SNickeau     * the union of these alternative subsets is a singleton, then no amount of
*37748cd8SNickeau     * more lookahead will help us. We will always pick that alternative. If,
*37748cd8SNickeau     * however, there is more than one alternative, then we are uncertain which
*37748cd8SNickeau     * alternative to predict and must continue looking for resolution. We may
*37748cd8SNickeau     * or may not discover an ambiguity in the future, even if there are no
*37748cd8SNickeau     * conflicting subsets this round.
*37748cd8SNickeau     *
*37748cd8SNickeau     * The biggest sin is to terminate early because it means we've made a
*37748cd8SNickeau     * decision but were uncertain as to the eventual outcome. We haven't used
*37748cd8SNickeau     * enough lookahead. On the other hand, announcing a conflict too late is no
*37748cd8SNickeau     * big deal; you will still have the conflict. It's just inefficient. It
*37748cd8SNickeau     * might even look until the end of file.
*37748cd8SNickeau     *
*37748cd8SNickeau     * No special consideration for semantic predicates is required because
*37748cd8SNickeau     * predicates are evaluated on-the-fly for full LL prediction, ensuring that
*37748cd8SNickeau     * no configuration contains a semantic context during the termination
*37748cd8SNickeau     * check.
*37748cd8SNickeau     *
*37748cd8SNickeau     * CONFLICTING CONFIGS
*37748cd8SNickeau     *
*37748cd8SNickeau     * Two configurations `(s, i, x)` and `(s, j, x')`, conflict when `i!=j`
*37748cd8SNickeau     * but `x=x'`. Because we merge all `(s, i, _)` configurations together,
*37748cd8SNickeau     * that means that there are at most `n` configurations associated with
*37748cd8SNickeau     * state `s` for `n` possible alternatives in the decision. The merged stacks
*37748cd8SNickeau     * complicate the comparison of configuration contexts `x` and `x'`.
*37748cd8SNickeau     * Sam checks to see if one is a subset of the other by calling merge and
*37748cd8SNickeau     * checking to see if the merged result is either `x` orv`x'`. If the `x`
*37748cd8SNickeau     * associated with lowest alternative `i`vis the superset, then `i` is the
*37748cd8SNickeau     * only possible prediction since the others resolve to `min(i)` as well.
*37748cd8SNickeau     * However, if `x` is associated with `j>i` then at least one stack
*37748cd8SNickeau     * configuration for `j` is not in conflict with alternative `i`. The algorithm
*37748cd8SNickeau     * should keep going, looking for more lookahead due to the uncertainty.
*37748cd8SNickeau     *
*37748cd8SNickeau     * For simplicity, I'm doing a equality check between `x` and `x'` that lets
*37748cd8SNickeau     * the algorithm continue to consume lookahead longer than necessary. The
*37748cd8SNickeau     * reason I like the equality is of course the simplicity but also because
*37748cd8SNickeau     * that is the test you need to detect the alternatives that are actually
*37748cd8SNickeau     * in conflict.
*37748cd8SNickeau     *
*37748cd8SNickeau     * CONTINUE/STOP RULE
*37748cd8SNickeau     *
*37748cd8SNickeau     * Continue if union of resolved alternative sets from non-conflicting and
*37748cd8SNickeau     * conflicting alternative subsets has more than one alternative. We are
*37748cd8SNickeau     * uncertain about which alternative to predict.
*37748cd8SNickeau     *
*37748cd8SNickeau     * The complete set of alternatives, `[i for (_,i,_)]`, tells us which
*37748cd8SNickeau     * alternatives are still in the running for the amount of input we've
*37748cd8SNickeau     * consumed at this point. The conflicting sets let us to strip away
*37748cd8SNickeau     * configurations that won't lead to more states because we resolve
*37748cd8SNickeau     * conflicts to the configuration with a minimum alternate for the
*37748cd8SNickeau     * conflicting set.
*37748cd8SNickeau     *
*37748cd8SNickeau     * CASES
*37748cd8SNickeau     *
*37748cd8SNickeau     * - no conflicts and more than 1 alternative in set => continue
*37748cd8SNickeau     * - `(s, 1, x)}, `(s, 2, x)`, `(s, 3, z)`, `(s', 1, y)`, `(s', 2, y)`
*37748cd8SNickeau     *   yields non-conflicting set `{3}} U conflicting sets `min({1,2})} U
*37748cd8SNickeau     *   `min({1,2`)` = `{1,3}` => continue
*37748cd8SNickeau     * - `(s, 1, x)}, `(s, 2, x)`, `(s', 1, y)`, `(s', 2, y)`, `(s'', 1, z)`
*37748cd8SNickeau     *    yields non-conflicting set `{1}} U conflicting sets `min({1,2})} U
*37748cd8SNickeau     *    `min({1,2`)` = `{1`` => stop and predict 1
*37748cd8SNickeau     * - `(s, 1, x)}, `(s, 2, x)`, `(s', 1, y)`, `(s', 2, y)` yields conflicting,
*37748cd8SNickeau     *    reduced sets `{1`` U `{1}} = `{1`` => stop and predict 1, can announce
*37748cd8SNickeau     *    ambiguity `{1,2}`
*37748cd8SNickeau     * - `(s, 1, x)}, `(s, 2, x)`, `(s', 2, y)`, `(s', 3, y)` yields conflicting,
*37748cd8SNickeau     *    reduced sets `{1`` U `{2}} = `{1,2`` => continue
*37748cd8SNickeau     * - `(s, 1, x)}, `(s, 2, x)`, `(s', 3, y)`, `(s', 4, y)` yields conflicting,
*37748cd8SNickeau     *    reduced sets `{1`` U `{3}} = `{1,3`` => continue
*37748cd8SNickeau     *
*37748cd8SNickeau     * EXACT AMBIGUITY DETECTION
*37748cd8SNickeau     *
*37748cd8SNickeau     * If all states report the same conflicting set of alternatives, then we
*37748cd8SNickeau     * know we have the exact ambiguity set.
*37748cd8SNickeau     *
*37748cd8SNickeau     * `|A_i|>1` and `A_i = A_j` for all i, j.
*37748cd8SNickeau     *
*37748cd8SNickeau     * In other words, we continue examining lookahead until all `A_i`
*37748cd8SNickeau     * have more than one alternative and all `A_i` are the same. If
*37748cd8SNickeau     * `A={{1,2}, {1,3}}`, then regular LL prediction would terminate
*37748cd8SNickeau     * because the resolved set is `{1}`. To determine what the real
*37748cd8SNickeau     * ambiguity is, we have to know whether the ambiguity is between one and
*37748cd8SNickeau     * two or one and three so we keep going. We can only stop prediction when
*37748cd8SNickeau     * we need exact ambiguity detection when the sets look like
*37748cd8SNickeau     * `A={{1,2}}} or `{{1,2},{1,2}``, etc...
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function resolvesToJustOneViableAlt(array $altsets) : int
*37748cd8SNickeau    {
*37748cd8SNickeau        return self::getSingleViableAlt($altsets);
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Determines if every alternative subset in `altsets` contains more
*37748cd8SNickeau     * than one alternative.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets a collection of alternative subsets
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return bool If every >BitSet in `altsets` {@see BitSet::length()} > 1,
*37748cd8SNickeau     *              otherwise `false`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function allSubsetsConflict(array $altsets) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        return !self::hasNonConflictingAltSet($altsets);
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Determines if any single alternative subset in `altsets` contains
*37748cd8SNickeau     * exactly one alternative.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets a collection of alternative subsets
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return bool `true` if `altsets` contains a {@see BitSet} with
*37748cd8SNickeau     *              {@see BitSet::length()} 1, otherwise `false`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function hasNonConflictingAltSet(array $altsets) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        foreach ($altsets as $alts) {
*37748cd8SNickeau            if ($alts->length() === 1) {
*37748cd8SNickeau                return true;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return false;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Determines if any single alternative subset in `altsets` contains
*37748cd8SNickeau     * more than one alternative.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets a collection of alternative subsets
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return bool `true` if `altsets` contains a {@see BitSet} with
*37748cd8SNickeau     *              {@see BitSet::length()} > 1, otherwise `false`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function hasConflictingAltSet(array $altsets) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        foreach ($altsets as $alts) {
*37748cd8SNickeau            if ($alts->length() > 1) {
*37748cd8SNickeau                return true;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return false;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Determines if every alternative subset in `altsets` is equivalent.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets a collection of alternative subsets
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return bool `true` if every member of `altsets` is equal to
*37748cd8SNickeau     *              the others, otherwise `false`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function allSubsetsEqual(array $altsets) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        $first = null;
*37748cd8SNickeau
*37748cd8SNickeau        foreach ($altsets as $alts) {
*37748cd8SNickeau            if ($first === null) {
*37748cd8SNickeau                $first = $alts;
*37748cd8SNickeau            } elseif ($alts !== $first) {
*37748cd8SNickeau                return false;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return true;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Returns the unique alternative predicted by all alternative subsets in
*37748cd8SNickeau     * `altsets`. If no such alternative exists, this method returns
*37748cd8SNickeau     * {@see ATN::INVALID_ALT_NUMBER}.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets a collection of alternative subsets
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function getUniqueAlt(array $altsets) : int
*37748cd8SNickeau    {
*37748cd8SNickeau        $all = self::getAlts($altsets);
*37748cd8SNickeau
*37748cd8SNickeau        if ($all->length() === 1) {
*37748cd8SNickeau            return $all->minValue();
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return ATN::INVALID_ALT_NUMBER;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Gets the complete set of represented alternatives for a collection of
*37748cd8SNickeau     * alternative subsets. This method returns the union of each {@see BitSet}
*37748cd8SNickeau     * in `altsets`.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @param array<BitSet> $altsets a collection of alternative subsets.
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return BitSet the set of represented alternatives in `altsets`.
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function getAlts(array $altsets) : BitSet
*37748cd8SNickeau    {
*37748cd8SNickeau        $all = new BitSet();
*37748cd8SNickeau
*37748cd8SNickeau        foreach ($altsets as $alts) {
*37748cd8SNickeau            $all->or($alts);
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return $all;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * This function gets the conflicting alt subsets from a configuration set.
*37748cd8SNickeau     * For each configuration `c` in `configs`:
*37748cd8SNickeau     *
*37748cd8SNickeau     *     map[c] U= c.{@see ATNConfig::$alt} # map hash/equals uses s and x,
*37748cd8SNickeau     *     not alt and not pred
*37748cd8SNickeau     *
*37748cd8SNickeau     * @return array<BitSet>
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function getConflictingAltSubsets(ATNConfigSet $configs) : array
*37748cd8SNickeau    {
*37748cd8SNickeau        $configToAlts = new Map(new class implements Equivalence {
*37748cd8SNickeau            public function equals(object $other) : bool
*37748cd8SNickeau            {
*37748cd8SNickeau                return $this instanceof self;
*37748cd8SNickeau            }
*37748cd8SNickeau
*37748cd8SNickeau            public function equivalent(Hashable $left, Hashable $right) : bool
*37748cd8SNickeau            {
*37748cd8SNickeau                return $left instanceof ATNConfig
*37748cd8SNickeau                    && $right instanceof ATNConfig
*37748cd8SNickeau                    && $left->state->stateNumber === $right->state->stateNumber
*37748cd8SNickeau                    && Equality::equals($left->context, $right->context);
*37748cd8SNickeau            }
*37748cd8SNickeau
*37748cd8SNickeau            public function hash(Hashable $value) : int
*37748cd8SNickeau            {
*37748cd8SNickeau                if (!$value instanceof ATNConfig) {
*37748cd8SNickeau                    throw new \InvalidArgumentException('Unsupported value.');
*37748cd8SNickeau                }
*37748cd8SNickeau
*37748cd8SNickeau                return Hasher::hash($value->state->stateNumber, $value->context);
*37748cd8SNickeau            }
*37748cd8SNickeau        });
*37748cd8SNickeau
*37748cd8SNickeau        foreach ($configs->elements() as $cfg) {
*37748cd8SNickeau            $alts = $configToAlts->get($cfg);
*37748cd8SNickeau
*37748cd8SNickeau            if ($alts === null) {
*37748cd8SNickeau                $alts = new BitSet();
*37748cd8SNickeau                $configToAlts->put($cfg, $alts);
*37748cd8SNickeau            }
*37748cd8SNickeau
*37748cd8SNickeau            $alts->add($cfg->alt);
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return $configToAlts->getValues();
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * Get a map from state to alt subset from a configuration set. For each
*37748cd8SNickeau     * configuration `c` in `configs`:
*37748cd8SNickeau     *
*37748cd8SNickeau     *     map[c.{@see ATNConfig::$state}] U= c.{@see ATNConfig::$alt}
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function getStateToAltMap(ATNConfigSet $configs) : Map
*37748cd8SNickeau    {
*37748cd8SNickeau        $m = new Map();
*37748cd8SNickeau
*37748cd8SNickeau        foreach ($configs->elements() as $c) {
*37748cd8SNickeau            $alts = $m->get($c->state);
*37748cd8SNickeau
*37748cd8SNickeau            if ($alts === null) {
*37748cd8SNickeau                $alts = new BitSet();
*37748cd8SNickeau                $m->put($c->state, $alts);
*37748cd8SNickeau            }
*37748cd8SNickeau
*37748cd8SNickeau            $alts->add($c->alt);
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return $m;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    public static function hasStateAssociatedWithOneAlt(ATNConfigSet $configs) : bool
*37748cd8SNickeau    {
*37748cd8SNickeau        foreach (self::getStateToAltMap($configs)->getValues() as $value) {
*37748cd8SNickeau            if ($value instanceof BitSet && $value->length() === 1) {
*37748cd8SNickeau                return true;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return false;
*37748cd8SNickeau    }
*37748cd8SNickeau
*37748cd8SNickeau    /**
*37748cd8SNickeau     * @param array<BitSet> $altsets
*37748cd8SNickeau     */
*37748cd8SNickeau    public static function getSingleViableAlt(array $altsets) : int
*37748cd8SNickeau    {
*37748cd8SNickeau        $result = 0;
*37748cd8SNickeau
*37748cd8SNickeau        foreach ($altsets as $alts) {
*37748cd8SNickeau            $minAlt = $alts->minValue();
*37748cd8SNickeau
*37748cd8SNickeau            if ($result === 0) {
*37748cd8SNickeau                $result = (int) $minAlt;
*37748cd8SNickeau            } elseif ($result !== $minAlt) {
*37748cd8SNickeau                // more than 1 viable alt
*37748cd8SNickeau                return ATN::INVALID_ALT_NUMBER;
*37748cd8SNickeau            }
*37748cd8SNickeau        }
*37748cd8SNickeau
*37748cd8SNickeau        return $result;
*37748cd8SNickeau    }
*37748cd8SNickeau}