rust/src/librustdoc/html/static/js/search.js

/* global addClass, getNakedUrl, getSettingValue */
/* global onEachLazy, removeClass, searchState, browserSupportsHistoryApi, exports */

"use strict";

// polyfill
// https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects/Array/toSpliced
if (!Array.prototype.toSpliced) {
    // Can't use arrow functions, because we want `this`
    Array.prototype.toSpliced = function() {
        const me = this.slice();
        Array.prototype.splice.apply(me, arguments);
        return me;
    };
}

(function() {
// This mapping table should match the discriminants of
// `rustdoc::formats::item_type::ItemType` type in Rust.
const itemTypes = [
    "keyword",
    "primitive",
    "mod",
    "externcrate",
    "import",
    "struct", // 5
    "enum",
    "fn",
    "type",
    "static",
    "trait", // 10
    "impl",
    "tymethod",
    "method",
    "structfield",
    "variant", // 15
    "macro",
    "associatedtype",
    "constant",
    "associatedconstant",
    "union", // 20
    "foreigntype",
    "existential",
    "attr",
    "derive",
    "traitalias", // 25
    "generic",
];

const longItemTypes = [
    "keyword",
    "primitive type",
    "module",
    "extern crate",
    "re-export",
    "struct",
    "enum",
    "function",
    "type alias",
    "static",
    "trait",
    "",
    "trait method",
    "method",
    "struct field",
    "enum variant",
    "macro",
    "assoc type",
    "constant",
    "assoc const",
    "union",
    "foreign type",
    "existential type",
    "attribute macro",
    "derive macro",
    "trait alias",
];

// used for special search precedence
const TY_GENERIC = itemTypes.indexOf("generic");
const ROOT_PATH = typeof window !== "undefined" ? window.rootPath : "../";

function hasOwnPropertyRustdoc(obj, property) {
    return Object.prototype.hasOwnProperty.call(obj, property);
}

// In the search display, allows to switch between tabs.
function printTab(nb) {
    let iter = 0;
    let foundCurrentTab = false;
    let foundCurrentResultSet = false;
    onEachLazy(document.getElementById("search-tabs").childNodes, elem => {
        if (nb === iter) {
            addClass(elem, "selected");
            foundCurrentTab = true;
        } else {
            removeClass(elem, "selected");
        }
        iter += 1;
    });
    const isTypeSearch = (nb > 0 || iter === 1);
    iter = 0;
    onEachLazy(document.getElementById("results").childNodes, elem => {
        if (nb === iter) {
            addClass(elem, "active");
            foundCurrentResultSet = true;
        } else {
            removeClass(elem, "active");
        }
        iter += 1;
    });
    if (foundCurrentTab && foundCurrentResultSet) {
        searchState.currentTab = nb;
        // Corrections only kick in on type-based searches.
        const correctionsElem = document.getElementsByClassName("search-corrections");
        if (isTypeSearch) {
            removeClass(correctionsElem[0], "hidden");
        } else {
            addClass(correctionsElem[0], "hidden");
        }
    } else if (nb !== 0) {
        printTab(0);
    }
}

/**
 * The [edit distance] is a metric for measuring the difference between two strings.
 *
 * [edit distance]: https://en.wikipedia.org/wiki/Edit_distance
 */

/*
 * This function was translated, mostly line-for-line, from
 * https://github.com/rust-lang/rust/blob/ff4b772f805ec1e/compiler/rustc_span/src/edit_distance.rs
 *
 * The current implementation is the restricted Damerau-Levenshtein algorithm. It is restricted
 * because it does not permit modifying characters that have already been transposed. The specific
 * algorithm should not matter to the caller of the methods, which is why it is not noted in the
 * documentation.
 */
const editDistanceState = {
    current: [],
    prev: [],
    prevPrev: [],
    calculate: function calculate(a, b, limit) {
        // Ensure that `b` is the shorter string, minimizing memory use.
        if (a.length < b.length) {
            const aTmp = a;
            a = b;
            b = aTmp;
        }

        const minDist = a.length - b.length;
        // If we know the limit will be exceeded, we can return early.
        if (minDist > limit) {
            return limit + 1;
        }

        // Strip common prefix.
        // We know that `b` is the shorter string, so we don't need to check
        // `a.length`.
        while (b.length > 0 && b[0] === a[0]) {
            a = a.substring(1);
            b = b.substring(1);
        }
        // Strip common suffix.
        while (b.length > 0 && b[b.length - 1] === a[a.length - 1]) {
            a = a.substring(0, a.length - 1);
            b = b.substring(0, b.length - 1);
        }

        // If either string is empty, the distance is the length of the other.
        // We know that `b` is the shorter string, so we don't need to check `a`.
        if (b.length === 0) {
            return minDist;
        }

        const aLength = a.length;
        const bLength = b.length;

        for (let i = 0; i <= bLength; ++i) {
            this.current[i] = 0;
            this.prev[i] = i;
            this.prevPrev[i] = Number.MAX_VALUE;
        }

        // row by row
        for (let i = 1; i <= aLength; ++i) {
            this.current[0] = i;
            const aIdx = i - 1;

            // column by column
            for (let j = 1; j <= bLength; ++j) {
                const bIdx = j - 1;

                // There is no cost to substitute a character with itself.
                const substitutionCost = a[aIdx] === b[bIdx] ? 0 : 1;

                this.current[j] = Math.min(
                    // deletion
                    this.prev[j] + 1,
                    // insertion
                    this.current[j - 1] + 1,
                    // substitution
                    this.prev[j - 1] + substitutionCost
                );

                if ((i > 1) && (j > 1) && (a[aIdx] === b[bIdx - 1]) && (a[aIdx - 1] === b[bIdx])) {
                    // transposition
                    this.current[j] = Math.min(
                        this.current[j],
                        this.prevPrev[j - 2] + 1
                    );
                }
            }

            // Rotate the buffers, reusing the memory
            const prevPrevTmp = this.prevPrev;
            this.prevPrev = this.prev;
            this.prev = this.current;
            this.current = prevPrevTmp;
        }

        // `prev` because we already rotated the buffers.
        const distance = this.prev[bLength];
        return distance <= limit ? distance : (limit + 1);
    },
};

function editDistance(a, b, limit) {
    return editDistanceState.calculate(a, b, limit);
}

function initSearch(rawSearchIndex) {
    const MAX_RESULTS = 200;
    const NO_TYPE_FILTER = -1;
    /**
     *  @type {Array<Row>}
     */
    let searchIndex;
    /**
     *  @type {Uint32Array}
     */
    let functionTypeFingerprint;
    let currentResults;
    /**
     * Map from normalized type names to integers. Used to make type search
     * more efficient.
     *
     * @type {Map<string, {id: integer, assocOnly: boolean}>}
     */
    let typeNameIdMap;
    const ALIASES = new Map();

    /**
     * Special type name IDs for searching by array.
     */
    let typeNameIdOfArray;
    /**
     * Special type name IDs for searching by slice.
     */
    let typeNameIdOfSlice;
    /**
     * Special type name IDs for searching by both array and slice (`[]` syntax).
     */
    let typeNameIdOfArrayOrSlice;

    /**
     * Add an item to the type Name->ID map, or, if one already exists, use it.
     * Returns the number. If name is "" or null, return null (pure generic).
     *
     * This is effectively string interning, so that function matching can be
     * done more quickly. Two types with the same name but different item kinds
     * get the same ID.
     *
     * @param {string} name
     * @param {boolean} isAssocType - True if this is an assoc type
     *
     * @returns {integer}
     */
    function buildTypeMapIndex(name, isAssocType) {
        if (name === "" || name === null) {
            return null;
        }

        if (typeNameIdMap.has(name)) {
            const obj = typeNameIdMap.get(name);
            obj.assocOnly = isAssocType && obj.assocOnly;
            return obj.id;
        } else {
            const id = typeNameIdMap.size;
            typeNameIdMap.set(name, {id, assocOnly: isAssocType});
            return id;
        }
    }

    function isSpecialStartCharacter(c) {
        return "<\"".indexOf(c) !== -1;
    }

    function isEndCharacter(c) {
        return "=,>-]".indexOf(c) !== -1;
    }

    function isErrorCharacter(c) {
        return "()".indexOf(c) !== -1;
    }

    function itemTypeFromName(typename) {
        const index = itemTypes.findIndex(i => i === typename);
        if (index < 0) {
            throw ["Unknown type filter ", typename];
        }
        return index;
    }

    /**
     * If we encounter a `"`, then we try to extract the string from it until we find another `"`.
     *
     * This function will throw an error in the following cases:
     * * There is already another string element.
     * * We are parsing a generic argument.
     * * There is more than one element.
     * * There is no closing `"`.
     *
     * @param {ParsedQuery} query
     * @param {ParserState} parserState
     * @param {boolean} isInGenerics
     */
    function getStringElem(query, parserState, isInGenerics) {
        if (isInGenerics) {
            throw ["Unexpected ", "\"", " in generics"];
        } else if (query.literalSearch) {
            throw ["Cannot have more than one literal search element"];
        } else if (parserState.totalElems - parserState.genericsElems > 0) {
            throw ["Cannot use literal search when there is more than one element"];
        }
        parserState.pos += 1;
        const start = parserState.pos;
        const end = getIdentEndPosition(parserState);
        if (parserState.pos >= parserState.length) {
            throw ["Unclosed ", "\""];
        } else if (parserState.userQuery[end] !== "\"") {
            throw ["Unexpected ", parserState.userQuery[end], " in a string element"];
        } else if (start === end) {
            throw ["Cannot have empty string element"];
        }
        // To skip the quote at the end.
        parserState.pos += 1;
        query.literalSearch = true;
    }

    /**
     * Returns `true` if the current parser position is starting with "::".
     *
     * @param {ParserState} parserState
     *
     * @return {boolean}
     */
    function isPathStart(parserState) {
        return parserState.userQuery.slice(parserState.pos, parserState.pos + 2) === "::";
    }

    /**
     * Returns `true` if the current parser position is starting with "->".
     *
     * @param {ParserState} parserState
     *
     * @return {boolean}
     */
    function isReturnArrow(parserState) {
        return parserState.userQuery.slice(parserState.pos, parserState.pos + 2) === "->";
    }

    /**
     * Returns `true` if the given `c` character is valid for an ident.
     *
     * @param {string} c
     *
     * @return {boolean}
     */
    function isIdentCharacter(c) {
        return (
            c === "_" ||
            (c >= "0" && c <= "9") ||
            (c >= "a" && c <= "z") ||
            (c >= "A" && c <= "Z"));
    }

    /**
     * Returns `true` if the given `c` character is a separator.
     *
     * @param {string} c
     *
     * @return {boolean}
     */
    function isSeparatorCharacter(c) {
        return c === "," || c === "=";
    }

/**
     * Returns `true` if the given `c` character is a path separator. For example
     * `:` in `a::b` or a whitespace in `a b`.
     *
     * @param {string} c
     *
     * @return {boolean}
     */
    function isPathSeparator(c) {
        return c === ":" || c === " ";
    }

    /**
     * Returns `true` if the previous character is `lookingFor`.
     *
     * @param {ParserState} parserState
     * @param {String} lookingFor
     *
     * @return {boolean}
     */
    function prevIs(parserState, lookingFor) {
        let pos = parserState.pos;
        while (pos > 0) {
            const c = parserState.userQuery[pos - 1];
            if (c === lookingFor) {
                return true;
            } else if (c !== " ") {
                break;
            }
            pos -= 1;
        }
        return false;
    }

    /**
     * Returns `true` if the last element in the `elems` argument has generics.
     *
     * @param {Array<QueryElement>} elems
     * @param {ParserState} parserState
     *
     * @return {boolean}
     */
    function isLastElemGeneric(elems, parserState) {
        return (elems.length > 0 && elems[elems.length - 1].generics.length > 0) ||
            prevIs(parserState, ">");
    }

    /**
     * Increase current parser position until it doesn't find a whitespace anymore.
     *
     * @param {ParserState} parserState
     */
    function skipWhitespace(parserState) {
        while (parserState.pos < parserState.userQuery.length) {
            const c = parserState.userQuery[parserState.pos];
            if (c !== " ") {
                break;
            }
            parserState.pos += 1;
        }
    }

    /**
     * @param {ParsedQuery} query
     * @param {ParserState} parserState
     * @param {string} name                  - Name of the query element.
     * @param {Array<QueryElement>} generics - List of generics of this query element.
     *
     * @return {QueryElement}                - The newly created `QueryElement`.
     */
    function createQueryElement(query, parserState, name, generics, isInGenerics) {
        const path = name.trim();
        if (path.length === 0 && generics.length === 0) {
            throw ["Unexpected ", parserState.userQuery[parserState.pos]];
        }
        if (query.literalSearch && parserState.totalElems - parserState.genericsElems > 0) {
            throw ["Cannot have more than one element if you use quotes"];
        }
        const typeFilter = parserState.typeFilter;
        parserState.typeFilter = null;
        if (name === "!") {
            if (typeFilter !== null && typeFilter !== "primitive") {
                throw [
                    "Invalid search type: primitive never type ",
                    "!",
                    " and ",
                    typeFilter,
                    " both specified",
                ];
            }
            if (generics.length !== 0) {
                throw [
                    "Never type ",
                    "!",
                    " does not accept generic parameters",
                ];
            }
            const bindingName = parserState.isInBinding;
            parserState.isInBinding = null;
            return {
                name: "never",
                id: null,
                fullPath: ["never"],
                pathWithoutLast: [],
                pathLast: "never",
                generics: [],
                bindings: new Map(),
                typeFilter: "primitive",
                bindingName,
            };
        }
        const quadcolon = /::\s*::/.exec(path);
        if (path.startsWith("::")) {
            throw ["Paths cannot start with ", "::"];
        } else if (path.endsWith("::")) {
            throw ["Paths cannot end with ", "::"];
        } else if (quadcolon !== null) {
            throw ["Unexpected ", quadcolon[0]];
        }
        const pathSegments = path.split(/(?:::\s*)|(?:\s+(?:::\s*)?)/);
        // In case we only have something like `<p>`, there is no name.
        if (pathSegments.length === 0 || (pathSegments.length === 1 && pathSegments[0] === "")) {
            if (generics.length > 0 || prevIs(parserState, ">")) {
                throw ["Found generics without a path"];
            } else {
                throw ["Unexpected ", parserState.userQuery[parserState.pos]];
            }
        }
        for (const [i, pathSegment] of pathSegments.entries()) {
            if (pathSegment === "!") {
                if (i !== 0) {
                    throw ["Never type ", "!", " is not associated item"];
                }
                pathSegments[i] = "never";
            }
        }
        parserState.totalElems += 1;
        if (isInGenerics) {
            parserState.genericsElems += 1;
        }
        const bindingName = parserState.isInBinding;
        parserState.isInBinding = null;
        const bindings = new Map();
        return {
            name: name.trim(),
            id: null,
            fullPath: pathSegments,
            pathWithoutLast: pathSegments.slice(0, pathSegments.length - 1),
            pathLast: pathSegments[pathSegments.length - 1],
            generics: generics.filter(gen => {
                // Syntactically, bindings are parsed as generics,
                // but the query engine treats them differently.
                if (gen.bindingName !== null) {
                    bindings.set(gen.bindingName.name, [gen, ...gen.bindingName.generics]);
                    return false;
                }
                return true;
            }),
            bindings,
            typeFilter,
            bindingName,
        };
    }

    /**
     * This function goes through all characters until it reaches an invalid ident character or the
     * end of the query. It returns the position of the last character of the ident.
     *
     * @param {ParserState} parserState
     *
     * @return {integer}
     */
    function getIdentEndPosition(parserState) {
        const start = parserState.pos;
        let end = parserState.pos;
        let foundExclamation = -1;
        while (parserState.pos < parserState.length) {
            const c = parserState.userQuery[parserState.pos];
            if (!isIdentCharacter(c)) {
                if (c === "!") {
                    if (foundExclamation !== -1) {
                        throw ["Cannot have more than one ", "!", " in an ident"];
                    } else if (parserState.pos + 1 < parserState.length &&
                        isIdentCharacter(parserState.userQuery[parserState.pos + 1])
                    ) {
                        throw ["Unexpected ", "!", ": it can only be at the end of an ident"];
                    }
                    foundExclamation = parserState.pos;
                } else if (isErrorCharacter(c)) {
                    throw ["Unexpected ", c];
                } else if (isPathSeparator(c)) {
                    if (c === ":") {
                        if (!isPathStart(parserState)) {
                            break;
                        }
                        // Skip current ":".
                        parserState.pos += 1;
                    } else {
                        while (parserState.pos + 1 < parserState.length) {
                            const next_c = parserState.userQuery[parserState.pos + 1];
                            if (next_c !== " ") {
                                break;
                            }
                            parserState.pos += 1;
                        }
                    }
                    if (foundExclamation !== -1) {
                        if (foundExclamation !== start &&
                            isIdentCharacter(parserState.userQuery[foundExclamation - 1])
                        ) {
                            throw ["Cannot have associated items in macros"];
                        } else {
                            // while the never type has no associated macros, we still
                            // can parse a path like that
                            foundExclamation = -1;
                        }
                    }
                } else if (
                    c === "[" ||
                    isEndCharacter(c) ||
                    isSpecialStartCharacter(c) ||
                    isSeparatorCharacter(c)
                ) {
                    break;
                } else {
                    throw ["Unexpected ", c];
                }
            }
            parserState.pos += 1;
            end = parserState.pos;
        }
        // if start == end - 1, we got the never type
        if (foundExclamation !== -1 &&
            foundExclamation !== start &&
            isIdentCharacter(parserState.userQuery[foundExclamation - 1])
        ) {
            if (parserState.typeFilter === null) {
                parserState.typeFilter = "macro";
            } else if (parserState.typeFilter !== "macro") {
                throw [
                    "Invalid search type: macro ",
                    "!",
                    " and ",
                    parserState.typeFilter,
                    " both specified",
                ];
            }
            end = foundExclamation;
        }
        return end;
    }

    /**
     * @param {ParsedQuery} query
     * @param {ParserState} parserState
     * @param {Array<QueryElement>} elems - This is where the new {QueryElement} will be added.
     * @param {boolean} isInGenerics
     */
    function getNextElem(query, parserState, elems, isInGenerics) {
        const generics = [];

        skipWhitespace(parserState);
        let start = parserState.pos;
        let end;
        if (parserState.userQuery[parserState.pos] === "[") {
            parserState.pos += 1;
            getItemsBefore(query, parserState, generics, "]");
            const typeFilter = parserState.typeFilter;
            const isInBinding = parserState.isInBinding;
            if (typeFilter !== null && typeFilter !== "primitive") {
                throw [
                    "Invalid search type: primitive ",
                    "[]",
                    " and ",
                    typeFilter,
                    " both specified",
                ];
            }
            parserState.typeFilter = null;
            parserState.isInBinding = null;
            parserState.totalElems += 1;
            if (isInGenerics) {
                parserState.genericsElems += 1;
            }
            for (const gen of generics) {
                if (gen.bindingName !== null) {
                    throw ["Type parameter ", "=", " cannot be within slice ", "[]"];
                }
            }
            elems.push({
                name: "[]",
                id: null,
                fullPath: ["[]"],
                pathWithoutLast: [],
                pathLast: "[]",
                generics,
                typeFilter: "primitive",
                bindingName: isInBinding,
                bindings: new Map(),
            });
        } else {
            const isStringElem = parserState.userQuery[start] === "\"";
            // We handle the strings on their own mostly to make code easier to follow.
            if (isStringElem) {
                start += 1;
                getStringElem(query, parserState, isInGenerics);
                end = parserState.pos - 1;
            } else {
                end = getIdentEndPosition(parserState);
            }
            if (parserState.pos < parserState.length &&
                parserState.userQuery[parserState.pos] === "<"
            ) {
                if (start >= end) {
                    throw ["Found generics without a path"];
                }
                parserState.pos += 1;
                getItemsBefore(query, parserState, generics, ">");
            }
            if (isStringElem) {
                skipWhitespace(parserState);
            }
            if (start >= end && generics.length === 0) {
                return;
            }
            if (parserState.userQuery[parserState.pos] === "=") {
                if (parserState.isInBinding) {
                    throw ["Cannot write ", "=", " twice in a binding"];
                }
                if (!isInGenerics) {
                    throw ["Type parameter ", "=", " must be within generics list"];
                }
                const name = parserState.userQuery.slice(start, end).trim();
                if (name === "!") {
                    throw ["Type parameter ", "=", " key cannot be ", "!", " never type"];
                }
                if (name.includes("!")) {
                    throw ["Type parameter ", "=", " key cannot be ", "!", " macro"];
                }
                if (name.includes("::")) {
                    throw ["Type parameter ", "=", " key cannot contain ", "::", " path"];
                }
                if (name.includes(":")) {
                    throw ["Type parameter ", "=", " key cannot contain ", ":", " type"];
                }
                parserState.isInBinding = { name, generics };
            } else {
                elems.push(
                    createQueryElement(
                        query,
                        parserState,
                        parserState.userQuery.slice(start, end),
                        generics,
                        isInGenerics
                    )
                );
            }
        }
    }

    /**
     * This function parses the next query element until it finds `endChar`, calling `getNextElem`
     * to collect each element.
     *
     * If there is no `endChar`, this function will implicitly stop at the end without raising an
     * error.
     *
     * @param {ParsedQuery} query
     * @param {ParserState} parserState
     * @param {Array<QueryElement>} elems - This is where the new {QueryElement} will be added.
     * @param {string} endChar            - This function will stop when it'll encounter this
     *                                      character.
     */
    function getItemsBefore(query, parserState, elems, endChar) {
        let foundStopChar = true;
        let start = parserState.pos;

        // If this is a generic, keep the outer item's type filter around.
        const oldTypeFilter = parserState.typeFilter;
        parserState.typeFilter = null;
        const oldIsInBinding = parserState.isInBinding;
        parserState.isInBinding = null;

        let extra = "";
        if (endChar === ">") {
            extra = "<";
        } else if (endChar === "]") {
            extra = "[";
        } else if (endChar === "") {
            extra = "->";
        } else {
            extra = endChar;
        }

        while (parserState.pos < parserState.length) {
            const c = parserState.userQuery[parserState.pos];
            if (c === endChar) {
                if (parserState.isInBinding) {
                    throw ["Unexpected ", endChar, " after ", "="];
                }
                break;
            } else if (isSeparatorCharacter(c)) {
                parserState.pos += 1;
                foundStopChar = true;
                continue;
            } else if (c === ":" && isPathStart(parserState)) {
                throw ["Unexpected ", "::", ": paths cannot start with ", "::"];
            }  else if (c === ":") {
                if (parserState.typeFilter !== null) {
                    throw ["Unexpected ", ":"];
                }
                if (elems.length === 0) {
                    throw ["Expected type filter before ", ":"];
                } else if (query.literalSearch) {
                    throw ["Cannot use quotes on type filter"];
                }
                // The type filter doesn't count as an element since it's a modifier.
                const typeFilterElem = elems.pop();
                checkExtraTypeFilterCharacters(start, parserState);
                parserState.typeFilter = typeFilterElem.name;
                parserState.pos += 1;
                parserState.totalElems -= 1;
                query.literalSearch = false;
                foundStopChar = true;
                continue;
            } else if (isEndCharacter(c)) {
                throw ["Unexpected ", c, " after ", extra];
            }
            if (!foundStopChar) {
                let extra = [];
                if (isLastElemGeneric(query.elems, parserState)) {
                    extra = [" after ", ">"];
                } else if (prevIs(parserState, "\"")) {
                    throw ["Cannot have more than one element if you use quotes"];
                }
                if (endChar !== "") {
                    throw [
                        "Expected ",
                        ",",
                        ", ",
                        "=",
                        ", or ",
                        endChar,
                        ...extra,
                        ", found ",
                        c,
                    ];
                }
                throw [
                    "Expected ",
                    ",",
                    " or ",
                    "=",
                    ...extra,
                    ", found ",
                    c,
                ];
            }
            const posBefore = parserState.pos;
            start = parserState.pos;
            getNextElem(query, parserState, elems, endChar !== "");
            if (endChar !== "" && parserState.pos >= parserState.length) {
                throw ["Unclosed ", extra];
            }
            // This case can be encountered if `getNextElem` encountered a "stop character" right
            // from the start. For example if you have `,,` or `<>`. In this case, we simply move up
            // the current position to continue the parsing.
            if (posBefore === parserState.pos) {
                parserState.pos += 1;
            }
            foundStopChar = false;
        }
        if (parserState.pos >= parserState.length && endChar !== "") {
            throw ["Unclosed ", extra];
        }
        // We are either at the end of the string or on the `endChar` character, let's move forward
        // in any case.
        parserState.pos += 1;

        parserState.typeFilter = oldTypeFilter;
        parserState.isInBinding = oldIsInBinding;
    }

    /**
     * Checks that the type filter doesn't have unwanted characters like `<>` (which are ignored
     * if empty).
     *
     * @param {ParserState} parserState
     */
    function checkExtraTypeFilterCharacters(start, parserState) {
        const query = parserState.userQuery.slice(start, parserState.pos).trim();

        for (const c in query) {
            if (!isIdentCharacter(query[c])) {
                throw [
                    "Unexpected ",
                    query[c],
                    " in type filter (before ",
                    ":",
                    ")",
                ];
            }
        }
    }

    /**
     * Parses the provided `query` input to fill `parserState`. If it encounters an error while
     * parsing `query`, it'll throw an error.
     *
     * @param {ParsedQuery} query
     * @param {ParserState} parserState
     */
    function parseInput(query, parserState) {
        let foundStopChar = true;
        let start = parserState.pos;

        while (parserState.pos < parserState.length) {
            const c = parserState.userQuery[parserState.pos];
            if (isEndCharacter(c)) {
                foundStopChar = true;
                if (isSeparatorCharacter(c)) {
                    parserState.pos += 1;
                    continue;
                } else if (c === "-" || c === ">") {
                    if (isReturnArrow(parserState)) {
                        break;
                    }
                    throw ["Unexpected ", c, " (did you mean ", "->", "?)"];
                }
                throw ["Unexpected ", c];
            } else if (c === ":" && !isPathStart(parserState)) {
                if (parserState.typeFilter !== null) {
                    throw [
                        "Unexpected ",
                        ":",
                        " (expected path after type filter ",
                        parserState.typeFilter + ":",
                        ")",
                    ];
                } else if (query.elems.length === 0) {
                    throw ["Expected type filter before ", ":"];
                } else if (query.literalSearch) {
                    throw ["Cannot use quotes on type filter"];
                }
                // The type filter doesn't count as an element since it's a modifier.
                const typeFilterElem = query.elems.pop();
                checkExtraTypeFilterCharacters(start, parserState);
                parserState.typeFilter = typeFilterElem.name;
                parserState.pos += 1;
                parserState.totalElems -= 1;
                query.literalSearch = false;
                foundStopChar = true;
                continue;
            } else if (c === " ") {
                skipWhitespace(parserState);
                continue;
            }
            if (!foundStopChar) {
                let extra = "";
                if (isLastElemGeneric(query.elems, parserState)) {
                    extra = [" after ", ">"];
                } else if (prevIs(parserState, "\"")) {
                    throw ["Cannot have more than one element if you use quotes"];
                }
                if (parserState.typeFilter !== null) {
                    throw [
                        "Expected ",
                        ",",
                        " or ",
                        "->",
                        ...extra,
                        ", found ",
                        c,
                    ];
                }
                throw [
                    "Expected ",
                    ",",
                    ", ",
                    ":",
                    " or ",
                    "->",
                    ...extra,
                    ", found ",
                    c,
                ];
            }
            const before = query.elems.length;
            start = parserState.pos;
            getNextElem(query, parserState, query.elems, false);
            if (query.elems.length === before) {
                // Nothing was added, weird... Let's increase the position to not remain stuck.
                parserState.pos += 1;
            }
            foundStopChar = false;
        }
        if (parserState.typeFilter !== null) {
            throw [
                "Unexpected ",
                ":",
                " (expected path after type filter ",
                parserState.typeFilter + ":",
                ")",
            ];
        }
        while (parserState.pos < parserState.length) {
            if (isReturnArrow(parserState)) {
                parserState.pos += 2;
                skipWhitespace(parserState);
                // Get returned elements.
                getItemsBefore(query, parserState, query.returned, "");
                // Nothing can come afterward!
                if (query.returned.length === 0) {
                    throw ["Expected at least one item after ", "->"];
                }
                break;
            } else {
                parserState.pos += 1;
            }
        }
    }

    /**
     * Takes the user search input and returns an empty `ParsedQuery`.
     *
     * @param {string} userQuery
     *
     * @return {ParsedQuery}
     */
    function newParsedQuery(userQuery) {
        return {
            original: userQuery,
            userQuery: userQuery.toLowerCase(),
            elems: [],
            returned: [],
            // Total number of "top" elements (does not include generics).
            foundElems: 0,
            // Total number of elements (includes generics).
            totalElems: 0,
            literalSearch: false,
            error: null,
            correction: null,
            proposeCorrectionFrom: null,
            proposeCorrectionTo: null,
            // bloom filter build from type ids
            typeFingerprint: new Uint32Array(4),
        };
    }

    /**
     * Build an URL with search parameters.
     *
     * @param {string} search            - The current search being performed.
     * @param {string|null} filterCrates - The current filtering crate (if any).
     *
     * @return {string}
     */
    function buildUrl(search, filterCrates) {
        let extra = "?search=" + encodeURIComponent(search);

        if (filterCrates !== null) {
            extra += "&filter-crate=" + encodeURIComponent(filterCrates);
        }
        return getNakedUrl() + extra + window.location.hash;
    }

    /**
     * Return the filtering crate or `null` if there is none.
     *
     * @return {string|null}
     */
    function getFilterCrates() {
        const elem = document.getElementById("crate-search");

        if (elem &&
            elem.value !== "all crates" &&
            hasOwnPropertyRustdoc(rawSearchIndex, elem.value)
        ) {
            return elem.value;
        }
        return null;
    }

    /**
     * Parses the query.
     *
     * The supported syntax by this parser is given in the rustdoc book chapter
     * /src/doc/rustdoc/src/read-documentation/search.md
     *
     * When adding new things to the parser, add them there, too!
     *
     * @param  {string} val     - The user query
     *
     * @return {ParsedQuery}    - The parsed query
     */
    function parseQuery(userQuery) {
        function convertTypeFilterOnElem(elem) {
            if (elem.typeFilter !== null) {
                let typeFilter = elem.typeFilter;
                if (typeFilter === "const") {
                    typeFilter = "constant";
                }
                elem.typeFilter = itemTypeFromName(typeFilter);
            } else {
                elem.typeFilter = NO_TYPE_FILTER;
            }
            for (const elem2 of elem.generics) {
                convertTypeFilterOnElem(elem2);
            }
            for (const constraints of elem.bindings.values()) {
                for (const constraint of constraints) {
                    convertTypeFilterOnElem(constraint);
                }
            }
        }
        userQuery = userQuery.trim().replace(/\r|\n|\t/g, " ");
        const parserState = {
            length: userQuery.length,
            pos: 0,
            // Total number of elements (includes generics).
            totalElems: 0,
            genericsElems: 0,
            typeFilter: null,
            isInBinding: null,
            userQuery: userQuery.toLowerCase(),
        };
        let query = newParsedQuery(userQuery);

        try {
            parseInput(query, parserState);
            for (const elem of query.elems) {
                convertTypeFilterOnElem(elem);
            }
            for (const elem of query.returned) {
                convertTypeFilterOnElem(elem);
            }
        } catch (err) {
            query = newParsedQuery(userQuery);
            query.error = err;
            return query;
        }
        if (!query.literalSearch) {
            // If there is more than one element in the query, we switch to literalSearch in any
            // case.
            query.literalSearch = parserState.totalElems > 1;
        }
        query.foundElems = query.elems.length + query.returned.length;
        query.totalElems = parserState.totalElems;
        return query;
    }

    /**
     * Creates the query results.
     *
     * @param {Array<Result>} results_in_args
     * @param {Array<Result>} results_returned
     * @param {Array<Result>} results_others
     * @param {ParsedQuery} parsedQuery
     *
     * @return {ResultsTable}
     */
    function createQueryResults(results_in_args, results_returned, results_others, parsedQuery) {
        return {
            "in_args": results_in_args,
            "returned": results_returned,
            "others": results_others,
            "query": parsedQuery,
        };
    }

    /**
     * Executes the parsed query and builds a {ResultsTable}.
     *
     * @param  {ParsedQuery} parsedQuery - The parsed user query
     * @param  {Object} searchWords      - The list of search words to query against
     * @param  {Object} [filterCrates]   - Crate to search in if defined
     * @param  {Object} [currentCrate]   - Current crate, to rank results from this crate higher
     *
     * @return {ResultsTable}
     */
    function execQuery(parsedQuery, searchWords, filterCrates, currentCrate) {
        const results_others = new Map(), results_in_args = new Map(),
            results_returned = new Map();

        /**
         * Add extra data to result objects, and filter items that have been
         * marked for removal.
         *
         * @param {[ResultObject]} results
         * @returns {[ResultObject]}
         */
        function transformResults(results) {
            const duplicates = new Set();
            const out = [];

            for (const result of results) {
                if (result.id !== -1) {
                    const obj = searchIndex[result.id];
                    obj.dist = result.dist;
                    const res = buildHrefAndPath(obj);
                    obj.displayPath = pathSplitter(res[0]);
                    obj.fullPath = obj.displayPath + obj.name;
                    // To be sure than it some items aren't considered as duplicate.
                    obj.fullPath += "|" + obj.ty;

                    if (duplicates.has(obj.fullPath)) {
                        continue;
                    }
                    duplicates.add(obj.fullPath);

                    obj.href = res[1];
                    out.push(obj);
                    if (out.length >= MAX_RESULTS) {
                        break;
                    }
                }
            }
            return out;
        }

        /**
         * This function takes a result map, and sorts it by various criteria, including edit
         * distance, substring match, and the crate it comes from.
         *
         * @param {Results} results
         * @param {boolean} isType
         * @param {string} preferredCrate
         * @returns {[ResultObject]}
         */
        function sortResults(results, isType, preferredCrate) {
            // if there are no results then return to default and fail
            if (results.size === 0) {
                return [];
            }

            const userQuery = parsedQuery.userQuery;
            const result_list = [];
            for (const result of results.values()) {
                result.word = searchWords[result.id];
                result.item = searchIndex[result.id] || {};
                result_list.push(result);
            }

            result_list.sort((aaa, bbb) => {
                let a, b;

                // sort by exact match with regard to the last word (mismatch goes later)
                a = (aaa.word !== userQuery);
                b = (bbb.word !== userQuery);
                if (a !== b) {
                    return a - b;
                }

                // sort by index of keyword in item name (no literal occurrence goes later)
                a = (aaa.index < 0);
                b = (bbb.index < 0);
                if (a !== b) {
                    return a - b;
                }

                // Sort by distance in the path part, if specified
                // (less changes required to match means higher rankings)
                a = aaa.path_dist;
                b = bbb.path_dist;
                if (a !== b) {
                    return a - b;
                }

                // (later literal occurrence, if any, goes later)
                a = aaa.index;
                b = bbb.index;
                if (a !== b) {
                    return a - b;
                }

                // Sort by distance in the name part, the last part of the path
                // (less changes required to match means higher rankings)
                a = (aaa.dist);
                b = (bbb.dist);
                if (a !== b) {
                    return a - b;
                }

                // sort deprecated items later
                a = aaa.item.deprecated;
                b = bbb.item.deprecated;
                if (a !== b) {
                    return a - b;
                }

                // sort by crate (current crate comes first)
                a = (aaa.item.crate !== preferredCrate);
                b = (bbb.item.crate !== preferredCrate);
                if (a !== b) {
                    return a - b;
                }

                // sort by item name length (longer goes later)
                a = aaa.word.length;
                b = bbb.word.length;
                if (a !== b) {
                    return a - b;
                }

                // sort by item name (lexicographically larger goes later)
                a = aaa.word;
                b = bbb.word;
                if (a !== b) {
                    return (a > b ? +1 : -1);
                }

                // sort by description (no description goes later)
                a = (aaa.item.desc === "");
                b = (bbb.item.desc === "");
                if (a !== b) {
                    return a - b;
                }

                // sort by type (later occurrence in `itemTypes` goes later)
                a = aaa.item.ty;
                b = bbb.item.ty;
                if (a !== b) {
                    return a - b;
                }

                // sort by path (lexicographically larger goes later)
                a = aaa.item.path;
                b = bbb.item.path;
                if (a !== b) {
                    return (a > b ? +1 : -1);
                }

                // que sera, sera
                return 0;
            });

            return transformResults(result_list);
        }

        /**
         * This function checks if a list of search query `queryElems` can all be found in the
         * search index (`fnTypes`).
         *
         * This function returns `true` on a match, or `false` if none. If `solutionCb` is
         * supplied, it will call that function with mgens, and that callback can accept or
         * reject the result bu returning `true` or `false`. If the callback returns false,
         * then this function will try with a different solution, or bail with false if it
         * runs out of candidates.
         *
         * @param {Array<FunctionType>} fnTypesIn - The objects to check.
         * @param {Array<QueryElement>} queryElems - The elements from the parsed query.
         * @param {[FunctionType]} whereClause - Trait bounds for generic items.
         * @param {Map<number,number>|null} mgensIn
         *     - Map functions generics to query generics (never modified).
         * @param {null|Map<number,number> -> bool} solutionCb - Called for each `mgens` solution.
         *
         * @return {boolean} - Returns true if a match, false otherwise.
         */
        function unifyFunctionTypes(fnTypesIn, queryElems, whereClause, mgensIn, solutionCb) {
            /**
             * @type Map<integer, integer>|null
             */
            const mgens = mgensIn === null ? null : new Map(mgensIn);
            if (queryElems.length === 0) {
                return !solutionCb || solutionCb(mgens);
            }
            if (!fnTypesIn || fnTypesIn.length === 0) {
                return false;
            }
            const ql = queryElems.length;
            const fl = fnTypesIn.length;

            // One element fast path / base case
            if (ql === 1 && queryElems[0].generics.length === 0
                && queryElems[0].bindings.size === 0) {
                const queryElem = queryElems[0];
                for (const fnType of fnTypesIn) {
                    if (!unifyFunctionTypeIsMatchCandidate(fnType, queryElem, whereClause, mgens)) {
                        continue;
                    }
                    if (fnType.id < 0 && queryElem.id < 0) {
                        if (mgens && mgens.has(fnType.id) &&
                            mgens.get(fnType.id) !== queryElem.id) {
                            continue;
                        }
                        const mgensScratch = new Map(mgens);
                        mgensScratch.set(fnType.id, queryElem.id);
                        if (!solutionCb || solutionCb(mgensScratch)) {
                            return true;
                        }
                    } else if (!solutionCb || solutionCb(mgens ? new Map(mgens) : null)) {
                        // unifyFunctionTypeIsMatchCandidate already checks that ids match
                        return true;
                    }
                }
                for (const fnType of fnTypesIn) {
                    if (!unifyFunctionTypeIsUnboxCandidate(fnType, queryElem, whereClause, mgens)) {
                        continue;
                    }
                    if (fnType.id < 0) {
                        if (mgens && mgens.has(fnType.id) &&
                            mgens.get(fnType.id) !== 0) {
                            continue;
                        }
                        const mgensScratch = new Map(mgens);
                        mgensScratch.set(fnType.id, 0);
                        if (unifyFunctionTypes(
                            whereClause[(-fnType.id) - 1],
                            queryElems,
                            whereClause,
                            mgensScratch,
                            solutionCb
                        )) {
                            return true;
                        }
                    } else if (unifyFunctionTypes(
                        [...fnType.generics, ...Array.from(fnType.bindings.values()).flat() ],
                        queryElems,
                        whereClause,
                        mgens ? new Map(mgens) : null,
                        solutionCb
                    )) {
                        return true;
                    }
                }
                return false;
            }

            // Multiple element recursive case
            /**
             * @type Array<FunctionType>
             */
            const fnTypes = fnTypesIn.slice();
            /**
             * Algorithm works by building up a solution set in the working arrays
             * fnTypes gets mutated in place to make this work, while queryElems
             * is left alone.
             *
             * It works backwards, because arrays can be cheaply truncated that way.
             *
             *                         vvvvvvv `queryElem`
             * queryElems = [ unknown, unknown, good, good, good ]
             * fnTypes    = [ unknown, unknown, good, good, good ]
             *                ^^^^^^^^^^^^^^^^ loop over these elements to find candidates
             *
             * Everything in the current working solution is known to be a good
             * match, but it might not be the match we wind up going with, because
             * there might be more than one candidate match, and we need to try them all
             * before giving up. So, to handle this, it backtracks on failure.
             */
            const flast = fl - 1;
            const qlast = ql - 1;
            const queryElem = queryElems[qlast];
            let queryElemsTmp = null;
            for (let i = flast; i >= 0; i -= 1) {
                const fnType = fnTypes[i];
                if (!unifyFunctionTypeIsMatchCandidate(fnType, queryElem, whereClause, mgens)) {
                    continue;
                }
                let mgensScratch;
                if (fnType.id < 0) {
                    mgensScratch = new Map(mgens);
                    if (mgensScratch.has(fnType.id)
                        && mgensScratch.get(fnType.id) !== queryElem.id) {
                        continue;
                    }
                    mgensScratch.set(fnType.id, queryElem.id);
                } else {
                    mgensScratch = mgens;
                }
                // fnTypes[i] is a potential match
                // fnTypes[flast] is the last item in the list
                // swap them, and drop the potential match from the list
                // check if the remaining function types also match
                fnTypes[i] = fnTypes[flast];
                fnTypes.length = flast;
                if (!queryElemsTmp) {
                    queryElemsTmp = queryElems.slice(0, qlast);
                }
                const passesUnification = unifyFunctionTypes(
                    fnTypes,
                    queryElemsTmp,
                    whereClause,
                    mgensScratch,
                    mgensScratch => {
                        if (fnType.generics.length === 0 && queryElem.generics.length === 0
                            && fnType.bindings.size === 0 && queryElem.bindings.size === 0) {
                            return !solutionCb || solutionCb(mgensScratch);
                        }
                        const solution = unifyFunctionTypeCheckBindings(
                            fnType,
                            queryElem,
                            whereClause,
                            mgensScratch
                        );
                        if (!solution) {
                            return false;
                        }
                        const simplifiedGenerics = solution.simplifiedGenerics;
                        for (const simplifiedMgens of solution.mgens) {
                            const passesUnification = unifyFunctionTypes(
                                simplifiedGenerics,
                                queryElem.generics,
                                whereClause,
                                simplifiedMgens,
                                solutionCb
                            );
                            if (passesUnification) {
                                return true;
                            }
                        }
                        return false;
                    }
                );
                if (passesUnification) {
                    return true;
                }
                // backtrack
                fnTypes[flast] = fnTypes[i];
                fnTypes[i] = fnType;
                fnTypes.length = fl;
            }
            for (let i = flast; i >= 0; i -= 1) {
                const fnType = fnTypes[i];
                if (!unifyFunctionTypeIsUnboxCandidate(fnType, queryElem, whereClause, mgens)) {
                    continue;
                }
                let mgensScratch;
                if (fnType.id < 0) {
                    mgensScratch = new Map(mgens);
                    if (mgensScratch.has(fnType.id) && mgensScratch.get(fnType.id) !== 0) {
                        continue;
                    }
                    mgensScratch.set(fnType.id, 0);
                } else {
                    mgensScratch = mgens;
                }
                const generics = fnType.id < 0 ?
                    whereClause[(-fnType.id) - 1] :
                    fnType.generics;
                const bindings = fnType.bindings ?
                    Array.from(fnType.bindings.values()).flat() :
                    [];
                const passesUnification = unifyFunctionTypes(
                    fnTypes.toSpliced(i, 1, ...generics, ...bindings),
                    queryElems,
                    whereClause,
                    mgensScratch,
                    solutionCb
                );
                if (passesUnification) {
                    return true;
                }
            }
            return false;
        }
        /**
         * Check if this function is a match candidate.
         *
         * This function is all the fast checks that don't require backtracking.
         * It checks that two items are not named differently, and is load-bearing for that.
         * It also checks that, if the query has generics, the function type must have generics
         * or associated type bindings: that's not load-bearing, but it prevents unnecessary
         * backtracking later.
         *
         * @param {FunctionType} fnType
         * @param {QueryElement} queryElem
         * @param {[FunctionSearchType]} whereClause - Trait bounds for generic items.
         * @param {Map<number,number>|null} mgensIn - Map functions generics to query generics.
         * @returns {boolean}
         */
        function unifyFunctionTypeIsMatchCandidate(fnType, queryElem, whereClause, mgensIn) {
            // type filters look like `trait:Read` or `enum:Result`
            if (!typePassesFilter(queryElem.typeFilter, fnType.ty)) {
                return false;
            }
            // fnType.id < 0 means generic
            // queryElem.id < 0 does too
            // mgensIn[fnType.id] = queryElem.id
            // or, if mgensIn[fnType.id] = 0, then we've matched this generic with a bare trait
            // and should make that same decision everywhere it appears
            if (fnType.id < 0 && queryElem.id < 0) {
                if (mgensIn) {
                    if (mgensIn.has(fnType.id) && mgensIn.get(fnType.id) !== queryElem.id) {
                        return false;
                    }
                    for (const [fid, qid] of mgensIn.entries()) {
                        if (fnType.id !== fid && queryElem.id === qid) {
                            return false;
                        }
                        if (fnType.id === fid && queryElem.id !== qid) {
                            return false;
                        }
                    }
                }
                return true;
            } else {
                if (queryElem.id === typeNameIdOfArrayOrSlice &&
                    (fnType.id === typeNameIdOfSlice || fnType.id === typeNameIdOfArray)
                ) {
                    // [] matches primitive:array or primitive:slice
                    // if it matches, then we're fine, and this is an appropriate match candidate
                } else if (fnType.id !== queryElem.id || queryElem.id === null) {
                    return false;
                }
                // If the query elem has generics, and the function doesn't,
                // it can't match.
                if ((fnType.generics.length + fnType.bindings.size) === 0 &&
                    queryElem.generics.length !== 0
                ) {
                    return false;
                }
                if (fnType.bindings.size < queryElem.bindings.size) {
                    return false;
                }
                // If the query element is a path (it contains `::`), we need to check if this
                // path is compatible with the target type.
                const queryElemPathLength = queryElem.pathWithoutLast.length;
                if (queryElemPathLength > 0) {
                    const fnTypePath = fnType.path !== undefined && fnType.path !== null ?
                        fnType.path.split("::") : [];
                    // If the path provided in the query element is longer than this type,
                    // no need to check it since it won't match in any case.
                    if (queryElemPathLength > fnTypePath.length) {
                        return false;
                    }
                    let i = 0;
                    for (const path of fnTypePath) {
                        if (path === queryElem.pathWithoutLast[i]) {
                            i += 1;
                            if (i >= queryElemPathLength) {
                                break;
                            }
                        }
                    }
                    if (i < queryElemPathLength) {
                        // If we didn't find all parts of the path of the query element inside
                        // the fn type, then it's not the right one.
                        return false;
                    }
                }
                return true;
            }
        }
        /**
         * This function checks the associated type bindings. Any that aren't matched get converted
         * to generics, and this function returns an array of the function's generics with these
         * simplified bindings added to them. That is, it takes a path like this:
         *
         *     Iterator<Item=u32>
         *
         * ... if queryElem itself has an `Item=` in it, then this function returns an empty array.
         * But if queryElem contains no Item=, then this function returns a one-item array with the
         * ID of u32 in it, and the rest of the matching engine acts as if `Iterator<u32>` were
         * the type instead.
         *
         * @param {FunctionType} fnType
         * @param {QueryElement} queryElem
         * @param {[FunctionType]} whereClause - Trait bounds for generic items.
         * @param {Map<number,number>} mgensIn - Map functions generics to query generics.
         *                                            Never modified.
         * @returns {false|{mgens: [Map<number,number>], simplifiedGenerics: [FunctionType]}}
         */
        function unifyFunctionTypeCheckBindings(fnType, queryElem, whereClause, mgensIn) {
            if (fnType.bindings.size < queryElem.bindings.size) {
                return false;
            }
            let simplifiedGenerics = fnType.generics || [];
            if (fnType.bindings.size > 0) {
                let mgensSolutionSet = [mgensIn];
                for (const [name, constraints] of queryElem.bindings.entries()) {
                    if (mgensSolutionSet.length === 0) {
                        return false;
                    }
                    if (!fnType.bindings.has(name)) {
                        return false;
                    }
                    const fnTypeBindings = fnType.bindings.get(name);
                    mgensSolutionSet = mgensSolutionSet.flatMap(mgens => {
                        const newSolutions = [];
                        unifyFunctionTypes(
                            fnTypeBindings,
                            constraints,
                            whereClause,
                            mgens,
                            newMgens => {
                                newSolutions.push(newMgens);
                                // return `false` makes unifyFunctionTypes return the full set of
                                // possible solutions
                                return false;
                            }
                        );
                        return newSolutions;
                    });
                }
                if (mgensSolutionSet.length === 0) {
                    return false;
                }
                const binds = Array.from(fnType.bindings.entries()).flatMap(entry => {
                    const [name, constraints] = entry;
                    if (queryElem.bindings.has(name)) {
                        return [];
                    } else {
                        return constraints;
                    }
                });
                if (simplifiedGenerics.length > 0) {
                    simplifiedGenerics = [...simplifiedGenerics, ...binds];
                } else {
                    simplifiedGenerics = binds;
                }
                return { simplifiedGenerics, mgens: mgensSolutionSet };
            }
            return { simplifiedGenerics, mgens: [mgensIn] };
        }
        /**
         * @param {FunctionType} fnType
         * @param {QueryElement} queryElem
         * @param {[FunctionType]} whereClause - Trait bounds for generic items.
         * @param {Map<number,number>|null} mgens - Map functions generics to query generics.
         * @returns {boolean}
         */
        function unifyFunctionTypeIsUnboxCandidate(fnType, queryElem, whereClause, mgens) {
            if (fnType.id < 0 && queryElem.id >= 0) {
                if (!whereClause) {
                    return false;
                }
                // mgens[fnType.id] === 0 indicates that we committed to unboxing this generic
                // mgens[fnType.id] === null indicates that we haven't decided yet
                if (mgens && mgens.has(fnType.id) && mgens.get(fnType.id) !== 0) {
                    return false;
                }
                // Where clauses can represent cyclical data.
                // `null` prevents it from trying to unbox in an infinite loop
                const mgensTmp = new Map(mgens);
                mgensTmp.set(fnType.id, null);
                // This is only a potential unbox if the search query appears in the where clause
                // for example, searching `Read -> usize` should find
                // `fn read_all<R: Read>(R) -> Result<usize>`
                // generic `R` is considered "unboxed"
                return checkIfInList(
                    whereClause[(-fnType.id) - 1],
                    queryElem,
                    whereClause,
                    mgensTmp
                );
            } else if (fnType.generics.length > 0 || fnType.bindings.size > 0) {
                const simplifiedGenerics = [
                    ...fnType.generics,
                    ...Array.from(fnType.bindings.values()).flat(),
                ];
                return checkIfInList(simplifiedGenerics, queryElem, whereClause, mgens);
            }
            return false;
        }

        /**
          * This function checks if the object (`row`) matches the given type (`elem`) and its
          * generics (if any).
          *
          * @param {Array<FunctionType>} list
          * @param {QueryElement} elem          - The element from the parsed query.
          * @param {[FunctionType]} whereClause - Trait bounds for generic items.
         * @param {Map<number,number>|null} mgens - Map functions generics to query generics.
          *
          * @return {boolean} - Returns true if found, false otherwise.
          */
        function checkIfInList(list, elem, whereClause, mgens) {
            for (const entry of list) {
                if (checkType(entry, elem, whereClause, mgens)) {
                    return true;
                }
            }
            return false;
        }

        /**
          * This function checks if the object (`row`) matches the given type (`elem`) and its
          * generics (if any).
          *
          * @param {Row} row
          * @param {QueryElement} elem          - The element from the parsed query.
          * @param {[FunctionType]} whereClause - Trait bounds for generic items.
         * @param {Map<number,number>|null} mgens - Map functions generics to query generics.
          *
          * @return {boolean} - Returns true if the type matches, false otherwise.
          */
        function checkType(row, elem, whereClause, mgens) {
            if (row.bindings.size === 0 && elem.bindings.size === 0) {
                if (elem.id < 0) {
                    return row.id < 0 || checkIfInList(row.generics, elem, whereClause, mgens);
                }
                if (row.id > 0 && elem.id > 0 && elem.pathWithoutLast.length === 0 &&
                    typePassesFilter(elem.typeFilter, row.ty) && elem.generics.length === 0 &&
                    // special case
                    elem.id !== typeNameIdOfArrayOrSlice
                ) {
                    return row.id === elem.id || checkIfInList(
                        row.generics,
                        elem,
                        whereClause,
                        mgens
                    );
                }
            }
            return unifyFunctionTypes([row], [elem], whereClause, mgens);
        }

        function checkPath(contains, ty, maxEditDistance) {
            if (contains.length === 0) {
                return 0;
            }
            let ret_dist = maxEditDistance + 1;
            const path = ty.path.split("::");

            if (ty.parent && ty.parent.name) {
                path.push(ty.parent.name.toLowerCase());
            }

            const length = path.length;
            const clength = contains.length;
            pathiter: for (let i = length - clength; i >= 0; i -= 1) {
                let dist_total = 0;
                for (let x = 0; x < clength; ++x) {
                    const dist = editDistance(path[i + x], contains[x], maxEditDistance);
                    if (dist > maxEditDistance) {
                        continue pathiter;
                    }
                    dist_total += dist;
                }
                ret_dist = Math.min(ret_dist, Math.round(dist_total / clength));
            }
            return ret_dist;
        }

        function typePassesFilter(filter, type) {
            // No filter or Exact mach
            if (filter <= NO_TYPE_FILTER || filter === type) return true;

            // Match related items
            const name = itemTypes[type];
            switch (itemTypes[filter]) {
                case "constant":
                    return name === "associatedconstant";
                case "fn":
                    return name === "method" || name === "tymethod";
                case "type":
                    return name === "primitive" || name === "associatedtype";
                case "trait":
                    return name === "traitalias";
            }

            // No match
            return false;
        }

        function createAliasFromItem(item) {
            return {
                crate: item.crate,
                name: item.name,
                path: item.path,
                desc: item.desc,
                ty: item.ty,
                parent: item.parent,
                type: item.type,
                is_alias: true,
                deprecated: item.deprecated,
                implDisambiguator: item.implDisambiguator,
            };
        }

        function handleAliases(ret, query, filterCrates, currentCrate) {
            const lowerQuery = query.toLowerCase();
            // We separate aliases and crate aliases because we want to have current crate
            // aliases to be before the others in the displayed results.
            const aliases = [];
            const crateAliases = [];
            if (filterCrates !== null) {
                if (ALIASES.has(filterCrates) && ALIASES.get(filterCrates).has(lowerQuery)) {
                    const query_aliases = ALIASES.get(filterCrates).get(lowerQuery);
                    for (const alias of query_aliases) {
                        aliases.push(createAliasFromItem(searchIndex[alias]));
                    }
                }
            } else {
                for (const [crate, crateAliasesIndex] of ALIASES) {
                    if (crateAliasesIndex.has(lowerQuery)) {
                        const pushTo = crate === currentCrate ? crateAliases : aliases;
                        const query_aliases = crateAliasesIndex.get(lowerQuery);
                        for (const alias of query_aliases) {
                            pushTo.push(createAliasFromItem(searchIndex[alias]));
                        }
                    }
                }
            }

            const sortFunc = (aaa, bbb) => {
                if (aaa.path < bbb.path) {
                    return 1;
                } else if (aaa.path === bbb.path) {
                    return 0;
                }
                return -1;
            };
            crateAliases.sort(sortFunc);
            aliases.sort(sortFunc);

            const pushFunc = alias => {
                alias.alias = query;
                const res = buildHrefAndPath(alias);
                alias.displayPath = pathSplitter(res[0]);
                alias.fullPath = alias.displayPath + alias.name;
                alias.href = res[1];

                ret.others.unshift(alias);
                if (ret.others.length > MAX_RESULTS) {
                    ret.others.pop();
                }
            };

            aliases.forEach(pushFunc);
            crateAliases.forEach(pushFunc);
        }

        /**
         * This function adds the given result into the provided `results` map if it matches the
         * following condition:
         *
         * * If it is a "literal search" (`parsedQuery.literalSearch`), then `dist` must be 0.
         * * If it is not a "literal search", `dist` must be <= `maxEditDistance`.
         *
         * The `results` map contains information which will be used to sort the search results:
         *
         * * `fullId` is a `string`` used as the key of the object we use for the `results` map.
         * * `id` is the index in both `searchWords` and `searchIndex` arrays for this element.
         * * `index` is an `integer`` used to sort by the position of the word in the item's name.
         * * `dist` is the main metric used to sort the search results.
         * * `path_dist` is zero if a single-component search query is used, otherwise it's the
         *   distance computed for everything other than the last path component.
         *
         * @param {Results} results
         * @param {string} fullId
         * @param {integer} id
         * @param {integer} index
         * @param {integer} dist
         * @param {integer} path_dist
         */
        function addIntoResults(results, fullId, id, index, dist, path_dist, maxEditDistance) {
            if (dist <= maxEditDistance || index !== -1) {
                if (results.has(fullId)) {
                    const result = results.get(fullId);
                    if (result.dontValidate || result.dist <= dist) {
                        return;
                    }
                }
                results.set(fullId, {
                    id: id,
                    index: index,
                    dontValidate: parsedQuery.literalSearch,
                    dist: dist,
                    path_dist: path_dist,
                });
            }
        }

        /**
         * This function is called in case the query is only one element (with or without generics).
         * This element will be compared to arguments' and returned values' items and also to items.
         *
         * Other important thing to note: since there is only one element, we use edit
         * distance for name comparisons.
         *
         * @param {Row} row
         * @param {integer} pos              - Position in the `searchIndex`.
         * @param {QueryElement} elem        - The element from the parsed query.
         * @param {Results} results_others   - Unqualified results (not in arguments nor in
         *                                     returned values).
         * @param {Results} results_in_args  - Matching arguments results.
         * @param {Results} results_returned - Matching returned arguments results.
         */
        function handleSingleArg(
            row,
            pos,
            elem,
            results_others,
            results_in_args,
            results_returned,
            maxEditDistance
        ) {
            if (!row || (filterCrates !== null && row.crate !== filterCrates)) {
                return;
            }
            let index = -1, path_dist = 0;
            const fullId = row.id;
            const searchWord = searchWords[pos];

            // fpDist is a minimum possible type distance, where "type distance" is the number of
            // atoms in the function not present in the query
            const tfpDist = compareTypeFingerprints(
                fullId,
                parsedQuery.typeFingerprint
            );
            if (tfpDist !== null &&
                !(results_in_args.size >= MAX_RESULTS && tfpDist > results_in_args.max_dist)
            ) {
                const in_args = row.type && row.type.inputs
                    && checkIfInList(row.type.inputs, elem, row.type.where_clause);
                if (in_args) {
                    results_in_args.max_dist = Math.max(results_in_args.max_dist || 0, tfpDist);
                    const maxDist = results_in_args.size < MAX_RESULTS ?
                        (tfpDist + 1) :
                        results_in_args.max_dist;
                    addIntoResults(results_in_args, fullId, pos, -1, tfpDist, 0, maxDist);
                }
            }
            if (tfpDist !== false &&
                !(results_returned.size >= MAX_RESULTS && tfpDist > results_returned.max_dist)
            ) {
                const returned = row.type && row.type.output
                    && checkIfInList(row.type.output, elem, row.type.where_clause);
                if (returned) {
                    results_returned.max_dist = Math.max(results_returned.max_dist || 0, tfpDist);
                    const maxDist = results_returned.size < MAX_RESULTS ?
                        (tfpDist + 1) :
                        results_returned.max_dist;
                    addIntoResults(results_returned, fullId, pos, -1, tfpDist, 0, maxDist);
                }
            }

            if (!typePassesFilter(elem.typeFilter, row.ty)) {
                return;
            }

            const row_index = row.normalizedName.indexOf(elem.pathLast);
            const word_index = searchWord.indexOf(elem.pathLast);

            // lower indexes are "better" matches
            // rank based on the "best" match
            if (row_index === -1) {
                index = word_index;
            } else if (word_index === -1) {
                index = row_index;
            } else if (word_index < row_index) {
                index = word_index;
            } else {
                index = row_index;
            }

            if (elem.fullPath.length > 1) {
                path_dist = checkPath(elem.pathWithoutLast, row, maxEditDistance);
                if (path_dist > maxEditDistance) {
                    return;
                }
            }

            if (parsedQuery.literalSearch) {
                if (searchWord === elem.name) {
                    addIntoResults(results_others, fullId, pos, index, 0, path_dist);
                }
                return;
            }

            const dist = editDistance(searchWord, elem.pathLast, maxEditDistance);

            if (index === -1 && dist + path_dist > maxEditDistance) {
                return;
            }

            addIntoResults(results_others, fullId, pos, index, dist, path_dist, maxEditDistance);
        }

        /**
         * This function is called in case the query has more than one element. In this case, it'll
         * try to match the items which validates all the elements. For `aa -> bb` will look for
         * functions which have a parameter `aa` and has `bb` in its returned values.
         *
         * @param {Row} row
         * @param {integer} pos      - Position in the `searchIndex`.
         * @param {Object} results
         */
        function handleArgs(row, pos, results) {
            if (!row || (filterCrates !== null && row.crate !== filterCrates) || !row.type) {
                return;
            }

            const tfpDist = compareTypeFingerprints(
                row.id,
                parsedQuery.typeFingerprint
            );
            if (tfpDist === null) {
                return;
            }
            if (results.size >= MAX_RESULTS && tfpDist > results.max_dist) {
                return;
            }

            // If the result is too "bad", we return false and it ends this search.
            if (!unifyFunctionTypes(
                row.type.inputs,
                parsedQuery.elems,
                row.type.where_clause,
                null,
                mgens => {
                    return unifyFunctionTypes(
                        row.type.output,
                        parsedQuery.returned,
                        row.type.where_clause,
                        mgens
                    );
                }
            )) {
                return;
            }

            results.max_dist = Math.max(results.max_dist || 0, tfpDist);
            addIntoResults(results, row.id, pos, 0, tfpDist, 0, Number.MAX_VALUE);
        }

        function innerRunQuery() {
            let queryLen = 0;
            for (const elem of parsedQuery.elems) {
                queryLen += elem.name.length;
            }
            for (const elem of parsedQuery.returned) {
                queryLen += elem.name.length;
            }
            const maxEditDistance = Math.floor(queryLen / 3);

            /**
             * @type {Map<string, integer>}
             */
            const genericSymbols = new Map();

            /**
             * Convert names to ids in parsed query elements.
             * This is not used for the "In Names" tab, but is used for the
             * "In Params", "In Returns", and "In Function Signature" tabs.
             *
             * If there is no matching item, but a close-enough match, this
             * function also that correction.
             *
             * See `buildTypeMapIndex` for more information.
             *
             * @param {QueryElement} elem
             * @param {boolean} isAssocType
             */
            function convertNameToId(elem, isAssocType) {
                if (typeNameIdMap.has(elem.pathLast) &&
                    (isAssocType || !typeNameIdMap.get(elem.pathLast).assocOnly)) {
                    elem.id = typeNameIdMap.get(elem.pathLast).id;
                } else if (!parsedQuery.literalSearch) {
                    let match = null;
                    let matchDist = maxEditDistance + 1;
                    let matchName = "";
                    for (const [name, {id, assocOnly}] of typeNameIdMap) {
                        const dist = editDistance(name, elem.pathLast, maxEditDistance);
                        if (dist <= matchDist && dist <= maxEditDistance &&
                            (isAssocType || !assocOnly)) {
                            if (dist === matchDist && matchName > name) {
                                continue;
                            }
                            match = id;
                            matchDist = dist;
                            matchName = name;
                        }
                    }
                    if (match !== null) {
                        parsedQuery.correction = matchName;
                    }
                    elem.id = match;
                }
                if ((elem.id === null && parsedQuery.totalElems > 1 && elem.typeFilter === -1
                     && elem.generics.length === 0 && elem.bindings.size === 0)
                    || elem.typeFilter === TY_GENERIC) {
                    if (genericSymbols.has(elem.name)) {
                        elem.id = genericSymbols.get(elem.name);
                    } else {
                        elem.id = -(genericSymbols.size + 1);
                        genericSymbols.set(elem.name, elem.id);
                    }
                    if (elem.typeFilter === -1 && elem.name.length >= 3) {
                        // Silly heuristic to catch if the user probably meant
                        // to not write a generic parameter. We don't use it,
                        // just bring it up.
                        const maxPartDistance = Math.floor(elem.name.length / 3);
                        let matchDist = maxPartDistance + 1;
                        let matchName = "";
                        for (const name of typeNameIdMap.keys()) {
                            const dist = editDistance(name, elem.name, maxPartDistance);
                            if (dist <= matchDist && dist <= maxPartDistance) {
                                if (dist === matchDist && matchName > name) {
                                    continue;
                                }
                                matchDist = dist;
                                matchName = name;
                            }
                        }
                        if (matchName !== "") {
                            parsedQuery.proposeCorrectionFrom = elem.name;
                            parsedQuery.proposeCorrectionTo = matchName;
                        }
                    }
                    elem.typeFilter = TY_GENERIC;
                }
                if (elem.generics.length > 0 && elem.typeFilter === TY_GENERIC) {
                    // Rust does not have HKT
                    parsedQuery.error = [
                        "Generic type parameter ",
                        elem.name,
                        " does not accept generic parameters",
                    ];
                }
                for (const elem2 of elem.generics) {
                    convertNameToId(elem2);
                }
                elem.bindings = new Map(Array.from(elem.bindings.entries())
                    .map(entry => {
                        const [name, constraints] = entry;
                        if (!typeNameIdMap.has(name)) {
                            parsedQuery.error = [
                                "Type parameter ",
                                name,
                                " does not exist",
                            ];
                            return [null, []];
                        }
                        for (const elem2 of constraints) {
                            convertNameToId(elem2);
                        }

                        return [typeNameIdMap.get(name).id, constraints];
                    })
                );
            }

            const fps = new Set();
            for (const elem of parsedQuery.elems) {
                convertNameToId(elem);
                buildFunctionTypeFingerprint(elem, parsedQuery.typeFingerprint, fps);
            }
            for (const elem of parsedQuery.returned) {
                convertNameToId(elem);
                buildFunctionTypeFingerprint(elem, parsedQuery.typeFingerprint, fps);
            }

            if (parsedQuery.foundElems === 1 && parsedQuery.returned.length === 0) {
                if (parsedQuery.elems.length === 1) {
                    const elem = parsedQuery.elems[0];
                    for (let i = 0, nSearchWords = searchWords.length; i < nSearchWords; ++i) {
                        // It means we want to check for this element everywhere (in names, args and
                        // returned).
                        handleSingleArg(
                            searchIndex[i],
                            i,
                            elem,
                            results_others,
                            results_in_args,
                            results_returned,
                            maxEditDistance
                        );
                    }
                }
            } else if (parsedQuery.foundElems > 0) {
                // Sort input and output so that generic type variables go first and
                // types with generic parameters go last.
                // That's because of the way unification is structured: it eats off
                // the end, and hits a fast path if the last item is a simple atom.
                const sortQ = (a, b) => {
                    const ag = a.generics.length === 0 && a.bindings.size === 0;
                    const bg = b.generics.length === 0 && b.bindings.size === 0;
                    if (ag !== bg) {
                        return ag - bg;
                    }
                    const ai = a.id > 0;
                    const bi = b.id > 0;
                    return ai - bi;
                };
                parsedQuery.elems.sort(sortQ);
                parsedQuery.returned.sort(sortQ);
                for (let i = 0, nSearchWords = searchWords.length; i < nSearchWords; ++i) {
                    handleArgs(searchIndex[i], i, results_others);
                }
            }
        }

        if (parsedQuery.error === null) {
            innerRunQuery();
        }

        const ret = createQueryResults(
            sortResults(results_in_args, true, currentCrate),
            sortResults(results_returned, true, currentCrate),
            sortResults(results_others, false, currentCrate),
            parsedQuery);
        handleAliases(ret, parsedQuery.original.replace(/"/g, ""), filterCrates, currentCrate);
        if (parsedQuery.error !== null && ret.others.length !== 0) {
            // It means some doc aliases were found so let's "remove" the error!
            ret.query.error = null;
        }
        return ret;
    }

    function nextTab(direction) {
        const next = (searchState.currentTab + direction + 3) % searchState.focusedByTab.length;
        searchState.focusedByTab[searchState.currentTab] = document.activeElement;
        printTab(next);
        focusSearchResult();
    }

    // Focus the first search result on the active tab, or the result that
    // was focused last time this tab was active.
    function focusSearchResult() {
        const target = searchState.focusedByTab[searchState.currentTab] ||
            document.querySelectorAll(".search-results.active a").item(0) ||
            document.querySelectorAll("#search-tabs button").item(searchState.currentTab);
        searchState.focusedByTab[searchState.currentTab] = null;
        if (target) {
            target.focus();
        }
    }

    function buildHrefAndPath(item) {
        let displayPath;
        let href;
        const type = itemTypes[item.ty];
        const name = item.name;
        let path = item.path;

        if (type === "mod") {
            displayPath = path + "::";
            href = ROOT_PATH + path.replace(/::/g, "/") + "/" +
                name + "/index.html";
        } else if (type === "import") {
            displayPath = item.path + "::";
            href = ROOT_PATH + item.path.replace(/::/g, "/") + "/index.html#reexport." + name;
        } else if (type === "primitive" || type === "keyword") {
            displayPath = "";
            href = ROOT_PATH + path.replace(/::/g, "/") +
                "/" + type + "." + name + ".html";
        } else if (type === "externcrate") {
            displayPath = "";
            href = ROOT_PATH + name + "/index.html";
        } else if (item.parent !== undefined) {
            const myparent = item.parent;
            let anchor = type + "." + name;
            const parentType = itemTypes[myparent.ty];
            let pageType = parentType;
            let pageName = myparent.name;

            if (parentType === "primitive") {
                displayPath = myparent.name + "::";
            } else if (type === "structfield" && parentType === "variant") {
                // Structfields belonging to variants are special: the
                // final path element is the enum name.
                const enumNameIdx = item.path.lastIndexOf("::");
                const enumName = item.path.substr(enumNameIdx + 2);
                path = item.path.substr(0, enumNameIdx);
                displayPath = path + "::" + enumName + "::" + myparent.name + "::";
                anchor = "variant." + myparent.name + ".field." + name;
                pageType = "enum";
                pageName = enumName;
            } else {
                displayPath = path + "::" + myparent.name + "::";
            }
            if (item.implDisambiguator !== null) {
                anchor = item.implDisambiguator + "/" + anchor;
            }
            href = ROOT_PATH + path.replace(/::/g, "/") +
                "/" + pageType +
                "." + pageName +
                ".html#" + anchor;
        } else {
            displayPath = item.path + "::";
            href = ROOT_PATH + item.path.replace(/::/g, "/") +
                "/" + type + "." + name + ".html";
        }
        return [displayPath, href];
    }

    function pathSplitter(path) {
        const tmp = "<span>" + path.replace(/::/g, "::</span><span>");
        if (tmp.endsWith("<span>")) {
            return tmp.slice(0, tmp.length - 6);
        }
        return tmp;
    }

    /**
     * Render a set of search results for a single tab.
     * @param {Array<?>}    array   - The search results for this tab
     * @param {ParsedQuery} query
     * @param {boolean}     display - True if this is the active tab
     */
    function addTab(array, query, display) {
        const extraClass = display ? " active" : "";

        const output = document.createElement("div");
        if (array.length > 0) {
            output.className = "search-results " + extraClass;

            array.forEach(item => {
                const name = item.name;
                const type = itemTypes[item.ty];
                const longType = longItemTypes[item.ty];
                const typeName = longType.length !== 0 ? `${longType}` : "?";

                const link = document.createElement("a");
                link.className = "result-" + type;
                link.href = item.href;

                const resultName = document.createElement("div");
                resultName.className = "result-name";

                resultName.insertAdjacentHTML(
                    "beforeend",
                    `<span class="typename">${typeName}</span>`);
                link.appendChild(resultName);

                let alias = " ";
                if (item.is_alias) {
                    alias = ` <div class="alias">\
<b>${item.alias}</b><i class="grey">&nbsp;- see&nbsp;</i>\
</div>`;
                }
                resultName.insertAdjacentHTML(
                    "beforeend",
                    `<div class="path">${alias}\
${item.displayPath}<span class="${type}">${name}</span>\
</div>`);

                const description = document.createElement("div");
                description.className = "desc";
                description.insertAdjacentHTML("beforeend", item.desc);

                link.appendChild(description);
                output.appendChild(link);
            });
        } else if (query.error === null) {
            output.className = "search-failed" + extraClass;
            output.innerHTML = "No results :(<br/>" +
                "Try on <a href=\"https://duckduckgo.com/?q=" +
                encodeURIComponent("rust " + query.userQuery) +
                "\">DuckDuckGo</a>?<br/><br/>" +
                "Or try looking in one of these:<ul><li>The <a " +
                "href=\"https://doc.rust-lang.org/reference/index.html\">Rust Reference</a> " +
                " for technical details about the language.</li><li><a " +
                "href=\"https://doc.rust-lang.org/rust-by-example/index.html\">Rust By " +
                "Example</a> for expository code examples.</a></li><li>The <a " +
                "href=\"https://doc.rust-lang.org/book/index.html\">Rust Book</a> for " +
                "introductions to language features and the language itself.</li><li><a " +
                "href=\"https://docs.rs\">Docs.rs</a> for documentation of crates released on" +
                " <a href=\"https://crates.io/\">crates.io</a>.</li></ul>";
        }
        return [output, array.length];
    }

    function makeTabHeader(tabNb, text, nbElems) {
        // https://blog.horizon-eda.org/misc/2020/02/19/ui.html
        //
        // CSS runs with `font-variant-numeric: tabular-nums` to ensure all
        // digits are the same width. \u{2007} is a Unicode space character
        // that is defined to be the same width as a digit.
        const fmtNbElems =
            nbElems < 10  ? `\u{2007}(${nbElems})\u{2007}\u{2007}` :
            nbElems < 100 ? `\u{2007}(${nbElems})\u{2007}` :
            `\u{2007}(${nbElems})`;
        if (searchState.currentTab === tabNb) {
            return "<button class=\"selected\">" + text +
                   "<span class=\"count\">" + fmtNbElems + "</span></button>";
        }
        return "<button>" + text + "<span class=\"count\">" + fmtNbElems + "</span></button>";
    }

    /**
     * @param {ResultsTable} results
     * @param {boolean} go_to_first
     * @param {string} filterCrates
     */
    function showResults(results, go_to_first, filterCrates) {
        const search = searchState.outputElement();
        if (go_to_first || (results.others.length === 1
            && getSettingValue("go-to-only-result") === "true")
        ) {
            // Needed to force re-execution of JS when coming back to a page. Let's take this
            // scenario as example:
            //
            // 1. You have the "Directly go to item in search if there is only one result" option
            //    enabled.
            // 2. You make a search which results only one result, leading you automatically to
            //    this result.
            // 3. You go back to previous page.
            //
            // Now, without the call below, the JS will not be re-executed and the previous state
            // will be used, starting search again since the search input is not empty, leading you
            // back to the previous page again.
            window.onunload = () => {};
            searchState.removeQueryParameters();
            const elem = document.createElement("a");
            elem.href = results.others[0].href;
            removeClass(elem, "active");
            // For firefox, we need the element to be in the DOM so it can be clicked.
            document.body.appendChild(elem);
            elem.click();
            return;
        }
        if (results.query === undefined) {
            results.query = parseQuery(searchState.input.value);
        }

        currentResults = results.query.userQuery;

        const ret_others = addTab(results.others, results.query, true);
        const ret_in_args = addTab(results.in_args, results.query, false);
        const ret_returned = addTab(results.returned, results.query, false);

        // Navigate to the relevant tab if the current tab is empty, like in case users search
        // for "-> String". If they had selected another tab previously, they have to click on
        // it again.
        let currentTab = searchState.currentTab;
        if ((currentTab === 0 && ret_others[1] === 0) ||
                (currentTab === 1 && ret_in_args[1] === 0) ||
                (currentTab === 2 && ret_returned[1] === 0)) {
            if (ret_others[1] !== 0) {
                currentTab = 0;
            } else if (ret_in_args[1] !== 0) {
                currentTab = 1;
            } else if (ret_returned[1] !== 0) {
                currentTab = 2;
            }
        }

        let crates = "";
        const crates_list = Object.keys(rawSearchIndex);
        if (crates_list.length > 1) {
            crates = " in&nbsp;<div id=\"crate-search-div\"><select id=\"crate-search\">" +
                "<option value=\"all crates\">all crates</option>";
            for (const c of crates_list) {
                crates += `<option value="${c}" ${c === filterCrates && "selected"}>${c}</option>`;
            }
            crates += "</select></div>";
        }

        let output = `<h1 class="search-results-title">Results${crates}</h1>`;
        if (results.query.error !== null) {
            const error = results.query.error;
            error.forEach((value, index) => {
                value = value.split("<").join("&lt;").split(">").join("&gt;");
                if (index % 2 !== 0) {
                    error[index] = `<code>${value.replaceAll(" ", "&nbsp;")}</code>`;
                } else {
                    error[index] = value;
                }
            });
            output += `<h3 class="error">Query parser error: "${error.join("")}".</h3>`;
            output += "<div id=\"search-tabs\">" +
                makeTabHeader(0, "In Names", ret_others[1]) +
                "</div>";
            currentTab = 0;
        } else if (results.query.foundElems <= 1 && results.query.returned.length === 0) {
            output += "<div id=\"search-tabs\">" +
                makeTabHeader(0, "In Names", ret_others[1]) +
                makeTabHeader(1, "In Parameters", ret_in_args[1]) +
                makeTabHeader(2, "In Return Types", ret_returned[1]) +
                "</div>";
        } else {
            const signatureTabTitle =
                results.query.elems.length === 0 ? "In Function Return Types" :
                results.query.returned.length === 0 ? "In Function Parameters" :
                "In Function Signatures";
            output += "<div id=\"search-tabs\">" +
                makeTabHeader(0, signatureTabTitle, ret_others[1]) +
                "</div>";
            currentTab = 0;
        }

        if (results.query.correction !== null) {
            const orig = results.query.returned.length > 0
                ? results.query.returned[0].name
                : results.query.elems[0].name;
            output += "<h3 class=\"search-corrections\">" +
                `Type "${orig}" not found. ` +
                "Showing results for closest type name " +
                `"${results.query.correction}" instead.</h3>`;
        }
        if (results.query.proposeCorrectionFrom !== null) {
            const orig = results.query.proposeCorrectionFrom;
            const targ = results.query.proposeCorrectionTo;
            output += "<h3 class=\"search-corrections\">" +
                `Type "${orig}" not found and used as generic parameter. ` +
                `Consider searching for "${targ}" instead.</h3>`;
        }

        const resultsElem = document.createElement("div");
        resultsElem.id = "results";
        resultsElem.appendChild(ret_others[0]);
        resultsElem.appendChild(ret_in_args[0]);
        resultsElem.appendChild(ret_returned[0]);

        search.innerHTML = output;
        const crateSearch = document.getElementById("crate-search");
        if (crateSearch) {
            crateSearch.addEventListener("input", updateCrate);
        }
        search.appendChild(resultsElem);
        // Reset focused elements.
        searchState.showResults(search);
        const elems = document.getElementById("search-tabs").childNodes;
        searchState.focusedByTab = [];
        let i = 0;
        for (const elem of elems) {
            const j = i;
            elem.onclick = () => printTab(j);
            searchState.focusedByTab.push(null);
            i += 1;
        }
        printTab(currentTab);
    }

    function updateSearchHistory(url) {
        if (!browserSupportsHistoryApi()) {
            return;
        }
        const params = searchState.getQueryStringParams();
        if (!history.state && !params.search) {
            history.pushState(null, "", url);
        } else {
            history.replaceState(null, "", url);
        }
    }

    /**
     * Perform a search based on the current state of the search input element
     * and display the results.
     * @param {boolean} [forced]
     */
    function search(forced) {
        const query = parseQuery(searchState.input.value.trim());
        let filterCrates = getFilterCrates();

        if (!forced && query.userQuery === currentResults) {
            if (query.userQuery.length > 0) {
                putBackSearch();
            }
            return;
        }

        searchState.setLoadingSearch();

        const params = searchState.getQueryStringParams();

        // In case we have no information about the saved crate and there is a URL query parameter,
        // we override it with the URL query parameter.
        if (filterCrates === null && params["filter-crate"] !== undefined) {
            filterCrates = params["filter-crate"];
        }

        // Update document title to maintain a meaningful browser history
        searchState.title = "Results for " + query.original + " - Rust";

        // Because searching is incremental by character, only the most
        // recent search query is added to the browser history.
        updateSearchHistory(buildUrl(query.original, filterCrates));

        showResults(
            execQuery(query, searchWords, filterCrates, window.currentCrate),
            params.go_to_first,
            filterCrates);
    }

    /**
     * Convert a list of RawFunctionType / ID to object-based FunctionType.
     *
     * Crates often have lots of functions in them, and it's common to have a large number of
     * functions that operate on a small set of data types, so the search index compresses them
     * by encoding function parameter and return types as indexes into an array of names.
     *
     * Even when a general-purpose compression algorithm is used, this is still a win. I checked.
     * https://github.com/rust-lang/rust/pull/98475#issue-1284395985
     *
     * The format for individual function types is encoded in
     * librustdoc/html/render/mod.rs: impl Serialize for RenderType
     *
     * @param {null|Array<RawFunctionType>} types
     * @param {Array<{name: string, ty: number}>} lowercasePaths
     *
     * @return {Array<FunctionSearchType>}
     */
    function buildItemSearchTypeAll(types, lowercasePaths) {
        return types.map(type => buildItemSearchType(type, lowercasePaths));
    }

    /**
     * Converts a single type.
     *
     * @param {RawFunctionType} type
     */
    function buildItemSearchType(type, lowercasePaths, isAssocType) {
        const PATH_INDEX_DATA = 0;
        const GENERICS_DATA = 1;
        const BINDINGS_DATA = 2;
        let pathIndex, generics, bindings;
        if (typeof type === "number") {
            pathIndex = type;
            generics = [];
            bindings = new Map();
        } else {
            pathIndex = type[PATH_INDEX_DATA];
            generics = buildItemSearchTypeAll(
                type[GENERICS_DATA],
                lowercasePaths
            );
            if (type.length > BINDINGS_DATA) {
                bindings = new Map(type[BINDINGS_DATA].map(binding => {
                    const [assocType, constraints] = binding;
                    // Associated type constructors are represented sloppily in rustdoc's
                    // type search, to make the engine simpler.
                    //
                    // MyType<Output<T>=Result<T>> is equivalent to MyType<Output<Result<T>>=T>
                    // and both are, essentially
                    // MyType<Output=(T, Result<T>)>, except the tuple isn't actually there.
                    // It's more like the value of a type binding is naturally an array,
                    // which rustdoc calls "constraints".
                    //
                    // As a result, the key should never have generics on it.
                    return [
                        buildItemSearchType(assocType, lowercasePaths, true).id,
                        buildItemSearchTypeAll(constraints, lowercasePaths),
                    ];
                }));
            } else {
                bindings = new Map();
            }
        }
        if (pathIndex < 0) {
            // types less than 0 are generic parameters
            // the actual names of generic parameters aren't stored, since they aren't API
            return {
                id: pathIndex,
                ty: TY_GENERIC,
                path: null,
                generics,
                bindings,
            };
        }
        if (pathIndex === 0) {
            // `0` is used as a sentinel because it's fewer bytes than `null`
            return {
                id: null,
                ty: null,
                path: null,
                generics,
                bindings,
            };
        }
        const item = lowercasePaths[pathIndex - 1];
        return {
            id: buildTypeMapIndex(item.name, isAssocType),
            ty: item.ty,
            path: item.path,
            generics,
            bindings,
        };
    }

    /**
     * Convert from RawFunctionSearchType to FunctionSearchType.
     *
     * Crates often have lots of functions in them, and function signatures are sometimes complex,
     * so rustdoc uses a pretty tight encoding for them. This function converts it to a simpler,
     * object-based encoding so that the actual search code is more readable and easier to debug.
     *
     * The raw function search type format is generated using serde in
     * librustdoc/html/render/mod.rs: impl Serialize for IndexItemFunctionType
     *
     * @param {RawFunctionSearchType} functionSearchType
     * @param {Array<{name: string, ty: number}>} lowercasePaths
     * @param {Map<string, integer>}
     *
     * @return {null|FunctionSearchType}
     */
    function buildFunctionSearchType(functionSearchType, lowercasePaths) {
        const INPUTS_DATA = 0;
        const OUTPUT_DATA = 1;
        // `0` is used as a sentinel because it's fewer bytes than `null`
        if (functionSearchType === 0) {
            return null;
        }
        let inputs, output;
        if (typeof functionSearchType[INPUTS_DATA] === "number") {
            inputs = [buildItemSearchType(functionSearchType[INPUTS_DATA], lowercasePaths)];
        } else {
            inputs = buildItemSearchTypeAll(
                functionSearchType[INPUTS_DATA],
                lowercasePaths
            );
        }
        if (functionSearchType.length > 1) {
            if (typeof functionSearchType[OUTPUT_DATA] === "number") {
                output = [buildItemSearchType(functionSearchType[OUTPUT_DATA], lowercasePaths)];
            } else {
                output = buildItemSearchTypeAll(
                    functionSearchType[OUTPUT_DATA],
                    lowercasePaths
                );
            }
        } else {
            output = [];
        }
        const where_clause = [];
        const l = functionSearchType.length;
        for (let i = 2; i < l; ++i) {
            where_clause.push(typeof functionSearchType[i] === "number"
                ? [buildItemSearchType(functionSearchType[i], lowercasePaths)]
                : buildItemSearchTypeAll(functionSearchType[i], lowercasePaths));
        }
        return {
            inputs, output, where_clause,
        };
    }

    /**
     * Type fingerprints allow fast, approximate matching of types.
     *
     * This algo creates a compact representation of the type set using a Bloom filter.
     * This fingerprint is used three ways:
     *
     * - It accelerates the matching algorithm by checking the function fingerprint against the
     *   query fingerprint. If any bits are set in the query but not in the function, it can't
     *   match.
     *
     * - The fourth section has the number of distinct items in the set.
     *   This is the distance function, used for filtering and for sorting.
     *
     * [^1]: Distance is the relatively naive metric of counting the number of distinct items in
     * the function that are not present in the query.
     *
     * @param {FunctionType|QueryElement} type - a single type
     * @param {Uint32Array} output - write the fingerprint to this data structure: uses 128 bits
     * @param {Set<number>} fps - Set of distinct items
     */
    function buildFunctionTypeFingerprint(type, output, fps) {
        let input = type.id;
        // All forms of `[]` get collapsed down to one thing in the bloom filter.
        // Differentiating between arrays and slices, if the user asks for it, is
        // still done in the matching algorithm.
        if (input === typeNameIdOfArray || input === typeNameIdOfSlice) {
            input = typeNameIdOfArrayOrSlice;
        }
        // http://burtleburtle.net/bob/hash/integer.html
        // ~~ is toInt32. It's used before adding, so
        // the number stays in safe integer range.
        const hashint1 = k => {
            k = (~~k + 0x7ed55d16) + (k << 12);
            k = (k ^ 0xc761c23c) ^ (k >>> 19);
            k = (~~k + 0x165667b1) + (k << 5);
            k = (~~k + 0xd3a2646c) ^ (k << 9);
            k = (~~k + 0xfd7046c5) + (k << 3);
            return (k ^ 0xb55a4f09) ^ (k >>> 16);
        };
        const hashint2 = k => {
            k = ~k + (k << 15);
            k ^= k >>> 12;
            k += k << 2;
            k ^= k >>> 4;
            k = Math.imul(k, 2057);
            return k ^ (k >> 16);
        };
        if (input !== null) {
            const h0a = hashint1(input);
            const h0b = hashint2(input);
            // Less Hashing, Same Performance: Building a Better Bloom Filter
            // doi=10.1.1.72.2442
            const h1a = ~~(h0a + Math.imul(h0b, 2));
            const h1b = ~~(h0a + Math.imul(h0b, 3));
            const h2a = ~~(h0a + Math.imul(h0b, 4));
            const h2b = ~~(h0a + Math.imul(h0b, 5));
            output[0] |= (1 << (h0a % 32)) | (1 << (h1b % 32));
            output[1] |= (1 << (h1a % 32)) | (1 << (h2b % 32));
            output[2] |= (1 << (h2a % 32)) | (1 << (h0b % 32));
            fps.add(input);
        }
        for (const g of type.generics) {
            buildFunctionTypeFingerprint(g, output, fps);
        }
        const fb = {
            id: null,
            ty: 0,
            generics: [],
            bindings: new Map(),
        };
        for (const [k, v] of type.bindings.entries()) {
            fb.id = k;
            fb.generics = v;
            buildFunctionTypeFingerprint(fb, output, fps);
        }
        output[3] = fps.size;
    }

    /**
     * Compare the query fingerprint with the function fingerprint.
     *
     * @param {{number}} fullId - The function
     * @param {{Uint32Array}} queryFingerprint - The query
     * @returns {number|null} - Null if non-match, number if distance
     *                          This function might return 0!
     */
    function compareTypeFingerprints(fullId, queryFingerprint) {
        const fh0 = functionTypeFingerprint[fullId * 4];
        const fh1 = functionTypeFingerprint[(fullId * 4) + 1];
        const fh2 = functionTypeFingerprint[(fullId * 4) + 2];
        const [qh0, qh1, qh2] = queryFingerprint;
        // Approximate set intersection with bloom filters.
        // This can be larger than reality, not smaller, because hashes have
        // the property that if they've got the same value, they hash to the
        // same thing. False positives exist, but not false negatives.
        const [in0, in1, in2] = [fh0 & qh0, fh1 & qh1, fh2 & qh2];
        // Approximate the set of items in the query but not the function.
        // This might be smaller than reality, but cannot be bigger.
        //
        // | in_ | qh_ | XOR | Meaning                                          |
        // | --- | --- | --- | ------------------------------------------------ |
        // |  0  |  0  |  0  | Not present                                      |
        // |  1  |  0  |  1  | IMPOSSIBLE because `in_` is `fh_ & qh_`          |
        // |  1  |  1  |  0  | If one or both is false positive, false negative |
        // |  0  |  1  |  1  | Since in_ has no false negatives, must be real   |
        if ((in0 ^ qh0) || (in1 ^ qh1) || (in2 ^ qh2)) {
            return null;
        }
        return functionTypeFingerprint[(fullId * 4) + 3];
    }

    function buildIndex(rawSearchIndex) {
        searchIndex = [];
        /**
         * List of normalized search words (ASCII lowercased, and undescores removed).
         *
         * @type {Array<string>}
         */
        const searchWords = [];
        typeNameIdMap = new Map();
        const charA = "A".charCodeAt(0);
        let currentIndex = 0;
        let id = 0;

        // Initialize type map indexes for primitive list types
        // that can be searched using `[]` syntax.
        typeNameIdOfArray = buildTypeMapIndex("array");
        typeNameIdOfSlice = buildTypeMapIndex("slice");
        typeNameIdOfArrayOrSlice = buildTypeMapIndex("[]");

        // Function type fingerprints are 128-bit bloom filters that are used to
        // estimate the distance between function and query.
        // This loop counts the number of items to allocate a fingerprint for.
        for (const crate in rawSearchIndex) {
            if (!hasOwnPropertyRustdoc(rawSearchIndex, crate)) {
                continue;
            }
            // Each item gets an entry in the fingerprint array, and the crate
            // does, too
            id += rawSearchIndex[crate].t.length + 1;
        }
        functionTypeFingerprint = new Uint32Array((id + 1) * 4);

        // This loop actually generates the search item indexes, including
        // normalized names, type signature objects and fingerprints, and aliases.
        id = 0;
        for (const crate in rawSearchIndex) {
            if (!hasOwnPropertyRustdoc(rawSearchIndex, crate)) {
                continue;
            }

            let crateSize = 0;

            /**
             * The raw search data for a given crate. `n`, `t`, `d`, `i`, and `f`
             * are arrays with the same length. `q`, `a`, and `c` use a sparse
             * representation for compactness.
             *
             * `n[i]` contains the name of an item.
             *
             * `t[i]` contains the type of that item
             * (as a string of characters that represent an offset in `itemTypes`).
             *
             * `d[i]` contains the description of that item.
             *
             * `q` contains the full paths of the items. For compactness, it is a set of
             * (index, path) pairs used to create a map. If a given index `i` is
             * not present, this indicates "same as the last index present".
             *
             * `i[i]` contains an item's parent, usually a module. For compactness,
             * it is a set of indexes into the `p` array.
             *
             * `f[i]` contains function signatures, or `0` if the item isn't a function.
             * Functions are themselves encoded as arrays. The first item is a list of
             * types representing the function's inputs, and the second list item is a list
             * of types representing the function's output. Tuples are flattened.
             * Types are also represented as arrays; the first item is an index into the `p`
             * array, while the second is a list of types representing any generic parameters.
             *
             * b[i] contains an item's impl disambiguator. This is only present if an item
             * is defined in an impl block and, the impl block's type has more than one associated
             * item with the same name.
             *
             * `a` defines aliases with an Array of pairs: [name, offset], where `offset`
             * points into the n/t/d/q/i/f arrays.
             *
             * `doc` contains the description of the crate.
             *
             * `p` is a list of path/type pairs. It is used for parents and function parameters.
             *
             * `c` is an array of item indices that are deprecated.
             *
             * @type {{
             *   doc: string,
             *   a: Object,
             *   n: Array<string>,
             *   t: String,
             *   d: Array<string>,
             *   q: Array<[Number, string]>,
             *   i: Array<Number>,
             *   f: Array<RawFunctionSearchType>,
             *   p: Array<Object>,
             *   b: Array<[Number, String]>,
             *   c: Array<Number>
             * }}
             */
            const crateCorpus = rawSearchIndex[crate];

            searchWords.push(crate);
            // This object should have exactly the same set of fields as the "row"
            // object defined below. Your JavaScript runtime will thank you.
            // https://mathiasbynens.be/notes/shapes-ics
            const crateRow = {
                crate: crate,
                ty: 3, // == ExternCrate
                name: crate,
                path: "",
                desc: crateCorpus.doc,
                parent: undefined,
                type: null,
                id: id,
                normalizedName: crate.indexOf("_") === -1 ? crate : crate.replace(/_/g, ""),
                deprecated: null,
                implDisambiguator: null,
            };
            id += 1;
            searchIndex.push(crateRow);
            currentIndex += 1;

            // a String of one character item type codes
            const itemTypes = crateCorpus.t;
            // an array of (String) item names
            const itemNames = crateCorpus.n;
            // an array of [(Number) item index,
            //              (String) full path]
            // an item whose index is not present will fall back to the previous present path
            // i.e. if indices 4 and 11 are present, but 5-10 and 12-13 are not present,
            // 5-10 will fall back to the path for 4 and 12-13 will fall back to the path for 11
            const itemPaths = new Map(crateCorpus.q);
            // an array of (String) descriptions
            const itemDescs = crateCorpus.d;
            // an array of (Number) the parent path index + 1 to `paths`, or 0 if none
            const itemParentIdxs = crateCorpus.i;
            // an array of (Object | null) the type of the function, if any
            const itemFunctionSearchTypes = crateCorpus.f;
            // an array of (Number) indices for the deprecated items
            const deprecatedItems = new Set(crateCorpus.c);
            // an array of (Number) indices for the deprecated items
            const implDisambiguator = new Map(crateCorpus.b);
            // an array of [(Number) item type,
            //              (String) name]
            const paths = crateCorpus.p;
            // an array of [(String) alias name
            //             [Number] index to items]
            const aliases = crateCorpus.a;

            // an array of [{name: String, ty: Number}]
            const lowercasePaths = [];

            // convert `rawPaths` entries into object form
            // generate normalizedPaths for function search mode
            let len = paths.length;
            let lastPath = itemPaths.get(0);
            for (let i = 0; i < len; ++i) {
                const elem = paths[i];
                const ty = elem[0];
                const name = elem[1];
                let path = null;
                if (elem.length > 2) {
                    path = itemPaths.has(elem[2]) ? itemPaths.get(elem[2]) : lastPath;
                    lastPath = path;
                }

                lowercasePaths.push({ty: ty, name: name.toLowerCase(), path: path});
                paths[i] = {ty: ty, name: name, path: path};
            }

            // convert `item*` into an object form, and construct word indices.
            //
            // before any analysis is performed lets gather the search terms to
            // search against apart from the rest of the data.  This is a quick
            // operation that is cached for the life of the page state so that
            // all other search operations have access to this cached data for
            // faster analysis operations
            lastPath = "";
            len = itemTypes.length;
            for (let i = 0; i < len; ++i) {
                let word = "";
                // This object should have exactly the same set of fields as the "crateRow"
                // object defined above.
                if (typeof itemNames[i] === "string") {
                    word = itemNames[i].toLowerCase();
                }
                searchWords.push(word);
                const path = itemPaths.has(i) ? itemPaths.get(i) : lastPath;
                let type = null;
                if (itemFunctionSearchTypes[i] !== 0) {
                    type = buildFunctionSearchType(
                        itemFunctionSearchTypes[i],
                        lowercasePaths
                    );
                    if (type) {
                        const fp = functionTypeFingerprint.subarray(id * 4, (id + 1) * 4);
                        const fps = new Set();
                        for (const t of type.inputs) {
                            buildFunctionTypeFingerprint(t, fp, fps);
                        }
                        for (const t of type.output) {
                            buildFunctionTypeFingerprint(t, fp, fps);
                        }
                        for (const w of type.where_clause) {
                            for (const t of w) {
                                buildFunctionTypeFingerprint(t, fp, fps);
                            }
                        }
                    }
                }
                const row = {
                    crate: crate,
                    ty: itemTypes.charCodeAt(i) - charA,
                    name: itemNames[i],
                    path: path,
                    desc: itemDescs[i],
                    parent: itemParentIdxs[i] > 0 ? paths[itemParentIdxs[i] - 1] : undefined,
                    type,
                    id: id,
                    normalizedName: word.indexOf("_") === -1 ? word : word.replace(/_/g, ""),
                    deprecated: deprecatedItems.has(i),
                    implDisambiguator: implDisambiguator.has(i) ? implDisambiguator.get(i) : null,
                };
                id += 1;
                searchIndex.push(row);
                lastPath = row.path;
                crateSize += 1;
            }

            if (aliases) {
                const currentCrateAliases = new Map();
                ALIASES.set(crate, currentCrateAliases);
                for (const alias_name in aliases) {
                    if (!hasOwnPropertyRustdoc(aliases, alias_name)) {
                        continue;
                    }

                    let currentNameAliases;
                    if (currentCrateAliases.has(alias_name)) {
                        currentNameAliases = currentCrateAliases.get(alias_name);
                    } else {
                        currentNameAliases = [];
                        currentCrateAliases.set(alias_name, currentNameAliases);
                    }
                    for (const local_alias of aliases[alias_name]) {
                        currentNameAliases.push(local_alias + currentIndex);
                    }
                }
            }
            currentIndex += crateSize;
        }
        return searchWords;
    }

    /**
     * Callback for when the search form is submitted.
     * @param {Event} [e] - The event that triggered this call, if any
     */
    function onSearchSubmit(e) {
        e.preventDefault();
        searchState.clearInputTimeout();
        search();
    }

    function putBackSearch() {
        const search_input = searchState.input;
        if (!searchState.input) {
            return;
        }
        if (search_input.value !== "" && !searchState.isDisplayed()) {
            searchState.showResults();
            if (browserSupportsHistoryApi()) {
                history.replaceState(null, "",
                    buildUrl(search_input.value, getFilterCrates()));
            }
            document.title = searchState.title;
        }
    }

    function registerSearchEvents() {
        const params = searchState.getQueryStringParams();

        // Populate search bar with query string search term when provided,
        // but only if the input bar is empty. This avoid the obnoxious issue
        // where you start trying to do a search, and the index loads, and
        // suddenly your search is gone!
        if (searchState.input.value === "") {
            searchState.input.value = params.search || "";
        }

        const searchAfter500ms = () => {
            searchState.clearInputTimeout();
            if (searchState.input.value.length === 0) {
                searchState.hideResults();
            } else {
                searchState.timeout = setTimeout(search, 500);
            }
        };
        searchState.input.onkeyup = searchAfter500ms;
        searchState.input.oninput = searchAfter500ms;
        document.getElementsByClassName("search-form")[0].onsubmit = onSearchSubmit;
        searchState.input.onchange = e => {
            if (e.target !== document.activeElement) {
                // To prevent doing anything when it's from a blur event.
                return;
            }
            // Do NOT e.preventDefault() here. It will prevent pasting.
            searchState.clearInputTimeout();
            // zero-timeout necessary here because at the time of event handler execution the
            // pasted content is not in the input field yet. Shouldn’t make any difference for
            // change, though.
            setTimeout(search, 0);
        };
        searchState.input.onpaste = searchState.input.onchange;

        searchState.outputElement().addEventListener("keydown", e => {
            // We only handle unmodified keystrokes here. We don't want to interfere with,
            // for instance, alt-left and alt-right for history navigation.
            if (e.altKey || e.ctrlKey || e.shiftKey || e.metaKey) {
                return;
            }
            // up and down arrow select next/previous search result, or the
            // search box if we're already at the top.
            if (e.which === 38) { // up
                const previous = document.activeElement.previousElementSibling;
                if (previous) {
                    previous.focus();
                } else {
                    searchState.focus();
                }
                e.preventDefault();
            } else if (e.which === 40) { // down
                const next = document.activeElement.nextElementSibling;
                if (next) {
                    next.focus();
                }
                const rect = document.activeElement.getBoundingClientRect();
                if (window.innerHeight - rect.bottom < rect.height) {
                    window.scrollBy(0, rect.height);
                }
                e.preventDefault();
            } else if (e.which === 37) { // left
                nextTab(-1);
                e.preventDefault();
            } else if (e.which === 39) { // right
                nextTab(1);
                e.preventDefault();
            }
        });

        searchState.input.addEventListener("keydown", e => {
            if (e.which === 40) { // down
                focusSearchResult();
                e.preventDefault();
            }
        });

        searchState.input.addEventListener("focus", () => {
            putBackSearch();
        });

        searchState.input.addEventListener("blur", () => {
            searchState.input.placeholder = searchState.input.origPlaceholder;
        });

        // Push and pop states are used to add search results to the browser
        // history.
        if (browserSupportsHistoryApi()) {
            // Store the previous <title> so we can revert back to it later.
            const previousTitle = document.title;

            window.addEventListener("popstate", e => {
                const params = searchState.getQueryStringParams();
                // Revert to the previous title manually since the History
                // API ignores the title parameter.
                document.title = previousTitle;
                // When browsing forward to search results the previous
                // search will be repeated, so the currentResults are
                // cleared to ensure the search is successful.
                currentResults = null;
                // Synchronize search bar with query string state and
                // perform the search. This will empty the bar if there's
                // nothing there, which lets you really go back to a
                // previous state with nothing in the bar.
                if (params.search && params.search.length > 0) {
                    searchState.input.value = params.search;
                    // Some browsers fire "onpopstate" for every page load
                    // (Chrome), while others fire the event only when actually
                    // popping a state (Firefox), which is why search() is
                    // called both here and at the end of the startSearch()
                    // function.
                    e.preventDefault();
                    search();
                } else {
                    searchState.input.value = "";
                    // When browsing back from search results the main page
                    // visibility must be reset.
                    searchState.hideResults();
                }
            });
        }

        // This is required in firefox to avoid this problem: Navigating to a search result
        // with the keyboard, hitting enter, and then hitting back would take you back to
        // the doc page, rather than the search that should overlay it.
        // This was an interaction between the back-forward cache and our handlers
        // that try to sync state between the URL and the search input. To work around it,
        // do a small amount of re-init on page show.
        window.onpageshow = () => {
            const qSearch = searchState.getQueryStringParams().search;
            if (searchState.input.value === "" && qSearch) {
                searchState.input.value = qSearch;
            }
            search();
        };
    }

    function updateCrate(ev) {
        if (ev.target.value === "all crates") {
            // If we don't remove it from the URL, it'll be picked up again by the search.
            const query = searchState.input.value.trim();
            updateSearchHistory(buildUrl(query, null));
        }
        // In case you "cut" the entry from the search input, then change the crate filter
        // before paste back the previous search, you get the old search results without
        // the filter. To prevent this, we need to remove the previous results.
        currentResults = null;
        search(true);
    }

    /**
     *  @type {Array<string>}
     */
    const searchWords = buildIndex(rawSearchIndex);
    if (typeof window !== "undefined") {
        registerSearchEvents();
        // If there's a search term in the URL, execute the search now.
        if (window.searchState.getQueryStringParams().search) {
            search();
        }
    }

    if (typeof exports !== "undefined") {
        exports.initSearch = initSearch;
        exports.execQuery = execQuery;
        exports.parseQuery = parseQuery;
    }
    return searchWords;
}

if (typeof window !== "undefined") {
    window.initSearch = initSearch;
    if (window.searchIndex !== undefined) {
        initSearch(window.searchIndex);
    }
} else {
    // Running in Node, not a browser. Run initSearch just to produce the
    // exports.
    initSearch({});
}


})();
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								/* global addClass, getNakedUrl, getSettingValue */
 								/* global onEachLazy, removeClass, searchState, browserSupportsHistoryApi, exports */
-												Fix eslint errors

											
										
										
											2021-05-14 13:56:15 +02:00
-												Use "strict" mode in JS scripts

											
										
										
											2022-05-02 14:32:56 +02:00
+								"use strict";
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								// polyfill
 								// https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects/Array/toSpliced
 								if (!Array.prototype.toSpliced) {
 								    // Can't use arrow functions, because we want `this`
 								    Array.prototype.toSpliced = function() {
 								        const me = this.slice();
 								        Array.prototype.splice.apply(me, arguments);
 								        return me;
 								    };
 								}
-												Use "strict" mode in JS scripts

											
										
										
											2022-05-02 14:32:56 +02:00
+								(function() {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								// This mapping table should match the discriminants of
-												rustdoc: discr. required+provided assoc consts+tys

											
										
										
											2022-03-29 19:30:54 +02:00
+								// `rustdoc::formats::item_type::ItemType` type in Rust.
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								const itemTypes = [
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "keyword",
 								    "primitive",
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "mod",
 								    "externcrate",
 								    "import",
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "struct", // 5
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "enum",
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "fn",
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "type",
 								    "static",
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "trait", // 10
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "impl",
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "tymethod",
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "method",
 								    "structfield",
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "variant", // 15
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "macro",
 								    "associatedtype",
 								    "constant",
 								    "associatedconstant",
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "union", // 20
 								    "foreigntype",
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								    "existential",
 								    "attr",
 								    "derive",
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								    "traitalias", // 25
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								    "generic",
-												Fix indent of itemTypes in search.js

											
										
										
											2021-12-08 17:31:56 +01:00
+								];
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Add search result item types after their name

											
										
										
											2023-04-22 16:00:20 +02:00
+								const longItemTypes = [
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								    "keyword",
 								    "primitive type",
-												Add search result item types after their name

											
										
										
											2023-04-22 16:00:20 +02:00
+								    "module",
 								    "extern crate",
 								    "re-export",
 								    "struct",
 								    "enum",
 								    "function",
 								    "type alias",
 								    "static",
 								    "trait",
 								    "",
 								    "trait method",
 								    "method",
 								    "struct field",
 								    "enum variant",
 								    "macro",
-												Abbreviate long typenames so they don't get wrapped in results

											
										
										
											2023-06-23 09:51:53 -07:00
+								    "assoc type",
-												Add search result item types after their name

											
										
										
											2023-04-22 16:00:20 +02:00
+								    "constant",
-												Abbreviate long typenames so they don't get wrapped in results

											
										
										
											2023-06-23 09:51:53 -07:00
+								    "assoc const",
-												Add search result item types after their name

											
										
										
											2023-04-22 16:00:20 +02:00
+								    "union",
 								    "foreign type",
 								    "existential type",
 								    "attribute macro",
 								    "derive macro",
 								    "trait alias",
 								];
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								// used for special search precedence
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								const TY_GENERIC = itemTypes.indexOf("generic");
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								const ROOT_PATH = typeof window !== "undefined" ? window.rootPath : "../";
 								function hasOwnPropertyRustdoc(obj, property) {
 								    return Object.prototype.hasOwnProperty.call(obj, property);
 								}
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								// In the search display, allows to switch between tabs.
 								function printTab(nb) {
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								    let iter = 0;
 								    let foundCurrentTab = false;
 								    let foundCurrentResultSet = false;
-												rustdoc: use a more evocative name for CSS/JS `#titles`

This renames the ID, which is only used in search results, to
`#search-tabs`. Also changes the `.count` to a span, so it doesn't need its
display mode to be overridden.

											
										
										
											2022-12-22 15:52:34 -07:00
+								    onEachLazy(document.getElementById("search-tabs").childNodes, elem => {
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								        if (nb === iter) {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            addClass(elem, "selected");
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								            foundCurrentTab = true;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        } else {
 								            removeClass(elem, "selected");
 								        }
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								        iter += 1;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    });
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								    const isTypeSearch = (nb > 0 || iter === 1);
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								    iter = 0;
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								    onEachLazy(document.getElementById("results").childNodes, elem => {
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								        if (nb === iter) {
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								            addClass(elem, "active");
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								            foundCurrentResultSet = true;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        } else {
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								            removeClass(elem, "active");
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								        iter += 1;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    });
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								    if (foundCurrentTab && foundCurrentResultSet) {
 								        searchState.currentTab = nb;
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								        // Corrections only kick in on type-based searches.
 								        const correctionsElem = document.getElementsByClassName("search-corrections");
 								        if (isTypeSearch) {
 								            removeClass(correctionsElem[0], "hidden");
 								        } else {
 								            addClass(correctionsElem[0], "hidden");
 								        }
-												Add "eqeqeq" eslint rule

											
										
										
											2022-05-27 22:30:19 +02:00
+								    } else if (nb !== 0) {
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								        printTab(0);
 								    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								}
 								/**
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								 * The [edit distance] is a metric for measuring the difference between two strings.
 								 *
 								 * [edit distance]: https://en.wikipedia.org/wiki/Edit_distance
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								 */
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
 								/*
 								 * This function was translated, mostly line-for-line, from
 								 * https://github.com/rust-lang/rust/blob/ff4b772f805ec1e/compiler/rustc_span/src/edit_distance.rs
 								 *
 								 * The current implementation is the restricted Damerau-Levenshtein algorithm. It is restricted
 								 * because it does not permit modifying characters that have already been transposed. The specific
 								 * algorithm should not matter to the caller of the methods, which is why it is not noted in the
 								 * documentation.
 								 */
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								const editDistanceState = {
 								    current: [],
 								    prev: [],
 								    prevPrev: [],
 								    calculate: function calculate(a, b, limit) {
 								        // Ensure that `b` is the shorter string, minimizing memory use.
 								        if (a.length < b.length) {
 								            const aTmp = a;
 								            a = b;
 								            b = aTmp;
 								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        const minDist = a.length - b.length;
 								        // If we know the limit will be exceeded, we can return early.
 								        if (minDist > limit) {
 								            return limit + 1;
 								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        // Strip common prefix.
 								        // We know that `b` is the shorter string, so we don't need to check
 								        // `a.length`.
 								        while (b.length > 0 && b[0] === a[0]) {
 								            a = a.substring(1);
 								            b = b.substring(1);
 								        }
 								        // Strip common suffix.
 								        while (b.length > 0 && b[b.length - 1] === a[a.length - 1]) {
 								            a = a.substring(0, a.length - 1);
 								            b = b.substring(0, b.length - 1);
 								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        // If either string is empty, the distance is the length of the other.
 								        // We know that `b` is the shorter string, so we don't need to check `a`.
 								        if (b.length === 0) {
 								            return minDist;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        const aLength = a.length;
 								        const bLength = b.length;
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        for (let i = 0; i <= bLength; ++i) {
 								            this.current[i] = 0;
 								            this.prev[i] = i;
 								            this.prevPrev[i] = Number.MAX_VALUE;
 								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        // row by row
 								        for (let i = 1; i <= aLength; ++i) {
 								            this.current[0] = i;
 								            const aIdx = i - 1;
 								            // column by column
 								            for (let j = 1; j <= bLength; ++j) {
 								                const bIdx = j - 1;
 								                // There is no cost to substitute a character with itself.
 								                const substitutionCost = a[aIdx] === b[bIdx] ? 0 : 1;
 								                this.current[j] = Math.min(
 								                    // deletion
 								                    this.prev[j] + 1,
 								                    // insertion
 								                    this.current[j - 1] + 1,
 								                    // substitution
 								                    this.prev[j - 1] + substitutionCost
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                );
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
 								                if ((i > 1) && (j > 1) && (a[aIdx] === b[bIdx - 1]) && (a[aIdx - 1] === b[bIdx])) {
 								                    // transposition
 								                    this.current[j] = Math.min(
 								                        this.current[j],
 								                        this.prevPrev[j - 2] + 1
 								                    );
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
 								            // Rotate the buffers, reusing the memory
 								            const prevPrevTmp = this.prevPrev;
 								            this.prevPrev = this.prev;
 								            this.prev = this.current;
 								            this.current = prevPrevTmp;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								        // `prev` because we already rotated the buffers.
 								        const distance = this.prev[bLength];
 								        return distance <= limit ? distance : (limit + 1);
 								    },
 								};
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
-												rustdoc: collapse edit distance state into an object

											
										
										
											2023-03-11 20:36:43 -07:00
+								function editDistance(a, b, limit) {
 								    return editDistanceState.calculate(a, b, limit);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								}
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								function initSearch(rawSearchIndex) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								    const MAX_RESULTS = 200;
 								    const NO_TYPE_FILTER = -1;
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								    /**
 								     *  @type {Array<Row>}
 								     */
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								    let searchIndex;
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								    /**
 								     *  @type {Uint32Array}
 								     */
 								    let functionTypeFingerprint;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								    let currentResults;
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								    /**
 								     * Map from normalized type names to integers. Used to make type search
 								     * more efficient.
 								     *
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								     * @type {Map<string, {id: integer, assocOnly: boolean}>}
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								     */
 								    let typeNameIdMap;
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								    const ALIASES = new Map();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								    /**
 								     * Special type name IDs for searching by array.
 								     */
 								    let typeNameIdOfArray;
 								    /**
 								     * Special type name IDs for searching by slice.
 								     */
 								    let typeNameIdOfSlice;
 								    /**
 								     * Special type name IDs for searching by both array and slice (`[]` syntax).
 								     */
 								    let typeNameIdOfArrayOrSlice;
 								    /**
 								     * Add an item to the type Name->ID map, or, if one already exists, use it.
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								     * Returns the number. If name is "" or null, return null (pure generic).
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								     *
 								     * This is effectively string interning, so that function matching can be
 								     * done more quickly. Two types with the same name but different item kinds
 								     * get the same ID.
 								     *
 								     * @param {string} name
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								     * @param {boolean} isAssocType - True if this is an assoc type
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								     *
 								     * @returns {integer}
 								     */
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								    function buildTypeMapIndex(name, isAssocType) {
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								        if (name === "" || name === null) {
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								            return null;
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								        }
 								        if (typeNameIdMap.has(name)) {
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								            const obj = typeNameIdMap.get(name);
 								            obj.assocOnly = isAssocType && obj.assocOnly;
 								            return obj.id;
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								        } else {
 								            const id = typeNameIdMap.size;
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								            typeNameIdMap.set(name, {id, assocOnly: isAssocType});
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            return id;
 								        }
 								    }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    function isSpecialStartCharacter(c) {
-												Simplify parser syntax

											
										
										
											2022-02-09 20:56:37 +01:00
+								        return "<\"".indexOf(c) !== -1;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								    function isEndCharacter(c) {
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        return "=,>-]".indexOf(c) !== -1;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
-												Simplify parser syntax

											
										
										
											2022-02-09 20:56:37 +01:00
+								    function isErrorCharacter(c) {
 								        return "()".indexOf(c) !== -1;
 								    }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    function itemTypeFromName(typename) {
-												Improve JS function itemTypeFromName code a bit

											
										
										
											2023-02-11 18:03:06 +01:00
+								        const index = itemTypes.findIndex(i => i === typename);
 								        if (index < 0) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Unknown type filter ", typename];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
-												Improve JS function itemTypeFromName code a bit

											
										
										
											2023-02-11 18:03:06 +01:00
+								        return index;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
 								    /**
 								     * If we encounter a `"`, then we try to extract the string from it until we find another `"`.
 								     *
 								     * This function will throw an error in the following cases:
 								     * * There is already another string element.
 								     * * We are parsing a generic argument.
 								     * * There is more than one element.
 								     * * There is no closing `"`.
 								     *
 								     * @param {ParsedQuery} query
 								     * @param {ParserState} parserState
 								     * @param {boolean} isInGenerics
 								     */
 								    function getStringElem(query, parserState, isInGenerics) {
 								        if (isInGenerics) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Unexpected ", "\"", " in generics"];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        } else if (query.literalSearch) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Cannot have more than one literal search element"];
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								        } else if (parserState.totalElems - parserState.genericsElems > 0) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Cannot use literal search when there is more than one element"];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
 								        parserState.pos += 1;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const start = parserState.pos;
 								        const end = getIdentEndPosition(parserState);
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        if (parserState.pos >= parserState.length) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Unclosed ", "\""];
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								        } else if (parserState.userQuery[end] !== "\"") {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Unexpected ", parserState.userQuery[end], " in a string element"];
-												Fix some corner cases

											
										
										
											2022-04-17 01:43:26 +02:00
+								        } else if (start === end) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            throw ["Cannot have empty string element"];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
 								        // To skip the quote at the end.
 								        parserState.pos += 1;
 								        query.literalSearch = true;
 								    }
 								    /**
 								     * Returns `true` if the current parser position is starting with "::".
 								     *
 								     * @param {ParserState} parserState
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @return {boolean}
 								     */
 								    function isPathStart(parserState) {
-												Add "eqeqeq" eslint rule

											
										
										
											2022-05-27 22:30:19 +02:00
+								        return parserState.userQuery.slice(parserState.pos, parserState.pos + 2) === "::";
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
 								    /**
 								     * Returns `true` if the current parser position is starting with "->".
 								     *
 								     * @param {ParserState} parserState
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @return {boolean}
 								     */
 								    function isReturnArrow(parserState) {
-												Add "eqeqeq" eslint rule

											
										
										
											2022-05-27 22:30:19 +02:00
+								        return parserState.userQuery.slice(parserState.pos, parserState.pos + 2) === "->";
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
-												Add isIdentCharacter function to ensure that unexpected characters are handled correctly

											
										
										
											2022-03-23 17:26:32 +01:00
+								    /**
 								     * Returns `true` if the given `c` character is valid for an ident.
 								     *
 								     * @param {string} c
 								     *
 								     * @return {boolean}
 								     */
 								    function isIdentCharacter(c) {
 								        return (
-												Enforce quote rule for JS source code

											
										
										
											2022-05-07 20:18:23 +02:00
+								            c === "_" ||
 								            (c >= "0" && c <= "9") ||
 								            (c >= "a" && c <= "z") ||
 								            (c >= "A" && c <= "Z"));
-												Add isIdentCharacter function to ensure that unexpected characters are handled correctly

											
										
										
											2022-03-23 17:26:32 +01:00
+								    }
-												Handle separators in their own functions and fix missing handling of tabs

											
										
										
											2022-03-30 11:32:03 +02:00
+								    /**
 								     * Returns `true` if the given `c` character is a separator.
 								     *
 								     * @param {string} c
 								     *
 								     * @return {boolean}
 								     */
 								    function isSeparatorCharacter(c) {
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        return c === "," || c === "=";
-												Add an extra check over filter type

											
										
										
											2022-04-17 12:05:31 +02:00
+								    }
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								/**
 								     * Returns `true` if the given `c` character is a path separator. For example
 								     * `:` in `a::b` or a whitespace in `a b`.
-												Add an extra check over filter type

											
										
										
											2022-04-17 12:05:31 +02:00
+								     *
 								     * @param {string} c
 								     *
 								     * @return {boolean}
 								     */
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								    function isPathSeparator(c) {
-												rustdoc-search: replace TAB/NL/LF with SP first

This way, most of the parsing code doesn't need to be designed to handle
it, since they should always be treated exactly the same anyhow.

											
										
										
											2023-11-29 10:54:49 -07:00
+								        return c === ":" || c === " ";
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								    }
 								    /**
 								     * Returns `true` if the previous character is `lookingFor`.
 								     *
 								     * @param {ParserState} parserState
 								     * @param {String} lookingFor
 								     *
 								     * @return {boolean}
 								     */
 								    function prevIs(parserState, lookingFor) {
 								        let pos = parserState.pos;
 								        while (pos > 0) {
 								            const c = parserState.userQuery[pos - 1];
 								            if (c === lookingFor) {
 								                return true;
-												rustdoc-search: replace TAB/NL/LF with SP first

This way, most of the parsing code doesn't need to be designed to handle
it, since they should always be treated exactly the same anyhow.

											
										
										
											2023-11-29 10:54:49 -07:00
+								            } else if (c !== " ") {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                break;
 								            }
 								            pos -= 1;
 								        }
 								        return false;
 								    }
 								    /**
 								     * Returns `true` if the last element in the `elems` argument has generics.
 								     *
 								     * @param {Array<QueryElement>} elems
 								     * @param {ParserState} parserState
 								     *
 								     * @return {boolean}
 								     */
 								    function isLastElemGeneric(elems, parserState) {
 								        return (elems.length > 0 && elems[elems.length - 1].generics.length > 0) ||
 								            prevIs(parserState, ">");
 								    }
 								    /**
 								     * Increase current parser position until it doesn't find a whitespace anymore.
 								     *
 								     * @param {ParserState} parserState
 								     */
 								    function skipWhitespace(parserState) {
 								        while (parserState.pos < parserState.userQuery.length) {
 								            const c = parserState.userQuery[parserState.pos];
-												rustdoc-search: replace TAB/NL/LF with SP first

This way, most of the parsing code doesn't need to be designed to handle
it, since they should always be treated exactly the same anyhow.

											
										
										
											2023-11-29 10:54:49 -07:00
+								            if (c !== " ") {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                break;
 								            }
 								            parserState.pos += 1;
 								        }
-												Handle separators in their own functions and fix missing handling of tabs

											
										
										
											2022-03-30 11:32:03 +02:00
+								    }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    /**
 								     * @param {ParsedQuery} query
 								     * @param {ParserState} parserState
 								     * @param {string} name                  - Name of the query element.
 								     * @param {Array<QueryElement>} generics - List of generics of this query element.
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
 								     * @return {QueryElement}                - The newly created `QueryElement`.
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     */
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								    function createQueryElement(query, parserState, name, generics, isInGenerics) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								        const path = name.trim();
 								        if (path.length === 0 && generics.length === 0) {
 								            throw ["Unexpected ", parserState.userQuery[parserState.pos]];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								        if (query.literalSearch && parserState.totalElems - parserState.genericsElems > 0) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            throw ["Cannot have more than one element if you use quotes"];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								        const typeFilter = parserState.typeFilter;
 								        parserState.typeFilter = null;
 								        if (name === "!") {
 								            if (typeFilter !== null && typeFilter !== "primitive") {
 								                throw [
 								                    "Invalid search type: primitive never type ",
 								                    "!",
 								                    " and ",
 								                    typeFilter,
 								                    " both specified",
 								                ];
 								            }
 								            if (generics.length !== 0) {
 								                throw [
 								                    "Never type ",
 								                    "!",
 								                    " does not accept generic parameters",
 								                ];
 								            }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            const bindingName = parserState.isInBinding;
 								            parserState.isInBinding = null;
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								            return {
 								                name: "never",
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								                id: null,
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								                fullPath: ["never"],
 								                pathWithoutLast: [],
 								                pathLast: "never",
 								                generics: [],
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                bindings: new Map(),
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								                typeFilter: "primitive",
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                bindingName,
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								            };
 								        }
-												rustdoc-search: allow `:: ` and ` ::`

This restriction made sense back when spaces separated function
parameters, but now that they separate path components, there's
no real ambiguity any more.

Additionally, the Rust language allows it.

											
										
										
											2023-11-29 10:11:37 -07:00
+								        const quadcolon = /::\s*::/.exec(path);
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								        if (path.startsWith("::")) {
 								            throw ["Paths cannot start with ", "::"];
 								        } else if (path.endsWith("::")) {
 								            throw ["Paths cannot end with ", "::"];
-												rustdoc-search: allow `:: ` and ` ::`

This restriction made sense back when spaces separated function
parameters, but now that they separate path components, there's
no real ambiguity any more.

Additionally, the Rust language allows it.

											
										
										
											2023-11-29 10:11:37 -07:00
+								        } else if (quadcolon !== null) {
 								            throw ["Unexpected ", quadcolon[0]];
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								        }
-												rustdoc-search: allow `:: ` and ` ::`

This restriction made sense back when spaces separated function
parameters, but now that they separate path components, there's
no real ambiguity any more.

Additionally, the Rust language allows it.

											
										
										
											2023-11-29 10:11:37 -07:00
+								        const pathSegments = path.split(/(?:::\s*)|(?:\s+(?:::\s*)?)/);
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								        // In case we only have something like `<p>`, there is no name.
 								        if (pathSegments.length === 0 || (pathSegments.length === 1 && pathSegments[0] === "")) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            if (generics.length > 0 || prevIs(parserState, ">")) {
 								                throw ["Found generics without a path"];
 								            } else {
 								                throw ["Unexpected ", parserState.userQuery[parserState.pos]];
 								            }
 								        }
 								        for (const [i, pathSegment] of pathSegments.entries()) {
 								            if (pathSegment === "!") {
 								                if (i !== 0) {
 								                    throw ["Never type ", "!", " is not associated item"];
 								                }
 								                pathSegments[i] = "never";
 								            }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								        parserState.totalElems += 1;
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								        if (isInGenerics) {
 								            parserState.genericsElems += 1;
 								        }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        const bindingName = parserState.isInBinding;
 								        parserState.isInBinding = null;
 								        const bindings = new Map();
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								        return {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            name: name.trim(),
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								            id: null,
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            fullPath: pathSegments,
 								            pathWithoutLast: pathSegments.slice(0, pathSegments.length - 1),
 								            pathLast: pathSegments[pathSegments.length - 1],
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            generics: generics.filter(gen => {
 								                // Syntactically, bindings are parsed as generics,
 								                // but the query engine treats them differently.
 								                if (gen.bindingName !== null) {
 								                    bindings.set(gen.bindingName.name, [gen, ...gen.bindingName.generics]);
 								                    return false;
 								                }
 								                return true;
 								            }),
 								            bindings,
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            typeFilter,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            bindingName,
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								        };
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								    /**
 								     * This function goes through all characters until it reaches an invalid ident character or the
 								     * end of the query. It returns the position of the last character of the ident.
 								     *
 								     * @param {ParserState} parserState
 								     *
 								     * @return {integer}
 								     */
 								    function getIdentEndPosition(parserState) {
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								        const start = parserState.pos;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let end = parserState.pos;
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								        let foundExclamation = -1;
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								        while (parserState.pos < parserState.length) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const c = parserState.userQuery[parserState.pos];
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								            if (!isIdentCharacter(c)) {
-												Update rustdoc search parser to handle `!` correctly

											
										
										
											2022-04-26 13:58:23 +02:00
+								                if (c === "!") {
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								                    if (foundExclamation !== -1) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                        throw ["Cannot have more than one ", "!", " in an ident"];
-												Update rustdoc search parser to handle `!` correctly

											
										
										
											2022-04-26 13:58:23 +02:00
+								                    } else if (parserState.pos + 1 < parserState.length &&
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                        isIdentCharacter(parserState.userQuery[parserState.pos + 1])
 								                    ) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                        throw ["Unexpected ", "!", ": it can only be at the end of an ident"];
-												Update rustdoc search parser to handle `!` correctly

											
										
										
											2022-04-26 13:58:23 +02:00
+								                    }
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								                    foundExclamation = parserState.pos;
-												Update rustdoc search parser to handle `!` correctly

											
										
										
											2022-04-26 13:58:23 +02:00
+								                } else if (isErrorCharacter(c)) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw ["Unexpected ", c];
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                } else if (isPathSeparator(c)) {
 								                    if (c === ":") {
 								                        if (!isPathStart(parserState)) {
 								                            break;
 								                        }
 								                        // Skip current ":".
 								                        parserState.pos += 1;
 								                    } else {
 								                        while (parserState.pos + 1 < parserState.length) {
 								                            const next_c = parserState.userQuery[parserState.pos + 1];
-												rustdoc-search: replace TAB/NL/LF with SP first

This way, most of the parsing code doesn't need to be designed to handle
it, since they should always be treated exactly the same anyhow.

											
										
										
											2023-11-29 10:54:49 -07:00
+								                            if (next_c !== " ") {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                                break;
 								                            }
 								                            parserState.pos += 1;
 								                        }
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								                    }
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								                    if (foundExclamation !== -1) {
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								                        if (foundExclamation !== start &&
 								                            isIdentCharacter(parserState.userQuery[foundExclamation - 1])
 								                        ) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                            throw ["Cannot have associated items in macros"];
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								                        } else {
 								                            // while the never type has no associated macros, we still
 								                            // can parse a path like that
 								                            foundExclamation = -1;
 								                        }
 								                    }
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                } else if (
 								                    c === "[" ||
-												rustdoc-search: clean up parser

The `c === "="` was redundant when `isSeparatorCharacter` already
checks that.

The function `isStopCharacter` and `isEndCharacter` functions
did exactly the same thing and have synonymous names.
There doesn't seem much point in having both.

											
										
										
											2023-12-11 22:24:44 -07:00
+								                    isEndCharacter(c) ||
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    isSpecialStartCharacter(c) ||
 								                    isSeparatorCharacter(c)
 								                ) {
 								                    break;
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								                } else {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw ["Unexpected ", c];
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								                }
 								            }
 								            parserState.pos += 1;
 								            end = parserState.pos;
 								        }
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								        // if start == end - 1, we got the never type
-												rustdoc-search: search never type with `!`

This feature extends rustdoc to support the syntax that most users will
naturally attempt to use to search for diverging functions.
Part of #60485

It's already possible to do this search with `primitive:never`, but
that's not what the Rust language itself uses, so nobody will try it if
they aren't told or helped along.

											
										
										
											2023-06-12 14:56:54 -07:00
+								        if (foundExclamation !== -1 &&
 								            foundExclamation !== start &&
 								            isIdentCharacter(parserState.userQuery[foundExclamation - 1])
 								        ) {
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								            if (parserState.typeFilter === null) {
 								                parserState.typeFilter = "macro";
 								            } else if (parserState.typeFilter !== "macro") {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                throw [
 								                    "Invalid search type: macro ",
 								                    "!",
 								                    " and ",
 								                    parserState.typeFilter,
 								                    " both specified",
 								                ];
-												rustdoc: search by macro when query ends with `!`

Related to #96399

											
										
										
											2023-02-16 15:32:38 -07:00
+								            }
 								            end = foundExclamation;
 								        }
-												Parse idents the same way in both quote string elements and "normal" elements

											
										
										
											2022-04-16 16:33:42 +02:00
+								        return end;
 								    }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    /**
 								     * @param {ParsedQuery} query
 								     * @param {ParserState} parserState
 								     * @param {Array<QueryElement>} elems - This is where the new {QueryElement} will be added.
 								     * @param {boolean} isInGenerics
 								     */
 								    function getNextElem(query, parserState, elems, isInGenerics) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const generics = [];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								        skipWhitespace(parserState);
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let start = parserState.pos;
 								        let end;
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								        if (parserState.userQuery[parserState.pos] === "[") {
 								            parserState.pos += 1;
 								            getItemsBefore(query, parserState, generics, "]");
 								            const typeFilter = parserState.typeFilter;
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            const isInBinding = parserState.isInBinding;
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            if (typeFilter !== null && typeFilter !== "primitive") {
 								                throw [
 								                    "Invalid search type: primitive ",
 								                    "[]",
 								                    " and ",
 								                    typeFilter,
 								                    " both specified",
 								                ];
 								            }
 								            parserState.typeFilter = null;
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            parserState.isInBinding = null;
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            parserState.totalElems += 1;
 								            if (isInGenerics) {
 								                parserState.genericsElems += 1;
 								            }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            for (const gen of generics) {
 								                if (gen.bindingName !== null) {
 								                    throw ["Type parameter ", "=", " cannot be within slice ", "[]"];
 								                }
 								            }
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            elems.push({
 								                name: "[]",
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								                id: null,
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								                fullPath: ["[]"],
 								                pathWithoutLast: [],
 								                pathLast: "[]",
 								                generics,
 								                typeFilter: "primitive",
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                bindingName: isInBinding,
 								                bindings: new Map(),
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            });
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        } else {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            const isStringElem = parserState.userQuery[start] === "\"";
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            // We handle the strings on their own mostly to make code easier to follow.
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            if (isStringElem) {
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								                start += 1;
 								                getStringElem(query, parserState, isInGenerics);
 								                end = parserState.pos - 1;
 								            } else {
 								                end = getIdentEndPosition(parserState);
-												Simplify parser syntax

											
										
										
											2022-02-09 20:56:37 +01:00
+								            }
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            if (parserState.pos < parserState.length &&
 								                parserState.userQuery[parserState.pos] === "<"
 								            ) {
 								                if (start >= end) {
 								                    throw ["Found generics without a path"];
 								                }
 								                parserState.pos += 1;
 								                getItemsBefore(query, parserState, generics, ">");
 								            }
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            if (isStringElem) {
 								                skipWhitespace(parserState);
 								            }
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            if (start >= end && generics.length === 0) {
 								                return;
 								            }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            if (parserState.userQuery[parserState.pos] === "=") {
 								                if (parserState.isInBinding) {
 								                    throw ["Cannot write ", "=", " twice in a binding"];
 								                }
 								                if (!isInGenerics) {
 								                    throw ["Type parameter ", "=", " must be within generics list"];
 								                }
 								                const name = parserState.userQuery.slice(start, end).trim();
 								                if (name === "!") {
 								                    throw ["Type parameter ", "=", " key cannot be ", "!", " never type"];
 								                }
 								                if (name.includes("!")) {
 								                    throw ["Type parameter ", "=", " key cannot be ", "!", " macro"];
 								                }
 								                if (name.includes("::")) {
 								                    throw ["Type parameter ", "=", " key cannot contain ", "::", " path"];
 								                }
 								                if (name.includes(":")) {
 								                    throw ["Type parameter ", "=", " key cannot contain ", ":", " type"];
 								                }
 								                parserState.isInBinding = { name, generics };
 								            } else {
 								                elems.push(
 								                    createQueryElement(
 								                        query,
 								                        parserState,
 								                        parserState.userQuery.slice(start, end),
 								                        generics,
 								                        isInGenerics
 								                    )
 								                );
 								            }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
 								    }
 								    /**
-												Improve documentation and add some explanations in the code

											
										
										
											2022-02-11 15:48:57 +01:00
+								     * This function parses the next query element until it finds `endChar`, calling `getNextElem`
 								     * to collect each element.
 								     *
 								     * If there is no `endChar`, this function will implicitly stop at the end without raising an
 								     * error.
 								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @param {ParsedQuery} query
 								     * @param {ParserState} parserState
 								     * @param {Array<QueryElement>} elems - This is where the new {QueryElement} will be added.
-												Improve documentation and add some explanations in the code

											
										
										
											2022-02-11 15:48:57 +01:00
+								     * @param {string} endChar            - This function will stop when it'll encounter this
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     *                                      character.
 								     */
-												Improve documentation and add some explanations in the code

											
										
										
											2022-02-11 15:48:57 +01:00
+								    function getItemsBefore(query, parserState, elems, endChar) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let foundStopChar = true;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								        let start = parserState.pos;
 								        // If this is a generic, keep the outer item's type filter around.
 								        const oldTypeFilter = parserState.typeFilter;
 								        parserState.typeFilter = null;
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        const oldIsInBinding = parserState.isInBinding;
 								        parserState.isInBinding = null;
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								        let extra = "";
 								        if (endChar === ">") {
 								            extra = "<";
 								        } else if (endChar === "]") {
 								            extra = "[";
 								        } else if (endChar === "") {
 								            extra = "->";
 								        } else {
 								            extra = endChar;
 								        }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        while (parserState.pos < parserState.length) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const c = parserState.userQuery[parserState.pos];
-												Improve documentation and add some explanations in the code

											
										
										
											2022-02-11 15:48:57 +01:00
+								            if (c === endChar) {
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                if (parserState.isInBinding) {
 								                    throw ["Unexpected ", endChar, " after ", "="];
 								                }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                break;
-												Handle separators in their own functions and fix missing handling of tabs

											
										
										
											2022-03-30 11:32:03 +02:00
+								            } else if (isSeparatorCharacter(c)) {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                parserState.pos += 1;
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                foundStopChar = true;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                continue;
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								            } else if (c === ":" && isPathStart(parserState)) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                throw ["Unexpected ", "::", ": paths cannot start with ", "::"];
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            }  else if (c === ":") {
 								                if (parserState.typeFilter !== null) {
 								                    throw ["Unexpected ", ":"];
 								                }
 								                if (elems.length === 0) {
 								                    throw ["Expected type filter before ", ":"];
 								                } else if (query.literalSearch) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    throw ["Cannot use quotes on type filter"];
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								                }
 								                // The type filter doesn't count as an element since it's a modifier.
 								                const typeFilterElem = elems.pop();
 								                checkExtraTypeFilterCharacters(start, parserState);
 								                parserState.typeFilter = typeFilterElem.name;
 								                parserState.pos += 1;
 								                parserState.totalElems -= 1;
 								                query.literalSearch = false;
 								                foundStopChar = true;
 								                continue;
 								            } else if (isEndCharacter(c)) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                throw ["Unexpected ", c, " after ", extra];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            if (!foundStopChar) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                let extra = [];
 								                if (isLastElemGeneric(query.elems, parserState)) {
 								                    extra = [" after ", ">"];
 								                } else if (prevIs(parserState, "\"")) {
 								                    throw ["Cannot have more than one element if you use quotes"];
 								                }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                if (endChar !== "") {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw [
 								                        "Expected ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                        ",",
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                        ", ",
 								                        "=",
 								                        ", or ",
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                        endChar,
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                        ...extra,
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                        ", found ",
 								                        c,
 								                    ];
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                }
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                throw [
 								                    "Expected ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    ",",
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                    " or ",
 								                    "=",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    ...extra,
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    ", found ",
 								                    c,
 								                ];
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            }
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const posBefore = parserState.pos;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            start = parserState.pos;
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            getNextElem(query, parserState, elems, endChar !== "");
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            if (endChar !== "" && parserState.pos >= parserState.length) {
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								                throw ["Unclosed ", extra];
-												Emit an error for unclosed generic

											
										
										
											2023-03-02 14:28:06 +01:00
+								            }
-												Improve crate selection on rustdoc search results page

Resolves all of issue #93240

Reproduces a similar change as #99086, but with improvements

In particular, this PR inlcludes:
* redesigning the crate-search selector so the background color matches its surroundings
* decrease the font of the dropdown menu to a reaonable size
* add a hover effect
* make the color of the arrow theme-dependent, using a surrounding div, with :after pseudo-element
  that can then be transformed using CSS filters to approximate the desired color
* fix the text "in" to match the title font
* remove the "for xyz" in the "Results for xyz in [All crates]" title when
  searching for search term "xyz"; you can already see what you're searching for
  as it's typed in the search bar!
* in line with #99086, handle super-long crate names appropriately without a long <select>
  element escaping the screen area; the improvement is that we also keep the title
  within a single line now; uses some flex layout shenanigans...
* the margins / paddings are adjusted so the selected label of the <select> fits within
  the rest of that title nicely; also some inconsistency in the way that Firefox renders
  a <select> with "appearance: none" (roughly 4px more padding left and right of the text
  than e.g. Chrome) is worked around, and it now produces a result that looks (essentially)
  identical to Chrome
* the color of the help menu and settings menu border in light theme is made to match with
  the color of the corresponding buttons, like they do (match) in the ayu theme
* the casing of "All crates" changes to "all crates"
* the new tests from #99086 are temporarily disabled, until they can be adapted later

											
										
										
											2022-07-03 20:10:19 +02:00
+								            // This case can be encountered if `getNextElem` encountered a "stop character" right
 								            // from the start. For example if you have `,,` or `<>`. In this case, we simply move up
 								            // the current position to continue the parsing.
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            if (posBefore === parserState.pos) {
 								                parserState.pos += 1;
 								            }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            foundStopChar = false;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
-												Emit an error for unclosed generic

											
										
										
											2023-03-02 14:28:06 +01:00
+								        if (parserState.pos >= parserState.length && endChar !== "") {
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								            throw ["Unclosed ", extra];
-												Emit an error for unclosed generic

											
										
										
											2023-03-02 14:28:06 +01:00
+								        }
 								        // We are either at the end of the string or on the `endChar` character, let's move forward
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								        // in any case.
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        parserState.pos += 1;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
 								        parserState.typeFilter = oldTypeFilter;
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        parserState.isInBinding = oldIsInBinding;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    }
-												Add an extra check over filter type

											
										
										
											2022-04-17 12:05:31 +02:00
+								    /**
 								     * Checks that the type filter doesn't have unwanted characters like `<>` (which are ignored
 								     * if empty).
 								     *
 								     * @param {ParserState} parserState
 								     */
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								    function checkExtraTypeFilterCharacters(start, parserState) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								        const query = parserState.userQuery.slice(start, parserState.pos).trim();
-												Add an extra check over filter type

											
										
										
											2022-04-17 12:05:31 +02:00
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								        for (const c in query) {
 								            if (!isIdentCharacter(query[c])) {
 								                throw [
 								                    "Unexpected ",
 								                    query[c],
 								                    " in type filter (before ",
 								                    ":",
 								                    ")",
 								                ];
-												Add an extra check over filter type

											
										
										
											2022-04-17 12:05:31 +02:00
+								            }
 								        }
 								    }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    /**
-												Improve documentation and add some explanations in the code

											
										
										
											2022-02-11 15:48:57 +01:00
+								     * Parses the provided `query` input to fill `parserState`. If it encounters an error while
 								     * parsing `query`, it'll throw an error.
 								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @param {ParsedQuery} query
 								     * @param {ParserState} parserState
 								     */
 								    function parseInput(query, parserState) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let foundStopChar = true;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								        let start = parserState.pos;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
 								        while (parserState.pos < parserState.length) {
-												Clean up JS files code a bit

											
										
										
											2023-02-26 16:26:59 +01:00
+								            const c = parserState.userQuery[parserState.pos];
-												rustdoc-search: clean up parser

The `c === "="` was redundant when `isSeparatorCharacter` already
checks that.

The function `isStopCharacter` and `isEndCharacter` functions
did exactly the same thing and have synonymous names.
There doesn't seem much point in having both.

											
										
										
											2023-12-11 22:24:44 -07:00
+								            if (isEndCharacter(c)) {
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                foundStopChar = true;
-												Handle separators in their own functions and fix missing handling of tabs

											
										
										
											2022-03-30 11:32:03 +02:00
+								                if (isSeparatorCharacter(c)) {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                    parserState.pos += 1;
 								                    continue;
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								                } else if (c === "-" || c === ">") {
 								                    if (isReturnArrow(parserState)) {
 								                        break;
 								                    }
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw ["Unexpected ", c, " (did you mean ", "->", "?)"];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                }
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                throw ["Unexpected ", c];
-												Correctly handle single `:`

											
										
										
											2022-04-18 23:11:42 +02:00
+								            } else if (c === ":" && !isPathStart(parserState)) {
 								                if (parserState.typeFilter !== null) {
-												Fix eBNF and handling of whitespace characters when not in a path

											
										
										
											2023-06-13 14:01:01 +02:00
+								                    throw [
 								                        "Unexpected ",
 								                        ":",
 								                        " (expected path after type filter ",
 								                        parserState.typeFilter + ":",
 								                        ")",
 								                    ];
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                } else if (query.elems.length === 0) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw ["Expected type filter before ", ":"];
-												Add an extra check over filter type

											
										
										
											2022-04-17 12:05:31 +02:00
+								                } else if (query.literalSearch) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    throw ["Cannot use quotes on type filter"];
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                }
 								                // The type filter doesn't count as an element since it's a modifier.
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								                const typeFilterElem = query.elems.pop();
 								                checkExtraTypeFilterCharacters(start, parserState);
 								                parserState.typeFilter = typeFilterElem.name;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                parserState.pos += 1;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								                parserState.totalElems -= 1;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                query.literalSearch = false;
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                foundStopChar = true;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                continue;
-												rustdoc-search: replace TAB/NL/LF with SP first

This way, most of the parsing code doesn't need to be designed to handle
it, since they should always be treated exactly the same anyhow.

											
										
										
											2023-11-29 10:54:49 -07:00
+								            } else if (c === " ") {
-												Fix eBNF and handling of whitespace characters when not in a path

											
										
										
											2023-06-13 14:01:01 +02:00
+								                skipWhitespace(parserState);
 								                continue;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            if (!foundStopChar) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                let extra = "";
 								                if (isLastElemGeneric(query.elems, parserState)) {
 								                    extra = [" after ", ">"];
 								                } else if (prevIs(parserState, "\"")) {
 								                    throw ["Cannot have more than one element if you use quotes"];
 								                }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                if (parserState.typeFilter !== null) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw [
 								                        "Expected ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                        ",",
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                        " or ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                        "->",
 								                        ...extra,
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                        ", found ",
 								                        c,
 								                    ];
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								                }
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                throw [
 								                    "Expected ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    ",",
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    ", ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    ":",
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    " or ",
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                    "->",
 								                    ...extra,
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    ", found ",
 								                    c,
 								                ];
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            }
-												Clean up JS files code a bit

											
										
										
											2023-02-26 16:26:59 +01:00
+								            const before = query.elems.length;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            start = parserState.pos;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            getNextElem(query, parserState, query.elems, false);
 								            if (query.elems.length === before) {
-												Correctly handle single `:`

											
										
										
											2022-04-18 23:11:42 +02:00
+								                // Nothing was added, weird... Let's increase the position to not remain stuck.
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                parserState.pos += 1;
 								            }
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            foundStopChar = false;
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        }
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								        if (parserState.typeFilter !== null) {
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								            throw [
 								                "Unexpected ",
 								                ":",
 								                " (expected path after type filter ",
 								                parserState.typeFilter + ":",
 								                ")",
 								            ];
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								        }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        while (parserState.pos < parserState.length) {
-												Simplify parser syntax

											
										
										
											2022-02-09 20:56:37 +01:00
+								            if (isReturnArrow(parserState)) {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                parserState.pos += 2;
-												Use whitespace as path separator like double colon

											
										
										
											2023-06-12 13:23:38 +02:00
+								                skipWhitespace(parserState);
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                // Get returned elements.
 								                getItemsBefore(query, parserState, query.returned, "");
 								                // Nothing can come afterward!
-												Forbid rustdoc search query to end with ->

											
										
										
											2022-03-28 15:08:47 +02:00
+								                if (query.returned.length === 0) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                    throw ["Expected at least one item after ", "->"];
-												Forbid rustdoc search query to end with ->

											
										
										
											2022-03-28 15:08:47 +02:00
+								                }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                break;
 								            } else {
 								                parserState.pos += 1;
 								            }
 								        }
 								    }
 								    /**
 								     * Takes the user search input and returns an empty `ParsedQuery`.
 								     *
 								     * @param {string} userQuery
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @return {ParsedQuery}
 								     */
 								    function newParsedQuery(userQuery) {
 								        return {
 								            original: userQuery,
 								            userQuery: userQuery.toLowerCase(),
 								            elems: [],
 								            returned: [],
 								            // Total number of "top" elements (does not include generics).
 								            foundElems: 0,
-												rustdoc: bug fix for `-> option<t>`

											
										
										
											2023-08-05 11:22:21 -07:00
+								            // Total number of elements (includes generics).
 								            totalElems: 0,
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            literalSearch: false,
 								            error: null,
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            correction: null,
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            proposeCorrectionFrom: null,
 								            proposeCorrectionTo: null,
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            // bloom filter build from type ids
 								            typeFingerprint: new Uint32Array(4),
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        };
 								    }
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								    /**
 								     * Build an URL with search parameters.
 								     *
 								     * @param {string} search            - The current search being performed.
 								     * @param {string|null} filterCrates - The current filtering crate (if any).
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								     * @return {string}
 								     */
 								    function buildUrl(search, filterCrates) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let extra = "?search=" + encodeURIComponent(search);
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
 								        if (filterCrates !== null) {
 								            extra += "&filter-crate=" + encodeURIComponent(filterCrates);
 								        }
 								        return getNakedUrl() + extra + window.location.hash;
 								    }
 								    /**
 								     * Return the filtering crate or `null` if there is none.
 								     *
 								     * @return {string|null}
 								     */
 								    function getFilterCrates() {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const elem = document.getElementById("crate-search");
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
 								        if (elem &&
-												Improve crate selection on rustdoc search results page

Resolves all of issue #93240

Reproduces a similar change as #99086, but with improvements

In particular, this PR inlcludes:
* redesigning the crate-search selector so the background color matches its surroundings
* decrease the font of the dropdown menu to a reaonable size
* add a hover effect
* make the color of the arrow theme-dependent, using a surrounding div, with :after pseudo-element
  that can then be transformed using CSS filters to approximate the desired color
* fix the text "in" to match the title font
* remove the "for xyz" in the "Results for xyz in [All crates]" title when
  searching for search term "xyz"; you can already see what you're searching for
  as it's typed in the search bar!
* in line with #99086, handle super-long crate names appropriately without a long <select>
  element escaping the screen area; the improvement is that we also keep the title
  within a single line now; uses some flex layout shenanigans...
* the margins / paddings are adjusted so the selected label of the <select> fits within
  the rest of that title nicely; also some inconsistency in the way that Firefox renders
  a <select> with "appearance: none" (roughly 4px more padding left and right of the text
  than e.g. Chrome) is worked around, and it now produces a result that looks (essentially)
  identical to Chrome
* the color of the help menu and settings menu border in light theme is made to match with
  the color of the corresponding buttons, like they do (match) in the ayu theme
* the casing of "All crates" changes to "all crates"
* the new tests from #99086 are temporarily disabled, until they can be adapted later

											
										
										
											2022-07-03 20:10:19 +02:00
+								            elem.value !== "all crates" &&
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								            hasOwnPropertyRustdoc(rawSearchIndex, elem.value)
 								        ) {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								            return elem.value;
 								        }
 								        return null;
 								    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    /**
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * Parses the query.
-												Add query syntax for the parser

											
										
										
											2022-01-02 19:12:28 +01:00
+								     *
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								     * The supported syntax by this parser is given in the rustdoc book chapter
 								     * /src/doc/rustdoc/src/read-documentation/search.md
-												Add query syntax for the parser

											
										
										
											2022-01-02 19:12:28 +01:00
+								     *
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								     * When adding new things to the parser, add them there, too!
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								     *
 								     * @param  {string} val     - The user query
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								     * @return {ParsedQuery}    - The parsed query
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								     */
-												Improve naming of "val" field

											
										
										
											2022-01-03 16:43:30 +01:00
+								    function parseQuery(userQuery) {
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								        function convertTypeFilterOnElem(elem) {
 								            if (elem.typeFilter !== null) {
 								                let typeFilter = elem.typeFilter;
 								                if (typeFilter === "const") {
 								                    typeFilter = "constant";
 								                }
 								                elem.typeFilter = itemTypeFromName(typeFilter);
 								            } else {
 								                elem.typeFilter = NO_TYPE_FILTER;
 								            }
 								            for (const elem2 of elem.generics) {
 								                convertTypeFilterOnElem(elem2);
 								            }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            for (const constraints of elem.bindings.values()) {
 								                for (const constraint of constraints) {
 								                    convertTypeFilterOnElem(constraint);
 								                }
 								            }
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								        }
-												rustdoc-search: replace TAB/NL/LF with SP first

This way, most of the parsing code doesn't need to be designed to handle
it, since they should always be treated exactly the same anyhow.

											
										
										
											2023-11-29 10:54:49 -07:00
+								        userQuery = userQuery.trim().replace(/\r|\n|\t/g, " ");
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const parserState = {
-												Improve naming of "val" field

											
										
										
											2022-01-03 16:43:30 +01:00
+								            length: userQuery.length,
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								            pos: 0,
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								            // Total number of elements (includes generics).
 								            totalElems: 0,
-												Improve the BNF description a bit and fix some issues

											
										
										
											2022-03-28 16:14:00 +02:00
+								            genericsElems: 0,
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            typeFilter: null,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            isInBinding: null,
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            userQuery: userQuery.toLowerCase(),
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        };
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let query = newParsedQuery(userQuery);
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								        try {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            parseInput(query, parserState);
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            for (const elem of query.elems) {
 								                convertTypeFilterOnElem(elem);
 								            }
 								            for (const elem of query.returned) {
 								                convertTypeFilterOnElem(elem);
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								            }
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								        } catch (err) {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            query = newParsedQuery(userQuery);
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            query.error = err;
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								            return query;
 								        }
 								        if (!query.literalSearch) {
 								            // If there is more than one element in the query, we switch to literalSearch in any
 								            // case.
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            query.literalSearch = parserState.totalElems > 1;
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								        }
-												Simplify parser syntax

											
										
										
											2022-02-09 20:56:37 +01:00
+								        query.foundElems = query.elems.length + query.returned.length;
-												rustdoc: bug fix for `-> option<t>`

											
										
										
											2023-08-05 11:22:21 -07:00
+								        query.totalElems = parserState.totalElems;
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        return query;
 								    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								    /**
 								     * Creates the query results.
 								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @param {Array<Result>} results_in_args
 								     * @param {Array<Result>} results_returned
-												rustdoc-search: fix incorrect doc comment

											
										
										
											2023-04-14 13:32:44 -07:00
+								     * @param {Array<Result>} results_others
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @param {ParsedQuery} parsedQuery
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @return {ResultsTable}
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								     */
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    function createQueryResults(results_in_args, results_returned, results_others, parsedQuery) {
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								        return {
 								            "in_args": results_in_args,
 								            "returned": results_returned,
 								            "others": results_others,
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            "query": parsedQuery,
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								        };
 								    }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								    /**
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * Executes the parsed query and builds a {ResultsTable}.
-												Update search engine and parser to error when quotes are used on queries with more than one element.

											
										
										
											2022-01-03 14:11:54 +01:00
+								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @param  {ParsedQuery} parsedQuery - The parsed user query
 								     * @param  {Object} searchWords      - The list of search words to query against
 								     * @param  {Object} [filterCrates]   - Crate to search in if defined
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								     * @param  {Object} [currentCrate]   - Current crate, to rank results from this crate higher
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								     *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								     * @return {ResultsTable}
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								     */
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								    function execQuery(parsedQuery, searchWords, filterCrates, currentCrate) {
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								        const results_others = new Map(), results_in_args = new Map(),
 								            results_returned = new Map();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								        /**
 								         * Add extra data to result objects, and filter items that have been
 								         * marked for removal.
 								         *
 								         * @param {[ResultObject]} results
 								         * @returns {[ResultObject]}
 								         */
-												rustdoc: remove explicit boolean comparisons.

For boolean variables it's shorter and more readable to check the value
directly, or negate it with `!`.

In a couple of cases I reordered an if/else pair because it made the
initial `if` statement simpler.

Removed unused isType parameter from two functions.

											
										
										
											2021-05-09 13:49:22 -07:00
+								        function transformResults(results) {
-												rustdoc-search: use ES6 `Set` for deduplication instead of `Object`

											
										
										
											2023-04-13 16:51:01 -07:00
+								            const duplicates = new Set();
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const out = [];
-												Move duplicates removal when generating results instead of when displaying them

											
										
										
											2021-12-20 18:01:04 +01:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            for (const result of results) {
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								                if (result.id !== -1) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                    const obj = searchIndex[result.id];
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                    obj.dist = result.dist;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                    const res = buildHrefAndPath(obj);
-												rustdoc: remove explicit boolean comparisons.

For boolean variables it's shorter and more readable to check the value
directly, or negate it with `!`.

In a couple of cases I reordered an if/else pair because it made the
initial `if` statement simpler.

Removed unused isType parameter from two functions.

											
										
										
											2021-05-09 13:49:22 -07:00
+								                    obj.displayPath = pathSplitter(res[0]);
 								                    obj.fullPath = obj.displayPath + obj.name;
 								                    // To be sure than it some items aren't considered as duplicate.
 								                    obj.fullPath += "|" + obj.ty;
-												Move duplicates removal when generating results instead of when displaying them

											
										
										
											2021-12-20 18:01:04 +01:00
-												rustdoc-search: use ES6 `Set` for deduplication instead of `Object`

											
										
										
											2023-04-13 16:51:01 -07:00
+								                    if (duplicates.has(obj.fullPath)) {
-												Move duplicates removal when generating results instead of when displaying them

											
										
										
											2021-12-20 18:01:04 +01:00
+								                        continue;
 								                    }
-												rustdoc-search: use ES6 `Set` for deduplication instead of `Object`

											
										
										
											2023-04-13 16:51:01 -07:00
+								                    duplicates.add(obj.fullPath);
-												Move duplicates removal when generating results instead of when displaying them

											
										
										
											2021-12-20 18:01:04 +01:00
-												rustdoc: remove explicit boolean comparisons.

For boolean variables it's shorter and more readable to check the value
directly, or negate it with `!`.

In a couple of cases I reordered an if/else pair because it made the
initial `if` statement simpler.

Removed unused isType parameter from two functions.

											
										
										
											2021-05-09 13:49:22 -07:00
+								                    obj.href = res[1];
 								                    out.push(obj);
 								                    if (out.length >= MAX_RESULTS) {
 								                        break;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    }
 								                }
 								            }
 								            return out;
 								        }
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								        /**
 								         * This function takes a result map, and sorts it by various criteria, including edit
 								         * distance, substring match, and the crate it comes from.
 								         *
 								         * @param {Results} results
 								         * @param {boolean} isType
 								         * @param {string} preferredCrate
 								         * @returns {[ResultObject]}
 								         */
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								        function sortResults(results, isType, preferredCrate) {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // if there are no results then return to default and fail
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								            if (results.size === 0) {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                return [];
 								            }
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								            const userQuery = parsedQuery.userQuery;
 								            const result_list = [];
 								            for (const result of results.values()) {
 								                result.word = searchWords[result.id];
 								                result.item = searchIndex[result.id] || {};
 								                result_list.push(result);
 								            }
 								            result_list.sort((aaa, bbb) => {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                let a, b;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // sort by exact match with regard to the last word (mismatch goes later)
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								                a = (aaa.word !== userQuery);
 								                b = (bbb.word !== userQuery);
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								                // sort by index of keyword in item name (no literal occurrence goes later)
 								                a = (aaa.index < 0);
 								                b = (bbb.index < 0);
 								                if (a !== b) {
 								                    return a - b;
 								                }
 								                // Sort by distance in the path part, if specified
 								                // (less changes required to match means higher rankings)
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                a = aaa.path_dist;
 								                b = bbb.path_dist;
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
 								                // (later literal occurrence, if any, goes later)
 								                a = aaa.index;
 								                b = bbb.index;
 								                if (a !== b) {
 								                    return a - b;
 								                }
 								                // Sort by distance in the name part, the last part of the path
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                // (less changes required to match means higher rankings)
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                a = (aaa.dist);
 								                b = (bbb.dist);
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								                // sort deprecated items later
 								                a = aaa.item.deprecated;
 								                b = bbb.item.deprecated;
 								                if (a !== b) {
 								                    return a - b;
 								                }
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								                // sort by crate (current crate comes first)
 								                a = (aaa.item.crate !== preferredCrate);
 								                b = (bbb.item.crate !== preferredCrate);
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // sort by item name length (longer goes later)
 								                a = aaa.word.length;
 								                b = bbb.word.length;
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // sort by item name (lexicographically larger goes later)
 								                a = aaa.word;
 								                b = bbb.word;
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return (a > b ? +1 : -1);
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // sort by description (no description goes later)
 								                a = (aaa.item.desc === "");
 								                b = (bbb.item.desc === "");
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // sort by type (later occurrence in `itemTypes` goes later)
 								                a = aaa.item.ty;
 								                b = bbb.item.ty;
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return a - b;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // sort by path (lexicographically larger goes later)
 								                a = aaa.item.path;
 								                b = bbb.item.path;
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								                if (a !== b) {
 								                    return (a > b ? +1 : -1);
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								                // que sera, sera
 								                return 0;
 								            });
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								            return transformResults(result_list);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								        /**
 								         * This function checks if a list of search query `queryElems` can all be found in the
 								         * search index (`fnTypes`).
 								         *
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								         * This function returns `true` on a match, or `false` if none. If `solutionCb` is
 								         * supplied, it will call that function with mgens, and that callback can accept or
 								         * reject the result bu returning `true` or `false`. If the callback returns false,
 								         * then this function will try with a different solution, or bail with false if it
 								         * runs out of candidates.
 								         *
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								         * @param {Array<FunctionType>} fnTypesIn - The objects to check.
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								         * @param {Array<QueryElement>} queryElems - The elements from the parsed query.
 								         * @param {[FunctionType]} whereClause - Trait bounds for generic items.
 								         * @param {Map<number,number>|null} mgensIn
 								         *     - Map functions generics to query generics (never modified).
 								         * @param {null|Map<number,number> -> bool} solutionCb - Called for each `mgens` solution.
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								         *
 								         * @return {boolean} - Returns true if a match, false otherwise.
 								         */
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								        function unifyFunctionTypes(fnTypesIn, queryElems, whereClause, mgensIn, solutionCb) {
 								            /**
-												rustdoc-search: less new Maps in unifyFunctionType

This is a major source of expense on generic queries,
and this commit reduces them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-2/index.html

											
										
										
											2023-11-17 13:05:18 -07:00
+								             * @type Map<integer, integer>|null
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								             */
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            const mgens = mgensIn === null ? null : new Map(mgensIn);
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								            if (queryElems.length === 0) {
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                return !solutionCb || solutionCb(mgens);
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								            }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								            if (!fnTypesIn || fnTypesIn.length === 0) {
-												rustdoc-search: simplify JS in `checkGenerics`

											
										
										
											2023-06-02 18:31:51 -07:00
+								                return false;
 								            }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								            const ql = queryElems.length;
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            const fl = fnTypesIn.length;
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            // One element fast path / base case
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            if (ql === 1 && queryElems[0].generics.length === 0
 								                && queryElems[0].bindings.size === 0) {
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                const queryElem = queryElems[0];
 								                for (const fnType of fnTypesIn) {
 								                    if (!unifyFunctionTypeIsMatchCandidate(fnType, queryElem, whereClause, mgens)) {
 								                        continue;
 								                    }
 								                    if (fnType.id < 0 && queryElem.id < 0) {
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                        if (mgens && mgens.has(fnType.id) &&
 								                            mgens.get(fnType.id) !== queryElem.id) {
 								                            continue;
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                        }
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                        const mgensScratch = new Map(mgens);
 								                        mgensScratch.set(fnType.id, queryElem.id);
 								                        if (!solutionCb || solutionCb(mgensScratch)) {
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                            return true;
 								                        }
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                    } else if (!solutionCb || solutionCb(mgens ? new Map(mgens) : null)) {
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                        // unifyFunctionTypeIsMatchCandidate already checks that ids match
 								                        return true;
 								                    }
 								                }
 								                for (const fnType of fnTypesIn) {
 								                    if (!unifyFunctionTypeIsUnboxCandidate(fnType, queryElem, whereClause, mgens)) {
 								                        continue;
 								                    }
 								                    if (fnType.id < 0) {
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                        if (mgens && mgens.has(fnType.id) &&
 								                            mgens.get(fnType.id) !== 0) {
 								                            continue;
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                        }
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                        const mgensScratch = new Map(mgens);
 								                        mgensScratch.set(fnType.id, 0);
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                        if (unifyFunctionTypes(
 								                            whereClause[(-fnType.id) - 1],
 								                            queryElems,
 								                            whereClause,
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                            mgensScratch,
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                            solutionCb
 								                        )) {
 								                            return true;
 								                        }
 								                    } else if (unifyFunctionTypes(
-												rustdoc-search: fix fast path unboxing bindings

											
										
										
											2023-12-10 20:53:53 -07:00
+								                        [...fnType.generics, ...Array.from(fnType.bindings.values()).flat() ],
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                        queryElems,
 								                        whereClause,
-												rustdoc-search: fix accidental shared, mutable map

											
										
										
											2023-11-17 15:44:29 -07:00
+								                        mgens ? new Map(mgens) : null,
-												rustdoc-search: fast path for 1-query unification

Short queries, in addition to being common, are also the base
case for a lot of more complicated queries. We can avoid
most of the backtracking data structures, and use simple
recursive matching instead, by special casing them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-3/index.html

											
										
										
											2023-11-17 14:44:53 -07:00
+								                        solutionCb
 								                    )) {
 								                        return true;
 								                    }
 								                }
 								                return false;
 								            }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            // Multiple element recursive case
-												rustdoc-search: fix order-independence bug

											
										
										
											2023-06-08 23:12:36 -07:00
+								            /**
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								             * @type Array<FunctionType>
-												rustdoc-search: fix order-independence bug

											
										
										
											2023-06-08 23:12:36 -07:00
+								             */
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            const fnTypes = fnTypesIn.slice();
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								            /**
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								             * Algorithm works by building up a solution set in the working arrays
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								             * fnTypes gets mutated in place to make this work, while queryElems
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								             * is left alone.
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								             *
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								             * It works backwards, because arrays can be cheaply truncated that way.
 								             *
 								             *                         vvvvvvv `queryElem`
 								             * queryElems = [ unknown, unknown, good, good, good ]
 								             * fnTypes    = [ unknown, unknown, good, good, good ]
 								             *                ^^^^^^^^^^^^^^^^ loop over these elements to find candidates
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								             *
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								             * Everything in the current working solution is known to be a good
 								             * match, but it might not be the match we wind up going with, because
 								             * there might be more than one candidate match, and we need to try them all
 								             * before giving up. So, to handle this, it backtracks on failure.
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								             */
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            const flast = fl - 1;
 								            const qlast = ql - 1;
 								            const queryElem = queryElems[qlast];
 								            let queryElemsTmp = null;
 								            for (let i = flast; i >= 0; i -= 1) {
 								                const fnType = fnTypes[i];
 								                if (!unifyFunctionTypeIsMatchCandidate(fnType, queryElem, whereClause, mgens)) {
 								                    continue;
 								                }
 								                let mgensScratch;
 								                if (fnType.id < 0) {
 								                    mgensScratch = new Map(mgens);
 								                    if (mgensScratch.has(fnType.id)
 								                        && mgensScratch.get(fnType.id) !== queryElem.id) {
 								                        continue;
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                    }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                    mgensScratch.set(fnType.id, queryElem.id);
 								                } else {
 								                    mgensScratch = mgens;
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                // fnTypes[i] is a potential match
 								                // fnTypes[flast] is the last item in the list
 								                // swap them, and drop the potential match from the list
 								                // check if the remaining function types also match
 								                fnTypes[i] = fnTypes[flast];
 								                fnTypes.length = flast;
 								                if (!queryElemsTmp) {
 								                    queryElemsTmp = queryElems.slice(0, qlast);
 								                }
 								                const passesUnification = unifyFunctionTypes(
 								                    fnTypes,
 								                    queryElemsTmp,
 								                    whereClause,
 								                    mgensScratch,
 								                    mgensScratch => {
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                        if (fnType.generics.length === 0 && queryElem.generics.length === 0
 								                            && fnType.bindings.size === 0 && queryElem.bindings.size === 0) {
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                            return !solutionCb || solutionCb(mgensScratch);
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								                        }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                        const solution = unifyFunctionTypeCheckBindings(
 								                            fnType,
 								                            queryElem,
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                            whereClause,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                            mgensScratch
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                        );
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                        if (!solution) {
 								                            return false;
 								                        }
 								                        const simplifiedGenerics = solution.simplifiedGenerics;
 								                        for (const simplifiedMgens of solution.mgens) {
 								                            const passesUnification = unifyFunctionTypes(
 								                                simplifiedGenerics,
 								                                queryElem.generics,
 								                                whereClause,
 								                                simplifiedMgens,
 								                                solutionCb
 								                            );
 								                            if (passesUnification) {
 								                                return true;
 								                            }
 								                        }
 								                        return false;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								                    }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                );
 								                if (passesUnification) {
 								                    return true;
-												rustdoc-search: simplify JS in `checkGenerics`

											
										
										
											2023-06-02 18:31:51 -07:00
+								                }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                // backtrack
 								                fnTypes[flast] = fnTypes[i];
 								                fnTypes[i] = fnType;
 								                fnTypes.length = fl;
 								            }
 								            for (let i = flast; i >= 0; i -= 1) {
 								                const fnType = fnTypes[i];
 								                if (!unifyFunctionTypeIsUnboxCandidate(fnType, queryElem, whereClause, mgens)) {
 								                    continue;
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                let mgensScratch;
 								                if (fnType.id < 0) {
 								                    mgensScratch = new Map(mgens);
 								                    if (mgensScratch.has(fnType.id) && mgensScratch.get(fnType.id) !== 0) {
 								                        continue;
-												rustdoc-search: less new Maps in unifyFunctionType

This is a major source of expense on generic queries,
and this commit reduces them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-2/index.html

											
										
										
											2023-11-17 13:05:18 -07:00
+								                    }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                    mgensScratch.set(fnType.id, 0);
 								                } else {
 								                    mgensScratch = mgens;
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                const generics = fnType.id < 0 ?
 								                    whereClause[(-fnType.id) - 1] :
 								                    fnType.generics;
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                const bindings = fnType.bindings ?
 								                    Array.from(fnType.bindings.values()).flat() :
 								                    [];
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                const passesUnification = unifyFunctionTypes(
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                    fnTypes.toSpliced(i, 1, ...generics, ...bindings),
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								                    queryElems,
 								                    whereClause,
 								                    mgensScratch,
 								                    solutionCb
 								                );
 								                if (passesUnification) {
 								                    return true;
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                }
 								            }
-												rustdoc-search: switch to recursive backtracking

This is significantly faster, because

- It allows the one-element fast path to kick in on multi-
  element queries.
- It constructs intermediate data structures more lazily
  than the old system did.

It's measurably faster than the old algo even without the fast path, but
that fast path still helps significantly.

											
										
										
											2023-11-18 12:31:46 -07:00
+								            return false;
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								        }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        /**
 								         * Check if this function is a match candidate.
 								         *
 								         * This function is all the fast checks that don't require backtracking.
 								         * It checks that two items are not named differently, and is load-bearing for that.
 								         * It also checks that, if the query has generics, the function type must have generics
 								         * or associated type bindings: that's not load-bearing, but it prevents unnecessary
 								         * backtracking later.
 								         *
 								         * @param {FunctionType} fnType
 								         * @param {QueryElement} queryElem
 								         * @param {[FunctionSearchType]} whereClause - Trait bounds for generic items.
 								         * @param {Map<number,number>|null} mgensIn - Map functions generics to query generics.
 								         * @returns {boolean}
 								         */
 								        function unifyFunctionTypeIsMatchCandidate(fnType, queryElem, whereClause, mgensIn) {
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								            // type filters look like `trait:Read` or `enum:Result`
 								            if (!typePassesFilter(queryElem.typeFilter, fnType.ty)) {
-												rustdoc-search: fix order-independence bug

											
										
										
											2023-06-08 23:12:36 -07:00
+								                return false;
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								            }
 								            // fnType.id < 0 means generic
 								            // queryElem.id < 0 does too
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            // mgensIn[fnType.id] = queryElem.id
 								            // or, if mgensIn[fnType.id] = 0, then we've matched this generic with a bare trait
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								            // and should make that same decision everywhere it appears
 								            if (fnType.id < 0 && queryElem.id < 0) {
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                if (mgensIn) {
 								                    if (mgensIn.has(fnType.id) && mgensIn.get(fnType.id) !== queryElem.id) {
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                        return false;
 								                    }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                    for (const [fid, qid] of mgensIn.entries()) {
-												rustdoc-search: less new Maps in unifyFunctionType

This is a major source of expense on generic queries,
and this commit reduces them.

Profile output:
https://notriddle.com/rustdoc-html-demo-5/profile-2/index.html

											
										
										
											2023-11-17 13:05:18 -07:00
+								                        if (fnType.id !== fid && queryElem.id === qid) {
 								                            return false;
 								                        }
 								                        if (fnType.id === fid && queryElem.id !== qid) {
 								                            return false;
 								                        }
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                    }
 								                }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                return true;
-												rustdoc-search: fix bug with multi-item impl trait

											
										
										
											2023-10-05 22:32:37 -07:00
+								            } else {
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                if (queryElem.id === typeNameIdOfArrayOrSlice &&
 								                    (fnType.id === typeNameIdOfSlice || fnType.id === typeNameIdOfArray)
 								                ) {
 								                    // [] matches primitive:array or primitive:slice
 								                    // if it matches, then we're fine, and this is an appropriate match candidate
-												rustdoc-search: simplify the checkTypes fast path

This reduces code size while still matching the common case
for plain, concrete types.

											
										
										
											2023-10-25 08:52:12 -07:00
+								                } else if (fnType.id !== queryElem.id || queryElem.id === null) {
-												rustdoc-search: fix order-independence bug

											
										
										
											2023-06-08 23:12:36 -07:00
+								                    return false;
-												rustdoc-search: simplify JS in `checkGenerics`

											
										
										
											2023-06-02 18:31:51 -07:00
+								                }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                // If the query elem has generics, and the function doesn't,
 								                // it can't match.
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                if ((fnType.generics.length + fnType.bindings.size) === 0 &&
 								                    queryElem.generics.length !== 0
 								                ) {
 								                    return false;
 								                }
 								                if (fnType.bindings.size < queryElem.bindings.size) {
-												rustdoc-search: fix order-independence bug

											
										
										
											2023-06-08 23:12:36 -07:00
+								                    return false;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                // If the query element is a path (it contains `::`), we need to check if this
 								                // path is compatible with the target type.
 								                const queryElemPathLength = queryElem.pathWithoutLast.length;
 								                if (queryElemPathLength > 0) {
 								                    const fnTypePath = fnType.path !== undefined && fnType.path !== null ?
 								                        fnType.path.split("::") : [];
 								                    // If the path provided in the query element is longer than this type,
 								                    // no need to check it since it won't match in any case.
 								                    if (queryElemPathLength > fnTypePath.length) {
 								                        return false;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								                    }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                    let i = 0;
 								                    for (const path of fnTypePath) {
 								                        if (path === queryElem.pathWithoutLast[i]) {
 								                            i += 1;
 								                            if (i >= queryElemPathLength) {
 								                                break;
 								                            }
 								                        }
 								                    }
 								                    if (i < queryElemPathLength) {
 								                        // If we didn't find all parts of the path of the query element inside
 								                        // the fn type, then it's not the right one.
 								                        return false;
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								                    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                return true;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								        }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        /**
 								         * This function checks the associated type bindings. Any that aren't matched get converted
 								         * to generics, and this function returns an array of the function's generics with these
 								         * simplified bindings added to them. That is, it takes a path like this:
 								         *
 								         *     Iterator<Item=u32>
 								         *
 								         * ... if queryElem itself has an `Item=` in it, then this function returns an empty array.
 								         * But if queryElem contains no Item=, then this function returns a one-item array with the
 								         * ID of u32 in it, and the rest of the matching engine acts as if `Iterator<u32>` were
 								         * the type instead.
 								         *
 								         * @param {FunctionType} fnType
 								         * @param {QueryElement} queryElem
 								         * @param {[FunctionType]} whereClause - Trait bounds for generic items.
 								         * @param {Map<number,number>} mgensIn - Map functions generics to query generics.
 								         *                                            Never modified.
 								         * @returns {false|{mgens: [Map<number,number>], simplifiedGenerics: [FunctionType]}}
 								         */
 								        function unifyFunctionTypeCheckBindings(fnType, queryElem, whereClause, mgensIn) {
 								            if (fnType.bindings.size < queryElem.bindings.size) {
 								                return false;
 								            }
 								            let simplifiedGenerics = fnType.generics || [];
 								            if (fnType.bindings.size > 0) {
 								                let mgensSolutionSet = [mgensIn];
 								                for (const [name, constraints] of queryElem.bindings.entries()) {
 								                    if (mgensSolutionSet.length === 0) {
 								                        return false;
 								                    }
 								                    if (!fnType.bindings.has(name)) {
 								                        return false;
 								                    }
 								                    const fnTypeBindings = fnType.bindings.get(name);
 								                    mgensSolutionSet = mgensSolutionSet.flatMap(mgens => {
 								                        const newSolutions = [];
 								                        unifyFunctionTypes(
 								                            fnTypeBindings,
 								                            constraints,
 								                            whereClause,
 								                            mgens,
 								                            newMgens => {
 								                                newSolutions.push(newMgens);
 								                                // return `false` makes unifyFunctionTypes return the full set of
 								                                // possible solutions
 								                                return false;
 								                            }
 								                        );
 								                        return newSolutions;
 								                    });
 								                }
 								                if (mgensSolutionSet.length === 0) {
 								                    return false;
 								                }
 								                const binds = Array.from(fnType.bindings.entries()).flatMap(entry => {
 								                    const [name, constraints] = entry;
 								                    if (queryElem.bindings.has(name)) {
 								                        return [];
 								                    } else {
 								                        return constraints;
 								                    }
 								                });
 								                if (simplifiedGenerics.length > 0) {
 								                    simplifiedGenerics = [...simplifiedGenerics, ...binds];
 								                } else {
 								                    simplifiedGenerics = binds;
 								                }
 								                return { simplifiedGenerics, mgens: mgensSolutionSet };
 								            }
 								            return { simplifiedGenerics, mgens: [mgensIn] };
 								        }
 								        /**
 								         * @param {FunctionType} fnType
 								         * @param {QueryElement} queryElem
 								         * @param {[FunctionType]} whereClause - Trait bounds for generic items.
 								         * @param {Map<number,number>|null} mgens - Map functions generics to query generics.
 								         * @returns {boolean}
 								         */
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								        function unifyFunctionTypeIsUnboxCandidate(fnType, queryElem, whereClause, mgens) {
 								            if (fnType.id < 0 && queryElem.id >= 0) {
 								                if (!whereClause) {
 								                    return false;
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                // mgens[fnType.id] === 0 indicates that we committed to unboxing this generic
 								                // mgens[fnType.id] === null indicates that we haven't decided yet
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                if (mgens && mgens.has(fnType.id) && mgens.get(fnType.id) !== 0) {
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                    return false;
 								                }
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								                // Where clauses can represent cyclical data.
 								                // `null` prevents it from trying to unbox in an infinite loop
 								                const mgensTmp = new Map(mgens);
 								                mgensTmp.set(fnType.id, null);
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                // This is only a potential unbox if the search query appears in the where clause
 								                // for example, searching `Read -> usize` should find
 								                // `fn read_all<R: Read>(R) -> Result<usize>`
 								                // generic `R` is considered "unboxed"
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								                return checkIfInList(
 								                    whereClause[(-fnType.id) - 1],
 								                    queryElem,
 								                    whereClause,
 								                    mgensTmp
 								                );
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            } else if (fnType.generics.length > 0 || fnType.bindings.size > 0) {
 								                const simplifiedGenerics = [
 								                    ...fnType.generics,
 								                    ...Array.from(fnType.bindings.values()).flat(),
 								                ];
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								                return checkIfInList(simplifiedGenerics, queryElem, whereClause, mgens);
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            }
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								            return false;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								        /**
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								          * This function checks if the object (`row`) matches the given type (`elem`) and its
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								          * generics (if any).
 								          *
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								          * @param {Array<FunctionType>} list
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								          * @param {QueryElement} elem          - The element from the parsed query.
 								          * @param {[FunctionType]} whereClause - Trait bounds for generic items.
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								         * @param {Map<number,number>|null} mgens - Map functions generics to query generics.
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								          *
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								          * @return {boolean} - Returns true if found, false otherwise.
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								          */
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								        function checkIfInList(list, elem, whereClause, mgens) {
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								            for (const entry of list) {
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								                if (checkType(entry, elem, whereClause, mgens)) {
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                    return true;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								            }
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            return false;
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        }
 								        /**
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								          * This function checks if the object (`row`) matches the given type (`elem`) and its
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								          * generics (if any).
 								          *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								          * @param {Row} row
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								          * @param {QueryElement} elem          - The element from the parsed query.
 								          * @param {[FunctionType]} whereClause - Trait bounds for generic items.
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								         * @param {Map<number,number>|null} mgens - Map functions generics to query generics.
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								          *
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								          * @return {boolean} - Returns true if the type matches, false otherwise.
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								          */
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								        function checkType(row, elem, whereClause, mgens) {
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            if (row.bindings.size === 0 && elem.bindings.size === 0) {
 								                if (elem.id < 0) {
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								                    return row.id < 0 || checkIfInList(row.generics, elem, whereClause, mgens);
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                }
 								                if (row.id > 0 && elem.id > 0 && elem.pathWithoutLast.length === 0 &&
 								                    typePassesFilter(elem.typeFilter, row.ty) && elem.generics.length === 0 &&
 								                    // special case
 								                    elem.id !== typeNameIdOfArrayOrSlice
 								                ) {
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								                    return row.id === elem.id || checkIfInList(
 								                        row.generics,
 								                        elem,
 								                        whereClause,
 								                        mgens
 								                    );
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												rustdoc-search: avoid infinite where clause unbox

Fixes #118242

											
										
										
											2023-11-24 09:47:55 -07:00
+								            return unifyFunctionTypes([row], [elem], whereClause, mgens);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								        function checkPath(contains, ty, maxEditDistance) {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            if (contains.length === 0) {
 								                return 0;
 								            }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								            let ret_dist = maxEditDistance + 1;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const path = ty.path.split("::");
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								            if (ty.parent && ty.parent.name) {
 								                path.push(ty.parent.name.toLowerCase());
 								            }
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const length = path.length;
 								            const clength = contains.length;
-												rustdoc-search: clean up `checkPath`

This computes the same result with less code by computing many of
the old checks at once:

* It won't enter the loop if clength > length, because then the
  result of length - clength will be negative and the
  loop conditional will fail.
* i + clength will never be greater than length, because it
  starts out as i = length - clength, implying that i + clength
  equals length, and it only goes down from there.
* The aborted variable is replaced with control flow.

											
										
										
											2023-11-20 13:15:47 -07:00
+								            pathiter: for (let i = length - clength; i >= 0; i -= 1) {
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                let dist_total = 0;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                for (let x = 0; x < clength; ++x) {
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                    const dist = editDistance(path[i + x], contains[x], maxEditDistance);
 								                    if (dist > maxEditDistance) {
-												rustdoc-search: clean up `checkPath`

This computes the same result with less code by computing many of
the old checks at once:

* It won't enter the loop if clength > length, because then the
  result of length - clength will be negative and the
  loop conditional will fail.
* i + clength will never be greater than length, because it
  starts out as i = length - clength, implying that i + clength
  equals length, and it only goes down from there.
* The aborted variable is replaced with control flow.

											
										
										
											2023-11-20 13:15:47 -07:00
+								                        continue pathiter;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                    dist_total += dist;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                }
-												rustdoc-search: clean up `checkPath`

This computes the same result with less code by computing many of
the old checks at once:

* It won't enter the loop if clength > length, because then the
  result of length - clength will be negative and the
  loop conditional will fail.
* i + clength will never be greater than length, because it
  starts out as i = length - clength, implying that i + clength
  equals length, and it only goes down from there.
* The aborted variable is replaced with control flow.

											
										
										
											2023-11-20 13:15:47 -07:00
+								                ret_dist = Math.min(ret_dist, Math.round(dist_total / clength));
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								            return ret_dist;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
 								        function typePassesFilter(filter, type) {
-												Refactor conditional

											
										
										
											2022-02-04 14:59:22 -05:00
+								            // No filter or Exact mach
 								            if (filter <= NO_TYPE_FILTER || filter === type) return true;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								            // Match related items
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const name = itemTypes[type];
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            switch (itemTypes[filter]) {
 								                case "constant":
 								                    return name === "associatedconstant";
 								                case "fn":
 								                    return name === "method" || name === "tymethod";
 								                case "type":
 								                    return name === "primitive" || name === "associatedtype";
 								                case "trait":
 								                    return name === "traitalias";
 								            }
 								            // No match
 								            return false;
 								        }
 								        function createAliasFromItem(item) {
 								            return {
 								                crate: item.crate,
 								                name: item.name,
 								                path: item.path,
 								                desc: item.desc,
 								                ty: item.ty,
 								                parent: item.parent,
 								                type: item.type,
 								                is_alias: true,
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								                deprecated: item.deprecated,
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								                implDisambiguator: item.implDisambiguator,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            };
 								        }
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								        function handleAliases(ret, query, filterCrates, currentCrate) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const lowerQuery = query.toLowerCase();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // We separate aliases and crate aliases because we want to have current crate
 								            // aliases to be before the others in the displayed results.
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const aliases = [];
 								            const crateAliases = [];
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								            if (filterCrates !== null) {
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                if (ALIASES.has(filterCrates) && ALIASES.get(filterCrates).has(lowerQuery)) {
 								                    const query_aliases = ALIASES.get(filterCrates).get(lowerQuery);
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                    for (const alias of query_aliases) {
 								                        aliases.push(createAliasFromItem(searchIndex[alias]));
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    }
 								                }
 								            } else {
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                for (const [crate, crateAliasesIndex] of ALIASES) {
 								                    if (crateAliasesIndex.has(lowerQuery)) {
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								                        const pushTo = crate === currentCrate ? crateAliases : aliases;
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                        const query_aliases = crateAliasesIndex.get(lowerQuery);
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                        for (const alias of query_aliases) {
 								                            pushTo.push(createAliasFromItem(searchIndex[alias]));
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                        }
 								                    }
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								            const sortFunc = (aaa, bbb) => {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                if (aaa.path < bbb.path) {
 								                    return 1;
 								                } else if (aaa.path === bbb.path) {
 								                    return 0;
 								                }
 								                return -1;
 								            };
 								            crateAliases.sort(sortFunc);
 								            aliases.sort(sortFunc);
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								            const pushFunc = alias => {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                alias.alias = query;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const res = buildHrefAndPath(alias);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                alias.displayPath = pathSplitter(res[0]);
 								                alias.fullPath = alias.displayPath + alias.name;
 								                alias.href = res[1];
 								                ret.others.unshift(alias);
 								                if (ret.others.length > MAX_RESULTS) {
 								                    ret.others.pop();
 								                }
 								            };
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
 								            aliases.forEach(pushFunc);
 								            crateAliases.forEach(pushFunc);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								        /**
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								         * This function adds the given result into the provided `results` map if it matches the
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         * following condition:
 								         *
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								         * * If it is a "literal search" (`parsedQuery.literalSearch`), then `dist` must be 0.
 								         * * If it is not a "literal search", `dist` must be <= `maxEditDistance`.
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								         * The `results` map contains information which will be used to sort the search results:
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								         * * `fullId` is a `string`` used as the key of the object we use for the `results` map.
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         * * `id` is the index in both `searchWords` and `searchIndex` arrays for this element.
 								         * * `index` is an `integer`` used to sort by the position of the word in the item's name.
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								         * * `dist` is the main metric used to sort the search results.
 								         * * `path_dist` is zero if a single-component search query is used, otherwise it's the
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								         *   distance computed for everything other than the last path component.
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         *
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								         * @param {Results} results
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         * @param {string} fullId
 								         * @param {integer} id
 								         * @param {integer} index
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								         * @param {integer} dist
 								         * @param {integer} path_dist
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								         */
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								        function addIntoResults(results, fullId, id, index, dist, path_dist, maxEditDistance) {
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            if (dist <= maxEditDistance || index !== -1) {
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								                if (results.has(fullId)) {
 								                    const result = results.get(fullId);
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                    if (result.dontValidate || result.dist <= dist) {
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								                        return;
 								                    }
 								                }
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								                results.set(fullId, {
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								                    id: id,
 								                    index: index,
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                    dontValidate: parsedQuery.literalSearch,
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                    dist: dist,
 								                    path_dist: path_dist,
-												rustdoc-search: use ES6 Map for `Result` instead of Object

											
										
										
											2023-04-13 17:05:12 -07:00
+								                });
-												Clean up search code and unify function returned values

											
										
										
											2021-12-15 20:52:37 +01:00
+								            }
 								        }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        /**
 								         * This function is called in case the query is only one element (with or without generics).
-												Extend `handleSingleArg` documentation

											
										
										
											2022-04-20 21:11:39 +02:00
+								         * This element will be compared to arguments' and returned values' items and also to items.
 								         *
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								         * Other important thing to note: since there is only one element, we use edit
-												Extend `handleSingleArg` documentation

											
										
										
											2022-04-20 21:11:39 +02:00
+								         * distance for name comparisons.
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								         *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								         * @param {Row} row
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								         * @param {integer} pos              - Position in the `searchIndex`.
 								         * @param {QueryElement} elem        - The element from the parsed query.
 								         * @param {Results} results_others   - Unqualified results (not in arguments nor in
 								         *                                     returned values).
 								         * @param {Results} results_in_args  - Matching arguments results.
 								         * @param {Results} results_returned - Matching returned arguments results.
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								         */
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								        function handleSingleArg(
 								            row,
 								            pos,
 								            elem,
 								            results_others,
 								            results_in_args,
-												rustdoc: compute maximum Levenshtein distance based on the query

The heuristic is pretty close to the name resolver.

Fixes #103357

											
										
										
											2022-10-28 21:54:09 -07:00
+								            results_returned,
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								            maxEditDistance
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								        ) {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            if (!row || (filterCrates !== null && row.crate !== filterCrates)) {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                return;
 								            }
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            let index = -1, path_dist = 0;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const fullId = row.id;
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								            const searchWord = searchWords[pos];
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            // fpDist is a minimum possible type distance, where "type distance" is the number of
 								            // atoms in the function not present in the query
 								            const tfpDist = compareTypeFingerprints(
 								                fullId,
 								                parsedQuery.typeFingerprint
 								            );
 								            if (tfpDist !== null &&
 								                !(results_in_args.size >= MAX_RESULTS && tfpDist > results_in_args.max_dist)
 								            ) {
 								                const in_args = row.type && row.type.inputs
 								                    && checkIfInList(row.type.inputs, elem, row.type.where_clause);
 								                if (in_args) {
 								                    results_in_args.max_dist = Math.max(results_in_args.max_dist || 0, tfpDist);
 								                    const maxDist = results_in_args.size < MAX_RESULTS ?
 								                        (tfpDist + 1) :
 								                        results_in_args.max_dist;
 								                    addIntoResults(results_in_args, fullId, pos, -1, tfpDist, 0, maxDist);
 								                }
 								            }
 								            if (tfpDist !== false &&
 								                !(results_returned.size >= MAX_RESULTS && tfpDist > results_returned.max_dist)
 								            ) {
 								                const returned = row.type && row.type.output
 								                    && checkIfInList(row.type.output, elem, row.type.where_clause);
 								                if (returned) {
 								                    results_returned.max_dist = Math.max(results_returned.max_dist || 0, tfpDist);
 								                    const maxDist = results_returned.size < MAX_RESULTS ?
 								                        (tfpDist + 1) :
 								                        results_returned.max_dist;
 								                    addIntoResults(results_returned, fullId, pos, -1, tfpDist, 0, maxDist);
 								                }
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
-												rustdoc: add support for type filters in arguments and generics

This makes sense, since the search index has the information in it,
and it's more useful for function signature searches since a
function signature search's item type is, by definition, some type
of function (there's more than one, but not very many).

											
										
										
											2023-02-28 18:17:59 -07:00
+								            if (!typePassesFilter(elem.typeFilter, row.ty)) {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                return;
 								            }
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								            const row_index = row.normalizedName.indexOf(elem.pathLast);
 								            const word_index = searchWord.indexOf(elem.pathLast);
 								            // lower indexes are "better" matches
 								            // rank based on the "best" match
 								            if (row_index === -1) {
 								                index = word_index;
 								            } else if (word_index === -1) {
 								                index = row_index;
 								            } else if (word_index < row_index) {
 								                index = word_index;
 								            } else {
 								                index = row_index;
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								            }
 								            if (elem.fullPath.length > 1) {
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                path_dist = checkPath(elem.pathWithoutLast, row, maxEditDistance);
 								                if (path_dist > maxEditDistance) {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                    return;
 								                }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								            if (parsedQuery.literalSearch) {
 								                if (searchWord === elem.name) {
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                    addIntoResults(results_others, fullId, pos, index, 0, path_dist);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                return;
 								            }
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            const dist = editDistance(searchWord, elem.pathLast, maxEditDistance);
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								            if (index === -1 && dist + path_dist > maxEditDistance) {
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
+								                return;
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								            }
-												rustdoc: simplify JS search routine by not messing with lev distance

Since the sorting function accounts for an `index` field, there's not much
reason to also be applying changes to the levenshtein distance. Instead,
we can just not treat `lev` as a filter if there's already a non-sentinel
value for `index`.

This change gives slightly more weight to the index and path part, as
search criteria, than it used to. This changes some of the test cases,
but not in any obviously-"worse" way, and, in particular, substring matches
are a bigger deal than levenshtein distances (we're assuming that a typo
is less likely than someone just not typing the entire name).

Based on
https://github.com/rust-lang/rust/pull/103710#issuecomment-1296894296

											
										
										
											2022-12-16 11:12:59 -07:00
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								            addIntoResults(results_others, fullId, pos, index, dist, path_dist, maxEditDistance);
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        /**
-												Improve documentation and add some explanations in the code

											
										
										
											2022-02-11 15:48:57 +01:00
+								         * This function is called in case the query has more than one element. In this case, it'll
 								         * try to match the items which validates all the elements. For `aa -> bb` will look for
 								         * functions which have a parameter `aa` and has `bb` in its returned values.
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								         *
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								         * @param {Row} row
 								         * @param {integer} pos      - Position in the `searchIndex`.
 								         * @param {Object} results
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								         */
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								        function handleArgs(row, pos, results) {
-												rustdoc-search: build args, return, and generics on one unifier

This enhances generics with the "unboxing" behavior where A<T>
matches T. It makes this unboxing transitive over generics.

											
										
										
											2023-06-02 19:58:44 -07:00
+								            if (!row || (filterCrates !== null && row.crate !== filterCrates) || !row.type) {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                return;
 								            }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            const tfpDist = compareTypeFingerprints(
 								                row.id,
 								                parsedQuery.typeFingerprint
 								            );
 								            if (tfpDist === null) {
 								                return;
 								            }
 								            if (results.size >= MAX_RESULTS && tfpDist > results.max_dist) {
 								                return;
 								            }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								            // If the result is too "bad", we return false and it ends this search.
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            if (!unifyFunctionTypes(
 								                row.type.inputs,
 								                parsedQuery.elems,
 								                row.type.where_clause,
-												rustdoc-search: fix bugs when unboxing and reordering combine

											
										
										
											2023-09-09 16:49:29 -07:00
+								                null,
 								                mgens => {
 								                    return unifyFunctionTypes(
 								                        row.type.output,
 								                        parsedQuery.returned,
 								                        row.type.where_clause,
 								                        mgens
 								                    );
 								                }
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            )) {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                return;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            results.max_dist = Math.max(results.max_dist || 0, tfpDist);
 								            addIntoResults(results, row.id, pos, 0, tfpDist, 0, Number.MAX_VALUE);
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        function innerRunQuery() {
-												rustdoc: compute maximum Levenshtein distance based on the query

The heuristic is pretty close to the name resolver.

Fixes #103357

											
										
										
											2022-10-28 21:54:09 -07:00
+								            let queryLen = 0;
 								            for (const elem of parsedQuery.elems) {
 								                queryLen += elem.name.length;
 								            }
 								            for (const elem of parsedQuery.returned) {
 								                queryLen += elem.name.length;
 								            }
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								            const maxEditDistance = Math.floor(queryLen / 3);
-												rustdoc: compute maximum Levenshtein distance based on the query

The heuristic is pretty close to the name resolver.

Fixes #103357

											
										
										
											2022-10-28 21:54:09 -07:00
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            /**
 								             * @type {Map<string, integer>}
 								             */
 								            const genericSymbols = new Map();
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            /**
 								             * Convert names to ids in parsed query elements.
 								             * This is not used for the "In Names" tab, but is used for the
 								             * "In Params", "In Returns", and "In Function Signature" tabs.
 								             *
 								             * If there is no matching item, but a close-enough match, this
 								             * function also that correction.
 								             *
 								             * See `buildTypeMapIndex` for more information.
 								             *
 								             * @param {QueryElement} elem
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								             * @param {boolean} isAssocType
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								             */
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								            function convertNameToId(elem, isAssocType) {
 								                if (typeNameIdMap.has(elem.pathLast) &&
 								                    (isAssocType || !typeNameIdMap.get(elem.pathLast).assocOnly)) {
 								                    elem.id = typeNameIdMap.get(elem.pathLast).id;
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                } else if (!parsedQuery.literalSearch) {
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								                    let match = null;
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                    let matchDist = maxEditDistance + 1;
 								                    let matchName = "";
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								                    for (const [name, {id, assocOnly}] of typeNameIdMap) {
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								                        const dist = editDistance(name, elem.pathLast, maxEditDistance);
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								                        if (dist <= matchDist && dist <= maxEditDistance &&
 								                            (isAssocType || !assocOnly)) {
-												rustdoc-search: make type name correction choice deterministic

											
										
										
											2023-04-20 12:34:17 -07:00
+								                            if (dist === matchDist && matchName > name) {
 								                                continue;
 								                            }
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                            match = id;
 								                            matchDist = dist;
 								                            matchName = name;
 								                        }
 								                    }
-												rustdoc-search: `null`, not `-1`, for missing id

This allows us to use negative numbers for others purposes.

											
										
										
											2023-06-15 13:55:45 -07:00
+								                    if (match !== null) {
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                        parsedQuery.correction = matchName;
 								                    }
 								                    elem.id = match;
 								                }
-												rustdoc: fix test case for generics that look like names

											
										
										
											2023-08-05 12:27:58 -07:00
+								                if ((elem.id === null && parsedQuery.totalElems > 1 && elem.typeFilter === -1
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                     && elem.generics.length === 0 && elem.bindings.size === 0)
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                    || elem.typeFilter === TY_GENERIC) {
 								                    if (genericSymbols.has(elem.name)) {
 								                        elem.id = genericSymbols.get(elem.name);
 								                    } else {
 								                        elem.id = -(genericSymbols.size + 1);
 								                        genericSymbols.set(elem.name, elem.id);
 								                    }
 								                    if (elem.typeFilter === -1 && elem.name.length >= 3) {
 								                        // Silly heuristic to catch if the user probably meant
 								                        // to not write a generic parameter. We don't use it,
 								                        // just bring it up.
 								                        const maxPartDistance = Math.floor(elem.name.length / 3);
 								                        let matchDist = maxPartDistance + 1;
 								                        let matchName = "";
 								                        for (const name of typeNameIdMap.keys()) {
 								                            const dist = editDistance(name, elem.name, maxPartDistance);
 								                            if (dist <= matchDist && dist <= maxPartDistance) {
 								                                if (dist === matchDist && matchName > name) {
 								                                    continue;
 								                                }
 								                                matchDist = dist;
 								                                matchName = name;
 								                            }
 								                        }
 								                        if (matchName !== "") {
 								                            parsedQuery.proposeCorrectionFrom = elem.name;
 								                            parsedQuery.proposeCorrectionTo = matchName;
 								                        }
 								                    }
 								                    elem.typeFilter = TY_GENERIC;
 								                }
 								                if (elem.generics.length > 0 && elem.typeFilter === TY_GENERIC) {
 								                    // Rust does not have HKT
 								                    parsedQuery.error = [
 								                        "Generic type parameter ",
 								                        elem.name,
 								                        " does not accept generic parameters",
 								                    ];
 								                }
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                for (const elem2 of elem.generics) {
 								                    convertNameToId(elem2);
 								                }
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                elem.bindings = new Map(Array.from(elem.bindings.entries())
 								                    .map(entry => {
 								                        const [name, constraints] = entry;
 								                        if (!typeNameIdMap.has(name)) {
 								                            parsedQuery.error = [
 								                                "Type parameter ",
 								                                name,
 								                                " does not exist",
 								                            ];
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								                            return [null, []];
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                        }
 								                        for (const elem2 of constraints) {
 								                            convertNameToId(elem2);
 								                        }
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								                        return [typeNameIdMap.get(name).id, constraints];
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                    })
 								                );
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            }
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            const fps = new Set();
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            for (const elem of parsedQuery.elems) {
 								                convertNameToId(elem);
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								                buildFunctionTypeFingerprint(elem, parsedQuery.typeFingerprint, fps);
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            }
 								            for (const elem of parsedQuery.returned) {
 								                convertNameToId(elem);
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								                buildFunctionTypeFingerprint(elem, parsedQuery.typeFingerprint, fps);
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            }
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            if (parsedQuery.foundElems === 1 && parsedQuery.returned.length === 0) {
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								                if (parsedQuery.elems.length === 1) {
-												Clean up variables in `search.js`

											
										
										
											2023-12-12 19:31:43 +01:00
+								                    const elem = parsedQuery.elems[0];
 								                    for (let i = 0, nSearchWords = searchWords.length; i < nSearchWords; ++i) {
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								                        // It means we want to check for this element everywhere (in names, args and
 								                        // returned).
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								                        handleSingleArg(
 								                            searchIndex[i],
 								                            i,
 								                            elem,
 								                            results_others,
 								                            results_in_args,
-												rustdoc: compute maximum Levenshtein distance based on the query

The heuristic is pretty close to the name resolver.

Fixes #103357

											
										
										
											2022-10-28 21:54:09 -07:00
+								                            results_returned,
-												rustdoc: use restricted Damerau-Levenshtein distance for search

Based on https://github.com/rust-lang/rust/pull/108200, for the same
rationale.

> This replaces the existing Levenshtein algorithm with the
> Damerau-Levenshtein algorithm. This means that "ab" to "ba" is one change
> (a transposition) instead of two (a deletion and insertion). More
> specifically, this is a restricted implementation, in that "ca" to "abc"
> cannot be performed as "ca" → "ac" → "abc", as there is an insertion in the
> middle of a transposition. I believe that errors like that are sufficiently
> rare that it's not worth taking into account.

Before this change, searching `prinltn!` listed `print!` first, followed
by `println!`. With this change, `println!` matches more closely.

											
										
										
											2023-03-10 18:18:43 -07:00
+								                            maxEditDistance
-												Apply suggestions:

 * Forbid generics without a path (so "<p>" is forbidden).
 * Change `handleSingleArg` so that it takes `results_others`, `results_in_args` and `results_returned` as arguments instead of using the "global" variables.
 * Change `createQueryElement` so that it returns the newly created element instead of taking `elems` as argument.
 * Improve documentation

											
										
										
											2022-03-20 15:03:17 +01:00
+								                        );
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    }
 								                }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            } else if (parsedQuery.foundElems > 0) {
-												rustdoc-search: better hashing, faster unification

The hash changes are based on some tests with `arti` and various
specific queries, aimed at reducing the false positive rate.

Sorting the query elements so that generics always come first is
instead aimed at reducing the number of Map operations on mgens,
assuming if the bloom filter does find a false positive, it'll
be able to reject the row without having to track a mapping.

- https://hur.st/bloomfilter/?n=3&p=&m=96&k=6

  Different functions have different amounts of inputs, and
  unification isn't very slow anyway, so figuring out a single
  ideal number of hash functions is nasty, but 6 keeps things
  low even up to 10 inputs.

- https://web.archive.org/web/20210927123933/https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.72.2442&rep=rep1&type=pdf

  This is the `h1` and `h2`, both derived from `h0`.

											
										
										
											2023-12-10 22:46:40 -07:00
+								                // Sort input and output so that generic type variables go first and
 								                // types with generic parameters go last.
 								                // That's because of the way unification is structured: it eats off
 								                // the end, and hits a fast path if the last item is a simple atom.
 								                const sortQ = (a, b) => {
 								                    const ag = a.generics.length === 0 && a.bindings.size === 0;
 								                    const bg = b.generics.length === 0 && b.bindings.size === 0;
 								                    if (ag !== bg) {
 								                        return ag - bg;
 								                    }
 								                    const ai = a.id > 0;
 								                    const bi = b.id > 0;
 								                    return ai - bi;
 								                };
 								                parsedQuery.elems.sort(sortQ);
 								                parsedQuery.returned.sort(sortQ);
-												Clean up variables in `search.js`

											
										
										
											2023-12-12 19:31:43 +01:00
+								                for (let i = 0, nSearchWords = searchWords.length; i < nSearchWords; ++i) {
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                    handleArgs(searchIndex[i], i, results_others);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                }
 								            }
 								        }
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
 								        if (parsedQuery.error === null) {
 								            innerRunQuery();
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const ret = createQueryResults(
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            sortResults(results_in_args, true, currentCrate),
 								            sortResults(results_returned, true, currentCrate),
 								            sortResults(results_others, false, currentCrate),
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								            parsedQuery);
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								        handleAliases(ret, parsedQuery.original.replace(/"/g, ""), filterCrates, currentCrate);
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								        if (parsedQuery.error !== null && ret.others.length !== 0) {
 								            // It means some doc aliases were found so let's "remove" the error!
 								            ret.query.error = null;
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        return ret;
 								    }
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								    function nextTab(direction) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const next = (searchState.currentTab + direction + 3) % searchState.focusedByTab.length;
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								        searchState.focusedByTab[searchState.currentTab] = document.activeElement;
 								        printTab(next);
 								        focusSearchResult();
 								    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Reset "focusedByTab" field when doing another search

											
										
										
											2021-05-20 12:45:25 +02:00
+								    // Focus the first search result on the active tab, or the result that
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								    // was focused last time this tab was active.
 								    function focusSearchResult() {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const target = searchState.focusedByTab[searchState.currentTab] ||
-												Reset "focusedByTab" field when doing another search

											
										
										
											2021-05-20 12:45:25 +02:00
+								            document.querySelectorAll(".search-results.active a").item(0) ||
-												rustdoc: use a more evocative name for CSS/JS `#titles`

This renames the ID, which is only used in search results, to
`#search-tabs`. Also changes the `.count` to a span, so it doesn't need its
display mode to be overridden.

											
										
										
											2022-12-22 15:52:34 -07:00
+								            document.querySelectorAll("#search-tabs button").item(searchState.currentTab);
-												rustdoc: fix corner case in search keyboard commands

											
										
										
											2022-11-14 10:41:07 -07:00
+								        searchState.focusedByTab[searchState.currentTab] = null;
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								        if (target) {
 								            target.focus();
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    }
 								    function buildHrefAndPath(item) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let displayPath;
 								        let href;
 								        const type = itemTypes[item.ty];
 								        const name = item.name;
 								        let path = item.path;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								        if (type === "mod") {
 								            displayPath = path + "::";
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            href = ROOT_PATH + path.replace(/::/g, "/") + "/" +
 								                name + "/index.html";
-												Fix reexports missing from the search index

											
										
										
											2022-05-05 21:56:03 +02:00
+								        } else if (type === "import") {
 								            displayPath = item.path + "::";
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            href = ROOT_PATH + item.path.replace(/::/g, "/") + "/index.html#reexport." + name;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        } else if (type === "primitive" || type === "keyword") {
 								            displayPath = "";
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            href = ROOT_PATH + path.replace(/::/g, "/") +
 								                "/" + type + "." + name + ".html";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        } else if (type === "externcrate") {
 								            displayPath = "";
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            href = ROOT_PATH + name + "/index.html";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        } else if (item.parent !== undefined) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const myparent = item.parent;
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								            let anchor = type + "." + name;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const parentType = itemTypes[myparent.ty];
 								            let pageType = parentType;
 								            let pageName = myparent.name;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								            if (parentType === "primitive") {
 								                displayPath = myparent.name + "::";
 								            } else if (type === "structfield" && parentType === "variant") {
 								                // Structfields belonging to variants are special: the
 								                // final path element is the enum name.
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const enumNameIdx = item.path.lastIndexOf("::");
 								                const enumName = item.path.substr(enumNameIdx + 2);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                path = item.path.substr(0, enumNameIdx);
 								                displayPath = path + "::" + enumName + "::" + myparent.name + "::";
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								                anchor = "variant." + myparent.name + ".field." + name;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                pageType = "enum";
 								                pageName = enumName;
 								            } else {
 								                displayPath = path + "::" + myparent.name + "::";
 								            }
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								            if (item.implDisambiguator !== null) {
 								                anchor = item.implDisambiguator + "/" + anchor;
 								            }
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            href = ROOT_PATH + path.replace(/::/g, "/") +
 								                "/" + pageType +
 								                "." + pageName +
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								                ".html#" + anchor;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        } else {
 								            displayPath = item.path + "::";
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            href = ROOT_PATH + item.path.replace(/::/g, "/") +
 								                "/" + type + "." + name + ".html";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
 								        return [displayPath, href];
 								    }
 								    function pathSplitter(path) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const tmp = "<span>" + path.replace(/::/g, "::</span><span>");
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        if (tmp.endsWith("<span>")) {
 								            return tmp.slice(0, tmp.length - 6);
 								        }
 								        return tmp;
 								    }
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								    /**
 								     * Render a set of search results for a single tab.
 								     * @param {Array<?>}    array   - The search results for this tab
 								     * @param {ParsedQuery} query
 								     * @param {boolean}     display - True if this is the active tab
 								     */
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    function addTab(array, query, display) {
-												rustdoc-search: clean up some DOM code

											
										
										
											2023-11-25 10:39:45 -07:00
+								        const extraClass = display ? " active" : "";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const output = document.createElement("div");
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								        if (array.length > 0) {
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								            output.className = "search-results " + extraClass;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								            array.forEach(item => {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const name = item.name;
 								                const type = itemTypes[item.ty];
-												Add search result item types after their name

											
										
										
											2023-04-22 16:00:20 +02:00
+								                const longType = longItemTypes[item.ty];
-												Move item kind before the item name

											
										
										
											2023-05-18 16:16:13 +02:00
+								                const typeName = longType.length !== 0 ? `${longType}` : "?";
-												Move extra search result information for keywords and primitives from CSS to DOM

											
										
										
											2021-05-24 14:24:34 +02:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const link = document.createElement("a");
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								                link.className = "result-" + type;
 								                link.href = item.href;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const resultName = document.createElement("div");
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								                resultName.className = "result-name";
-												Fix display of aliases in rustdoc search results

											
										
										
											2023-07-18 14:22:27 +02:00
+								                resultName.insertAdjacentHTML(
 								                    "beforeend",
 								                    `<span class="typename">${typeName}</span>`);
 								                link.appendChild(resultName);
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
-												Fix display of aliases in rustdoc search results

											
										
										
											2023-07-18 14:22:27 +02:00
+								                let alias = " ";
 								                if (item.is_alias) {
 								                    alias = ` <div class="alias">\
 								<b>${item.alias}</b><i class="grey">&nbsp;- see&nbsp;</i>\
 								</div>`;
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								                }
 								                resultName.insertAdjacentHTML(
 								                    "beforeend",
-												Fix display of aliases in rustdoc search results

											
										
										
											2023-07-18 14:22:27 +02:00
+								                    `<div class="path">${alias}\
 								${item.displayPath}<span class="${type}">${name}</span>\
-												Fix display of long items in search results

											
										
										
											2023-06-27 15:05:43 +02:00
+								</div>`);
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const description = document.createElement("div");
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								                description.className = "desc";
-												rustdoc: get rid of CSS/DOM `div.desc span`, which isn't really needed

											
										
										
											2022-11-04 13:19:33 -07:00
+								                description.insertAdjacentHTML("beforeend", item.desc);
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
-												rustdoc: simplify search results CSS and DOM

There is a layout change caused by this commit, but it's subtle. You won't
notice it unless you're looking for it.

											
										
										
											2022-11-04 12:34:24 -07:00
+								                link.appendChild(description);
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								                output.appendChild(link);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            });
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								        } else if (query.error === null) {
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								            output.className = "search-failed" + extraClass;
 								            output.innerHTML = "No results :(<br/>" +
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                "Try on <a href=\"https://duckduckgo.com/?q=" +
-												Improve naming of "val" field

											
										
										
											2022-01-03 16:43:30 +01:00
+								                encodeURIComponent("rust " + query.userQuery) +
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                "\">DuckDuckGo</a>?<br/><br/>" +
 								                "Or try looking in one of these:<ul><li>The <a " +
 								                "href=\"https://doc.rust-lang.org/reference/index.html\">Rust Reference</a> " +
 								                " for technical details about the language.</li><li><a " +
 								                "href=\"https://doc.rust-lang.org/rust-by-example/index.html\">Rust By " +
 								                "Example</a> for expository code examples.</a></li><li>The <a " +
 								                "href=\"https://doc.rust-lang.org/book/index.html\">Rust Book</a> for " +
 								                "introductions to language features and the language itself.</li><li><a " +
 								                "href=\"https://docs.rs\">Docs.rs</a> for documentation of crates released on" +
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								                " <a href=\"https://crates.io/\">crates.io</a>.</li></ul>";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												Clean up variables in `search.js`

											
										
										
											2023-12-12 19:31:43 +01:00
+								        return [output, array.length];
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    }
 								    function makeTabHeader(tabNb, text, nbElems) {
-												rustdoc: add test cases, and fix, search tabs

											
										
										
											2023-09-19 19:40:36 -07:00
+								        // https://blog.horizon-eda.org/misc/2020/02/19/ui.html
-												rustdoc: add comment about numeric spacing

											
										
										
											2023-09-20 07:51:30 -07:00
+								        //
 								        // CSS runs with `font-variant-numeric: tabular-nums` to ensure all
 								        // digits are the same width. \u{2007} is a Unicode space character
 								        // that is defined to be the same width as a digit.
-												rustdoc: add test cases, and fix, search tabs

											
										
										
											2023-09-19 19:40:36 -07:00
+								        const fmtNbElems =
 								            nbElems < 10  ? `\u{2007}(${nbElems})\u{2007}\u{2007}` :
 								            nbElems < 100 ? `\u{2007}(${nbElems})\u{2007}` :
 								            `\u{2007}(${nbElems})`;
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								        if (searchState.currentTab === tabNb) {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            return "<button class=\"selected\">" + text +
-												rustdoc: add test cases, and fix, search tabs

											
										
										
											2023-09-19 19:40:36 -07:00
+								                   "<span class=\"count\">" + fmtNbElems + "</span></button>";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        }
-												rustdoc: add test cases, and fix, search tabs

											
										
										
											2023-09-19 19:40:36 -07:00
+								        return "<button>" + text + "<span class=\"count\">" + fmtNbElems + "</span></button>";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    }
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								    /**
 								     * @param {ResultsTable} results
 								     * @param {boolean} go_to_first
 								     * @param {string} filterCrates
 								     */
-												Move crate drop-down to search results page

This reduces clutter on doc pages.

											
										
										
											2022-01-01 23:48:34 -05:00
+								    function showResults(results, go_to_first, filterCrates) {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const search = searchState.outputElement();
-												Add go_to_first boolean query param to immeidately jump to the first search result

											
										
										
											2021-05-31 19:20:41 -07:00
+								        if (go_to_first || (results.others.length === 1
-												Fix "Directly go to item in search if there is only one result" setting

											
										
										
											2023-03-26 17:50:02 +02:00
+								            && getSettingValue("go-to-only-result") === "true")
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								        ) {
-												Fix invalid handling of "going back in history" when "Directly go to item in search if there is only one result" setting is set to true

											
										
										
											2023-06-16 16:56:13 +02:00
+								            // Needed to force re-execution of JS when coming back to a page. Let's take this
 								            // scenario as example:
 								            //
 								            // 1. You have the "Directly go to item in search if there is only one result" option
 								            //    enabled.
 								            // 2. You make a search which results only one result, leading you automatically to
 								            //    this result.
 								            // 3. You go back to previous page.
 								            //
 								            // Now, without the call below, the JS will not be re-executed and the previous state
 								            // will be used, starting search again since the search input is not empty, leading you
 								            // back to the previous page again.
 								            window.onunload = () => {};
 								            searchState.removeQueryParameters();
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const elem = document.createElement("a");
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            elem.href = results.others[0].href;
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								            removeClass(elem, "active");
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // For firefox, we need the element to be in the DOM so it can be clicked.
 								            document.body.appendChild(elem);
 								            elem.click();
 								            return;
 								        }
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        if (results.query === undefined) {
 								            results.query = parseQuery(searchState.input.value);
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        currentResults = results.query.userQuery;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const ret_others = addTab(results.others, results.query, true);
 								        const ret_in_args = addTab(results.in_args, results.query, false);
 								        const ret_returned = addTab(results.returned, results.query, false);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								        // Navigate to the relevant tab if the current tab is empty, like in case users search
 								        // for "-> String". If they had selected another tab previously, they have to click on
 								        // it again.
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let currentTab = searchState.currentTab;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        if ((currentTab === 0 && ret_others[1] === 0) ||
 								                (currentTab === 1 && ret_in_args[1] === 0) ||
 								                (currentTab === 2 && ret_returned[1] === 0)) {
 								            if (ret_others[1] !== 0) {
 								                currentTab = 0;
 								            } else if (ret_in_args[1] !== 0) {
 								                currentTab = 1;
 								            } else if (ret_returned[1] !== 0) {
 								                currentTab = 2;
 								            }
 								        }
-												Rustdoc style cleanups

 - Make "since" version numbers grey again (regressed in #92602).
 - Remove unneeded selectors for when crate filter dropdown is a
   sibling of search-input.
 - Crate filter dropdown doesn't need to be 100% width on mobile.
 - Only build crate filter dropdown when there is more than one crate.
 - Remove unused addCrateDropdown.

											
										
										
											2022-01-12 15:05:47 -08:00
+								        let crates = "";
-												Improve loading of crates.js and sidebar-items.js

Now that the "All Crates" dropdown is only rendered on the search results page,
there is no need to load crates.js on most pages. Load it only on crate pages.
Also, add the `defer` attribute so it does not block page rendering.

For sidebar-items.js, move the script tag to `<head>`. Since it already has the
defer attribute it won't block loading. The defer attribute does preserve
ordering between scripts, so instead of the callback on load, it can set a
global variable on load, which is slightly simpler. Also, since it is required
to finish rendering the page, beginning its load earlier is better.

Remove generation and handling of sidebar-vars. Everything there can be computed
with information available in JS via other means.

Remove the "other" wrapper in the sidebar. It was unnecessary.

Remove excess script fields

											
										
										
											2022-06-14 23:25:51 -07:00
+								        const crates_list = Object.keys(rawSearchIndex);
 								        if (crates_list.length > 1) {
-												Improve crate selection on rustdoc search results page

Resolves all of issue #93240

Reproduces a similar change as #99086, but with improvements

In particular, this PR inlcludes:
* redesigning the crate-search selector so the background color matches its surroundings
* decrease the font of the dropdown menu to a reaonable size
* add a hover effect
* make the color of the arrow theme-dependent, using a surrounding div, with :after pseudo-element
  that can then be transformed using CSS filters to approximate the desired color
* fix the text "in" to match the title font
* remove the "for xyz" in the "Results for xyz in [All crates]" title when
  searching for search term "xyz"; you can already see what you're searching for
  as it's typed in the search bar!
* in line with #99086, handle super-long crate names appropriately without a long <select>
  element escaping the screen area; the improvement is that we also keep the title
  within a single line now; uses some flex layout shenanigans...
* the margins / paddings are adjusted so the selected label of the <select> fits within
  the rest of that title nicely; also some inconsistency in the way that Firefox renders
  a <select> with "appearance: none" (roughly 4px more padding left and right of the text
  than e.g. Chrome) is worked around, and it now produces a result that looks (essentially)
  identical to Chrome
* the color of the help menu and settings menu border in light theme is made to match with
  the color of the corresponding buttons, like they do (match) in the ayu theme
* the casing of "All crates" changes to "all crates"
* the new tests from #99086 are temporarily disabled, until they can be adapted later

											
										
										
											2022-07-03 20:10:19 +02:00
+								            crates = " in&nbsp;<div id=\"crate-search-div\"><select id=\"crate-search\">" +
 								                "<option value=\"all crates\">all crates</option>";
-												Improve loading of crates.js and sidebar-items.js

Now that the "All Crates" dropdown is only rendered on the search results page,
there is no need to load crates.js on most pages. Load it only on crate pages.
Also, add the `defer` attribute so it does not block page rendering.

For sidebar-items.js, move the script tag to `<head>`. Since it already has the
defer attribute it won't block loading. The defer attribute does preserve
ordering between scripts, so instead of the callback on load, it can set a
global variable on load, which is slightly simpler. Also, since it is required
to finish rendering the page, beginning its load earlier is better.

Remove generation and handling of sidebar-vars. Everything there can be computed
with information available in JS via other means.

Remove the "other" wrapper in the sidebar. It was unnecessary.

Remove excess script fields

											
										
										
											2022-06-14 23:25:51 -07:00
+								            for (const c of crates_list) {
-												Add "eqeqeq" eslint rule

											
										
										
											2022-05-27 22:30:19 +02:00
+								                crates += `<option value="${c}" ${c === filterCrates && "selected"}>${c}</option>`;
-												Rustdoc style cleanups

 - Make "since" version numbers grey again (regressed in #92602).
 - Remove unneeded selectors for when crate filter dropdown is a
   sibling of search-input.
 - Crate filter dropdown doesn't need to be 100% width on mobile.
 - Only build crate filter dropdown when there is more than one crate.
 - Remove unused addCrateDropdown.

											
										
										
											2022-01-12 15:05:47 -08:00
+								            }
-												Improve crate selection on rustdoc search results page

Resolves all of issue #93240

Reproduces a similar change as #99086, but with improvements

In particular, this PR inlcludes:
* redesigning the crate-search selector so the background color matches its surroundings
* decrease the font of the dropdown menu to a reaonable size
* add a hover effect
* make the color of the arrow theme-dependent, using a surrounding div, with :after pseudo-element
  that can then be transformed using CSS filters to approximate the desired color
* fix the text "in" to match the title font
* remove the "for xyz" in the "Results for xyz in [All crates]" title when
  searching for search term "xyz"; you can already see what you're searching for
  as it's typed in the search bar!
* in line with #99086, handle super-long crate names appropriately without a long <select>
  element escaping the screen area; the improvement is that we also keep the title
  within a single line now; uses some flex layout shenanigans...
* the margins / paddings are adjusted so the selected label of the <select> fits within
  the rest of that title nicely; also some inconsistency in the way that Firefox renders
  a <select> with "appearance: none" (roughly 4px more padding left and right of the text
  than e.g. Chrome) is worked around, and it now produces a result that looks (essentially)
  identical to Chrome
* the color of the help menu and settings menu border in light theme is made to match with
  the color of the corresponding buttons, like they do (match) in the ayu theme
* the casing of "All crates" changes to "all crates"
* the new tests from #99086 are temporarily disabled, until they can be adapted later

											
										
										
											2022-07-03 20:10:19 +02:00
+								            crates += "</select></div>";
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        }
-												Improve crate selection on rustdoc search results page

Resolves all of issue #93240

Reproduces a similar change as #99086, but with improvements

In particular, this PR inlcludes:
* redesigning the crate-search selector so the background color matches its surroundings
* decrease the font of the dropdown menu to a reaonable size
* add a hover effect
* make the color of the arrow theme-dependent, using a surrounding div, with :after pseudo-element
  that can then be transformed using CSS filters to approximate the desired color
* fix the text "in" to match the title font
* remove the "for xyz" in the "Results for xyz in [All crates]" title when
  searching for search term "xyz"; you can already see what you're searching for
  as it's typed in the search bar!
* in line with #99086, handle super-long crate names appropriately without a long <select>
  element escaping the screen area; the improvement is that we also keep the title
  within a single line now; uses some flex layout shenanigans...
* the margins / paddings are adjusted so the selected label of the <select> fits within
  the rest of that title nicely; also some inconsistency in the way that Firefox renders
  a <select> with "appearance: none" (roughly 4px more padding left and right of the text
  than e.g. Chrome) is worked around, and it now produces a result that looks (essentially)
  identical to Chrome
* the color of the help menu and settings menu border in light theme is made to match with
  the color of the corresponding buttons, like they do (match) in the ayu theme
* the casing of "All crates" changes to "all crates"
* the new tests from #99086 are temporarily disabled, until they can be adapted later

											
										
										
											2022-07-03 20:10:19 +02:00
+								        let output = `<h1 class="search-results-title">Results${crates}</h1>`;
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								        if (results.query.error !== null) {
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								            const error = results.query.error;
 								            error.forEach((value, index) => {
 								                value = value.split("<").join("&lt;").split(">").join("&gt;");
 								                if (index % 2 !== 0) {
-												Correctly display whitespace characters in search error

											
										
										
											2023-06-13 10:50:16 +02:00
+								                    error[index] = `<code>${value.replaceAll(" ", "&nbsp;")}</code>`;
-												Put backtick content from rustdoc search errors into a <code> elements

											
										
										
											2023-02-28 22:37:52 +01:00
+								                } else {
 								                    error[index] = value;
 								                }
 								            });
 								            output += `<h3 class="error">Query parser error: "${error.join("")}".</h3>`;
-												rustdoc: use a more evocative name for CSS/JS `#titles`

This renames the ID, which is only used in search results, to
`#search-tabs`. Also changes the `.count` to a span, so it doesn't need its
display mode to be overridden.

											
										
										
											2022-12-22 15:52:34 -07:00
+								            output += "<div id=\"search-tabs\">" +
-												rustdoc: fix JS error when rendering parse error

											
										
										
											2022-05-03 09:20:45 -07:00
+								                makeTabHeader(0, "In Names", ret_others[1]) +
 								                "</div>";
 								            currentTab = 0;
-												rustdoc: when running a function-signature search, tweak the tab bar

											
										
										
											2022-04-30 13:05:40 -07:00
+								        } else if (results.query.foundElems <= 1 && results.query.returned.length === 0) {
-												rustdoc: use a more evocative name for CSS/JS `#titles`

This renames the ID, which is only used in search results, to
`#search-tabs`. Also changes the `.count` to a span, so it doesn't need its
display mode to be overridden.

											
										
										
											2022-12-22 15:52:34 -07:00
+								            output += "<div id=\"search-tabs\">" +
-												rustdoc: when running a function-signature search, tweak the tab bar

											
										
										
											2022-04-30 13:05:40 -07:00
+								                makeTabHeader(0, "In Names", ret_others[1]) +
 								                makeTabHeader(1, "In Parameters", ret_in_args[1]) +
 								                makeTabHeader(2, "In Return Types", ret_returned[1]) +
 								                "</div>";
 								        } else {
-												rustdoc: change the "In Function Signatures" to context-sensitive

* If it's just `-> a`, use "In Function Return Types"
* If it's just `a b`, use "In Function Parameters"
* Otherwise, still use "In Function Signatures"

											
										
										
											2022-05-02 09:45:32 -07:00
+								            const signatureTabTitle =
 								                results.query.elems.length === 0 ? "In Function Return Types" :
 								                results.query.returned.length === 0 ? "In Function Parameters" :
 								                "In Function Signatures";
-												rustdoc: use a more evocative name for CSS/JS `#titles`

This renames the ID, which is only used in search results, to
`#search-tabs`. Also changes the `.count` to a span, so it doesn't need its
display mode to be overridden.

											
										
										
											2022-12-22 15:52:34 -07:00
+								            output += "<div id=\"search-tabs\">" +
-												rustdoc: change the "In Function Signatures" to context-sensitive

* If it's just `-> a`, use "In Function Return Types"
* If it's just `a b`, use "In Function Parameters"
* Otherwise, still use "In Function Signatures"

											
										
										
											2022-05-02 09:45:32 -07:00
+								                makeTabHeader(0, signatureTabTitle, ret_others[1]) +
-												rustdoc: when running a function-signature search, tweak the tab bar

											
										
										
											2022-04-30 13:05:40 -07:00
+								                "</div>";
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								            currentTab = 0;
-												Make query parser more strict and improve display of errors

											
										
										
											2022-01-09 15:12:46 +01:00
+								        }
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								        if (results.query.correction !== null) {
-												rustdoc-search: give longer notification for type corrections

											
										
										
											2023-04-19 10:16:14 -07:00
+								            const orig = results.query.returned.length > 0
 								                ? results.query.returned[0].name
 								                : results.query.elems[0].name;
 								            output += "<h3 class=\"search-corrections\">" +
 								                `Type "${orig}" not found. ` +
-												rustdoc-search: use more descriptive "x not found; y instead" message

											
										
										
											2023-04-20 14:32:02 -07:00
+								                "Showing results for closest type name " +
-												rustdoc-search: give longer notification for type corrections

											
										
										
											2023-04-19 10:16:14 -07:00
+								                `"${results.query.correction}" instead.</h3>`;
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								        }
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        if (results.query.proposeCorrectionFrom !== null) {
 								            const orig = results.query.proposeCorrectionFrom;
 								            const targ = results.query.proposeCorrectionTo;
 								            output += "<h3 class=\"search-corrections\">" +
 								                `Type "${orig}" not found and used as generic parameter. ` +
 								                `Consider searching for "${targ}" instead.</h3>`;
 								        }
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const resultsElem = document.createElement("div");
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								        resultsElem.id = "results";
 								        resultsElem.appendChild(ret_others[0]);
 								        resultsElem.appendChild(ret_in_args[0]);
 								        resultsElem.appendChild(ret_returned[0]);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								        search.innerHTML = output;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const crateSearch = document.getElementById("crate-search");
-												Rustdoc style cleanups

 - Make "since" version numbers grey again (regressed in #92602).
 - Remove unneeded selectors for when crate filter dropdown is a
   sibling of search-input.
 - Crate filter dropdown doesn't need to be 100% width on mobile.
 - Only build crate filter dropdown when there is more than one crate.
 - Remove unused addCrateDropdown.

											
										
										
											2022-01-12 15:05:47 -08:00
+								        if (crateSearch) {
 								            crateSearch.addEventListener("input", updateCrate);
 								        }
-												Generate DOM more securely

											
										
										
											2021-05-20 15:14:50 +02:00
+								        search.appendChild(resultsElem);
-												Reset "focusedByTab" field when doing another search

											
										
										
											2021-05-20 12:45:25 +02:00
+								        // Reset focused elements.
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								        searchState.showResults(search);
-												rustdoc: use a more evocative name for CSS/JS `#titles`

This renames the ID, which is only used in search results, to
`#search-tabs`. Also changes the `.count` to a span, so it doesn't need its
display mode to be overridden.

											
										
										
											2022-12-22 15:52:34 -07:00
+								        const elems = document.getElementById("search-tabs").childNodes;
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								        searchState.focusedByTab = [];
 								        let i = 0;
 								        for (const elem of elems) {
 								            const j = i;
-												Add new eslint rule about brace style

											
										
										
											2022-05-14 13:50:52 +02:00
+								            elem.onclick = () => printTab(j);
-												rustdoc: fix keyboard shortcuts and console log on search page

											
										
										
											2022-05-02 15:50:01 -07:00
+								            searchState.focusedByTab.push(null);
 								            i += 1;
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        printTab(currentTab);
 								    }
-												Unify history interactions in search

											
										
										
											2023-06-16 13:43:55 +02:00
+								    function updateSearchHistory(url) {
 								        if (!browserSupportsHistoryApi()) {
 								            return;
 								        }
 								        const params = searchState.getQueryStringParams();
 								        if (!history.state && !params.search) {
 								            history.pushState(null, "", url);
 								        } else {
 								            history.replaceState(null, "", url);
 								        }
 								    }
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								    /**
 								     * Perform a search based on the current state of the search input element
 								     * and display the results.
 								     * @param {boolean} [forced]
 								     */
-												rustdoc-search: clean up some DOM code

											
										
										
											2023-11-25 10:39:45 -07:00
+								    function search(forced) {
-												Add sentence when rustdoc search is running

											
										
										
											2022-11-28 17:23:50 +01:00
+								        const query = parseQuery(searchState.input.value.trim());
 								        let filterCrates = getFilterCrates();
-												* Greatly improve the rustdoc search parser source code
* Move all functions outside parseQuery

											
										
										
											2022-01-04 15:44:00 +01:00
+								        if (!forced && query.userQuery === currentResults) {
-												Add query syntax for the parser

											
										
										
											2022-01-02 19:12:28 +01:00
+								            if (query.userQuery.length > 0) {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								                putBackSearch();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
 								            return;
 								        }
-												Add sentence when rustdoc search is running

											
										
										
											2022-11-28 17:23:50 +01:00
+								        searchState.setLoadingSearch();
 								        const params = searchState.getQueryStringParams();
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
 								        // In case we have no information about the saved crate and there is a URL query parameter,
 								        // we override it with the URL query parameter.
 								        if (filterCrates === null && params["filter-crate"] !== undefined) {
 								            filterCrates = params["filter-crate"];
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        // Update document title to maintain a meaningful browser history
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        searchState.title = "Results for " + query.original + " - Rust";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
 								        // Because searching is incremental by character, only the most
 								        // recent search query is added to the browser history.
-												Unify history interactions in search

											
										
										
											2023-06-16 13:43:55 +02:00
+								        updateSearchHistory(buildUrl(query.original, filterCrates));
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								        showResults(
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								            execQuery(query, searchWords, filterCrates, window.currentCrate),
-												Greatly improve rustdoc search

											
										
										
											2021-12-20 15:42:08 +01:00
+								            params.go_to_first,
 								            filterCrates);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    }
-												Add documentation

											
										
										
											2022-06-27 11:07:16 -07:00
+								    /**
 								     * Convert a list of RawFunctionType / ID to object-based FunctionType.
 								     *
 								     * Crates often have lots of functions in them, and it's common to have a large number of
 								     * functions that operate on a small set of data types, so the search index compresses them
 								     * by encoding function parameter and return types as indexes into an array of names.
 								     *
 								     * Even when a general-purpose compression algorithm is used, this is still a win. I checked.
 								     * https://github.com/rust-lang/rust/pull/98475#issue-1284395985
 								     *
 								     * The format for individual function types is encoded in
 								     * librustdoc/html/render/mod.rs: impl Serialize for RenderType
 								     *
 								     * @param {null|Array<RawFunctionType>} types
 								     * @param {Array<{name: string, ty: number}>} lowercasePaths
 								     *
 								     * @return {Array<FunctionSearchType>}
 								     */
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								    function buildItemSearchTypeAll(types, lowercasePaths) {
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        return types.map(type => buildItemSearchType(type, lowercasePaths));
 								    }
 								    /**
 								     * Converts a single type.
 								     *
 								     * @param {RawFunctionType} type
 								     */
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								    function buildItemSearchType(type, lowercasePaths, isAssocType) {
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        const PATH_INDEX_DATA = 0;
 								        const GENERICS_DATA = 1;
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								        const BINDINGS_DATA = 2;
 								        let pathIndex, generics, bindings;
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        if (typeof type === "number") {
 								            pathIndex = type;
 								            generics = [];
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            bindings = new Map();
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        } else {
 								            pathIndex = type[PATH_INDEX_DATA];
 								            generics = buildItemSearchTypeAll(
 								                type[GENERICS_DATA],
 								                lowercasePaths
 								            );
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            if (type.length > BINDINGS_DATA) {
 								                bindings = new Map(type[BINDINGS_DATA].map(binding => {
 								                    const [assocType, constraints] = binding;
 								                    // Associated type constructors are represented sloppily in rustdoc's
 								                    // type search, to make the engine simpler.
 								                    //
 								                    // MyType<Output<T>=Result<T>> is equivalent to MyType<Output<Result<T>>=T>
 								                    // and both are, essentially
 								                    // MyType<Output=(T, Result<T>)>, except the tuple isn't actually there.
 								                    // It's more like the value of a type binding is naturally an array,
 								                    // which rustdoc calls "constraints".
 								                    //
 								                    // As a result, the key should never have generics on it.
 								                    return [
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								                        buildItemSearchType(assocType, lowercasePaths, true).id,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                        buildItemSearchTypeAll(constraints, lowercasePaths),
 								                    ];
 								                }));
 								            } else {
 								                bindings = new Map();
 								            }
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        }
 								        if (pathIndex < 0) {
 								            // types less than 0 are generic parameters
 								            // the actual names of generic parameters aren't stored, since they aren't API
 								            return {
 								                id: pathIndex,
 								                ty: TY_GENERIC,
 								                path: null,
 								                generics,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                bindings,
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            };
 								        }
 								        if (pathIndex === 0) {
-												Improve `search.js` code

											
										
										
											2023-08-31 18:51:18 +02:00
+								            // `0` is used as a sentinel because it's fewer bytes than `null`
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            return {
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                id: null,
 								                ty: null,
 								                path: null,
 								                generics,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								                bindings,
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            };
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        }
 								        const item = lowercasePaths[pathIndex - 1];
 								        return {
-												rustdoc-search: do not treat associated type names as types

Before: http://notriddle.com/rustdoc-html-demo-6/tor-before/tor_config/

After: http://notriddle.com/rustdoc-html-demo-6/tor-after/tor_config/

Profile: http://notriddle.com/rustdoc-html-demo-6/tor-profile/

As a bit of background information: in type-based queries, a type
name that does not exist gets treated as a generic type variable.

This causes a counterintuitive behavior in the `tor_config` crate,
which has a trait with an associated type variable called `T`.

This isn't a searchable concrete type, but its name still gets stored
in the typeNameIdMap, as a convenient way to intern its name.

											
										
										
											2023-12-10 16:05:18 -07:00
+								            id: buildTypeMapIndex(item.name, isAssocType),
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            ty: item.ty,
 								            path: item.path,
 								            generics,
-												rustdoc-search: add support for associated types

											
										
										
											2023-09-22 17:27:06 -07:00
+								            bindings,
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        };
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								    }
-												Add documentation

											
										
										
											2022-06-27 11:07:16 -07:00
+								    /**
 								     * Convert from RawFunctionSearchType to FunctionSearchType.
 								     *
 								     * Crates often have lots of functions in them, and function signatures are sometimes complex,
 								     * so rustdoc uses a pretty tight encoding for them. This function converts it to a simpler,
 								     * object-based encoding so that the actual search code is more readable and easier to debug.
 								     *
 								     * The raw function search type format is generated using serde in
 								     * librustdoc/html/render/mod.rs: impl Serialize for IndexItemFunctionType
 								     *
 								     * @param {RawFunctionSearchType} functionSearchType
 								     * @param {Array<{name: string, ty: number}>} lowercasePaths
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								     * @param {Map<string, integer>}
-												Add documentation

											
										
										
											2022-06-27 11:07:16 -07:00
+								     *
 								     * @return {null|FunctionSearchType}
 								     */
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								    function buildFunctionSearchType(functionSearchType, lowercasePaths) {
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        const INPUTS_DATA = 0;
 								        const OUTPUT_DATA = 1;
-												Add comments, fixes for `0` sentinel

											
										
										
											2022-06-27 14:13:13 -07:00
+								        // `0` is used as a sentinel because it's fewer bytes than `null`
 								        if (functionSearchType === 0) {
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            return null;
 								        }
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								        let inputs, output;
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        if (typeof functionSearchType[INPUTS_DATA] === "number") {
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            inputs = [buildItemSearchType(functionSearchType[INPUTS_DATA], lowercasePaths)];
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        } else {
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            inputs = buildItemSearchTypeAll(
 								                functionSearchType[INPUTS_DATA],
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								                lowercasePaths
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								            );
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        }
 								        if (functionSearchType.length > 1) {
 								            if (typeof functionSearchType[OUTPUT_DATA] === "number") {
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								                output = [buildItemSearchType(functionSearchType[OUTPUT_DATA], lowercasePaths)];
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            } else {
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                output = buildItemSearchTypeAll(
 								                    functionSearchType[OUTPUT_DATA],
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								                    lowercasePaths
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								                );
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            }
 								        } else {
-												Put back, fix ()-output optimization

											
										
										
											2022-06-27 11:07:45 -07:00
+								            output = [];
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        }
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								        const where_clause = [];
 								        const l = functionSearchType.length;
 								        for (let i = 2; i < l; ++i) {
 								            where_clause.push(typeof functionSearchType[i] === "number"
 								                ? [buildItemSearchType(functionSearchType[i], lowercasePaths)]
 								                : buildItemSearchTypeAll(functionSearchType[i], lowercasePaths));
 								        }
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        return {
-												rustdoc-search: add support for type parameters

When writing a type-driven search query in rustdoc, specifically one
with more than one query element, non-existent types become generic
parameters instead of auto-correcting (which is currently only done
for single-element queries) or giving no result. You can also force a
generic type parameter by writing `generic:T` (and can force it to not
use a generic type parameter with something like `struct:T` or whatever,
though if this happens it means the thing you're looking for doesn't
exist and will give you no results).

There is no syntax provided for specifying type constraints
for generic type parameters.

When you have a generic type parameter in a search query, it will only
match up with generic type parameters in the actual function, not
concrete types that match, not concrete types that implement a trait.
It also strictly matches based on when they're the same or different,
so `option<T>, option<U> -> option<U>` matches `Option::and`, but not
`Option::or`. Similarly, `option<T>, option<T> -> option<T>`` matches
`Option::or`, but not `Option::and`.

											
										
										
											2023-06-16 14:43:28 -07:00
+								            inputs, output, where_clause,
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								        };
 								    }
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								    /**
 								     * Type fingerprints allow fast, approximate matching of types.
 								     *
 								     * This algo creates a compact representation of the type set using a Bloom filter.
 								     * This fingerprint is used three ways:
 								     *
 								     * - It accelerates the matching algorithm by checking the function fingerprint against the
 								     *   query fingerprint. If any bits are set in the query but not in the function, it can't
 								     *   match.
 								     *
 								     * - The fourth section has the number of distinct items in the set.
 								     *   This is the distance function, used for filtering and for sorting.
 								     *
 								     * [^1]: Distance is the relatively naive metric of counting the number of distinct items in
 								     * the function that are not present in the query.
 								     *
 								     * @param {FunctionType|QueryElement} type - a single type
 								     * @param {Uint32Array} output - write the fingerprint to this data structure: uses 128 bits
 								     * @param {Set<number>} fps - Set of distinct items
 								     */
 								    function buildFunctionTypeFingerprint(type, output, fps) {
 								        let input = type.id;
 								        // All forms of `[]` get collapsed down to one thing in the bloom filter.
 								        // Differentiating between arrays and slices, if the user asks for it, is
 								        // still done in the matching algorithm.
 								        if (input === typeNameIdOfArray || input === typeNameIdOfSlice) {
 								            input = typeNameIdOfArrayOrSlice;
 								        }
-												rustdoc-search: better hashing, faster unification

The hash changes are based on some tests with `arti` and various
specific queries, aimed at reducing the false positive rate.

Sorting the query elements so that generics always come first is
instead aimed at reducing the number of Map operations on mgens,
assuming if the bloom filter does find a false positive, it'll
be able to reject the row without having to track a mapping.

- https://hur.st/bloomfilter/?n=3&p=&m=96&k=6

  Different functions have different amounts of inputs, and
  unification isn't very slow anyway, so figuring out a single
  ideal number of hash functions is nasty, but 6 keeps things
  low even up to 10 inputs.

- https://web.archive.org/web/20210927123933/https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.72.2442&rep=rep1&type=pdf

  This is the `h1` and `h2`, both derived from `h0`.

											
										
										
											2023-12-10 22:46:40 -07:00
+								        // http://burtleburtle.net/bob/hash/integer.html
 								        // ~~ is toInt32. It's used before adding, so
 								        // the number stays in safe integer range.
 								        const hashint1 = k => {
 								            k = (~~k + 0x7ed55d16) + (k << 12);
 								            k = (k ^ 0xc761c23c) ^ (k >>> 19);
 								            k = (~~k + 0x165667b1) + (k << 5);
 								            k = (~~k + 0xd3a2646c) ^ (k << 9);
 								            k = (~~k + 0xfd7046c5) + (k << 3);
 								            return (k ^ 0xb55a4f09) ^ (k >>> 16);
 								        };
 								        const hashint2 = k => {
 								            k = ~k + (k << 15);
 								            k ^= k >>> 12;
 								            k += k << 2;
 								            k ^= k >>> 4;
 								            k = Math.imul(k, 2057);
 								            return k ^ (k >> 16);
 								        };
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								        if (input !== null) {
-												rustdoc-search: better hashing, faster unification

The hash changes are based on some tests with `arti` and various
specific queries, aimed at reducing the false positive rate.

Sorting the query elements so that generics always come first is
instead aimed at reducing the number of Map operations on mgens,
assuming if the bloom filter does find a false positive, it'll
be able to reject the row without having to track a mapping.

- https://hur.st/bloomfilter/?n=3&p=&m=96&k=6

  Different functions have different amounts of inputs, and
  unification isn't very slow anyway, so figuring out a single
  ideal number of hash functions is nasty, but 6 keeps things
  low even up to 10 inputs.

- https://web.archive.org/web/20210927123933/https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.72.2442&rep=rep1&type=pdf

  This is the `h1` and `h2`, both derived from `h0`.

											
										
										
											2023-12-10 22:46:40 -07:00
+								            const h0a = hashint1(input);
 								            const h0b = hashint2(input);
 								            // Less Hashing, Same Performance: Building a Better Bloom Filter
 								            // doi=10.1.1.72.2442
 								            const h1a = ~~(h0a + Math.imul(h0b, 2));
 								            const h1b = ~~(h0a + Math.imul(h0b, 3));
 								            const h2a = ~~(h0a + Math.imul(h0b, 4));
 								            const h2b = ~~(h0a + Math.imul(h0b, 5));
 								            output[0] |= (1 << (h0a % 32)) | (1 << (h1b % 32));
 								            output[1] |= (1 << (h1a % 32)) | (1 << (h2b % 32));
 								            output[2] |= (1 << (h2a % 32)) | (1 << (h0b % 32));
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								            fps.add(input);
 								        }
 								        for (const g of type.generics) {
 								            buildFunctionTypeFingerprint(g, output, fps);
 								        }
 								        const fb = {
 								            id: null,
 								            ty: 0,
 								            generics: [],
 								            bindings: new Map(),
 								        };
 								        for (const [k, v] of type.bindings.entries()) {
 								            fb.id = k;
 								            fb.generics = v;
 								            buildFunctionTypeFingerprint(fb, output, fps);
 								        }
 								        output[3] = fps.size;
 								    }
 								    /**
 								     * Compare the query fingerprint with the function fingerprint.
 								     *
 								     * @param {{number}} fullId - The function
 								     * @param {{Uint32Array}} queryFingerprint - The query
 								     * @returns {number|null} - Null if non-match, number if distance
 								     *                          This function might return 0!
 								     */
 								    function compareTypeFingerprints(fullId, queryFingerprint) {
 								        const fh0 = functionTypeFingerprint[fullId * 4];
 								        const fh1 = functionTypeFingerprint[(fullId * 4) + 1];
 								        const fh2 = functionTypeFingerprint[(fullId * 4) + 2];
 								        const [qh0, qh1, qh2] = queryFingerprint;
 								        // Approximate set intersection with bloom filters.
 								        // This can be larger than reality, not smaller, because hashes have
 								        // the property that if they've got the same value, they hash to the
 								        // same thing. False positives exist, but not false negatives.
 								        const [in0, in1, in2] = [fh0 & qh0, fh1 & qh1, fh2 & qh2];
 								        // Approximate the set of items in the query but not the function.
 								        // This might be smaller than reality, but cannot be bigger.
 								        //
 								        // | in_ | qh_ | XOR | Meaning                                          |
 								        // | --- | --- | --- | ------------------------------------------------ |
 								        // |  0  |  0  |  0  | Not present                                      |
 								        // |  1  |  0  |  1  | IMPOSSIBLE because `in_` is `fh_ & qh_`          |
 								        // |  1  |  1  |  0  | If one or both is false positive, false negative |
 								        // |  0  |  1  |  1  | Since in_ has no false negatives, must be real   |
 								        if ((in0 ^ qh0) || (in1 ^ qh1) || (in2 ^ qh2)) {
 								            return null;
 								        }
 								        return functionTypeFingerprint[(fullId * 4) + 3];
 								    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    function buildIndex(rawSearchIndex) {
 								        searchIndex = [];
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								        /**
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								         * List of normalized search words (ASCII lowercased, and undescores removed).
 								         *
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								         * @type {Array<string>}
 								         */
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const searchWords = [];
-												rustdoc: restructure type search engine to pick-and-use IDs

This change makes it so, instead of mixing string distance with
type unification, function signature search works by
mapping names to IDs at the start, reporting to the user any
cases where it had to make corrections, and then matches with
IDs when going through the items.

This only changes function searches. Name searches are left alone,
and corrections are only done when there's a single item in the
search query.

											
										
										
											2023-04-15 11:53:50 -07:00
+								        typeNameIdMap = new Map();
-												rustdoc: use a string with one-character codes for search index types

    $ wc -c search-index.old.js search-index.new.js
    3940530 search-index.old.js
    3843222 search-index.new.js

((3940530-3843222)/3940530)*100 = 2.47%

    $ wc -c search-index.old.js.gz search-index.new.js.gz
    380251 search-index.old.js.gz
    379434 search-index.new.js.gz

((380251-379434)/380251)*100 = 0.214%

											
										
										
											2023-02-13 13:39:01 -07:00
+								        const charA = "A".charCodeAt(0);
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        let currentIndex = 0;
 								        let id = 0;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: search for slices and arrays by type with `[]`

Part of #60485

											
										
										
											2023-05-25 12:58:36 -07:00
+								        // Initialize type map indexes for primitive list types
 								        // that can be searched using `[]` syntax.
 								        typeNameIdOfArray = buildTypeMapIndex("array");
 								        typeNameIdOfSlice = buildTypeMapIndex("slice");
 								        typeNameIdOfArrayOrSlice = buildTypeMapIndex("[]");
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								        // Function type fingerprints are 128-bit bloom filters that are used to
 								        // estimate the distance between function and query.
 								        // This loop counts the number of items to allocate a fingerprint for.
 								        for (const crate in rawSearchIndex) {
 								            if (!hasOwnPropertyRustdoc(rawSearchIndex, crate)) {
 								                continue;
 								            }
 								            // Each item gets an entry in the fingerprint array, and the crate
 								            // does, too
 								            id += rawSearchIndex[crate].t.length + 1;
 								        }
 								        functionTypeFingerprint = new Uint32Array((id + 1) * 4);
 								        // This loop actually generates the search item indexes, including
 								        // normalized names, type signature objects and fingerprints, and aliases.
 								        id = 0;
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        for (const crate in rawSearchIndex) {
-												Fix eslint errors

											
										
										
											2021-05-14 13:56:15 +02:00
+								            if (!hasOwnPropertyRustdoc(rawSearchIndex, crate)) {
 								                continue;
 								            }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            let crateSize = 0;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								            /**
-												rustdoc: update comment in search.js for #107629

											
										
										
											2023-09-02 19:26:10 -06:00
+								             * The raw search data for a given crate. `n`, `t`, `d`, `i`, and `f`
 								             * are arrays with the same length. `q`, `a`, and `c` use a sparse
 								             * representation for compactness.
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *
-												rustdoc: update comment in search.js for #107629

											
										
										
											2023-09-02 19:26:10 -06:00
+								             * `n[i]` contains the name of an item.
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *
-												rustdoc: update comment in search.js for #107629

											
										
										
											2023-09-02 19:26:10 -06:00
+								             * `t[i]` contains the type of that item
 								             * (as a string of characters that represent an offset in `itemTypes`).
 								             *
 								             * `d[i]` contains the description of that item.
 								             *
 								             * `q` contains the full paths of the items. For compactness, it is a set of
 								             * (index, path) pairs used to create a map. If a given index `i` is
 								             * not present, this indicates "same as the last index present".
 								             *
 								             * `i[i]` contains an item's parent, usually a module. For compactness,
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								             * it is a set of indexes into the `p` array.
 								             *
-												rustdoc: update comment in search.js for #107629

											
										
										
											2023-09-02 19:26:10 -06:00
+								             * `f[i]` contains function signatures, or `0` if the item isn't a function.
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								             * Functions are themselves encoded as arrays. The first item is a list of
 								             * types representing the function's inputs, and the second list item is a list
 								             * of types representing the function's output. Tuples are flattened.
 								             * Types are also represented as arrays; the first item is an index into the `p`
 								             * array, while the second is a list of types representing any generic parameters.
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								             * b[i] contains an item's impl disambiguator. This is only present if an item
 								             * is defined in an impl block and, the impl block's type has more than one associated
 								             * item with the same name.
 								             *
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             * `a` defines aliases with an Array of pairs: [name, offset], where `offset`
 								             * points into the n/t/d/q/i/f arrays.
 								             *
 								             * `doc` contains the description of the crate.
 								             *
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								             * `p` is a list of path/type pairs. It is used for parents and function parameters.
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *
-												rustdoc: update comment in search.js for #107629

											
										
										
											2023-09-02 19:26:10 -06:00
+								             * `c` is an array of item indices that are deprecated.
 								             *
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             * @type {{
 								             *   doc: string,
 								             *   a: Object,
 								             *   n: Array<string>,
-												rustdoc: use a string with one-character codes for search index types

    $ wc -c search-index.old.js search-index.new.js
    3940530 search-index.old.js
    3843222 search-index.new.js

((3940530-3843222)/3940530)*100 = 2.47%

    $ wc -c search-index.old.js.gz search-index.new.js.gz
    380251 search-index.old.js.gz
    379434 search-index.new.js.gz

((380251-379434)/380251)*100 = 0.214%

											
										
										
											2023-02-13 13:39:01 -07:00
+								             *   t: String,
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *   d: Array<string>,
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								             *   q: Array<[Number, string]>,
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *   i: Array<Number>,
-												Add documentation

											
										
										
											2022-06-27 11:07:16 -07:00
+								             *   f: Array<RawFunctionSearchType>,
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             *   p: Array<Object>,
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								             *   b: Array<[Number, String]>,
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								             *   c: Array<Number>
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								             * }}
 								             */
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const crateCorpus = rawSearchIndex[crate];
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            searchWords.push(crate);
 								            // This object should have exactly the same set of fields as the "row"
 								            // object defined below. Your JavaScript runtime will thank you.
 								            // https://mathiasbynens.be/notes/shapes-ics
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const crateRow = {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                crate: crate,
-												rustdoc-search: make primitives and keywords less special

The search sorting code already sorts by item type discriminant,
putting things with smaller discriminants first. There was
also a special case for sorting keywords and primitives earlier,
and this commit removes it by giving them lower discriminants.

The sorting code has another criteria where items with descriptions
appear earlier than items without, and that criteria has higher
priority than the item type. This shouldn't matter, though,
because primitives and keywords normally only appear in the
standard library, and it always gives them descriptions.

											
										
										
											2023-11-20 13:37:57 -07:00
+								                ty: 3, // == ExternCrate
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                name: crate,
 								                path: "",
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								                desc: crateCorpus.doc,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                parent: undefined,
 								                type: null,
 								                id: id,
-												Fix eslint errors

											
										
										
											2021-05-14 13:56:15 +02:00
+								                normalizedName: crate.indexOf("_") === -1 ? crate : crate.replace(/_/g, ""),
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								                deprecated: null,
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								                implDisambiguator: null,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            };
 								            id += 1;
 								            searchIndex.push(crateRow);
 								            currentIndex += 1;
-												rustdoc: use a string with one-character codes for search index types

    $ wc -c search-index.old.js search-index.new.js
    3940530 search-index.old.js
    3843222 search-index.new.js

((3940530-3843222)/3940530)*100 = 2.47%

    $ wc -c search-index.old.js.gz search-index.new.js.gz
    380251 search-index.old.js.gz
    379434 search-index.new.js.gz

((380251-379434)/380251)*100 = 0.214%

											
										
										
											2023-02-13 13:39:01 -07:00
+								            // a String of one character item type codes
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const itemTypes = crateCorpus.t;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // an array of (String) item names
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const itemNames = crateCorpus.n;
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								            // an array of [(Number) item index,
 								            //              (String) full path]
 								            // an item whose index is not present will fall back to the previous present path
 								            // i.e. if indices 4 and 11 are present, but 5-10 and 12-13 are not present,
 								            // 5-10 will fall back to the path for 4 and 12-13 will fall back to the path for 11
 								            const itemPaths = new Map(crateCorpus.q);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // an array of (String) descriptions
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const itemDescs = crateCorpus.d;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // an array of (Number) the parent path index + 1 to `paths`, or 0 if none
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const itemParentIdxs = crateCorpus.i;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // an array of (Object | null) the type of the function, if any
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const itemFunctionSearchTypes = crateCorpus.f;
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								            // an array of (Number) indices for the deprecated items
 								            const deprecatedItems = new Set(crateCorpus.c);
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								            // an array of (Number) indices for the deprecated items
 								            const implDisambiguator = new Map(crateCorpus.b);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // an array of [(Number) item type,
 								            //              (String) name]
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const paths = crateCorpus.p;
-												Fix typos “a”→“an”

											
										
										
											2021-08-22 14:46:15 +02:00
+								            // an array of [(String) alias name
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            //             [Number] index to items]
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const aliases = crateCorpus.a;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            // an array of [{name: String, ty: Number}]
 								            const lowercasePaths = [];
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // convert `rawPaths` entries into object form
-												rustdoc: reference function signature types from the `p` array

This reduces the size of the function signature index, because
it's common to have many functions that operate on the same types.

    $ wc -c search-index-old.js search-index-new.js
    5224374 search-index-old.js
    3932314 search-index-new.js

By my math, this reduces the uncompressed size of the search index by 32%.
On compressed signatures, the wins are less drastic, a mere 8%:

    $ wc -c search-index-old.js.gz search-index-new.js.gz
    404532 search-index-old.js.gz
    371635 search-index-new.js.gz

											
										
										
											2022-06-24 17:12:58 -07:00
+								            // generate normalizedPaths for function search mode
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            let len = paths.length;
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								            let lastPath = itemPaths.get(0);
-												Clean up JS files code a bit

											
										
										
											2023-02-26 16:26:59 +01:00
+								            for (let i = 0; i < len; ++i) {
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								                const elem = paths[i];
 								                const ty = elem[0];
 								                const name = elem[1];
 								                let path = null;
 								                if (elem.length > 2) {
 								                    path = itemPaths.has(elem[2]) ? itemPaths.get(elem[2]) : lastPath;
 								                    lastPath = path;
 								                }
 								                lowercasePaths.push({ty: ty, name: name.toLowerCase(), path: path});
 								                paths[i] = {ty: ty, name: name, path: path};
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
 								            // convert `item*` into an object form, and construct word indices.
 								            //
 								            // before any analysis is performed lets gather the search terms to
 								            // search against apart from the rest of the data.  This is a quick
 								            // operation that is cached for the life of the page state so that
 								            // all other search operations have access to this cached data for
 								            // faster analysis operations
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								            lastPath = "";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            len = itemTypes.length;
-												Clean up JS files code a bit

											
										
										
											2023-02-26 16:26:59 +01:00
+								            for (let i = 0; i < len; ++i) {
 								                let word = "";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                // This object should have exactly the same set of fields as the "crateRow"
 								                // object defined above.
 								                if (typeof itemNames[i] === "string") {
 								                    word = itemNames[i].toLowerCase();
 								                }
-												Clean up JS files code a bit

											
										
										
											2023-02-26 16:26:59 +01:00
+								                searchWords.push(word);
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								                const path = itemPaths.has(i) ? itemPaths.get(i) : lastPath;
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								                let type = null;
 								                if (itemFunctionSearchTypes[i] !== 0) {
 								                    type = buildFunctionSearchType(
 								                        itemFunctionSearchTypes[i],
 								                        lowercasePaths
 								                    );
 								                    if (type) {
 								                        const fp = functionTypeFingerprint.subarray(id * 4, (id + 1) * 4);
 								                        const fps = new Set();
 								                        for (const t of type.inputs) {
 								                            buildFunctionTypeFingerprint(t, fp, fps);
 								                        }
 								                        for (const t of type.output) {
 								                            buildFunctionTypeFingerprint(t, fp, fps);
 								                        }
 								                        for (const w of type.where_clause) {
 								                            for (const t of w) {
 								                                buildFunctionTypeFingerprint(t, fp, fps);
 								                            }
 								                        }
 								                    }
 								                }
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const row = {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    crate: crate,
-												rustdoc: use a string with one-character codes for search index types

    $ wc -c search-index.old.js search-index.new.js
    3940530 search-index.old.js
    3843222 search-index.new.js

((3940530-3843222)/3940530)*100 = 2.47%

    $ wc -c search-index.old.js.gz search-index.new.js.gz
    380251 search-index.old.js.gz
    379434 search-index.new.js.gz

((380251-379434)/380251)*100 = 0.214%

											
										
										
											2023-02-13 13:39:01 -07:00
+								                    ty: itemTypes.charCodeAt(i) - charA,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    name: itemNames[i],
-												[rustdoc] Fix path in type-based search

											
										
										
											2023-09-01 14:30:31 +02:00
+								                    path: path,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    desc: itemDescs[i],
 								                    parent: itemParentIdxs[i] > 0 ? paths[itemParentIdxs[i] - 1] : undefined,
-												rustdoc-search: use set ops for ranking and filtering

This commit adds ranking and quick filtering to type-based search,
improving performance and having it order results based on their
type signatures.

Motivation
----------

If I write a query like `str -> String`, a lot of functions come up.
That's to be expected, but `String::from_str` should come up on top, and
it doesn't right now. This is because the sorting algorithm is based
on the functions name, and doesn't consider the type signature at all.
`slice::join` even comes up above it!

To fix this, the sorting should take into account the function's
signature, and the closer match should come up on top.

Guide-level description
-----------------------

When searching by type signature, types with a "closer" match will
show up above types that match less precisely.

Reference-level explanation
---------------------------

Functions signature search works in three major phases:

* A compact "fingerprint," based on the [bloom filter] technique, is used to
  check for matches and to estimate the distance. It sometimes has false
  positive matches, but it also operates on 128 bit contiguous memory and
  requires no backtracking, so it performs a lot better than real
  unification.

  The fingerprint represents the set of items in the type signature, but it
  does not represent nesting, and it ignores when the same item appears more
  than once.

  The result is rejected if any query bits are absent in the function, or
  if the distance is higher than the current maximum and 200
  results have already been found.

* The second step performs unification. This is where nesting and true bag
  semantics are taken into account, and it has no false positives. It uses a
  recursive, backtracking algorithm.

  The result is rejected if any query elements are absent in the function.

[bloom filter]: https://en.wikipedia.org/wiki/Bloom_filter

Drawbacks
---------

This makes the code bigger.

More than that, this design is a subtle trade-off. It makes the cases I've
tested against measurably faster, but it's not clear how well this extends
to other crates with potentially more functions and fewer types.

The more complex things get, the more important it is to gather a good set
of data to test with (this is arguably more important than the actual
benchmarking ifrastructure right now).

Rationale and alternatives
--------------------------

Throwing a bloom filter in front makes it faster.

More than that, it tries to take a tactic where the system can not only check
for potential matches, but also gets an accurate distance function without
needing to do unification. That way it can skip unification even on items
that have the needed elems, as long as they have more items than the
currently found maximum.

If I didn't want to be able to cheaply do set operations on the fingerprint,
a [cuckoo filter] is supposed to have better performance.
But the nice bit-banging set intersection doesn't work AFAIK.

I also looked into [minhashing], but since it's actually an unbiased
estimate of the similarity coefficient, I'm not sure how it could be used
to skip unification (I wouldn't know if the estimate was too low or
too high).

This function actually uses the number of distinct items as its
"distance function."
This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|F\cap{}Q|}{|F\cup{}Q|}$, while being cheaper to compute.
This is because:

* The function $F$ must be a superset of the query $Q$, so their union is
  just $F$ and the intersection is $Q$ and it can be reduced to
  $1-\frac{|Q|}{|F|}.

* There are no magic thresholds. These values are only being used to
  compare against each other while sorting (and, if 200 results are found,
  to compare with the maximum match). This means we only care if one value
  is bigger than the other, not what it's actual value is, and since $Q$ is
  the same for everything, it can be safely left out, reducing the formula
  to $1-\frac{1}{|F|} = \frac{|F|}{|F|}-\frac{1}{|F|} = |F|-1$. And, since
  the values are only being compared with each other, $|F|$ is fine.

Prior art
---------

This is significantly different from how Hoogle does it.
It doesn't account for order, and it has no special account for nesting,
though `Box<t>` is still two items, while `t` is only one.

This should give the same results that it would have gotten from a Jaccard
Distance $1-\frac{|A\cap{}B|}{|A\cup{}B|}$, while being cheaper to compute.

Unresolved questions
--------------------

`[]` and `()`, the slice/array and tuple/union operators, are ignored while
building the signature for the query. This is because they match more than
one thing, making them ambiguous. Unfortunately, this also makes them
a performance cliff. Is this likely to be a problem?

Right now, the system just stashes the type distance into the
same field that levenshtein distance normally goes in. This means exact
query matches show up on top (for example, if you have a function like
`fn nothing(a: Nothing, b: i32)`, then searching for `nothing` will show it
on top even if there's another function with `fn bar(x: Nothing)` that's
technically a closer match in type signature.

Future possibilities
--------------------

It should be possible to adopt more sorting criteria to act as a tie breaker,
which could be determined during unification.

[cuckoo filter]: https://en.wikipedia.org/wiki/Cuckoo_filter
[minhashing]: https://en.wikipedia.org/wiki/MinHash

											
										
										
											2023-11-27 22:41:45 -07:00
+								                    type,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    id: id,
-												Fix eslint errors

											
										
										
											2021-05-14 13:56:15 +02:00
+								                    normalizedName: word.indexOf("_") === -1 ? word : word.replace(/_/g, ""),
-												rustdoc: sort deprecated items lower in search

serialize `q` (`itemPaths`) sparsely
overall 4% reduction in search index size

											
										
										
											2023-02-03 00:08:57 -07:00
+								                    deprecated: deprecatedItems.has(i),
-												rustdoc-search: add impl disambiguator to duplicate assoc items

Helps with #90929

This changes the search results, specifically, when there's more than
one impl with an associated item with the same name. For example,
the search queries `simd<i8> -> simd<i8>` and `simd<i64> -> simd<i64>`
don't link to the same function, but most of the functions have the
same names.

This change should probably be FCP-ed, especially since it adds a new
anchor link format for `main.js` to handle, so that URLs like
`struct.Vec.html#impl-AsMut<[T]>-for-Vec<T,+A>/method.as_mut` redirect
to `struct.Vec.html#method.as_mut-2`. It's a strange design, but there
are a few reasons for it:

* I'd like to avoid making the HTML bigger. Obviously, fixing this bug
  is going to add at least a little more data to the search index, but
  adding more HTML penalises viewers for the benefit of searchers.

* Breaking `struct.Vec.html#method.len` would also be a disappointment.

On the other hand:

* The path-style anchors might be less prone to link rot than the numbered
  anchors. It's definitely less likely to have URLs that appear to "work",
  but silently point at the wrong thing.

* This commit arranges the path-style anchor to redirect to the numbered
  anchor. Nothing stops rustdoc from doing the opposite, making path-style
  anchors the default and redirecting the "legacy" numbered ones.

											
										
										
											2023-03-20 16:02:51 -07:00
+								                    implDisambiguator: implDisambiguator.has(i) ? implDisambiguator.get(i) : null,
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                };
 								                id += 1;
 								                searchIndex.push(row);
 								                lastPath = row.path;
 								                crateSize += 1;
 								            }
 								            if (aliases) {
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                const currentCrateAliases = new Map();
 								                ALIASES.set(crate, currentCrateAliases);
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                for (const alias_name in aliases) {
-												Fix eslint errors

											
										
										
											2021-05-14 13:56:15 +02:00
+								                    if (!hasOwnPropertyRustdoc(aliases, alias_name)) {
 								                        continue;
 								                    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                    let currentNameAliases;
 								                    if (currentCrateAliases.has(alias_name)) {
 								                        currentNameAliases = currentCrateAliases.get(alias_name);
 								                    } else {
 								                        currentNameAliases = [];
 								                        currentCrateAliases.set(alias_name, currentNameAliases);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    }
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                    for (const local_alias of aliases[alias_name]) {
-												rustdoc-search: use ES6 `Map` for aliases instead of `Object`

											
										
										
											2023-04-13 16:30:02 -07:00
+								                        currentNameAliases.push(local_alias + currentIndex);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    }
 								                }
 								            }
 								            currentIndex += crateSize;
 								        }
 								        return searchWords;
 								    }
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								    /**
 								     * Callback for when the search form is submitted.
 								     * @param {Event} [e] - The event that triggered this call, if any
 								     */
 								    function onSearchSubmit(e) {
 								        e.preventDefault();
 								        searchState.clearInputTimeout();
 								        search();
 								    }
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								    function putBackSearch() {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								        const search_input = searchState.input;
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								        if (!searchState.input) {
 								            return;
 								        }
-												Move settings into full JS

											
										
										
											2022-01-19 22:36:15 +01:00
+								        if (search_input.value !== "" && !searchState.isDisplayed()) {
 								            searchState.showResults();
 								            if (browserSupportsHistoryApi()) {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								                history.replaceState(null, "",
 								                    buildUrl(search_input.value, getFilterCrates()));
 								            }
 								            document.title = searchState.title;
 								        }
 								    }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    function registerSearchEvents() {
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								        const params = searchState.getQueryStringParams();
 								        // Populate search bar with query string search term when provided,
 								        // but only if the input bar is empty. This avoid the obnoxious issue
 								        // where you start trying to do a search, and the index loads, and
 								        // suddenly your search is gone!
 								        if (searchState.input.value === "") {
 								            searchState.input.value = params.search || "";
 								        }
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        const searchAfter500ms = () => {
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								            searchState.clearInputTimeout();
 								            if (searchState.input.value.length === 0) {
 								                searchState.hideResults();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            } else {
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								                searchState.timeout = setTimeout(search, 500);
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
 								        };
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								        searchState.input.onkeyup = searchAfter500ms;
 								        searchState.input.oninput = searchAfter500ms;
-												Add some JSDoc comments to rustdoc JS

This follows the Closure Compiler dialect of JSDoc, so we
can use it to do some basic type checking. We don't plan to
compile with Closure Compiler, just use it to check types. See
https://github.com/google/closure-compiler/wiki/ for details.

											
										
										
											2021-12-16 21:17:22 -08:00
+								        document.getElementsByClassName("search-form")[0].onsubmit = onSearchSubmit;
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        searchState.input.onchange = e => {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            if (e.target !== document.activeElement) {
 								                // To prevent doing anything when it's from a blur event.
 								                return;
 								            }
 								            // Do NOT e.preventDefault() here. It will prevent pasting.
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								            searchState.clearInputTimeout();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // zero-timeout necessary here because at the time of event handler execution the
 								            // pasted content is not in the input field yet. Shouldn’t make any difference for
 								            // change, though.
 								            setTimeout(search, 0);
 								        };
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								        searchState.input.onpaste = searchState.input.onchange;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        searchState.outputElement().addEventListener("keydown", e => {
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								            // We only handle unmodified keystrokes here. We don't want to interfere with,
 								            // for instance, alt-left and alt-right for history navigation.
 								            if (e.altKey || e.ctrlKey || e.shiftKey || e.metaKey) {
 								                return;
 								            }
 								            // up and down arrow select next/previous search result, or the
 								            // search box if we're already at the top.
 								            if (e.which === 38) { // up
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const previous = document.activeElement.previousElementSibling;
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								                if (previous) {
 								                    previous.focus();
 								                } else {
 								                    searchState.focus();
 								                }
 								                e.preventDefault();
 								            } else if (e.which === 40) { // down
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const next = document.activeElement.nextElementSibling;
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								                if (next) {
 								                    next.focus();
 								                }
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const rect = document.activeElement.getBoundingClientRect();
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								                if (window.innerHeight - rect.bottom < rect.height) {
 								                    window.scrollBy(0, rect.height);
 								                }
 								                e.preventDefault();
 								            } else if (e.which === 37) { // left
 								                nextTab(-1);
 								                e.preventDefault();
 								            } else if (e.which === 39) { // right
 								                nextTab(1);
 								                e.preventDefault();
 								            }
 								        });
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        searchState.input.addEventListener("keydown", e => {
-												rustdoc: use focus for search navigation

Rather than keeping track of highlighted element inside the JS, take
advantage of `.focus()` and the :focus CSS pseudo-class.

This required wrapping each row of results in one big <a> tag (because
anchors can be focused, but table rows cannot). That in turn required
moving from a table layout to a div layout with float.

This makes it so Ctrl+Enter opens links in new tabs, and using the arrow
keys to navigate off the bottom of the page scrolls the rest of the page
into view. It also simplifies the keyboard event handling. It eliminates
the need for click handlers on the search results, and for tracking
mouse movements.

This changes the UI treatment of mouse hovering. A hovered element now
gets a light grey background, but does not change the focused element.
It's possible to have two highlighted search results: one that is
focused (via keyboard) and one that is hovered (via mouse). Pressing
enter will activate the focused link; clicking will activate the hovered
link. This matches up with how Firefox and Chrome handle suggestions in
their URL bar, and avoids stray mouse movements changing the focus.

Selecting tabs is now done with left/right arrows while any search
result is focused. The visibility of results on each search tab is
controlled with the "active" class, rather than by setting display: none
directly. Note that the old code kept track of highlighted search
element when tabbing back and forth. The new code doesn't.

											
										
										
											2021-05-09 12:56:21 -07:00
+								            if (e.which === 40) { // down
 								                focusSearchResult();
 								                e.preventDefault();
 								            }
 								        });
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        searchState.input.addEventListener("focus", () => {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								            putBackSearch();
 								        });
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        searchState.input.addEventListener("blur", () => {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								            searchState.input.placeholder = searchState.input.origPlaceholder;
 								        });
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								        // Push and pop states are used to add search results to the browser
 								        // history.
-												Move settings into full JS

											
										
										
											2022-01-19 22:36:15 +01:00
+								        if (browserSupportsHistoryApi()) {
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            // Store the previous <title> so we can revert back to it later.
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const previousTitle = document.title;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								            window.addEventListener("popstate", e => {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								                const params = searchState.getQueryStringParams();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                // Revert to the previous title manually since the History
 								                // API ignores the title parameter.
 								                document.title = previousTitle;
 								                // When browsing forward to search results the previous
 								                // search will be repeated, so the currentResults are
 								                // cleared to ensure the search is successful.
 								                currentResults = null;
 								                // Synchronize search bar with query string state and
 								                // perform the search. This will empty the bar if there's
 								                // nothing there, which lets you really go back to a
 								                // previous state with nothing in the bar.
 								                if (params.search && params.search.length > 0) {
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								                    searchState.input.value = params.search;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    // Some browsers fire "onpopstate" for every page load
 								                    // (Chrome), while others fire the event only when actually
 								                    // popping a state (Firefox), which is why search() is
 								                    // called both here and at the end of the startSearch()
 								                    // function.
-												rustdoc-search: clean up some DOM code

											
										
										
											2023-11-25 10:39:45 -07:00
+								                    e.preventDefault();
 								                    search();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                } else {
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								                    searchState.input.value = "";
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                    // When browsing back from search results the main page
 								                    // visibility must be reset.
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								                    searchState.hideResults();
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								                }
 								            });
 								        }
 								        // This is required in firefox to avoid this problem: Navigating to a search result
 								        // with the keyboard, hitting enter, and then hitting back would take you back to
 								        // the doc page, rather than the search that should overlay it.
 								        // This was an interaction between the back-forward cache and our handlers
 								        // that try to sync state between the URL and the search input. To work around it,
 								        // do a small amount of re-init on page show.
-												Move callback to the () => {} syntax.

Fix lint

Fix main.js

Restore anonymous functions

Fix

Fix more

											
										
										
											2022-05-03 12:03:17 +08:00
+								        window.onpageshow = () => {
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const qSearch = searchState.getQueryStringParams().search;
-												Consolidate search-related vars and functions.

This allows sharing across main.js and search.js without exporting too
many symbols into the global namespace.

											
										
										
											2021-04-12 23:50:18 -07:00
+								            if (searchState.input.value === "" && qSearch) {
 								                searchState.input.value = qSearch;
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								            }
 								            search();
 								        };
 								    }
-												Move crate drop-down to search results page

This reduces clutter on doc pages.

											
										
										
											2022-01-01 23:48:34 -05:00
+								    function updateCrate(ev) {
-												Improve crate selection on rustdoc search results page

Resolves all of issue #93240

Reproduces a similar change as #99086, but with improvements

In particular, this PR inlcludes:
* redesigning the crate-search selector so the background color matches its surroundings
* decrease the font of the dropdown menu to a reaonable size
* add a hover effect
* make the color of the arrow theme-dependent, using a surrounding div, with :after pseudo-element
  that can then be transformed using CSS filters to approximate the desired color
* fix the text "in" to match the title font
* remove the "for xyz" in the "Results for xyz in [All crates]" title when
  searching for search term "xyz"; you can already see what you're searching for
  as it's typed in the search bar!
* in line with #99086, handle super-long crate names appropriately without a long <select>
  element escaping the screen area; the improvement is that we also keep the title
  within a single line now; uses some flex layout shenanigans...
* the margins / paddings are adjusted so the selected label of the <select> fits within
  the rest of that title nicely; also some inconsistency in the way that Firefox renders
  a <select> with "appearance: none" (roughly 4px more padding left and right of the text
  than e.g. Chrome) is worked around, and it now produces a result that looks (essentially)
  identical to Chrome
* the color of the help menu and settings menu border in light theme is made to match with
  the color of the corresponding buttons, like they do (match) in the ayu theme
* the casing of "All crates" changes to "all crates"
* the new tests from #99086 are temporarily disabled, until they can be adapted later

											
										
										
											2022-07-03 20:10:19 +02:00
+								        if (ev.target.value === "all crates") {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								            // If we don't remove it from the URL, it'll be picked up again by the search.
-												Update search.js to ES6

											
										
										
											2022-04-24 15:36:02 +02:00
+								            const query = searchState.input.value.trim();
-												Unify history interactions in search

											
										
										
											2023-06-16 13:43:55 +02:00
+								            updateSearchHistory(buildUrl(query, null));
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								        }
-												Move crate drop-down to search results page

This reduces clutter on doc pages.

											
										
										
											2022-01-01 23:48:34 -05:00
+								        // In case you "cut" the entry from the search input, then change the crate filter
 								        // before paste back the previous search, you get the old search results without
 								        // the filter. To prevent this, we need to remove the previous results.
 								        currentResults = null;
-												rustdoc-search: clean up some DOM code

											
										
										
											2023-11-25 10:39:45 -07:00
+								        search(true);
-												Move crate drop-down to search results page

This reduces clutter on doc pages.

											
										
										
											2022-01-01 23:48:34 -05:00
+								    }
-												Small JS code improvements

											
										
										
											2022-04-25 14:12:12 +02:00
+								    /**
 								     *  @type {Array<string>}
 								     */
 								    const searchWords = buildIndex(rawSearchIndex);
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								    if (typeof window !== "undefined") {
 								        registerSearchEvents();
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								        // If there's a search term in the URL, execute the search now.
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								        if (window.searchState.getQueryStringParams().search) {
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
+								            search();
 								        }
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								    }
-												Add filter-crate URL parameter

											
										
										
											2022-01-10 14:57:43 +01:00
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								    if (typeof exports !== "undefined") {
 								        exports.initSearch = initSearch;
 								        exports.execQuery = execQuery;
 								        exports.parseQuery = parseQuery;
 								    }
 								    return searchWords;
 								}
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
+								if (typeof window !== "undefined") {
 								    window.initSearch = initSearch;
 								    if (window.searchIndex !== undefined) {
 								        initSearch(window.searchIndex);
 								    }
 								} else {
 								    // Running in Node, not a browser. Run initSearch just to produce the
 								    // exports.
 								    initSearch({});
-												Split search.js from search-index.js.

											
										
										
											2021-04-13 14:59:54 -07:00
+								}
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
-												rustdoc: make search.js a module

Previously, search.js relied on the DOM and the `window` object. It can now be
loaded in the absence of the DOM, for instance by Node. The same is true of
search-index.js.

This allows removing a lot of code from src/tools/rustdoc-js/tester.js that
tried to parse search.js and extract specific functions that were needed for
testing.

											
										
										
											2022-05-15 21:09:55 -07:00
-												Move search JS into search-index.js

Export a few variables and functions into the global scope because they
are needed both by main.js and search-index.js.

											
										
										
											2021-04-11 22:19:29 -07:00
+								})();