567 lines
18 KiB
JavaScript
Raw Normal View History

2020-12-30 11:12:35 +01:00
/*
* searchtools.js
* ~~~~~~~~~~~~~~~~
*
* Sphinx JavaScript utilities for the full-text search.
*
* :copyright: Copyright 2007-2023 by the Sphinx team, see AUTHORS.
2020-12-30 11:12:35 +01:00
* :license: BSD, see LICENSE for details.
*
*/
2022-06-22 20:22:26 +02:00
"use strict";
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
/**
* Simple result scoring code.
*/
if (typeof Scorer === "undefined") {
2020-12-30 11:12:35 +01:00
var Scorer = {
// Implement the following function to further tweak the score for each result
2022-06-22 20:22:26 +02:00
// The function takes a result array [docname, title, anchor, descr, score, filename]
2020-12-30 11:12:35 +01:00
// and returns the new score.
/*
2022-06-22 20:22:26 +02:00
score: result => {
const [docname, title, anchor, descr, score, filename] = result
return score
2020-12-30 11:12:35 +01:00
},
*/
// query matches the full name of an object
objNameMatch: 11,
// or matches in the last dotted part of the object name
objPartialMatch: 6,
// Additive scores depending on the priority of the object
2022-06-22 20:22:26 +02:00
objPrio: {
0: 15, // used to be importantResults
1: 5, // used to be objectResults
2: -5, // used to be unimportantResults
},
2020-12-30 11:12:35 +01:00
// Used when the priority is not in the mapping.
objPrioDefault: 0,
// query found in title
title: 15,
partialTitle: 7,
// query found in terms
term: 5,
2022-06-22 20:22:26 +02:00
partialTerm: 2,
2020-12-30 11:12:35 +01:00
};
}
2022-06-22 20:22:26 +02:00
const _removeChildren = (element) => {
while (element && element.lastChild) element.removeChild(element.lastChild);
};
/**
* See https://developer.mozilla.org/en-US/docs/Web/JavaScript/Guide/Regular_Expressions#escaping
*/
const _escapeRegExp = (string) =>
string.replace(/[.*+\-?^${}()|[\]\\]/g, "\\$&"); // $& means the whole matched string
2022-11-01 19:58:12 +01:00
const _displayItem = (item, searchTerms) => {
2022-06-22 20:22:26 +02:00
const docBuilder = DOCUMENTATION_OPTIONS.BUILDER;
const docUrlRoot = DOCUMENTATION_OPTIONS.URL_ROOT;
const docFileSuffix = DOCUMENTATION_OPTIONS.FILE_SUFFIX;
const docLinkSuffix = DOCUMENTATION_OPTIONS.LINK_SUFFIX;
const showSearchSummary = DOCUMENTATION_OPTIONS.SHOW_SEARCH_SUMMARY;
2022-11-01 19:58:12 +01:00
const [docName, title, anchor, descr, score, _filename] = item;
2022-06-22 20:22:26 +02:00
let listItem = document.createElement("li");
let requestUrl;
let linkUrl;
if (docBuilder === "dirhtml") {
// dirhtml builder
let dirname = docName + "/";
if (dirname.match(/\/index\/$/))
dirname = dirname.substring(0, dirname.length - 6);
else if (dirname === "index/") dirname = "";
requestUrl = docUrlRoot + dirname;
linkUrl = requestUrl;
} else {
// normal html builders
requestUrl = docUrlRoot + docName + docFileSuffix;
linkUrl = docName + docLinkSuffix;
}
let linkEl = listItem.appendChild(document.createElement("a"));
2022-11-01 19:58:12 +01:00
linkEl.href = linkUrl + anchor;
linkEl.dataset.score = score;
2022-06-22 20:22:26 +02:00
linkEl.innerHTML = title;
if (descr)
2022-07-27 11:10:29 +02:00
listItem.appendChild(document.createElement("span")).innerHTML =
2022-06-22 20:22:26 +02:00
" (" + descr + ")";
else if (showSearchSummary)
fetch(requestUrl)
.then((responseData) => responseData.text())
.then((data) => {
if (data)
listItem.appendChild(
2022-11-01 19:58:12 +01:00
Search.makeSearchSummary(data, searchTerms)
2022-06-22 20:22:26 +02:00
);
});
Search.output.appendChild(listItem);
};
const _finishSearch = (resultCount) => {
Search.stopPulse();
Search.title.innerText = _("Search Results");
if (!resultCount)
Search.status.innerText = Documentation.gettext(
"Your search did not match any documents. Please make sure that all words are spelled correctly and that you've selected enough categories."
);
else
Search.status.innerText = _(
`Search finished, found ${resultCount} page(s) matching the search query.`
);
};
const _displayNextItem = (
results,
resultCount,
searchTerms
) => {
// results left, load the summary and display it
// this is intended to be dynamic (don't sub resultsCount)
if (results.length) {
2022-11-01 19:58:12 +01:00
_displayItem(results.pop(), searchTerms);
2022-06-22 20:22:26 +02:00
setTimeout(
2022-11-01 19:58:12 +01:00
() => _displayNextItem(results, resultCount, searchTerms),
2022-06-22 20:22:26 +02:00
5
);
2020-12-30 11:12:35 +01:00
}
2022-06-22 20:22:26 +02:00
// search finished, update title and status message
else _finishSearch(resultCount);
};
/**
* Default splitQuery function. Can be overridden in ``sphinx.search`` with a
* custom function per language.
*
* The regular expression works by splitting the string on consecutive characters
* that are not Unicode letters, numbers, underscores, or emoji characters.
* This is the same as ``\W+`` in Python, preserving the surrogate pair area.
*/
if (typeof splitQuery === "undefined") {
var splitQuery = (query) => query
.split(/[^\p{Letter}\p{Number}_\p{Emoji_Presentation}]+/gu)
.filter(term => term) // remove remaining empty strings
2020-12-30 11:12:35 +01:00
}
/**
* Search Module
*/
2022-06-22 20:22:26 +02:00
const Search = {
_index: null,
_queued_query: null,
_pulse_status: -1,
htmlToText: (htmlString) => {
2022-07-27 11:10:29 +02:00
const htmlElement = new DOMParser().parseFromString(htmlString, 'text/html');
htmlElement.querySelectorAll(".headerlink").forEach((el) => { el.remove() });
2022-06-22 20:22:26 +02:00
const docContent = htmlElement.querySelector('[role="main"]');
if (docContent !== undefined) return docContent.textContent;
console.warn(
"Content block not found. Sphinx search tries to obtain it via '[role=main]'. Could you check your theme or template."
);
return "";
2020-12-30 11:12:35 +01:00
},
2022-06-22 20:22:26 +02:00
init: () => {
const query = new URLSearchParams(window.location.search).get("q");
document
.querySelectorAll('input[name="q"]')
.forEach((el) => (el.value = query));
if (query) Search.performSearch(query);
2020-12-30 11:12:35 +01:00
},
2022-06-22 20:22:26 +02:00
loadIndex: (url) =>
(document.body.appendChild(document.createElement("script")).src = url),
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
setIndex: (index) => {
Search._index = index;
if (Search._queued_query !== null) {
const query = Search._queued_query;
Search._queued_query = null;
Search.query(query);
2020-12-30 11:12:35 +01:00
}
},
2022-06-22 20:22:26 +02:00
hasIndex: () => Search._index !== null,
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
deferQuery: (query) => (Search._queued_query = query),
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
stopPulse: () => (Search._pulse_status = -1),
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
startPulse: () => {
if (Search._pulse_status >= 0) return;
const pulse = () => {
2020-12-30 11:12:35 +01:00
Search._pulse_status = (Search._pulse_status + 1) % 4;
2022-06-22 20:22:26 +02:00
Search.dots.innerText = ".".repeat(Search._pulse_status);
if (Search._pulse_status >= 0) window.setTimeout(pulse, 500);
};
2020-12-30 11:12:35 +01:00
pulse();
},
/**
* perform a search for something (or wait until index is loaded)
*/
2022-06-22 20:22:26 +02:00
performSearch: (query) => {
2020-12-30 11:12:35 +01:00
// create the required interface elements
2022-06-22 20:22:26 +02:00
const searchText = document.createElement("h2");
searchText.textContent = _("Searching");
const searchSummary = document.createElement("p");
searchSummary.classList.add("search-summary");
searchSummary.innerText = "";
const searchList = document.createElement("ul");
searchList.classList.add("search");
const out = document.getElementById("search-results");
Search.title = out.appendChild(searchText);
Search.dots = Search.title.appendChild(document.createElement("span"));
Search.status = out.appendChild(searchSummary);
Search.output = out.appendChild(searchList);
const searchProgress = document.getElementById("search-progress");
// Some themes don't use the search progress node
if (searchProgress) {
searchProgress.innerText = _("Preparing search...");
}
Search.startPulse();
2020-12-30 11:12:35 +01:00
// index already loaded, the browser was quick!
2022-06-22 20:22:26 +02:00
if (Search.hasIndex()) Search.query(query);
else Search.deferQuery(query);
2020-12-30 11:12:35 +01:00
},
/**
* execute search (requires search index to be loaded)
*/
2022-06-22 20:22:26 +02:00
query: (query) => {
2022-11-01 19:58:12 +01:00
const filenames = Search._index.filenames;
const docNames = Search._index.docnames;
const titles = Search._index.titles;
const allTitles = Search._index.alltitles;
const indexEntries = Search._index.indexentries;
2022-06-22 20:22:26 +02:00
// stem the search terms and add them to the correct list
const stemmer = new Stemmer();
const searchTerms = new Set();
const excludedTerms = new Set();
const highlightTerms = new Set();
const objectTerms = new Set(splitQuery(query.toLowerCase().trim()));
splitQuery(query.trim()).forEach((queryTerm) => {
const queryTermLower = queryTerm.toLowerCase();
// maybe skip this "word"
// stopwords array is from language_data.js
if (
stopwords.indexOf(queryTermLower) !== -1 ||
queryTerm.match(/^\d+$/)
)
return;
2020-12-30 11:12:35 +01:00
// stem the word
2022-06-22 20:22:26 +02:00
let word = stemmer.stemWord(queryTermLower);
2020-12-30 11:12:35 +01:00
// select the correct list
2022-06-22 20:22:26 +02:00
if (word[0] === "-") excludedTerms.add(word.substr(1));
2020-12-30 11:12:35 +01:00
else {
2022-06-22 20:22:26 +02:00
searchTerms.add(word);
highlightTerms.add(queryTermLower);
2020-12-30 11:12:35 +01:00
}
2022-06-22 20:22:26 +02:00
});
2020-12-30 11:12:35 +01:00
2022-11-01 19:58:12 +01:00
if (SPHINX_HIGHLIGHT_ENABLED) { // set in sphinx_highlight.js
localStorage.setItem("sphinx_highlight_terms", [...highlightTerms].join(" "))
}
2022-06-22 20:22:26 +02:00
// console.debug("SEARCH: searching for:");
// console.info("required: ", [...searchTerms]);
// console.info("excluded: ", [...excludedTerms]);
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
// array of [docname, title, anchor, descr, score, filename]
let results = [];
_removeChildren(document.getElementById("search-progress"));
2020-12-30 11:12:35 +01:00
2022-11-01 19:58:12 +01:00
const queryLower = query.toLowerCase();
for (const [title, foundTitles] of Object.entries(allTitles)) {
if (title.toLowerCase().includes(queryLower) && (queryLower.length >= title.length/2)) {
for (const [file, id] of foundTitles) {
let score = Math.round(100 * queryLower.length / title.length)
results.push([
docNames[file],
titles[file] !== title ? `${titles[file]} > ${title}` : title,
id !== null ? "#" + id : "",
null,
score,
filenames[file],
]);
}
}
}
// search for explicit entries in index directives
for (const [entry, foundEntries] of Object.entries(indexEntries)) {
if (entry.includes(queryLower) && (queryLower.length >= entry.length/2)) {
for (const [file, id] of foundEntries) {
let score = Math.round(100 * queryLower.length / entry.length)
results.push([
docNames[file],
titles[file],
id ? "#" + id : "",
null,
score,
filenames[file],
]);
}
}
}
2020-12-30 11:12:35 +01:00
// lookup as object
2022-06-22 20:22:26 +02:00
objectTerms.forEach((term) =>
results.push(...Search.performObjectSearch(term, objectTerms))
);
2020-12-30 11:12:35 +01:00
// lookup as search terms in fulltext
2022-06-22 20:22:26 +02:00
results.push(...Search.performTermsSearch(searchTerms, excludedTerms));
2020-12-30 11:12:35 +01:00
// let the scorer override scores with a custom scoring function
2022-06-22 20:22:26 +02:00
if (Scorer.score) results.forEach((item) => (item[4] = Scorer.score(item)));
2020-12-30 11:12:35 +01:00
// now sort the results by score (in opposite order of appearance, since the
// display function below uses pop() to retrieve items) and then
// alphabetically
2022-06-22 20:22:26 +02:00
results.sort((a, b) => {
const leftScore = a[4];
const rightScore = b[4];
if (leftScore === rightScore) {
2020-12-30 11:12:35 +01:00
// same score: sort alphabetically
2022-06-22 20:22:26 +02:00
const leftTitle = a[1].toLowerCase();
const rightTitle = b[1].toLowerCase();
if (leftTitle === rightTitle) return 0;
return leftTitle > rightTitle ? -1 : 1; // inverted is intentional
2020-12-30 11:12:35 +01:00
}
2022-06-22 20:22:26 +02:00
return leftScore > rightScore ? 1 : -1;
2020-12-30 11:12:35 +01:00
});
2022-06-22 20:22:26 +02:00
// remove duplicate search results
// note the reversing of results, so that in the case of duplicates, the highest-scoring entry is kept
let seen = new Set();
results = results.reverse().reduce((acc, result) => {
let resultStr = result.slice(0, 4).concat([result[5]]).map(v => String(v)).join(',');
if (!seen.has(resultStr)) {
acc.push(result);
seen.add(resultStr);
}
return acc;
}, []);
results = results.reverse();
2020-12-30 11:12:35 +01:00
// for debugging
//Search.lastresults = results.slice(); // a copy
2022-06-22 20:22:26 +02:00
// console.info("search results:", Search.lastresults);
2020-12-30 11:12:35 +01:00
// print the results
2022-11-01 19:58:12 +01:00
_displayNextItem(results, results.length, searchTerms);
2020-12-30 11:12:35 +01:00
},
/**
* search for object names
*/
2022-06-22 20:22:26 +02:00
performObjectSearch: (object, objectTerms) => {
const filenames = Search._index.filenames;
const docNames = Search._index.docnames;
const objects = Search._index.objects;
const objNames = Search._index.objnames;
const titles = Search._index.titles;
const results = [];
const objectSearchCallback = (prefix, match) => {
const name = match[4]
const fullname = (prefix ? prefix + "." : "") + name;
const fullnameLower = fullname.toLowerCase();
if (fullnameLower.indexOf(object) < 0) return;
let score = 0;
const parts = fullnameLower.split(".");
// check for different match types: exact matches of full name or
// "last name" (i.e. last dotted part)
if (fullnameLower === object || parts.slice(-1)[0] === object)
score += Scorer.objNameMatch;
else if (parts.slice(-1)[0].indexOf(object) > -1)
score += Scorer.objPartialMatch; // matches in last name
const objName = objNames[match[1]][2];
const title = titles[match[0]];
// If more than one term searched for, we require other words to be
// found in the name/title/description
const otherTerms = new Set(objectTerms);
otherTerms.delete(object);
if (otherTerms.size > 0) {
const haystack = `${prefix} ${name} ${objName} ${title}`.toLowerCase();
if (
[...otherTerms].some((otherTerm) => haystack.indexOf(otherTerm) < 0)
)
return;
2020-12-30 11:12:35 +01:00
}
2022-06-22 20:22:26 +02:00
let anchor = match[3];
if (anchor === "") anchor = fullname;
else if (anchor === "-") anchor = objNames[match[1]][1] + "-" + fullname;
const descr = objName + _(", in ") + title;
// add custom score for some objects according to scorer
if (Scorer.objPrio.hasOwnProperty(match[2]))
score += Scorer.objPrio[match[2]];
else score += Scorer.objPrioDefault;
results.push([
docNames[match[0]],
fullname,
"#" + anchor,
descr,
score,
filenames[match[0]],
]);
};
Object.keys(objects).forEach((prefix) =>
objects[prefix].forEach((array) =>
objectSearchCallback(prefix, array)
)
);
2020-12-30 11:12:35 +01:00
return results;
},
/**
* search for full-text terms in the index
*/
2022-06-22 20:22:26 +02:00
performTermsSearch: (searchTerms, excludedTerms) => {
// prepare search
const terms = Search._index.terms;
const titleTerms = Search._index.titleterms;
const filenames = Search._index.filenames;
2022-11-01 19:58:12 +01:00
const docNames = Search._index.docnames;
2022-06-22 20:22:26 +02:00
const titles = Search._index.titles;
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
const scoreMap = new Map();
const fileMap = new Map();
2020-12-30 11:12:35 +01:00
// perform the search on the required terms
2022-06-22 20:22:26 +02:00
searchTerms.forEach((word) => {
const files = [];
const arr = [
{ files: terms[word], score: Scorer.term },
{ files: titleTerms[word], score: Scorer.title },
2020-12-30 11:12:35 +01:00
];
// add support for partial matches
if (word.length > 2) {
2022-06-22 20:22:26 +02:00
const escapedWord = _escapeRegExp(word);
Object.keys(terms).forEach((term) => {
if (term.match(escapedWord) && !terms[word])
arr.push({ files: terms[term], score: Scorer.partialTerm });
});
Object.keys(titleTerms).forEach((term) => {
if (term.match(escapedWord) && !titleTerms[word])
arr.push({ files: titleTerms[word], score: Scorer.partialTitle });
});
2020-12-30 11:12:35 +01:00
}
// no match but word was a required one
2022-06-22 20:22:26 +02:00
if (arr.every((record) => record.files === undefined)) return;
2020-12-30 11:12:35 +01:00
// found search word in contents
2022-06-22 20:22:26 +02:00
arr.forEach((record) => {
if (record.files === undefined) return;
let recordFiles = record.files;
if (recordFiles.length === undefined) recordFiles = [recordFiles];
files.push(...recordFiles);
// set score for the word in each file
recordFiles.forEach((file) => {
if (!scoreMap.has(file)) scoreMap.set(file, {});
scoreMap.get(file)[word] = record.score;
});
2020-12-30 11:12:35 +01:00
});
// create the mapping
2022-06-22 20:22:26 +02:00
files.forEach((file) => {
if (fileMap.has(file) && fileMap.get(file).indexOf(word) === -1)
fileMap.get(file).push(word);
else fileMap.set(file, [word]);
});
});
2020-12-30 11:12:35 +01:00
// now check if the files don't contain excluded terms
2022-06-22 20:22:26 +02:00
const results = [];
for (const [file, wordList] of fileMap) {
2020-12-30 11:12:35 +01:00
// check if all requirements are matched
2022-06-22 20:22:26 +02:00
// as search terms with length < 3 are discarded
const filteredTermCount = [...searchTerms].filter(
(term) => term.length > 2
).length;
2020-12-30 11:12:35 +01:00
if (
2022-06-22 20:22:26 +02:00
wordList.length !== searchTerms.size &&
wordList.length !== filteredTermCount
)
continue;
2020-12-30 11:12:35 +01:00
// ensure that none of the excluded terms is in the search result
2022-06-22 20:22:26 +02:00
if (
[...excludedTerms].some(
(term) =>
terms[term] === file ||
titleTerms[term] === file ||
(terms[term] || []).includes(file) ||
(titleTerms[term] || []).includes(file)
)
)
break;
2020-12-30 11:12:35 +01:00
2022-06-22 20:22:26 +02:00
// select one (max) score for the file.
const score = Math.max(...wordList.map((w) => scoreMap.get(file)[w]));
// add result to the result list
results.push([
docNames[file],
titles[file],
"",
null,
score,
filenames[file],
]);
2020-12-30 11:12:35 +01:00
}
return results;
},
/**
* helper function to return a node containing the
* search summary for a given text. keywords is a list
2022-11-01 19:58:12 +01:00
* of stemmed words.
2020-12-30 11:12:35 +01:00
*/
2022-11-01 19:58:12 +01:00
makeSearchSummary: (htmlText, keywords) => {
2022-07-27 11:10:29 +02:00
const text = Search.htmlToText(htmlText);
2022-06-22 20:22:26 +02:00
if (text === "") return null;
2022-07-27 11:10:29 +02:00
const textLower = text.toLowerCase();
2022-06-22 20:22:26 +02:00
const actualStartPosition = [...keywords]
2022-07-27 11:10:29 +02:00
.map((k) => textLower.indexOf(k.toLowerCase()))
2022-06-22 20:22:26 +02:00
.filter((i) => i > -1)
.slice(-1)[0];
const startWithContext = Math.max(actualStartPosition - 120, 0);
const top = startWithContext === 0 ? "" : "...";
const tail = startWithContext + 240 < text.length ? "..." : "";
2022-07-27 11:10:29 +02:00
let summary = document.createElement("p");
2022-06-22 20:22:26 +02:00
summary.classList.add("context");
2022-07-27 11:10:29 +02:00
summary.textContent = top + text.substr(startWithContext, 240).trim() + tail;
2022-06-22 20:22:26 +02:00
return summary;
},
2020-12-30 11:12:35 +01:00
};
2022-06-22 20:22:26 +02:00
_ready(Search.init);