quartz-research-note/assets/js/search.js

263 lines
7.5 KiB
JavaScript
Raw Normal View History

// code from https://github.com/danestves/markdown-to-text
const removeMarkdown = (
markdown,
options = {
listUnicodeChar: false,
stripListLeaders: true,
gfm: true,
useImgAltText: false,
preserveLinks: false,
2022-05-30 03:40:44 +00:00
},
) => {
2022-05-30 03:40:44 +00:00
let output = markdown || ""
output = output.replace(/^(-\s*?|\*\s*?|_\s*?){3,}\s*$/gm, "")
try {
if (options.stripListLeaders) {
if (options.listUnicodeChar)
2022-05-30 03:40:44 +00:00
output = output.replace(/^([\s\t]*)([\*\-\+]|\d+\.)\s+/gm, options.listUnicodeChar + " $1")
else output = output.replace(/^([\s\t]*)([\*\-\+]|\d+\.)\s+/gm, "$1")
}
if (options.gfm) {
output = output
2022-05-30 03:40:44 +00:00
.replace(/\n={2,}/g, "\n")
.replace(/~{3}.*\n/g, "")
.replace(/~~/g, "")
.replace(/`{3}.*\n/g, "")
}
if (options.preserveLinks) {
2022-05-30 03:40:44 +00:00
output = output.replace(/\[(.*?)\][\[\(](.*?)[\]\)]/g, "$1 ($2)")
}
output = output
2022-05-30 03:40:44 +00:00
.replace(/<[^>]*>/g, "")
.replace(/^[=\-]{2,}\s*$/g, "")
.replace(/\[\^.+?\](\: .*?$)?/g, "")
.replace(/(#{1,6})\s+(.+)\1?/g, "<b>$2</b>")
.replace(/\s{0,2}\[.*?\]: .*?$/g, "")
.replace(/\!\[(.*?)\][\[\(].*?[\]\)]/g, options.useImgAltText ? "$1" : "")
.replace(/\[(.*?)\][\[\(].*?[\]\)]/g, "<a>$1</a>")
.replace(/!?\[\[\S[^\[\]\|]*(?:\|([^\[\]]*))?\S\]\]/g, "<a>$1</a>")
.replace(/^\s{0,3}>\s?/g, "")
.replace(/(^|\n)\s{0,3}>\s?/g, "\n\n")
.replace(/^\s{1,2}\[(.*?)\]: (\S+)( ".*?")?\s*$/g, "")
.replace(/([\*_]{1,3})(\S.*?\S{0,1})\1/g, "$2")
.replace(/([\*_]{1,3})(\S.*?\S{0,1})\1/g, "$2")
.replace(/(`{3,})(.*?)\1/gm, "$2")
.replace(/`(.+?)`/g, "$1")
.replace(/\n{2,}/g, "\n\n")
.replace(/\[![a-zA-Z]+\][-\+]? /g, "")
} catch (e) {
2022-05-02 16:14:51 +00:00
console.error(e)
return markdown
}
2022-05-02 16:14:51 +00:00
return output
}
// -----
const highlight = (content, term) => {
const highlightWindow = 20
// try to find direct match first
const directMatchIdx = content.indexOf(term)
if (directMatchIdx !== -1) {
const h = highlightWindow / 2
const before = content.substring(0, directMatchIdx).split(" ").slice(-h)
2022-05-30 03:40:44 +00:00
const after = content
.substring(directMatchIdx + term.length, content.length - 1)
.split(" ")
.slice(0, h)
return (
(before.length == h ? `...${before.join(" ")}` : before.join(" ")) +
`<span class="search-highlight">${term}</span>` +
after.join(" ")
)
}
2022-05-30 03:40:44 +00:00
const tokenizedTerm = term.split(/\s+/).filter((t) => t !== "")
const splitText = content.split(/\s+/).filter((t) => t !== "")
const includesCheck = (token) =>
2022-05-30 03:40:44 +00:00
tokenizedTerm.some((term) => token.toLowerCase().startsWith(term.toLowerCase()))
const occurrencesIndices = splitText.map(includesCheck)
// calculate best index
let bestSum = 0
let bestIndex = 0
2022-05-30 03:40:44 +00:00
for (let i = 0; i < Math.max(occurrencesIndices.length - highlightWindow, 0); i++) {
const window = occurrencesIndices.slice(i, i + highlightWindow)
const windowSum = window.reduce((total, cur) => total + cur, 0)
if (windowSum >= bestSum) {
bestSum = windowSum
bestIndex = i
}
}
const startIndex = Math.max(bestIndex - highlightWindow, 0)
2022-05-30 03:40:44 +00:00
const endIndex = Math.min(startIndex + 2 * highlightWindow, splitText.length)
const mappedText = splitText
.slice(startIndex, endIndex)
.map((token) => {
if (includesCheck(token)) {
return `<span class="search-highlight">${token}</span>`
}
return token
})
2022-05-30 03:40:44 +00:00
.join(" ")
.replaceAll('</span> <span class="search-highlight">', " ")
return `${startIndex === 0 ? "" : "..."}${mappedText}${
endIndex === splitText.length ? "" : "..."
}`
}
2022-05-30 03:40:44 +00:00
;(async function () {
2022-05-02 16:56:44 +00:00
const encoder = (str) => str.toLowerCase().split(/([^a-z]|[^\x00-\x7F])+/)
const contentIndex = new FlexSearch.Document({
cache: true,
2022-05-30 03:40:44 +00:00
charset: "latin:extra",
optimize: true,
2022-05-02 05:06:33 +00:00
index: [
{
2022-05-30 03:40:44 +00:00
field: "content",
tokenize: "reverse",
2022-05-02 05:06:33 +00:00
encode: encoder,
},
{
2022-05-30 03:40:44 +00:00
field: "title",
tokenize: "forward",
2022-05-02 05:06:33 +00:00
encode: encoder,
},
],
})
const { content } = await fetchData
for (const [key, value] of Object.entries(content)) {
contentIndex.add({
id: key,
title: value.title,
content: removeMarkdown(value.content),
})
}
const resultToHTML = ({ url, title, content, term }) => {
const text = removeMarkdown(content)
const resultTitle = highlight(title, term)
const resultText = highlight(text, term)
return `<button class="result-card" id="${url}">
<h3>${resultTitle}</h3>
<p>${resultText}</p>
</button>`
}
const redir = (id, term) => {
2022-05-02 16:04:36 +00:00
// SPA navigation
2022-05-27 15:40:00 +00:00
window.Million.navigate(
2022-05-30 03:40:44 +00:00
new URL(`${BASE_URL.replace(/\/$/g, "")}${id}#:~:text=${encodeURIComponent(term)}/`),
".singlePage",
2022-05-02 16:56:44 +00:00
)
closeSearch()
}
2022-05-02 05:06:33 +00:00
const formatForDisplay = (id) => ({
id,
url: id,
title: content[id].title,
2022-05-02 05:06:33 +00:00
content: content[id].content,
})
2022-05-30 03:40:44 +00:00
const source = document.getElementById("search-bar")
const results = document.getElementById("results-container")
let term
2022-05-30 03:40:44 +00:00
source.addEventListener("keyup", (e) => {
if (e.key === "Enter") {
const anchor = document.getElementsByClassName("result-card")[0]
redir(anchor.id, term)
}
})
2022-05-30 03:40:44 +00:00
source.addEventListener("input", (e) => {
term = e.target.value
const searchResults = contentIndex.search(term, [
{
2022-05-30 03:40:44 +00:00
field: "content",
limit: 10,
},
{
2022-05-30 03:40:44 +00:00
field: "title",
limit: 5,
2022-05-02 05:06:33 +00:00
},
])
2022-05-02 05:06:33 +00:00
const getByField = (field) => {
2022-05-02 16:56:44 +00:00
const results = searchResults.filter((x) => x.field === field)
if (results.length === 0) {
return []
} else {
return [...results[0].result]
}
}
2022-05-30 03:40:44 +00:00
const allIds = new Set([...getByField("title"), ...getByField("content")])
const finalResults = [...allIds].map(formatForDisplay)
// display
if (finalResults.length === 0) {
results.innerHTML = `<button class="result-card">
<h3>No results.</h3>
<p>Try another search term?</p>
</button>`
} else {
results.innerHTML = finalResults
2022-05-02 05:06:33 +00:00
.map((result) =>
resultToHTML({
...result,
term,
2022-05-30 03:40:44 +00:00
}),
2022-05-02 05:06:33 +00:00
)
2022-05-30 03:40:44 +00:00
.join("\n")
const anchors = [...document.getElementsByClassName("result-card")]
2022-05-02 16:56:44 +00:00
anchors.forEach((anchor) => {
anchor.onclick = () => redir(anchor.id, term)
})
}
})
2022-05-30 03:40:44 +00:00
const searchContainer = document.getElementById("search-container")
function openSearch() {
2022-05-30 03:40:44 +00:00
if (searchContainer.style.display === "none" || searchContainer.style.display === "") {
source.value = ""
results.innerHTML = ""
searchContainer.style.display = "block"
source.focus()
} else {
2022-05-30 03:40:44 +00:00
searchContainer.style.display = "none"
}
}
function closeSearch() {
2022-05-30 03:40:44 +00:00
searchContainer.style.display = "none"
}
2022-05-30 03:40:44 +00:00
document.addEventListener("keydown", (event) => {
if (event.key === "k" && (event.ctrlKey || event.metaKey)) {
event.preventDefault()
openSearch()
}
2022-05-30 03:40:44 +00:00
if (event.key === "Escape") {
event.preventDefault()
closeSearch()
}
})
2022-05-30 03:40:44 +00:00
const searchButton = document.getElementById("search-icon")
searchButton.addEventListener("click", (evt) => {
openSearch()
})
2022-05-30 03:40:44 +00:00
searchButton.addEventListener("keydown", (evt) => {
openSearch()
})
2022-05-30 03:40:44 +00:00
searchContainer.addEventListener("click", (evt) => {
closeSearch()
})
2022-05-30 03:40:44 +00:00
document.getElementById("search-space").addEventListener("click", (evt) => {
evt.stopPropagation()
})
})()