#373 - Arabic diacritics

This commit is contained in:
Simon Cambier
2024-06-27 21:00:18 +02:00
parent 85a23d8352
commit 87d2085fda
5 changed files with 46 additions and 12 deletions

View File

@@ -13,9 +13,9 @@ export class Query {
}
#inQuotes: string[]
constructor(text = '', options: { ignoreDiacritics: boolean }) {
constructor(text = '', options: { ignoreDiacritics: boolean, ignoreArabicDiacritics: boolean}) {
if (options.ignoreDiacritics) {
text = removeDiacritics(text)
text = removeDiacritics(text, options.ignoreArabicDiacritics)
}
const parsed = parse(text.toLowerCase(), {
tokenize: true,

View File

@@ -304,7 +304,12 @@ export class SearchEngine {
const title = document?.path.toLowerCase() ?? ''
const content = (document?.cleanedContent ?? '').toLowerCase()
return exactTerms.every(
q => content.includes(q) || removeDiacritics(title).includes(q)
q =>
content.includes(q) ||
removeDiacritics(
title,
this.plugin.settings.ignoreArabicDiacritics
).includes(q)
)
})
}
@@ -434,7 +439,7 @@ export class SearchEngine {
},
processTerm: (term: string) =>
(this.plugin.settings.ignoreDiacritics
? removeDiacritics(term)
? removeDiacritics(term, this.plugin.settings.ignoreArabicDiacritics)
: term
).toLowerCase(),
idField: 'path',