support umlauts in tokenizer

This commit is contained in:
Mario Zechner 2023-06-22 22:36:33 +02:00
parent 7578f544db
commit 8d2d8fd80b

View File

@ -122,7 +122,7 @@ exports.queryItemsAlasql = (query, items) => {
exports.queryItems = (query, items, exactWord) => {
query = query.trim().replace(",", ".").toLowerCase();
if (query.length < 3) return { items: [], queryTokens: [] };
const regex = /([A-Za-z-][A-Za-z0-9-]*)|(>=|<=|=|>|<)|(\d+(\.\d+)?)/g;
const regex = /([\p{L}-][\p{L}\p{N}-]*)|(>=|<=|=|>|<)|(\d+(\.\d+)?)/gu;
let tokens = query.match(regex);
// Find quantity/unit query