mirror of
https://github.com/zadam/trilium.git
synced 2025-11-01 02:45:54 +01:00
skeleton of first tests
This commit is contained in:
@@ -1,117 +0,0 @@
|
||||
function lexer(str) {
|
||||
str = str.toLowerCase();
|
||||
|
||||
const fulltextTokens = [];
|
||||
const expressionTokens = [];
|
||||
|
||||
let quotes = false;
|
||||
let fulltextEnded = false;
|
||||
let currentWord = '';
|
||||
|
||||
function isOperatorSymbol(chr) {
|
||||
return ['=', '*', '>', '<', '!'].includes(chr);
|
||||
}
|
||||
|
||||
function previousOperatorSymbol() {
|
||||
if (currentWord.length === 0) {
|
||||
return false;
|
||||
}
|
||||
else {
|
||||
return isOperatorSymbol(currentWord[currentWord.length - 1]);
|
||||
}
|
||||
}
|
||||
|
||||
function finishWord() {
|
||||
if (currentWord === '') {
|
||||
return;
|
||||
}
|
||||
|
||||
if (fulltextEnded) {
|
||||
expressionTokens.push(currentWord);
|
||||
} else {
|
||||
fulltextTokens.push(currentWord);
|
||||
}
|
||||
|
||||
currentWord = '';
|
||||
}
|
||||
|
||||
for (let i = 0; i < str.length; i++) {
|
||||
const chr = str[i];
|
||||
|
||||
if (chr === '\\') {
|
||||
if ((i + 1) < str.length) {
|
||||
i++;
|
||||
|
||||
currentWord += str[i];
|
||||
}
|
||||
else {
|
||||
currentWord += chr;
|
||||
}
|
||||
|
||||
continue;
|
||||
}
|
||||
else if (['"', "'", '`'].includes(chr)) {
|
||||
if (!quotes) {
|
||||
if (currentWord.length === 0 || fulltextEnded) {
|
||||
if (previousOperatorSymbol()) {
|
||||
finishWord();
|
||||
}
|
||||
|
||||
quotes = chr;
|
||||
}
|
||||
else {
|
||||
// quote inside a word does not have special meening and does not break word
|
||||
// e.g. d'Artagnan is kept as a single token
|
||||
currentWord += chr;
|
||||
}
|
||||
}
|
||||
else if (quotes === chr) {
|
||||
quotes = false;
|
||||
|
||||
finishWord();
|
||||
}
|
||||
else {
|
||||
// it's a quote but within other kind of quotes so it's valid as a literal character
|
||||
currentWord += chr;
|
||||
}
|
||||
continue;
|
||||
}
|
||||
else if (!quotes) {
|
||||
if (currentWord.length === 0 && (chr === '#' || chr === '~')) {
|
||||
fulltextEnded = true;
|
||||
currentWord = chr;
|
||||
|
||||
continue;
|
||||
}
|
||||
else if (chr === ' ') {
|
||||
finishWord();
|
||||
continue;
|
||||
}
|
||||
else if (fulltextEnded && ['(', ')', '.'].includes(chr)) {
|
||||
finishWord();
|
||||
currentWord += chr;
|
||||
finishWord();
|
||||
continue;
|
||||
}
|
||||
else if (fulltextEnded && previousOperatorSymbol() !== isOperatorSymbol(chr)) {
|
||||
finishWord();
|
||||
|
||||
currentWord += chr;
|
||||
continue;
|
||||
}
|
||||
}
|
||||
|
||||
currentWord += chr;
|
||||
}
|
||||
|
||||
finishWord();
|
||||
|
||||
return {
|
||||
fulltextTokens,
|
||||
expressionTokens
|
||||
}
|
||||
}
|
||||
|
||||
export default {
|
||||
lexer
|
||||
}
|
||||
Reference in New Issue
Block a user