perf(tokenizer): skip known-word lookup in MeCab POS enrichment

This commit is contained in:
2026-03-02 01:38:37 -08:00
parent cde231b1ff
commit 83f13df627
3 changed files with 52 additions and 5 deletions

View File

@@ -211,8 +211,7 @@ export function createTokenizerDepsRuntime(
return null;
}
const isKnownWordLookup = options.getNPlusOneEnabled?.() === false ? () => false : options.isKnownWord;
return mergeTokens(rawTokens, isKnownWordLookup, options.getKnownWordMatchMode());
return mergeTokens(rawTokens, options.isKnownWord, options.getKnownWordMatchMode(), false);
},
enrichTokensWithMecab: async (tokens, mecabTokens) =>
enrichTokensWithMecabAsync(tokens, mecabTokens),