aho-corasick.ts 1.8 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889
  1. interface Node {
  2. /** @default false */
  3. wordEnd: boolean,
  4. children: Map<string, Node | undefined>,
  5. fail: Node | undefined
  6. }
  7. const createNode = (): Node => ({
  8. wordEnd: false,
  9. children: new Map(),
  10. fail: undefined
  11. });
  12. const createKeywordFilter = (keys: string[] | Set<string>) => {
  13. const root = createNode();
  14. const put = (key: string, len = key.length) => {
  15. let node = root;
  16. const lastIdx = len - 1;
  17. for (let idx = 0; idx < len; idx++) {
  18. const char = key[idx];
  19. if (node.children.has(char)) {
  20. node = node.children.get(char)!;
  21. } else {
  22. const newNode = createNode();
  23. node.children.set(char, newNode);
  24. node = newNode;
  25. }
  26. if (lastIdx === idx && node !== root) {
  27. node.wordEnd = true;
  28. }
  29. }
  30. };
  31. keys.forEach(k => put(k));
  32. // const build = () => {
  33. const queue: Node[] = [];
  34. queue.push(root);
  35. let idx = 0;
  36. while (queue.length > idx) {
  37. const beginNode = queue[idx];
  38. const children = beginNode.children;
  39. children.forEach((node, char) => {
  40. let failNode = beginNode.fail;
  41. while (failNode && !failNode.children.has(char)) {
  42. failNode = failNode.fail;
  43. }
  44. if (node) {
  45. node.fail = failNode?.children.get(char) || root;
  46. queue.push(node);
  47. }
  48. });
  49. idx++;
  50. }
  51. // };
  52. // build();
  53. return (text: string) => {
  54. let node: Node | undefined = root;
  55. for (let i = 0, textLen = text.length; i < textLen; i++) {
  56. // const key = text.charAt(i);
  57. const char = text[i];
  58. while (node && !node.children.has(char)) {
  59. node = node.fail;
  60. }
  61. node = node?.children.get(char) || root;
  62. if (node.wordEnd) {
  63. return true;
  64. }
  65. }
  66. return false;
  67. };
  68. };
  69. export default createKeywordFilter;