improve: tokenzining function names and camel case string (#34)

2024-09-11 12:59:09 +03:00 · 2023-04-27 18:38:22 +02:00 · 2023-04-27 18:38:22 +02:00 · 24cacef89e
commit 24cacef89e
parent c707bd74a7
3 changed files with 27 additions and 17 deletions
--- a/website/components/NixFunctions/nixFunctions.tsx
+++ b/website/components/NixFunctions/nixFunctions.tsx
@ -31,9 +31,33 @@ export function NixFunctions(props: FunctionsProps) {
        boost += id.includes(term) ? 10 : 0;
        return boost;
      },
+      boost: {
+        id: 10,
+        name: 8,
+        category: 6,
+        example: 0.5,
+        fn_type: 3,
+        description: 1,
+      },
    },
-    tokenize: (text: string): string[] => {
-      const tokens = text.split(/\W|(?=[A-Z])/);
+    tokenize: (text: string, fieldName): string[] => {
+      //split the text into words
+      const wordTokens = text.split(/\W/);
+      const containsUpper = (w: string) => Boolean(w.match(/[A-Z]/)?.length);
+      const tokens = [
+        // include the words itself if they contain upperCharacters
+        // mapAttrs -> mapAttrs
+        ...wordTokens.filter(containsUpper),
+        // but also split words that contain uppercase
+        // mapAttrs -> [map, Attrs]
+        ...wordTokens
+          .filter(containsUpper)
+          .map((t) => t.split(/(?=[A-Z])/))
+          .flat(),
+        // just include lowercase words without further tokenizing
+        // map -> map
+        ...wordTokens.filter((w) => !containsUpper(w)),
+      ];
      return tokens;
    },
  });
--- a/website/components/basicList/basicList.tsx
+++ b/website/components/basicList/basicList.tsx
@ -62,16 +62,7 @@ export function BasicList(props: BasicListProps) {

  const handleSearch = (term: string) => {
    setTerm(term);
-    search(term, {
-      boost: {
-        id: 10,
-        name: 8,
-        category: 6,
-        example: 0.5,
-        fn_type: 3,
-        description: 1,
-      },
-    });
+    search(term);
    setPage(1);
  };

--- a/website/queries/byQuery.ts
+++ b/website/queries/byQuery.ts
@ -1,9 +1,4 @@
 import { DocItem, MetaData } from "../models/nix";
-// import MiniSearch from 'minisearch'
-
-// export const byMinisearch = (term: string, miniSearch: MiniSearch<DocItem> ) => (data: MetaData): MetaData => {
-//    return miniSearch.search(term);
-// }

 export const byQuery =
 (rawTerm: string) =>