Added types

Hugos68 · May 25, 2024 · 8dcc9bc · 8dcc9bc
1 parent 20c545a
commit 8dcc9bc
Show file tree

Hide file tree

Showing 6 changed files with 327 additions and 6 deletions.
diff --git a/.changeset/poor-lizards-greet.md b/.changeset/poor-lizards-greet.md
@@ -0,0 +1,5 @@
+---
+"vite-plugin-pagefind": patch
+---
+
+Added defaults per config options
diff --git a/.changeset/small-dogs-fail.md b/.changeset/small-dogs-fail.md
@@ -0,0 +1,5 @@
+---
+"vite-plugin-pagefind": patch
+---
+
+Added `/types` export for easier use
diff --git a/README.md b/README.md
@@ -57,22 +57,44 @@ Note: If your framework does not have a `vite.config` checkout the [examples](#e
 }
 ```
 
+Note: `vite-plugin-pagefind` currently only supports `.json` files, more will be supported in the future.
+
 ## Config
 
+### site
+
+The directory where your build output lives, this is required for both pagefind and this plugin.
+
 ### assets_dir
 
 The directory where the static assets are located relative to the project's root as specified in the vite config.
 
+_default_: 'public'
+
+### build_command
+
+The command to build and index the project.
+
+_default_: 'npm run build'
+
 ### dev_strategy
 
 The indexing strategy used during development:
 
 -   "eager": Build and index the app every time the development server starts
 -   "lazy": Build and index the app only if the pagefind bundle isn't present already
 
-### build_command
+_default_: 'lazy'
 
-The command to build and index the project.
+## Types
+
+Apart from the plugin, this package also exposes [the types from pagefind](https://github.com/CloudCannon/pagefind/blob/production-docs/pagefind_web_js/types/index.d.ts) as well as extending them by providing an additional `Pagefind` type:
+
+```ts
+import type { Pagefind } from 'vite-plugin-pagefind/types';
+
+const pagefind: Pagefind = await import('/pagefind/pagefind.js');
+```
 
 ## Examples
 

diff --git a/package.json b/package.json
@@ -14,7 +14,10 @@
 		"access": "public"
 	},
 	"license": "MIT",
-	"main": "dist/index.js",
+	"exports": {
+		".": "./dist/index.js",
+		"./types": "./dist/types.d.ts"
+	},
 	"files": [
 		"dist"
 	],

diff --git a/src/types.ts b/src/types.ts
@@ -0,0 +1,286 @@
+/**
+ * https://github.com/CloudCannon/pagefind/blob/production-docs/pagefind_web_js/types/index.d.ts
+ * Original Author: bglw, CloudCannon
+ */
+
+/** Global index options that can be passed to pagefind.options() */
+export type PagefindIndexOptions = {
+	/** Overrides the URL path that Pagefind uses to load its search bundle */
+	basePath?: string;
+	/** Appends the given baseURL to all search results. May be a path, or a full domain */
+	baseUrl?: string;
+	/** The maximum length of excerpts that Pagefind should generate for search results. Default to 30 */
+	excerptLength?: number;
+	/**
+	 * Multiply all rankings for this index by the given weight.
+	 *
+	 * Only applies in multisite setups, where one site should rank higher or lower than others.
+	 */
+	indexWeight?: number;
+	/**
+	 * Merge this filter object into all search queries in this index.
+	 *
+	 * Only applies in multisite setups.
+	 */
+	mergeFilter?: Object;
+	/**
+	 * If set, will ass the search term as a query parameter under this key, for use with Pagefind's highlighting script.
+	 */
+	highlightParam?: string;
+	language?: string;
+	/**
+	 * Whether an instance of Pagefind is the primary index or not (for multisite).
+	 *
+	 * This is set for you automatically, so it is unlikely you should set this directly.
+	 */
+	primary?: boolean;
+	/**
+	 * Provides the ability to fine tune Pagefind's ranking algorithm to better suit your dataset.
+	 */
+	ranking?: PagefindRankingWeights;
+};
+
+export type PagefindRankingWeights = {
+	/**
+            Controls page ranking based on similarity of terms to the search query (in length).
+            Increasing this number means pages rank higher when they contain words very close to the query,
+            e.g. if searching for `part` then `party` will boost a page higher than one containing `partition`.
+            Minimum value is 0.0, where `party` and `partition` would be viewed equally.
+        */
+	termSimilarity?: Number;
+	/**
+            Controls how much effect the average page length has on ranking.
+            Maximum value is 1.0, where ranking will strongly favour pages that are shorter than the average page on the site.
+            Minimum value is 0.0, where ranking will exclusively look at term frequency, regardless of how long a document is.
+        */
+	pageLength?: Number;
+	/**
+            Controls how quickly a term saturates on the page and reduces impact on the ranking.
+            Maximum value is 2.0, where pages will take a long time to saturate, and pages with very high term frequencies will take over.
+            As this number trends to 0, it does not take many terms to saturate and allow other paramaters to influence the ranking.
+            Minimum value is 0.0, where terms will saturate immediately and results will not distinguish between one term and many.
+        */
+	termSaturation?: Number;
+	/**
+            Controls how much ranking uses term frequency versus raw term count.
+            Maximum value is 1.0, where term frequency fully applies and is the main ranking factor.
+            Minimum value is 0.0, where term frequency does not apply, and pages are ranked based on the raw sum of words and weights.
+            Values between 0.0 and 1.0 will interpolate between the two ranking methods.
+            Reducing this number is a good way to boost longer documents in your search results, as they no longer get penalized for having a low term frequency.
+         */
+	termFrequency?: Number;
+};
+
+/** Options that can be passed to pagefind.search() */
+export type PagefindSearchOptions = {
+	/** If set, this call will load all assets but return before searching. Prefer using pagefind.preload() instead */
+	preload?: boolean;
+	/** Add more verbose console logging for this search query */
+	verbose?: boolean;
+	/** The set of filters to execute with this search. Input type is extremely flexible, see the filtering docs for details */
+	filters?: Object;
+	/** The set of sorts to use for this search, instead of relevancy */
+	sort?: Object;
+};
+
+/** Filter counts returned from pagefind.filters(), and alongside results from pagefind.search() */
+export type PagefindFilterCounts = Record<string, Record<string, number>>;
+
+/** The main results object returned from a call to pagefind.search() */
+export type PagefindSearchResults = {
+	/** All pages that match the search query and filters provided */
+	results: PagefindSearchResult[];
+	/** How many results would there have been if you had omitted the filters */
+	unfilteredResultCount: number;
+	/** Given the query and filters provided, how many remaining results are there under each filter? */
+	filters: PagefindFilterCounts;
+	/** If the searched filters were removed, how many total results for each filter are there? */
+	totalFilters: PagefindFilterCounts;
+	/** Information on how long it took Pagefind to execute this query */
+	timings: {
+		preload: number;
+		search: number;
+		total: number;
+	};
+};
+
+/** A single result from a search query, before actual data has been loaded */
+export type PagefindSearchResult = {
+	/** Pagefind's internal ID for this page, unique across the site */
+	id: string;
+	/** Pagefind's internal score for your query matching this page, that is used when ranking these results */
+	score: number;
+	/** The locations of all matching words in this page */
+	words: number[];
+	/**
+	 * Calling data() loads the final data fragment needed to display this result.
+	 *
+	 * Only call this when you need to display the data, rather than all at once.
+	 * (e.g. one page as a time, or in a scroll listener)
+	 * */
+	data: () => Promise<PagefindSearchFragment>;
+};
+
+/** The useful data Pagefind provides for a search result */
+export type PagefindSearchFragment = {
+	/** Pagefind's processed URL for this page. Will include the baseUrl if configured */
+	url: string;
+	/** Pagefind's unprocessed URL for this page */
+	raw_url?: string;
+	/** The full processed content text of this page */
+	content: string;
+	/** Internal type — ignore for now */
+	raw_content?: string;
+	/** The processed excerpt for this result, with matching terms wrapping in `<mark>` elements */
+	excerpt: string;
+	/**
+	 * What regions of the page matched this search query?
+	 *
+	 * Precalculates based on h1->6 tags with IDs, using the text between each.
+	 */
+	sub_results: PagefindSubResult[];
+	/** How many total words are there on this page? */
+	word_count: number;
+	/** The locations of all matching words in this page */
+	locations: number[];
+	/**
+	 * The locations of all matching words in this page,
+	 * paired with data about their weight and relevance to this query
+	 */
+	weighted_locations: PagefindWordLocation[];
+	/** The filter keys and values this page was tagged with */
+	filters: Record<string, string[]>;
+	/** The metadata keys and values this page was tagged with */
+	meta: Record<string, string>;
+	/**
+	 * The raw anchor data that Pagefind used to generate sub_results.
+	 *
+	 * Contains _all_ elements that had IDs on the page, so can be used to
+	 * implement your own sub result calculations with different semantics.
+	 */
+	anchors: PagefindSearchAnchor[];
+};
+
+/** Data for a matched section within a page */
+export type PagefindSubResult = {
+	/**
+	 * Title of this sub result — derived from the heading content.
+	 *
+	 * If this is a result for the section of the page before any headings with IDs,
+	 * this will be the same as the page's meta.title value.
+	 */
+	title: string;
+	/**
+	 * Direct URL to this sub result, comprised of the page's URL plus the hash string of the heading.
+	 *
+	 * If this is a result for the section of the page before any headings with IDs,
+	 * this will be the same as the page URL.
+	 */
+	url: string;
+	/** The locations of all matching words in this segment */
+	locations: number[];
+	/**
+	 * The locations of all matching words in this segment,
+	 * paired with data about their weight and relevance to this query
+	 */
+	weighted_locations: PagefindWordLocation[];
+	/** The processed excerpt for this segment, with matching terms wrapping in `<mark>` elements */
+	excerpt: string;
+	/**
+	 * Raw data about the anchor element associated with this sub result.
+	 *
+	 * The omission of this field means this sub result is for text found on the page
+	 * before the first heading that had an ID.
+	 */
+	anchor?: PagefindSearchAnchor;
+};
+
+/** Information about a matching word on a page */
+export type PagefindWordLocation = {
+	/** The weight that this word was originally tagged as */
+	weight: number;
+	/**
+	 * An internal score that Pagefind calculated for this word.
+	 *
+	 * The absolute value is somewhat meaningless, but the value can be used
+	 * in comparison to other values in this set of search results to perform custom ranking.
+	 */
+	balanced_score: number;
+	/**
+	 * The index of this word in the result content.
+	 *
+	 * Splitting the content key by whitespacing and indexing by this number
+	 * will yield the correct word.
+	 */
+	location: number;
+};
+
+/** Raw data about elements with IDs that Pagefind encountered when indexing the page */
+export type PagefindSearchAnchor = {
+	/** What element type was this anchor? e.g. `h1`, `div` */
+	element: string;
+	/** The raw id="..." attribute contents of the element */
+	id: string;
+	/**
+	 * The text content of this element.
+	 *
+	 * In order to prevent repeating most of the page data for every anchor,
+	 * Pagefind will only take top level text nodes, or text nodes nested within
+	 * inline elements such as <a> and <span>.
+	 */
+	text?: string;
+	/**
+	 * The position of this anchor in the result content.
+	 * Splitting the content key by whitespacing and indexing by this number
+	 * will yield the first word indexed after this element's ID was found.
+	 */
+	location: number;
+};
+
+/**
+ * The Pagefind API object that is returned when importing the pagefind module.
+ */
+export type Pagefind = {
+	/**
+	 * Searches the Pagefind index for the given term with a debounce.
+	 */
+	debouncedSearch: (
+		query: string,
+		options?: PagefindSearchOptions,
+		duration?: number
+	) => Promise<PagefindSearchResults>;
+	/**
+	 * Destroys the Pagefind instance.
+	 */
+	destroy: () => Promise<void>;
+	/**
+	 * Returns the filter counts for the current index.
+	 */
+	filters: () => Promise<PagefindFilterCounts>;
+	/**
+	 * Initializes the Pagefind instance.
+	 */
+	init: () => Promise<void>;
+	/**
+	 * Merges the given index into the current index.
+	 */
+	mergeIndex: (
+		indexPath: string,
+		options?: Record<string, unknown>
+	) => Promise<void>;
+	/**
+	 * Configures the Pagefind instance with options.
+	 */
+	options: (options: PagefindIndexOptions) => Promise<void>;
+	/**
+	 * Preloads the results for the given term.
+	 */
+	preload: (term: string, options?: PagefindIndexOptions) => Promise<void>;
+	/**
+	 * Searches the Pagefind index for the given term.
+	 */
+	search: (
+		term: string,
+		options?: PagefindSearchOptions
+	) => Promise<PagefindSearchResults>;
+};
diff --git a/src/util/config.ts b/src/util/config.ts
@@ -5,9 +5,9 @@ import { readFileSync } from 'fs';
 const PagefindConfigSchema = v.object({
 	site: v.string(),
 	vite_plugin_pagefind: v.object({
-		assets_dir: v.string(),
-		build_command: v.string(),
-		dev_strategy: v.string()
+		assets_dir: v.optional(v.string(), 'public'),
+		build_command: v.optional(v.string(), 'npm run build'),
+		dev_strategy: v.optional(v.string(), 'lazy')
 	})
 });