feat: Add Omnisearch support for regex search

This commit introduces the option to use Omnisearch as a backend for the regex search functionality, in addition to the existing ripgrep backend.
2025-06-09 09:40:16 +00:00 · 2025-06-09 09:40:16 +00:00 · 350a49cef9
commit 350a49cef9
parent 8915b84b04
8 changed files with 246 additions and 68 deletions
--- a/src/components/chat-view/ChatView.tsx
+++ b/src/components/chat-view/ChatView.tsx
@ -29,7 +29,8 @@ import {
 	LLMBaseUrlNotSetException,
 	LLMModelNotSetException,
 } from '../../core/llm/exception'
-import { regexSearchFiles } from '../../core/ripgrep'
+import { regexSearchFilesWithRipgrep } from '../../core/regex/ripgrep-index'
 import { regexSearchFilesWithOmnisearch } from '../../core/regex/omnisearch-index'
 import { useChatHistory } from '../../hooks/use-chat-history'
 import { useCustomModes } from '../../hooks/use-custom-mode'
 import { t } from '../../lang/helpers'
@ -609,10 +610,16 @@ const Chat = forwardRef<ChatRef, ChatProps>((props, ref) => {
 					}
 				} else if (toolArgs.type === 'regex_search_files') {
 					// @ts-expect-error Obsidian API type mismatch
 					const searchBackend = settings.regexSearchBackend
 					const baseVaultPath = String(app.vault.adapter.getBasePath())
 					const ripgrepPath = settings.ripgrepPath
 					const absolutePath = path.join(baseVaultPath, toolArgs.filepath)
-					const results = await regexSearchFiles(absolutePath, toolArgs.regex, ripgrepPath)
+					let results: string;
 					if (searchBackend === 'omnisearch') {
 						results = await regexSearchFilesWithOmnisearch(absolutePath, toolArgs.regex, app)
 					} else {
 						const ripgrepPath = settings.ripgrepPath
 						results = await regexSearchFilesWithRipgrep(absolutePath, toolArgs.regex, ripgrepPath)
 					}
 					const formattedContent = `[regex_search_files for '${toolArgs.filepath}'] Result:\n${results}\n`;
 					return {
 						type: 'regex_search_files',
--- a/src/core/regex/omnisearch-index.ts
+++ b/src/core/regex/omnisearch-index.ts
@ -0,0 +1,140 @@
 import { App } from "obsidian";
 import {
 	MAX_RESULTS,
 	truncateLine,
 	SearchResult,
 	formatResults,
 } from './regex-common';
 // --- Omnisearch API and Helper Types ---
 type SearchMatchApi = {
 	match: string;
 	offset: number;
 };
 type ResultNoteApi = {
 	score: number;
 	vault: string;
 	path: string;
 	basename: string;
 	foundWords: string[];
 	matches: SearchMatchApi[];
 	excerpt: string;
 };
 type OmnisearchApi = {
 	search: (query: string) => Promise<ResultNoteApi[]>;
 	// ... other API methods
 };
 declare global {
 	interface Window {
 		omnisearch: OmnisearchApi;
 	}
 }
 /**
 * Checks if the Omnisearch plugin's API is available.
 * @returns {boolean} True if the API is ready, false otherwise.
 */
 function isOmnisearchAvailable(): boolean {
 	return window.omnisearch && typeof window.omnisearch.search === "function";
 }
 /**
 * Finds the line number, column number, and content for a given character offset in a file.
 * @param allLines All lines in the file.
 * @param offset The character offset of the match.
 * @returns An object with line number, column number, and the full line content.
 */
 function findLineAndColumnFromOffset(
 	allLines: string[],
 	offset: number
 ): { lineNumber: number; columnNumber: number; lineContent: string } {
 	let charCount = 0;
 	for (let i = 0; i < allLines.length; i++) {
 		const line = allLines[i];
 		// The line ending length (1 for \n, 2 for \r\n) can vary.
 		// A simple +1 is a reasonable approximation for this calculation.
 		const lineEndOffset = charCount + line.length + 1; 
 		if (offset < lineEndOffset) {
 			const columnNumber = offset - charCount;
 			return { lineNumber: i, columnNumber, lineContent: line };
 		}
 		charCount = lineEndOffset;
 	}
 	return { lineNumber: -1, columnNumber: -1, lineContent: "" };
 }
 /**
 * Searches using Omnisearch and builds context for each match to replicate ripgrep's output.
 * @param vaultPath The absolute path of the vault for making relative paths.
 * @param query The search query for Omnisearch. Note: Omnisearch does not support full regex.
 * @param app The Obsidian App instance.
 * @returns A formatted string of search results.
 */
 export async function regexSearchFilesWithOmnisearch(
 	vaultPath: string,
 	query: string,
 	app: App,
 ): Promise<string> {
 	try {
 		if (!isOmnisearchAvailable()) {
 			throw new Error(
 				"Omnisearch plugin not found or not active. Please install and enable it to use this search feature."
 			);
 		}
 		// Omnisearch is not a regex engine. The function name is kept for consistency
 		// but the `query` will be treated as a keyword/fuzzy search by the plugin.
 		const apiResults = await window.omnisearch.search(query);
 		if (!apiResults || apiResults.length === 0) {
 			throw new Error("No results found.");
 		}
 		const results: SearchResult[] = [];
 		for (const result of apiResults) {
 			if (results.length >= MAX_RESULTS) {
 				break; // Stop processing new files if we have enough results
 			}
 			if (!result.matches || result.matches.length === 0) continue;
 			const fileContent = await app.vault.adapter.read(result.path);
 			const allLines = fileContent.split("\n");
 			for (const match of result.matches) {
 				if (results.length >= MAX_RESULTS) {
 					break; // Stop processing matches if we have enough results
 				}
 				const { lineNumber, columnNumber, lineContent } = findLineAndColumnFromOffset(
 					allLines,
 					match.offset
 				);
 				if (lineNumber === -1) continue;
 				const searchResult: SearchResult = {
 					file: result.path,
 					line: lineNumber + 1, // ripgrep is 1-based, so we adjust
 					column: columnNumber + 1,
 					match: truncateLine(lineContent.trimEnd()),
 					beforeContext: lineNumber > 0 ? [truncateLine(allLines[lineNumber - 1].trimEnd())] : [],
 					afterContext:
 						lineNumber < allLines.length - 1
 							? [truncateLine(allLines[lineNumber + 1].trimEnd())]
 							: [],
 				};
 				results.push(searchResult);
 			}
 		}
 		return formatResults(results, vaultPath);
 	} catch (error) {
 		console.error("Error during Omnisearch processing:", error);
 		return "An error occurred during the search.";
 	}
 }
--- a/src/core/regex/regex-common.ts
+++ b/src/core/regex/regex-common.ts
@ -0,0 +1,63 @@
 import * as path from "path"
 // Constants
 export const MAX_RESULTS = 300
 export const MAX_LINE_LENGTH = 500
 /**
 * Truncates a line if it exceeds the maximum length
 * @param line The line to truncate
 * @param maxLength The maximum allowed length (defaults to MAX_LINE_LENGTH)
 * @returns The truncated line, or the original line if it's shorter than maxLength
 */
 export function truncateLine(line: string, maxLength: number = MAX_LINE_LENGTH): string {
 	return line.length > maxLength ? line.substring(0, maxLength) + " [truncated...]" : line
 }
 export interface SearchResult {
 	file: string
 	line: number
 	column?: number
 	match?: string
 	beforeContext: string[]
 	afterContext: string[]
 }
 export function formatResults(results: SearchResult[], cwd: string): string {
 	const groupedResults: { [key: string]: SearchResult[] } = {}
 	let output = ""
 	if (results.length >= MAX_RESULTS) {
 		output += `Showing first ${MAX_RESULTS} of ${MAX_RESULTS}+ results. Use a more specific search if necessary.\n\n`
 	} else {
 		output += `Found ${results.length === 1 ? "1 result" : `${results.length.toLocaleString()} results`}.\n\n`
 	}
 	// Group results by file name
 	results.slice(0, MAX_RESULTS).forEach((result) => {
 		const relativeFilePath = path.relative(cwd, result.file)
 		if (!groupedResults[relativeFilePath]) {
 			groupedResults[relativeFilePath] = []
 		}
 		groupedResults[relativeFilePath].push(result)
 	})
 	for (const [filePath, fileResults] of Object.entries(groupedResults)) {
 		output += `${filePath.toPosix()}\n│----\n`
 		fileResults.forEach((result, index) => {
 			const allLines = [...result.beforeContext, result.match, ...result.afterContext]
 			allLines.forEach((line) => {
 				output += `│${line?.trimEnd() ?? ""}\n`
 			})
 			if (index < fileResults.length - 1) {
 				output += "│----\n"
 			}
 		})
 		output += "│----\n\n"
 	}
 	return output.trim()
 }
--- a/src/core/regex/ripgrep-index.ts
+++ b/src/core/regex/ripgrep-index.ts
@ -3,33 +3,16 @@ import * as childProcess from "child_process"
 import * as fs from "fs"
 import * as path from "path"
 import * as readline from "readline"
 import {
 	MAX_RESULTS,
 	truncateLine,
 	SearchResult,
 	formatResults
 } from './regex-common'
 const isWindows = /^win/.test(process.platform)
 const binName = isWindows ? "rg.exe" : "rg"
 interface SearchResult {
 	file: string
 	line: number
 	column: number
 	match: string
 	beforeContext: string[]
 	afterContext: string[]
 }
 // Constants
 const MAX_RESULTS = 300
 const MAX_LINE_LENGTH = 500
 /**
 * Truncates a line if it exceeds the maximum length
 * @param line The line to truncate
 * @param maxLength The maximum allowed length (defaults to MAX_LINE_LENGTH)
 * @returns The truncated line, or the original line if it's shorter than maxLength
 */
 export function truncateLine(line: string, maxLength: number = MAX_LINE_LENGTH): string {
 	return line.length > maxLength ? line.substring(0, maxLength) + " [truncated...]" : line
 }
 async function getBinPath(ripgrepPath: string): Promise<string | undefined> {
 	const binPath = path.join(ripgrepPath, binName)
 	return (await pathExists(binPath)) ? binPath : undefined
@ -83,7 +66,7 @@ async function execRipgrep(bin: string, args: string[]): Promise<string> {
 	})
 }
-export async function regexSearchFiles(
+export async function regexSearchFilesWithRipgrep(
 	directoryPath: string,
 	regex: string,
 	ripgrepPath: string,
@ -162,42 +145,3 @@ export async function regexSearchFiles(
 	return formatResults(results, directoryPath)
 }
 function formatResults(results: SearchResult[], cwd: string): string {
 	const groupedResults: { [key: string]: SearchResult[] } = {}
 	let output = ""
 	if (results.length >= MAX_RESULTS) {
 		output += `Showing first ${MAX_RESULTS} of ${MAX_RESULTS}+ results. Use a more specific search if necessary.\n\n`
 	} else {
 		output += `Found ${results.length === 1 ? "1 result" : `${results.length.toLocaleString()} results`}.\n\n`
 	}
 	// Group results by file name
 	results.slice(0, MAX_RESULTS).forEach((result) => {
 		const relativeFilePath = path.relative(cwd, result.file)
 		if (!groupedResults[relativeFilePath]) {
 			groupedResults[relativeFilePath] = []
 		}
 		groupedResults[relativeFilePath].push(result)
 	})
 	for (const [filePath, fileResults] of Object.entries(groupedResults)) {
 		output += `${filePath.toPosix()}\n│----\n`
 		fileResults.forEach((result, index) => {
 			const allLines = [...result.beforeContext, result.match, ...result.afterContext]
 			allLines.forEach((line) => {
 				output += `│${line?.trimEnd() ?? ""}\n`
 			})
 			if (index < fileResults.length - 1) {
 				output += "│----\n"
 			}
 		})
 		output += "│----\n\n"
 	}
 	return output.trim()
 }
--- a/src/lang/locale/en.ts
+++ b/src/lang/locale/en.ts
@ -227,8 +227,12 @@ export default {
 			auto: 'Auto',
 			semantic: 'Semantic',
 			regex: 'Regex',
 			regexBackend: 'Regex search backend',
 			regexBackendDescription: 'Choose the backend for regex search method.',
 			ripgrep: 'ripgrep',
 			omnisearch: 'Omnisearch',
 			ripgrepPath: 'ripgrep path',
-			ripgrepPathDescription: 'Path to the ripgrep binary. When using regex search, this is required.',
+			ripgrepPathDescription: 'Path to the ripgrep binary. When using ripgrep regex search, this is required.',
 		},
 		// Chat Behavior Section
--- a/src/lang/locale/zh-cn.ts
+++ b/src/lang/locale/zh-cn.ts
@ -228,8 +228,12 @@ export default {
 			auto: '自动',
 			semantic: '语义',
 			regex: '正则',
 			regexBackend: '正则搜索后端',
 			regexBackendDescription: '选择正则搜索的后端。',
 			ripgrep: 'ripgrep',
 			omnisearch: 'Omnisearch',
 			ripgrepPath: 'ripgrep 路径',
-			ripgrepPathDescription: 'ripgrep 二进制文件的路径。使用正则搜索时需要此项。',
+			ripgrepPathDescription: 'ripgrep 二进制文件的路径。使用 ripgrep 正则搜索时需要此项。',
 		},
 		// 聊天行为部分
--- a/src/settings/SettingTab.tsx
+++ b/src/settings/SettingTab.tsx
@ -163,6 +163,21 @@ export class InfioSettingTab extends PluginSettingTab {
 						})
 					}),
 			)
 			new Setting(containerEl)
 			.setName(t('settings.FilesSearch.regexBackend'))
 			.setDesc(t('settings.FilesSearch.regexBackendDescription'))
 			.addDropdown((dropdown) =>
 				dropdown
 					.addOption('ripgrep', t('settings.FilesSearch.ripgrep'))
 					.addOption('omnisearch', t('settings.FilesSearch.omnisearch'))
 					.setValue(this.plugin.settings.regexSearchBackend)
 					.onChange(async (value) => {
 						await this.plugin.setSettings({
 							...this.plugin.settings,
 							regexSearchBackend: value as 'ripgrep' | 'omnisearch',
 						})
 					}),
 			)
 		new Setting(containerEl)
 			.setName(t('settings.FilesSearch.ripgrepPath'))
 			.setDesc(t('settings.FilesSearch.ripgrepPathDescription'))
--- a/src/types/settings.ts
+++ b/src/types/settings.ts
@ -261,6 +261,7 @@ export const InfioSettingsSchema = z.object({
 	// Files Search
 	filesSearchMethod: z.enum(['regex', 'semantic', 'auto']).catch('auto'),
 	regexSearchBackend: z.enum(['omnisearch', 'ripgrep']).catch('ripgrep'),
 	ripgrepPath: z.string().catch(''),
 	/// [compatible]