update buildin mcp tools

2025-06-08 22:33:01 +08:00
parent 2b571f67a7
commit 4053214078
10 changed files with 996 additions and 91 deletions
--- a/src/utils/prompt-generator.ts
+++ b/src/utils/prompt-generator.ts
@@ -1,4 +1,4 @@
-import { App, MarkdownView, TAbstractFile, TFile, TFolder, Vault, getLanguage, htmlToMarkdown, requestUrl } from 'obsidian'
+import { App, MarkdownView, TAbstractFile, TFile, TFolder, Vault, getLanguage, htmlToMarkdown, normalizePath, requestUrl } from 'obsidian'

 import { editorStateToPlainText } from '../components/chat-view/chat-input/utils/editor-state-to-plain-text'
 import { QueryProgressState } from '../components/chat-view/QueryProgress'
@@ -21,10 +21,8 @@ import { InfioSettings } from '../types/settings'
 import { CustomModePrompts, Mode, ModeConfig, getFullModeDetails } from "../utils/modes"

 import {
-	readTFileContent,
-	readMultipleTFiles,
-	getNestedFiles,
-	parsePdfContent
+	parsePdfContent,
+	readTFileContent
 } from './obsidian'
 import { tokenCount } from './token'
 import { isVideoUrl, isYoutubeUrl } from './video-detector'
@@ -70,7 +68,11 @@ async function getFolderTreeContent(path: TFolder): Promise<string> {
 	}
 }

-async function getFileOrFolderContent(path: TAbstractFile, vault: Vault, app?: App): Promise<string> {
+async function getFileOrFolderContent(
+	path: TAbstractFile,
+	vault: Vault,
+	app?: App
+): Promise<string> {
 	try {
 		if (path instanceof TFile) {
 			if (path.extension === 'pdf') {
@@ -184,7 +186,7 @@ export class PromptGenerator {
 		}
 		const isNewChat = messages.filter(message => message.role === 'user').length === 1

-		const { promptContent, similaritySearchResults } =
+		const { promptContent, similaritySearchResults, fileReadResults, websiteReadResults } =
 			await this.compileUserMessagePrompt({
 				isNewChat,
 				message: lastUserMessage,
@@ -198,6 +200,8 @@ export class PromptGenerator {
 				...lastUserMessage,
 				promptContent,
 				similaritySearchResults,
+				fileReadResults,
+				websiteReadResults,
 			},
 		]

@@ -318,6 +322,8 @@ export class PromptGenerator {
 		similaritySearchResults?: (Omit<SelectVector, 'embedding'> & {
 			similarity: number
 		})[]
+		fileReadResults?: Array<{ path: string, content: string }>
+		websiteReadResults?: Array<{ url: string, content: string }>
 	}> {
 		// Add environment details
 		// const environmentDetails = isNewChat
@@ -349,27 +355,130 @@ export class PromptGenerator {

 		const taskPrompt = isNewChat ? `<task>\n${query}\n</task>` : `<feedback>\n${query}\n</feedback>`

+		// 收集所有读取结果用于显示
+		const allFileReadResults: Array<{ path: string, content: string }> = []
+		const allWebsiteReadResults: Array<{ url: string, content: string }> = []
+
 		// user mention files
 		const files = message.mentionables
 			.filter((m): m is MentionableFile => m.type === 'file')
 			.map((m) => m.file)
-		let fileContentsPrompts = files.length > 0
-			? (await Promise.all(files.map(async (file) => {
-				const content = await getFileOrFolderContent(file, this.app.vault, this.app)
-				return `<file_content path="${file.path}">\n${content}\n</file_content>`
-			}))).join('\n')
-			: undefined
+		let fileContentsPrompts: string | undefined = undefined
+		if (files.length > 0) {
+			// 初始化文件读取进度
+			onQueryProgressChange?.({
+				type: 'reading-files',
+				totalFiles: files.length,
+				completedFiles: 0
+			})
+
+			// 确保UI有时间显示初始状态
+			await new Promise(resolve => setTimeout(resolve, 100))
+
+			const fileContents: string[] = []
+			const fileContentsForProgress: Array<{ path: string, content: string }> = []
+			let completedFiles = 0
+
+			for (const file of files) {
+				// 更新当前正在读取的文件
+				onQueryProgressChange?.({
+					type: 'reading-files',
+					currentFile: file.path,
+					totalFiles: files.length,
+					completedFiles: completedFiles
+				})
+
+				const content = await getFileOrFolderContent(
+					file,
+					this.app.vault,
+					this.app
+				)
+
+				// 创建Markdown文件
+				const markdownFilePath = await this.createMarkdownFileForContent(
+					file.path,
+					content,
+					false
+				)
+
+				completedFiles++
+				fileContents.push(`<file_content path="${file.path}">\n${content}\n</file_content>`)
+				fileContentsForProgress.push({ path: markdownFilePath, content })
+				allFileReadResults.push({ path: markdownFilePath, content })
+			}
+
+			// 文件读取完成
+			onQueryProgressChange?.({
+				type: 'reading-files-done',
+				fileContents: fileContentsForProgress
+			})
+
+			// 让用户看到完成状态
+			await new Promise(resolve => setTimeout(resolve, 200))
+
+			fileContentsPrompts = fileContents.join('\n')
+		}

 		// user mention folders
 		const folders = message.mentionables
 			.filter((m): m is MentionableFolder => m.type === 'folder')
 			.map((m) => m.folder)
-		let folderContentsPrompts = folders.length > 0
-			? (await Promise.all(folders.map(async (folder) => {
-				const content = await getFileOrFolderContent(folder, this.app.vault, this.app)
-				return `<folder_content path="${folder.path}">\n${content}\n</folder_content>`
-			}))).join('\n')
-			: undefined
+		let folderContentsPrompts: string | undefined = undefined
+		if (folders.length > 0) {
+			// 初始化文件夹读取进度（如果之前没有文件需要读取）
+			if (files.length === 0) {
+				onQueryProgressChange?.({
+					type: 'reading-files',
+					totalFiles: folders.length,
+					completedFiles: 0
+				})
+			}
+
+			const folderContents: string[] = []
+			const folderContentsForProgress: Array<{ path: string, content: string }> = []
+			let completedFolders = 0
+
+			for (const folder of folders) {
+				// 更新当前正在读取的文件夹
+				onQueryProgressChange?.({
+					type: 'reading-files',
+					currentFile: folder.path,
+					totalFiles: folders.length,
+					completedFiles: completedFolders
+				})
+
+				const content = await getFileOrFolderContent(
+					folder,
+					this.app.vault,
+					this.app
+				)
+
+				// 为文件夹内容创建Markdown文件
+				const markdownFilePath = await this.createMarkdownFileForContent(
+					`${folder.path}/folder-contents`,
+					content,
+					false
+				)
+
+				completedFolders++
+				folderContents.push(`<folder_content path="${folder.path}">\n${content}\n</folder_content>`)
+				folderContentsForProgress.push({ path: markdownFilePath, content })
+				allFileReadResults.push({ path: markdownFilePath, content })
+			}
+
+			// 文件夹读取完成（如果之前没有文件需要读取）
+			if (files.length === 0) {
+				onQueryProgressChange?.({
+					type: 'reading-files-done',
+					fileContents: folderContentsForProgress
+				})
+
+				// 让用户看到完成状态
+				await new Promise(resolve => setTimeout(resolve, 200))
+			}
+
+			folderContentsPrompts = folderContents.join('\n')
+		}

 		// user mention blocks
 		const blocks = message.mentionables.filter(
@@ -388,16 +497,62 @@ export class PromptGenerator {
 		const urls = message.mentionables.filter(
 			(m): m is MentionableUrl => m.type === 'url',
 		)
-		const urlContents = await Promise.all(
-			urls.map(async ({ url }) => ({
-				url,
-				content: await this.getWebsiteContent(url)
-			}))
-		)
+		const urlContents: Array<{ url: string, content: string }> = []
+		if (urls.length > 0) {
+			// 初始化网页读取进度
+			onQueryProgressChange?.({
+				type: 'reading-websites',
+				totalUrls: urls.length,
+				completedUrls: 0
+			})
+
+			// 确保UI有时间显示初始状态
+			await new Promise(resolve => setTimeout(resolve, 100))
+
+			let completedUrls = 0
+
+			const mcpHub = await this.getMcpHub()
+
+			for (const { url } of urls) {
+				// 更新当前正在读取的网页
+				onQueryProgressChange?.({
+					type: 'reading-websites',
+					currentUrl: url,
+					totalUrls: urls.length,
+					completedUrls: completedUrls
+				})
+
+				const content = await this.getWebsiteContent(url, mcpHub)
+
+				// 从内容中提取标题
+				const websiteTitle = this.extractTitleFromWebsiteContent(content, url)
+
+				// 为网页内容创建Markdown文件
+				const markdownFilePath = await this.createMarkdownFileForContent(
+					url,
+					content,
+					true,
+					websiteTitle
+				)
+
+				completedUrls++
+				urlContents.push({ url: markdownFilePath, content }) // 这里url改为markdownFilePath
+				allWebsiteReadResults.push({ url: markdownFilePath, content }) // 同样这里也改为markdownFilePath
+			}
+
+			// 网页读取完成
+			onQueryProgressChange?.({
+				type: 'reading-websites-done',
+				websiteContents: urlContents
+			})
+
+			// 让用户看到完成状态
+			await new Promise(resolve => setTimeout(resolve, 200))
+		}
 		const urlContentsPrompt = urlContents.length > 0
 			? urlContents
 				.map(({ url, content }) => (
-					`<url_content url="${url}">\n${content}\n</url_content>`
+					`<file_content path="${url}">\n${content}\n</file_content>`
 				))
 				.join('\n') : undefined

@@ -405,9 +560,51 @@ export class PromptGenerator {
 		const currentFile = message.mentionables
 			.filter((m): m is MentionableFile => m.type === 'current-file')
 			.first()
-		const currentFileContent = currentFile && currentFile.file != null
-			? await getFileOrFolderContent(currentFile.file, this.app.vault, this.app)
-			: undefined
+		let currentFileContent: string | undefined = undefined
+		if (currentFile && currentFile.file != null) {
+			// 初始化当前文件读取进度（如果之前没有其他文件或文件夹需要读取）
+			if (files.length === 0 && folders.length === 0) {
+				onQueryProgressChange?.({
+					type: 'reading-files',
+					currentFile: currentFile.file.path,
+					totalFiles: 1,
+					completedFiles: 0
+				})
+			}
+
+			// 如果当前文件不是 md 文件且 mcpHub 存在，使用 MCP 工具转换
+			const mcpHub = await this.getMcpHub?.()
+			if (currentFile.file.extension !== 'md' && mcpHub?.isBuiltInServerAvailable()) {
+				currentFileContent = await this.callMcpToolConvertDocument(currentFile.file, mcpHub)
+			} else {
+				currentFileContent = await getFileOrFolderContent(
+					currentFile.file,
+					this.app.vault,
+					this.app
+				)
+			}
+
+			// 为当前文件创建Markdown文件
+			const currentMarkdownFilePath = await this.createMarkdownFileForContent(
+				currentFile.file.path,
+				currentFileContent,
+				false
+			)
+
+			// 添加当前文件到读取结果中
+			allFileReadResults.push({ path: currentMarkdownFilePath, content: currentFileContent })
+
+			// 当前文件读取完成（如果之前没有其他文件或文件夹需要读取）
+			if (files.length === 0 && folders.length === 0) {
+				onQueryProgressChange?.({
+					type: 'reading-files-done',
+					fileContents: [{ path: currentMarkdownFilePath, content: currentFileContent }]
+				})
+
+				// 让用户看到完成状态
+				await new Promise(resolve => setTimeout(resolve, 200))
+			}
+		}

 		// Check if current file content should be included
 		let shouldIncludeCurrentFile = false
@@ -458,15 +655,19 @@ export class PromptGenerator {
 			fileContentsPrompts = files.map((file) => {
 				return `<file_content path="${file.path}">\n(Content omitted due to token limit. Relevant sections will be provided by semantic search below.)\n</file_content>`
 			}).join('\n')
-			folderContentsPrompts = folders.map(async (folder) => {
+			folderContentsPrompts = (await Promise.all(folders.map(async (folder) => {
 				const tree_content = await getFolderTreeContent(folder)
 				return `<folder_content path="${folder.path}">\n${tree_content}\n(Content omitted due to token limit. Relevant sections will be provided by semantic search below.)\n</folder_content>`
-			}).join('\n')
+			}))).join('\n')
 		}

 		const shouldUseRAG = useVaultSearch || isOverThreshold
 		let similaritySearchContents
 		if (shouldUseRAG) {
+			// 重置进度状态，准备进入RAG阶段
+			onQueryProgressChange?.({
+				type: 'reading-mentionables',
+			})
 			similaritySearchResults = useVaultSearch
 				? await (
 					await this.getRagEngine()
@@ -530,6 +731,8 @@ export class PromptGenerator {
 				)
 			],
 			similaritySearchResults,
+			fileReadResults: allFileReadResults.length > 0 ? allFileReadResults : undefined,
+			websiteReadResults: allWebsiteReadResults.length > 0 ? allWebsiteReadResults : undefined,
 		}
 	}

@@ -773,7 +976,14 @@ When writing out new markdown blocks, remember not to include "line_number|" at
 	 * - filter visually hidden elements
 	 * ...
 	 */
-	private async getWebsiteContent(url: string): Promise<string> {
+	private async getWebsiteContent(url: string, mcpHub: McpHub | null): Promise<string> {
+
+		const mcpHubAvailable = mcpHub?.isBuiltInServerAvailable()
+
+		if (mcpHubAvailable && isVideoUrl(url)) {
+			return this.callMcpToolConvertVideo(url, mcpHub)
+		}
+
 		if (isYoutubeUrl(url)) {
 			// TODO: pass language based on user preferences
 			const { title, transcript } =
@@ -789,25 +999,224 @@ ${transcript.map((t) => `${t.offset}: ${t.text}`).join('\n')}`
 		return htmlToMarkdown(response.text)
 	}

-	private async callMcpToolGetWebsiteContent(url: string, mcpHub: McpHub | null): Promise<string> {
-		if (isVideoUrl(url)) {
-			return this.callMcpToolConvertVideo(url, mcpHub)
+	private async callMcpToolConvertVideo(url: string, mcpHub: McpHub): Promise<string> {
+		const response = await mcpHub.callTool(
+			'infio-builtin-server',
+			'CONVERT_VIDEO',
+			{ url, detect_language: 'en' }
+		)
+
+		// 处理图片内容并获取图片引用
+		const imageReferences = await this.processImagesInResponse(response.content)
+
+		const textContent = response.content.find((c) => c.type === 'text')
+		let result = textContent?.text || ''
+
+		// 在文本内容末尾添加图片引用
+		if (imageReferences.length > 0) {
+			result += '\n\n## 图片内容\n\n'
+			imageReferences.forEach(imagePath => {
+				result += `![](${imagePath})\n\n`
+			})
 		}
-		return this.callMcpToolFetchUrlContent(url, mcpHub)
+
+		return result
 	}

-	private async callMcpToolConvertVideo(url: string, mcpHub: McpHub | null): Promise<string> {
-		// TODO: implement
-		return ''
+	private async callMcpToolConvertDocument(file: TFile, mcpHub: McpHub): Promise<string> {
+		// 读取文件的二进制内容并转换为Base64
+		const fileBuffer = await this.app.vault.readBinary(file)
+
+		// 安全地转换为Base64，避免堆栈溢出
+		const uint8Array = new Uint8Array(fileBuffer)
+		let binaryString = ''
+		const chunkSize = 8192 // 处理块大小
+
+		for (let i = 0; i < uint8Array.length; i += chunkSize) {
+			const chunk = uint8Array.slice(i, i + chunkSize)
+			binaryString += String.fromCharCode.apply(null, Array.from(chunk))
+		}
+
+		const base64Content = btoa(binaryString)
+
+		// 提取文件扩展名（不带点）
+		const fileType = file.extension
+
+		const response = await mcpHub.callTool(
+			'infio-builtin-server',
+			'CONVERT_DOCUMENT',
+			{
+				file_content: base64Content,
+				file_type: fileType
+			}
+		)
+
+		// 处理图片内容并获取图片引用
+		await this.processImagesInResponse(response.content)
+
+		const textContent = response.content.find((c) => c.type === 'text')
+		const result = textContent?.text as string || ''
+
+		return result
 	}

-	private async callMcpToolFetchUrlContent(url: string, mcpHub: McpHub | null): Promise<string> {
-		// TODO: implement
-		return ''
+	/**
+	 * 为文件内容创建Markdown文件
+	 */
+	private async createMarkdownFileForContent(
+		originalPath: string,
+		content: string,
+		isWebsite: boolean = false,
+		websiteTitle?: string
+	): Promise<string> {
+		try {
+			let targetPath: string
+
+			if (isWebsite) {
+				// 网页内容保存到根目录
+				const fileName = this.sanitizeFileName(websiteTitle || 'website')
+				targetPath = `${fileName}.md`
+			} else {
+				// 如果原文件已经是.md文件，直接返回原路径，不重复创建
+				if (originalPath.endsWith('.md')) {
+					return originalPath
+				}
+
+				// 文件内容保存到同路径下的.md文件
+				const pathWithoutExt = originalPath.replace(/\.[^/.]+$/, "")
+				targetPath = `${pathWithoutExt}.md`
+			}
+
+			// 处理文件名冲突
+			targetPath = await this.getUniqueFilePath(targetPath)
+
+			// 创建文件内容
+			let markdownContent = content
+			if (isWebsite) {
+				markdownContent = `# ${websiteTitle || 'Website Content'}\n\n> Source: ${originalPath}\n\n${content}`
+			} else {
+				markdownContent = `# ${originalPath}\n\n${content}`
+			}
+
+			// 创建文件
+			const file = await this.app.vault.create(targetPath, markdownContent)
+
+			// 在新标签页中打开文件
+			this.app.workspace.getLeaf('tab').openFile(file)
+
+			return file.path
+		} catch (error) {
+			console.error('Failed to create markdown file:', error)
+			return originalPath // 如果创建失败，返回原路径
+		}
 	}

-	private async callMcpToolConvertDocument(file: TFile, mcpHub: McpHub | null): Promise<string> {
-		// TODO: implement
-		return ''
+	/**
+	 * 清理文件名，移除不合法字符
+	 */
+	private sanitizeFileName(fileName: string): string {
+		return fileName
+			.replace(/[<>:"/\\|?*]/g, '-') // 替换不合法字符
+			.replace(/\s+/g, '-') // 替换空格
+			.replace(/-+/g, '-') // 合并连续的横线
+			.replace(/^-|-$/g, '') // 移除开头和结尾的横线
+			.substring(0, 100) // 限制长度
+	}
+
+	/**
+	 * 获取唯一的文件路径（处理重名冲突）
+	 */
+	private async getUniqueFilePath(targetPath: string): Promise<string> {
+		const normalizedPath = normalizePath(targetPath)
+
+		if (!this.app.vault.getAbstractFileByPath(normalizedPath)) {
+			return normalizedPath
+		}
+
+		const pathParts = normalizedPath.split('.')
+		const extension = pathParts.pop()
+		const basePath = pathParts.join('.')
+
+		let counter = 1
+		let uniquePath: string
+
+		do {
+			uniquePath = `${basePath}-${counter}.${extension}`
+			counter++
+		} while (this.app.vault.getAbstractFileByPath(uniquePath))
+
+		return uniquePath
+	}
+
+	/**
+	 * 从网页内容中提取标题
+	 */
+	private extractTitleFromWebsiteContent(content: string, url: string): string {
+		// 尝试从内容中提取标题
+		const titleRegex1 = /^#\s+(.+)$/m
+		const titleRegex2 = /Title:\s*(.+)$/m
+		const titleMatch = titleRegex1.exec(content) || titleRegex2.exec(content)
+		if (titleMatch && titleMatch[1]) {
+			return titleMatch[1].trim()
+		}
+
+		// 如果没有找到标题，使用域名
+		try {
+			return new URL(url).hostname
+		} catch {
+			return 'website'
+		}
+	}
+
+	/**
+	 * 处理响应中的图片内容，将base64图片保存到Obsidian资源目录
+	 */
+	private async processImagesInResponse(content: Array<{ type: string, data: string, filename: string, mimeType?: string }>): Promise<string[]> {
+		const savedImagePaths: string[] = []
+
+		for (const item of content) {
+			if (item.type === 'image' && item.data && item.filename) {
+				try {
+					const imagePath = await this.saveImageFromBase64(item.data, item.filename, item.mimeType)
+					savedImagePaths.push(imagePath)
+				} catch (error) {
+					console.error('Failed to save image:', error)
+				}
+			}
+		}
+
+		return savedImagePaths
+	}
+
+	/**
+	 * 将base64图片数据保存为文件到Obsidian资源目录
+	 */
+	private async saveImageFromBase64(base64Data: string, filename: string, mimeType?: string): Promise<string> {
+		// 获取默认资源目录
+		const staticResourceDir = this.app.vault.getConfig("attachmentFolderPath")
+
+		// 构建完整的文件路径
+		const targetPath = staticResourceDir ? normalizePath(`${staticResourceDir}/${filename}`) : filename
+
+		// 处理文件名冲突
+		// const uniquePath = await this.getUniqueFilePath(targetPath)
+
+		try {
+			// 将base64数据转换为ArrayBuffer
+			const binaryString = atob(base64Data)
+			const bytes = new Uint8Array(binaryString.length)
+			for (let i = 0; i < binaryString.length; i++) {
+				bytes[i] = binaryString.charCodeAt(i)
+			}
+
+			// 创建图片文件
+			await this.app.vault.createBinary(targetPath, bytes.buffer)
+
+			console.log(`Image saved: ${targetPath}`)
+			return targetPath
+		} catch (error) {
+			console.error(`Failed to save image to ${targetPath}:`, error)
+			throw error
+		}
 	}
 }