| import { convertPDFToImage, convertPDFToText } from './pdf-processing'; |
| import { isSvgMimeType, svgBase64UrlToPngDataURL } from './svg-to-png'; |
| import { isWebpMimeType, webpBase64UrlToPngDataURL } from './webp-to-png'; |
| import { FileTypeCategory } from '$lib/enums/files'; |
| import { config, settingsStore } from '$lib/stores/settings.svelte'; |
| import { supportsVision } from '$lib/stores/server.svelte'; |
| import { getFileTypeCategory } from '$lib/utils/file-type'; |
| import { readFileAsText, isLikelyTextFile } from './text-files'; |
| import { toast } from 'svelte-sonner'; |
|
|
| function readFileAsBase64(file: File): Promise<string> { |
| return new Promise((resolve, reject) => { |
| const reader = new FileReader(); |
|
|
| reader.onload = () => { |
| |
| const dataUrl = reader.result as string; |
| const base64 = dataUrl.split(',')[1]; |
| resolve(base64); |
| }; |
|
|
| reader.onerror = () => reject(reader.error); |
|
|
| reader.readAsDataURL(file); |
| }); |
| } |
|
|
| export interface FileProcessingResult { |
| extras: DatabaseMessageExtra[]; |
| emptyFiles: string[]; |
| } |
|
|
| export async function parseFilesToMessageExtras( |
| files: ChatUploadedFile[] |
| ): Promise<FileProcessingResult> { |
| const extras: DatabaseMessageExtra[] = []; |
| const emptyFiles: string[] = []; |
|
|
| for (const file of files) { |
| if (getFileTypeCategory(file.type) === FileTypeCategory.IMAGE) { |
| if (file.preview) { |
| let base64Url = file.preview; |
|
|
| if (isSvgMimeType(file.type)) { |
| try { |
| base64Url = await svgBase64UrlToPngDataURL(base64Url); |
| } catch (error) { |
| console.error('Failed to convert SVG to PNG for database storage:', error); |
| } |
| } else if (isWebpMimeType(file.type)) { |
| try { |
| base64Url = await webpBase64UrlToPngDataURL(base64Url); |
| } catch (error) { |
| console.error('Failed to convert WebP to PNG for database storage:', error); |
| } |
| } |
|
|
| extras.push({ |
| type: 'imageFile', |
| name: file.name, |
| base64Url |
| }); |
| } |
| } else if (getFileTypeCategory(file.type) === FileTypeCategory.AUDIO) { |
| |
| try { |
| const base64Data = await readFileAsBase64(file.file); |
|
|
| extras.push({ |
| type: 'audioFile', |
| name: file.name, |
| base64Data: base64Data, |
| mimeType: file.type |
| }); |
| } catch (error) { |
| console.error(`Failed to process audio file ${file.name}:`, error); |
| } |
| } else if (getFileTypeCategory(file.type) === FileTypeCategory.PDF) { |
| try { |
| |
| const base64Data = await readFileAsBase64(file.file); |
| const currentConfig = config(); |
| const hasVisionSupport = supportsVision(); |
|
|
| |
| let shouldProcessAsImages = Boolean(currentConfig.pdfAsImage) && hasVisionSupport; |
|
|
| |
| if (currentConfig.pdfAsImage && !hasVisionSupport) { |
| console.log('Non-vision model detected: forcing PDF-to-text mode and updating settings'); |
|
|
| |
| settingsStore.updateConfig('pdfAsImage', false); |
|
|
| |
| toast.warning( |
| 'PDF setting changed: Non-vision model detected, PDFs will be processed as text instead of images.', |
| { |
| duration: 5000 |
| } |
| ); |
|
|
| shouldProcessAsImages = false; |
| } |
|
|
| if (shouldProcessAsImages) { |
| |
| try { |
| const images = await convertPDFToImage(file.file); |
|
|
| |
| toast.success( |
| `PDF "${file.name}" processed as ${images.length} images for vision model.`, |
| { |
| duration: 3000 |
| } |
| ); |
|
|
| extras.push({ |
| type: 'pdfFile', |
| name: file.name, |
| content: `PDF file with ${images.length} pages`, |
| images: images, |
| processedAsImages: true, |
| base64Data: base64Data |
| }); |
| } catch (imageError) { |
| console.warn( |
| `Failed to process PDF ${file.name} as images, falling back to text:`, |
| imageError |
| ); |
|
|
| |
| const content = await convertPDFToText(file.file); |
|
|
| extras.push({ |
| type: 'pdfFile', |
| name: file.name, |
| content: content, |
| processedAsImages: false, |
| base64Data: base64Data |
| }); |
| } |
| } else { |
| |
| const content = await convertPDFToText(file.file); |
|
|
| |
| toast.success(`PDF "${file.name}" processed as text content.`, { |
| duration: 3000 |
| }); |
|
|
| extras.push({ |
| type: 'pdfFile', |
| name: file.name, |
| content: content, |
| processedAsImages: false, |
| base64Data: base64Data |
| }); |
| } |
| } catch (error) { |
| console.error(`Failed to process PDF file ${file.name}:`, error); |
| } |
| } else { |
| try { |
| const content = await readFileAsText(file.file); |
|
|
| |
| if (content.trim() === '') { |
| console.warn(`File ${file.name} is empty and will be skipped`); |
| emptyFiles.push(file.name); |
| } else if (isLikelyTextFile(content)) { |
| extras.push({ |
| type: 'textFile', |
| name: file.name, |
| content: content |
| }); |
| } else { |
| console.warn(`File ${file.name} appears to be binary and will be skipped`); |
| } |
| } catch (error) { |
| console.error(`Failed to read file ${file.name}:`, error); |
| } |
| } |
| } |
|
|
| return { extras, emptyFiles }; |
| } |
|
|