189 lines
5.5 KiB
TypeScript
189 lines
5.5 KiB
TypeScript
import { convertPDFToImage, convertPDFToText } from './pdf-processing';
|
|
import { isSvgMimeType, svgBase64UrlToPngDataURL } from './svg-to-png';
|
|
import { isWebpMimeType, webpBase64UrlToPngDataURL } from './webp-to-png';
|
|
import { FileTypeCategory, AttachmentType } from '$lib/enums';
|
|
import { config, settingsStore } from '$lib/stores/settings.svelte';
|
|
import { supportsVision } from '$lib/stores/props.svelte';
|
|
import { getFileTypeCategory } from '$lib/utils/file-type';
|
|
import { readFileAsText, isLikelyTextFile } from './text-files';
|
|
import { toast } from 'svelte-sonner';
|
|
|
|
function readFileAsBase64(file: File): Promise<string> {
|
|
return new Promise((resolve, reject) => {
|
|
const reader = new FileReader();
|
|
|
|
reader.onload = () => {
|
|
// Extract base64 data without the data URL prefix
|
|
const dataUrl = reader.result as string;
|
|
const base64 = dataUrl.split(',')[1];
|
|
resolve(base64);
|
|
};
|
|
|
|
reader.onerror = () => reject(reader.error);
|
|
|
|
reader.readAsDataURL(file);
|
|
});
|
|
}
|
|
|
|
export interface FileProcessingResult {
|
|
extras: DatabaseMessageExtra[];
|
|
emptyFiles: string[];
|
|
}
|
|
|
|
export async function parseFilesToMessageExtras(
|
|
files: ChatUploadedFile[]
|
|
): Promise<FileProcessingResult> {
|
|
const extras: DatabaseMessageExtra[] = [];
|
|
const emptyFiles: string[] = [];
|
|
|
|
for (const file of files) {
|
|
if (getFileTypeCategory(file.type) === FileTypeCategory.IMAGE) {
|
|
if (file.preview) {
|
|
let base64Url = file.preview;
|
|
|
|
if (isSvgMimeType(file.type)) {
|
|
try {
|
|
base64Url = await svgBase64UrlToPngDataURL(base64Url);
|
|
} catch (error) {
|
|
console.error('Failed to convert SVG to PNG for database storage:', error);
|
|
}
|
|
} else if (isWebpMimeType(file.type)) {
|
|
try {
|
|
base64Url = await webpBase64UrlToPngDataURL(base64Url);
|
|
} catch (error) {
|
|
console.error('Failed to convert WebP to PNG for database storage:', error);
|
|
}
|
|
}
|
|
|
|
extras.push({
|
|
type: AttachmentType.IMAGE,
|
|
name: file.name,
|
|
base64Url
|
|
});
|
|
}
|
|
} else if (getFileTypeCategory(file.type) === FileTypeCategory.AUDIO) {
|
|
// Process audio files (MP3 and WAV)
|
|
try {
|
|
const base64Data = await readFileAsBase64(file.file);
|
|
|
|
extras.push({
|
|
type: AttachmentType.AUDIO,
|
|
name: file.name,
|
|
base64Data: base64Data,
|
|
mimeType: file.type
|
|
});
|
|
} catch (error) {
|
|
console.error(`Failed to process audio file ${file.name}:`, error);
|
|
}
|
|
} else if (getFileTypeCategory(file.type) === FileTypeCategory.PDF) {
|
|
try {
|
|
// Always get base64 data for preview functionality
|
|
const base64Data = await readFileAsBase64(file.file);
|
|
const currentConfig = config();
|
|
const hasVisionSupport = supportsVision();
|
|
|
|
// Force PDF-to-text for non-vision models
|
|
let shouldProcessAsImages = Boolean(currentConfig.pdfAsImage) && hasVisionSupport;
|
|
|
|
// If user had pdfAsImage enabled but model doesn't support vision, update setting and notify
|
|
if (currentConfig.pdfAsImage && !hasVisionSupport) {
|
|
console.log('Non-vision model detected: forcing PDF-to-text mode and updating settings');
|
|
|
|
// Update the setting in localStorage
|
|
settingsStore.updateConfig('pdfAsImage', false);
|
|
|
|
// Show toast notification to user
|
|
toast.warning(
|
|
'PDF setting changed: Non-vision model detected, PDFs will be processed as text instead of images.',
|
|
{
|
|
duration: 5000
|
|
}
|
|
);
|
|
|
|
shouldProcessAsImages = false;
|
|
}
|
|
|
|
if (shouldProcessAsImages) {
|
|
// Process PDF as images (only for vision models)
|
|
try {
|
|
const images = await convertPDFToImage(file.file);
|
|
|
|
// Show success toast for PDF image processing
|
|
toast.success(
|
|
`PDF "${file.name}" processed as ${images.length} images for vision model.`,
|
|
{
|
|
duration: 3000
|
|
}
|
|
);
|
|
|
|
extras.push({
|
|
type: AttachmentType.PDF,
|
|
name: file.name,
|
|
content: `PDF file with ${images.length} pages`,
|
|
images: images,
|
|
processedAsImages: true,
|
|
base64Data: base64Data
|
|
});
|
|
} catch (imageError) {
|
|
console.warn(
|
|
`Failed to process PDF ${file.name} as images, falling back to text:`,
|
|
imageError
|
|
);
|
|
|
|
// Fallback to text processing
|
|
const content = await convertPDFToText(file.file);
|
|
|
|
extras.push({
|
|
type: AttachmentType.PDF,
|
|
name: file.name,
|
|
content: content,
|
|
processedAsImages: false,
|
|
base64Data: base64Data
|
|
});
|
|
}
|
|
} else {
|
|
// Process PDF as text (default or forced for non-vision models)
|
|
const content = await convertPDFToText(file.file);
|
|
|
|
// Show success toast for PDF text processing
|
|
toast.success(`PDF "${file.name}" processed as text content.`, {
|
|
duration: 3000
|
|
});
|
|
|
|
extras.push({
|
|
type: AttachmentType.PDF,
|
|
name: file.name,
|
|
content: content,
|
|
processedAsImages: false,
|
|
base64Data: base64Data
|
|
});
|
|
}
|
|
} catch (error) {
|
|
console.error(`Failed to process PDF file ${file.name}:`, error);
|
|
}
|
|
} else {
|
|
try {
|
|
const content = await readFileAsText(file.file);
|
|
|
|
// Check if file is empty
|
|
if (content.trim() === '') {
|
|
console.warn(`File ${file.name} is empty and will be skipped`);
|
|
emptyFiles.push(file.name);
|
|
} else if (isLikelyTextFile(content)) {
|
|
extras.push({
|
|
type: AttachmentType.TEXT,
|
|
name: file.name,
|
|
content: content
|
|
});
|
|
} else {
|
|
console.warn(`File ${file.name} appears to be binary and will be skipped`);
|
|
}
|
|
} catch (error) {
|
|
console.error(`Failed to read file ${file.name}:`, error);
|
|
}
|
|
}
|
|
}
|
|
|
|
return { extras, emptyFiles };
|
|
}
|