Features added: - PDF to image conversion with configurable DPI - Multi-page PDF processing with OCR - Export to Markdown, HTML, DOCX, and JSON formats - Automatic image extraction from PDFs - Formula and formatting preservation - Real-time progress tracking for multi-page documents Backend changes: - New /api/process-pdf endpoint for PDF processing - pdf_utils.py: PDF conversion and image extraction utilities - format_converter.py: Document format conversion (MD, HTML, DOCX) - Updated dependencies: PyMuPDF, img2pdf, python-docx, markdown Frontend changes: - File type toggle (Image OCR / PDF Processing) - PDFProcessor component with format selection - Updated ImageUpload to support both images and PDFs - Progress bars for multi-page processing - Download options for converted documents Documentation: - Updated README with PDF processing features - Added API documentation for /api/process-pdf endpoint - Added format conversion examples
234 lines
8.6 KiB
JavaScript
234 lines
8.6 KiB
JavaScript
import { useState, useCallback } from 'react'
|
|
import { motion, AnimatePresence } from 'framer-motion'
|
|
import { FileText, Download, Loader2, CheckCircle2, AlertCircle } from 'lucide-react'
|
|
import axios from 'axios'
|
|
|
|
const API_BASE = import.meta.env.VITE_API_URL || '/api'
|
|
|
|
function PDFProcessor({ pdfFile, mode, prompt, advancedSettings, includeCaption }) {
|
|
const [processing, setProcessing] = useState(false)
|
|
const [progress, setProgress] = useState(0)
|
|
const [result, setResult] = useState(null)
|
|
const [error, setError] = useState(null)
|
|
const [outputFormat, setOutputFormat] = useState('markdown')
|
|
|
|
const formats = [
|
|
{ value: 'markdown', label: 'Markdown', ext: 'md', icon: '📝' },
|
|
{ value: 'html', label: 'HTML', ext: 'html', icon: '🌐' },
|
|
{ value: 'docx', label: 'Word', ext: 'docx', icon: '📄' },
|
|
{ value: 'json', label: 'JSON', ext: 'json', icon: '📊' }
|
|
]
|
|
|
|
const handleProcess = useCallback(async () => {
|
|
if (!pdfFile) return
|
|
|
|
setProcessing(true)
|
|
setError(null)
|
|
setProgress(0)
|
|
|
|
try {
|
|
const formData = new FormData()
|
|
formData.append('pdf_file', pdfFile)
|
|
formData.append('mode', mode)
|
|
formData.append('prompt', prompt)
|
|
formData.append('output_format', outputFormat)
|
|
formData.append('grounding', mode === 'find_ref')
|
|
formData.append('include_caption', includeCaption)
|
|
formData.append('extract_images', true)
|
|
formData.append('dpi', 144)
|
|
formData.append('base_size', advancedSettings.base_size)
|
|
formData.append('image_size', advancedSettings.image_size)
|
|
formData.append('crop_mode', advancedSettings.crop_mode)
|
|
|
|
const response = await axios.post(`${API_BASE}/process-pdf`, formData, {
|
|
headers: {
|
|
'Content-Type': 'multipart/form-data',
|
|
},
|
|
responseType: outputFormat === 'json' ? 'json' : 'blob',
|
|
onUploadProgress: (progressEvent) => {
|
|
const percentCompleted = Math.round((progressEvent.loaded * 100) / progressEvent.total)
|
|
setProgress(percentCompleted)
|
|
}
|
|
})
|
|
|
|
if (outputFormat === 'json') {
|
|
setResult(response.data)
|
|
} else {
|
|
// For file downloads (markdown, html, docx)
|
|
const format = formats.find(f => f.value === outputFormat)
|
|
const blob = new Blob([response.data], {
|
|
type: response.headers['content-type']
|
|
})
|
|
const url = URL.createObjectURL(blob)
|
|
const a = document.createElement('a')
|
|
a.href = url
|
|
a.download = `ocr_result.${format.ext}`
|
|
a.click()
|
|
URL.revokeObjectURL(url)
|
|
|
|
setResult({
|
|
success: true,
|
|
message: `Document downloaded as ${format.label}`,
|
|
format: outputFormat
|
|
})
|
|
}
|
|
|
|
setProgress(100)
|
|
} catch (err) {
|
|
console.error('PDF processing error:', err)
|
|
setError(err.response?.data?.detail || err.message || 'Failed to process PDF')
|
|
} finally {
|
|
setProcessing(false)
|
|
}
|
|
}, [pdfFile, mode, prompt, outputFormat, includeCaption, advancedSettings])
|
|
|
|
const handleDownloadJSON = useCallback(() => {
|
|
if (!result || outputFormat !== 'json') return
|
|
|
|
const blob = new Blob([JSON.stringify(result, null, 2)], { type: 'application/json' })
|
|
const url = URL.createObjectURL(blob)
|
|
const a = document.createElement('a')
|
|
a.href = url
|
|
a.download = 'ocr_result.json'
|
|
a.click()
|
|
URL.revokeObjectURL(url)
|
|
}, [result, outputFormat])
|
|
|
|
return (
|
|
<div className="space-y-4">
|
|
{/* Format Selector */}
|
|
<div className="glass p-6 rounded-2xl space-y-3">
|
|
<label className="block text-sm font-medium text-gray-300 mb-3">
|
|
Output Format
|
|
</label>
|
|
<div className="grid grid-cols-2 gap-2">
|
|
{formats.map((format) => (
|
|
<motion.button
|
|
key={format.value}
|
|
onClick={() => setOutputFormat(format.value)}
|
|
className={`p-3 rounded-xl text-sm font-medium transition-all ${
|
|
outputFormat === format.value
|
|
? 'bg-gradient-to-r from-purple-600 to-cyan-600 text-white'
|
|
: 'glass text-gray-400 hover:bg-white/5'
|
|
}`}
|
|
whileHover={{ scale: 1.02 }}
|
|
whileTap={{ scale: 0.98 }}
|
|
>
|
|
<span className="mr-2">{format.icon}</span>
|
|
{format.label}
|
|
</motion.button>
|
|
))}
|
|
</div>
|
|
</div>
|
|
|
|
{/* Process Button */}
|
|
<motion.button
|
|
onClick={handleProcess}
|
|
disabled={!pdfFile || processing}
|
|
className={`w-full relative overflow-hidden rounded-2xl p-[2px] ${
|
|
!pdfFile || processing ? 'opacity-50 cursor-not-allowed' : ''
|
|
}`}
|
|
whileHover={!processing && pdfFile ? { scale: 1.02 } : {}}
|
|
whileTap={!processing && pdfFile ? { scale: 0.98 } : {}}
|
|
>
|
|
<div className="absolute inset-0 bg-gradient-to-r from-purple-600 via-pink-600 to-cyan-600 animate-gradient" />
|
|
<div className="relative bg-dark-100 px-8 py-4 rounded-2xl flex items-center justify-center gap-3">
|
|
{processing ? (
|
|
<>
|
|
<Loader2 className="w-5 h-5 animate-spin" />
|
|
<span className="font-semibold">Processing PDF...</span>
|
|
</>
|
|
) : (
|
|
<>
|
|
<FileText className="w-5 h-5" />
|
|
<span className="font-semibold">Process PDF</span>
|
|
</>
|
|
)}
|
|
</div>
|
|
</motion.button>
|
|
|
|
{/* Progress Bar */}
|
|
<AnimatePresence>
|
|
{processing && progress > 0 && (
|
|
<motion.div
|
|
initial={{ opacity: 0, height: 0 }}
|
|
animate={{ opacity: 1, height: 'auto' }}
|
|
exit={{ opacity: 0, height: 0 }}
|
|
className="glass p-4 rounded-2xl"
|
|
>
|
|
<div className="flex items-center justify-between mb-2">
|
|
<span className="text-sm text-gray-400">Processing...</span>
|
|
<span className="text-sm font-medium text-purple-400">{progress}%</span>
|
|
</div>
|
|
<div className="h-2 bg-dark-200 rounded-full overflow-hidden">
|
|
<motion.div
|
|
className="h-full bg-gradient-to-r from-purple-600 to-cyan-600"
|
|
initial={{ width: 0 }}
|
|
animate={{ width: `${progress}%` }}
|
|
transition={{ duration: 0.3 }}
|
|
/>
|
|
</div>
|
|
</motion.div>
|
|
)}
|
|
</AnimatePresence>
|
|
|
|
{/* Error Display */}
|
|
<AnimatePresence>
|
|
{error && (
|
|
<motion.div
|
|
initial={{ opacity: 0, y: -10 }}
|
|
animate={{ opacity: 1, y: 0 }}
|
|
exit={{ opacity: 0, y: -10 }}
|
|
className="glass p-4 rounded-2xl border-red-500/50 bg-red-500/10 flex items-start gap-3"
|
|
>
|
|
<AlertCircle className="w-5 h-5 text-red-400 flex-shrink-0 mt-0.5" />
|
|
<div>
|
|
<p className="text-sm font-medium text-red-400">Processing Failed</p>
|
|
<p className="text-xs text-red-300 mt-1">{error}</p>
|
|
</div>
|
|
</motion.div>
|
|
)}
|
|
</AnimatePresence>
|
|
|
|
{/* Success Display */}
|
|
<AnimatePresence>
|
|
{result && !error && (
|
|
<motion.div
|
|
initial={{ opacity: 0, y: -10 }}
|
|
animate={{ opacity: 1, y: 0 }}
|
|
exit={{ opacity: 0, y: -10 }}
|
|
className="glass p-6 rounded-2xl border-green-500/50 bg-green-500/10"
|
|
>
|
|
<div className="flex items-start gap-3">
|
|
<CheckCircle2 className="w-5 h-5 text-green-400 flex-shrink-0 mt-0.5" />
|
|
<div className="flex-1">
|
|
<p className="text-sm font-medium text-green-400">
|
|
{result.message || 'PDF processed successfully!'}
|
|
</p>
|
|
{outputFormat === 'json' && result.pages && (
|
|
<div className="mt-3 space-y-2">
|
|
<p className="text-xs text-gray-400">
|
|
Processed {result.total_pages} page{result.total_pages > 1 ? 's' : ''}
|
|
</p>
|
|
<motion.button
|
|
onClick={handleDownloadJSON}
|
|
className="glass px-4 py-2 rounded-xl text-sm font-medium hover:bg-white/5 transition-colors flex items-center gap-2"
|
|
whileHover={{ scale: 1.02 }}
|
|
whileTap={{ scale: 0.98 }}
|
|
>
|
|
<Download className="w-4 h-4" />
|
|
Download JSON
|
|
</motion.button>
|
|
</div>
|
|
)}
|
|
</div>
|
|
</div>
|
|
</motion.div>
|
|
)}
|
|
</AnimatePresence>
|
|
</div>
|
|
)
|
|
}
|
|
|
|
export default PDFProcessor
|