diff --git a/backend/main.py b/backend/main.py index 573c7c2..945e693 100644 --- a/backend/main.py +++ b/backend/main.py @@ -102,7 +102,7 @@ def build_prompt( instruction = "" if mode == "plain_ocr": - instruction = "Free OCR. Only output the raw text." + instruction = "Free OCR." elif mode == "markdown": instruction = "Convert the document to markdown." elif mode == "tables_csv": diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx index 95d79d7..c0cd6a9 100644 --- a/frontend/src/App.jsx +++ b/frontend/src/App.jsx @@ -1,9 +1,10 @@ import { useState, useCallback } from 'react' import { motion, AnimatePresence } from 'framer-motion' -import { Sparkles, Zap, Loader2 } from 'lucide-react' +import { Sparkles, Zap, Loader2, Settings } from 'lucide-react' import ImageUpload from './components/ImageUpload' import ModeSelector from './components/ModeSelector' import ResultPanel from './components/ResultPanel' +import AdvancedSettings from './components/AdvancedSettings' import axios from 'axios' const API_BASE = import.meta.env.VITE_API_URL || '/api' @@ -15,6 +16,8 @@ function App() { const [result, setResult] = useState(null) const [loading, setLoading] = useState(false) const [error, setError] = useState(null) + const [showAdvanced, setShowAdvanced] = useState(false) + const [includeCaption, setIncludeCaption] = useState(false) // Form state const [prompt, setPrompt] = useState('') @@ -60,7 +63,7 @@ function App() { formData.append('prompt', prompt) // Enable grounding only for find mode formData.append('grounding', mode === 'find_ref') - formData.append('include_caption', false) + formData.append('include_caption', includeCaption) formData.append('find_term', findTerm) formData.append('schema', '') formData.append('base_size', advancedSettings.base_size) @@ -190,6 +193,39 @@ function App() { preview={imagePreview} /> + {/* Advanced Settings Toggle */} + setShowAdvanced(!showAdvanced)} + className="w-full glass px-4 py-3 rounded-2xl flex items-center justify-between hover:bg-white/5 transition-colors" + whileHover={{ scale: 1.01 }} + whileTap={{ scale: 0.99 }} + > +
+ + Advanced Settings +
+ + + + + +
+ + {/* Advanced Settings Panel */} + + {showAdvanced && ( + + )} + + {/* Action Button */}