From 2a1eeeda50e62dab15f398e436112e77a37bfe5a Mon Sep 17 00:00:00 2001
From: perf3ct <jonfuller2012@gmail.com>
Date: Tue, 1 Jul 2025 00:15:48 +0000
Subject: [PATCH] feat(debug): debug page actually works and does something

---
 frontend/src/App.tsx                         |    2 +
 frontend/src/components/Layout/AppLayout.tsx |    2 +
 frontend/src/pages/DebugPage.tsx             | 1057 ++++++++++++++++++
 src/routes/documents.rs                      |  555 +++++++++
 4 files changed, 1616 insertions(+)
 create mode 100644 frontend/src/pages/DebugPage.tsx
diff --git a/frontend/src/App.tsx b/frontend/src/App.tsx
index 3c5de8f..30b0371 100644
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@@ -18,6 +18,7 @@ import WatchFolderPage from './pages/WatchFolderPage';
 import DocumentManagementPage from './pages/DocumentManagementPage';
 import LabelsPage from './pages/LabelsPage';
 import IgnoredFilesPage from './pages/IgnoredFilesPage';
+import DebugPage from './pages/DebugPage';
 
 function App(): React.ReactElement {
   const { user, loading } = useAuth();
@@ -77,6 +78,7 @@ function App(): React.ReactElement {
                     <Route path="/settings" element={<SettingsPage />} />
                     <Route path="/documents/management" element={<DocumentManagementPage />} />
                     <Route path="/ignored-files" element={<IgnoredFilesPage />} />
+                    <Route path="/debug" element={<DebugPage />} />
                     <Route path="/profile" element={<div>Profile Page - Coming Soon</div>} />
                   </Routes>
                 </AppLayout>
diff --git a/frontend/src/components/Layout/AppLayout.tsx b/frontend/src/components/Layout/AppLayout.tsx
index 1fb91aa..5855e11 100644
--- a/frontend/src/components/Layout/AppLayout.tsx
+++ b/frontend/src/components/Layout/AppLayout.tsx
@@ -37,6 +37,7 @@ import {
   Block as BlockIcon,
   Api as ApiIcon,
   ManageAccounts as ManageIcon,
+  BugReport as BugReportIcon,
 } from '@mui/icons-material';
 import { useNavigate, useLocation } from 'react-router-dom';
 import { useAuth } from '../../contexts/AuthContext';
@@ -72,6 +73,7 @@ const navigationItems: NavigationItem[] = [
   { text: 'Watch Folder', icon: FolderIcon, path: '/watch' },
   { text: 'Document Management', icon: ManageIcon, path: '/documents/management' },
   { text: 'Ignored Files', icon: BlockIcon, path: '/ignored-files' },
+  { text: 'Debug', icon: BugReportIcon, path: '/debug' },
 ];
 
 const AppLayout: React.FC<AppLayoutProps> = ({ children }) => {
diff --git a/frontend/src/pages/DebugPage.tsx b/frontend/src/pages/DebugPage.tsx
new file mode 100644
index 0000000..790205e
--- /dev/null
+++ b/frontend/src/pages/DebugPage.tsx
@@ -0,0 +1,1057 @@
+import React, { useState, useCallback, useEffect } from 'react';
+import {
+  Box,
+  Card,
+  CardContent,
+  Typography,
+  TextField,
+  Button,
+  Grid,
+  Paper,
+  Stepper,
+  Step,
+  StepLabel,
+  StepContent,
+  Alert,
+  Chip,
+  Table,
+  TableBody,
+  TableCell,
+  TableContainer,
+  TableHead,
+  TableRow,
+  Accordion,
+  AccordionSummary,
+  AccordionDetails,
+  CircularProgress,
+  Container,
+  Tabs,
+  Tab,
+  LinearProgress,
+  Divider,
+} from '@mui/material';
+import {
+  ExpandMore as ExpandMoreIcon,
+  BugReport as BugReportIcon,
+  CheckCircle as CheckCircleIcon,
+  Error as ErrorIcon,
+  Warning as WarningIcon,
+  Pending as PendingIcon,
+  PlayArrow as PlayArrowIcon,
+  CloudUpload as UploadIcon,
+  Search as SearchIcon,
+  Refresh as RefreshIcon,
+  Visibility as PreviewIcon,
+} from '@mui/icons-material';
+import { api } from '../services/api';
+
+interface DebugStep {
+  step: number;
+  name: string;
+  status: string;
+  details: any;
+  success: boolean;
+  error?: string;
+}
+
+interface DebugInfo {
+  document_id: string;
+  filename: string;
+  overall_status: string;
+  pipeline_steps: DebugStep[];
+  failed_document_info?: any;
+  user_settings: any;
+  debug_timestamp: string;
+}
+
+const DebugPage: React.FC = () => {
+  const [activeTab, setActiveTab] = useState<number>(0);
+  const [documentId, setDocumentId] = useState<string>('');
+  const [debugInfo, setDebugInfo] = useState<DebugInfo | null>(null);
+  const [loading, setLoading] = useState<boolean>(false);
+  const [error, setError] = useState<string>('');
+  
+  // Upload functionality
+  const [selectedFile, setSelectedFile] = useState<File | null>(null);
+  const [uploading, setUploading] = useState<boolean>(false);
+  const [uploadProgress, setUploadProgress] = useState<number>(0);
+  const [uploadedDocumentId, setUploadedDocumentId] = useState<string>('');
+  const [monitoringInterval, setMonitoringInterval] = useState<NodeJS.Timeout | null>(null);
+  const [processingStatus, setProcessingStatus] = useState<string>('');
+
+  const getStepIcon = (status: string, success: boolean) => {
+    if (status === 'processing') return <CircularProgress size={20} />;
+    if (success || status === 'completed' || status === 'passed') return <CheckCircleIcon color="success" />;
+    if (status === 'failed' || status === 'error') return <ErrorIcon color="error" />;
+    if (status === 'pending' || status === 'not_reached') return <PendingIcon color="disabled" />;
+    if (status === 'not_queued' || status === 'ocr_disabled') return <WarningIcon color="warning" />;
+    return <PlayArrowIcon color="primary" />;
+  };
+
+  const getStatusColor = (status: string, success: boolean): "default" | "primary" | "secondary" | "error" | "info" | "success" | "warning" => {
+    if (status === 'processing') return 'info';
+    if (success || status === 'completed' || status === 'passed') return 'success';
+    if (status === 'failed' || status === 'error') return 'error';
+    if (status === 'pending' || status === 'not_reached') return 'default';
+    if (status === 'not_queued' || status === 'ocr_disabled') return 'warning';
+    return 'primary';
+  };
+
+  const fetchDebugInfo = useCallback(async (docId?: string, retryCount = 0) => {
+    const targetDocId = docId || documentId;
+    if (!targetDocId.trim()) {
+      setError('Please enter a document ID');
+      return;
+    }
+
+    setLoading(true);
+    if (retryCount === 0) {
+      setError(''); // Only clear error on first attempt
+    }
+    
+    try {
+      const response = await api.get(`/documents/${targetDocId}/debug`);
+      setDebugInfo(response.data);
+      setError(''); // Clear any previous errors
+    } catch (err: any) {
+      console.error('Debug fetch error:', err);
+      
+      // If it's a 404 and we haven't retried much, try again after a short delay
+      if (err.response?.status === 404 && retryCount < 3) {
+        console.log(`Document not found, retrying in ${(retryCount + 1) * 1000}ms... (attempt ${retryCount + 1})`);
+        setTimeout(() => {
+          fetchDebugInfo(docId, retryCount + 1);
+        }, (retryCount + 1) * 1000);
+        return;
+      }
+      
+      const errorMessage = err.response?.status === 404 
+        ? `Document ${targetDocId} not found. It may still be processing or may have been moved to failed documents.`
+        : err.response?.data?.message || `Failed to fetch debug information: ${err.message}`;
+      setError(errorMessage);
+      setDebugInfo(null);
+    } finally {
+      if (retryCount === 0) {
+        setLoading(false);
+      }
+    }
+  }, [documentId]);
+
+  const handleFileSelect = (event: React.ChangeEvent<HTMLInputElement>) => {
+    const file = event.target.files?.[0];
+    if (file) {
+      setSelectedFile(file);
+      setError('');
+    }
+  };
+
+  const uploadDocument = useCallback(async () => {
+    if (!selectedFile) {
+      setError('Please select a file to upload');
+      return;
+    }
+
+    setUploading(true);
+    setUploadProgress(0);
+    setError('');
+    setProcessingStatus('Uploading file...');
+
+    try {
+      const formData = new FormData();
+      formData.append('file', selectedFile);
+
+      const response = await api.post('/documents', formData, {
+        headers: {
+          'Content-Type': 'multipart/form-data',
+        },
+        onUploadProgress: (progressEvent) => {
+          const progress = progressEvent.total 
+            ? Math.round((progressEvent.loaded * 100) / progressEvent.total)
+            : 0;
+          setUploadProgress(progress);
+        },
+      });
+
+      const uploadedDoc = response.data;
+      setUploadedDocumentId(uploadedDoc.id);
+      setDocumentId(uploadedDoc.id);
+      setProcessingStatus('Document uploaded successfully. Starting OCR processing...');
+      
+      // Start monitoring the processing
+      startProcessingMonitor(uploadedDoc.id);
+    } catch (err: any) {
+      setError(err.response?.data?.message || 'Failed to upload document');
+      setProcessingStatus('Upload failed');
+    } finally {
+      setUploading(false);
+      setUploadProgress(0);
+    }
+  }, [selectedFile]);
+
+  const startProcessingMonitor = useCallback((docId: string) => {
+    // Clear any existing interval
+    if (monitoringInterval) {
+      clearInterval(monitoringInterval);
+    }
+
+    const interval = setInterval(async () => {
+      try {
+        const response = await api.get(`/documents/${docId}`);
+        const doc = response.data;
+        
+        if (doc.ocr_status === 'completed' || doc.ocr_status === 'failed') {
+          setProcessingStatus(`Processing ${doc.ocr_status}!`);
+          clearInterval(interval);
+          setMonitoringInterval(null);
+          
+          // Auto-fetch debug info when processing is complete OR failed (but don't switch tabs)
+          setTimeout(() => {
+            fetchDebugInfo(docId);
+            // Don't auto-switch tabs - let user decide when to view debug info
+          }, 2000); // Give it a bit more time to ensure document is saved
+        } else if (doc.ocr_status === 'processing') {
+          setProcessingStatus('OCR processing in progress...');
+        } else if (doc.ocr_status === 'pending') {
+          setProcessingStatus('Document queued for OCR processing...');
+        } else {
+          setProcessingStatus('Checking processing status...');
+        }
+      } catch (err) {
+        console.error('Error monitoring processing:', err);
+      }
+    }, 2000); // Check every 2 seconds
+
+    setMonitoringInterval(interval);
+    
+    // Auto-clear monitoring after 5 minutes
+    setTimeout(() => {
+      clearInterval(interval);
+      setMonitoringInterval(null);
+      setProcessingStatus('Monitoring stopped (timeout)');
+    }, 300000);
+  }, [monitoringInterval, fetchDebugInfo]);
+
+  // Cleanup interval on unmount
+  useEffect(() => {
+    return () => {
+      if (monitoringInterval) {
+        clearInterval(monitoringInterval);
+      }
+    };
+  }, [monitoringInterval]);
+
+  const renderStepDetails = (step: DebugStep) => {
+    const details = step.details;
+    
+    return (
+      <Box sx={{ mt: 2 }}>
+        {step.error && (
+          <Alert severity="error" sx={{ mb: 2 }}>
+            {step.error}
+          </Alert>
+        )}
+        
+        {step.step === 1 && ( // File Upload & Ingestion
+          <Box>
+            <Grid container spacing={2}>
+              <Grid item xs={12} md={6}>
+                <Paper sx={{ p: 2 }}>
+                  <Typography variant="h6" gutterBottom>File Information</Typography>
+                  <Typography><strong>Filename:</strong> {details.filename}</Typography>
+                  <Typography><strong>Original:</strong> {details.original_filename}</Typography>
+                  <Typography><strong>Size:</strong> {(details.file_size / 1024 / 1024).toFixed(2)} MB</Typography>
+                  <Typography><strong>MIME Type:</strong> {details.mime_type}</Typography>
+                  <Typography><strong>File Exists:</strong> <Chip 
+                    label={details.file_exists ? 'Yes' : 'No'} 
+                    color={details.file_exists ? 'success' : 'error'} 
+                    size="small" 
+                  /></Typography>
+                </Paper>
+              </Grid>
+              <Grid item xs={12} md={6}>
+                <Paper sx={{ p: 2 }}>
+                  <Typography variant="h6" gutterBottom>File Metadata</Typography>
+                  {details.file_metadata ? (
+                    <>
+                      <Typography><strong>Actual Size:</strong> {(details.file_metadata.size / 1024 / 1024).toFixed(2)} MB</Typography>
+                      <Typography><strong>Is File:</strong> {details.file_metadata.is_file ? 'Yes' : 'No'}</Typography>
+                      <Typography><strong>Modified:</strong> {details.file_metadata.modified ? new Date(details.file_metadata.modified.secs_since_epoch * 1000).toLocaleString() : 'Unknown'}</Typography>
+                    </>
+                  ) : (
+                    <Typography color="text.secondary">File metadata not available</Typography>
+                  )}
+                  <Typography><strong>Created:</strong> {new Date(details.created_at).toLocaleString()}</Typography>
+                </Paper>
+              </Grid>
+            </Grid>
+            
+            {details.file_analysis && (
+              <Box sx={{ mt: 2 }}>
+                <Typography variant="h6" gutterBottom>Detailed File Analysis</Typography>
+                <Grid container spacing={2}>
+                  <Grid item xs={12} md={6}>
+                    <Paper sx={{ p: 2 }}>
+                      <Typography variant="subtitle1" gutterBottom>Basic Analysis</Typography>
+                      <Typography><strong>File Type:</strong> {details.file_analysis.file_type}</Typography>
+                      <Typography><strong>Size:</strong> {(details.file_analysis.file_size_bytes / 1024 / 1024).toFixed(2)} MB</Typography>
+                      <Typography><strong>Readable:</strong> <Chip 
+                        label={details.file_analysis.is_readable ? 'Yes' : 'No'} 
+                        color={details.file_analysis.is_readable ? 'success' : 'error'} 
+                        size="small" 
+                      /></Typography>
+                      {details.file_analysis.error_details && (
+                        <Alert severity="error" sx={{ mt: 1 }}>
+                          <strong>File Error:</strong> {details.file_analysis.error_details}
+                        </Alert>
+                      )}
+                    </Paper>
+                  </Grid>
+                  <Grid item xs={12} md={6}>
+                    {details.file_analysis.pdf_info ? (
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>PDF Analysis</Typography>
+                        <Typography><strong>Valid PDF:</strong> <Chip 
+                          label={details.file_analysis.pdf_info.is_valid_pdf ? 'Yes' : 'No'} 
+                          color={details.file_analysis.pdf_info.is_valid_pdf ? 'success' : 'error'} 
+                          size="small" 
+                        /></Typography>
+                        <Typography><strong>PDF Version:</strong> {details.file_analysis.pdf_info.pdf_version || 'Unknown'}</Typography>
+                        <Typography><strong>Pages:</strong> {details.file_analysis.pdf_info.page_count || 'Unknown'}</Typography>
+                        <Typography><strong>Has Text:</strong> <Chip 
+                          label={details.file_analysis.pdf_info.has_text_content ? 'Yes' : 'No'} 
+                          color={details.file_analysis.pdf_info.has_text_content ? 'success' : 'warning'} 
+                          size="small" 
+                        /></Typography>
+                        <Typography><strong>Has Images:</strong> <Chip 
+                          label={details.file_analysis.pdf_info.has_images ? 'Yes' : 'No'} 
+                          color={details.file_analysis.pdf_info.has_images ? 'info' : 'default'} 
+                          size="small" 
+                        /></Typography>
+                        <Typography><strong>Encrypted:</strong> <Chip 
+                          label={details.file_analysis.pdf_info.is_encrypted ? 'Yes' : 'No'} 
+                          color={details.file_analysis.pdf_info.is_encrypted ? 'error' : 'success'} 
+                          size="small" 
+                        /></Typography>
+                        <Typography><strong>Font Count:</strong> {details.file_analysis.pdf_info.font_count}</Typography>
+                        <Typography><strong>Text Length:</strong> {details.file_analysis.pdf_info.estimated_text_length} chars</Typography>
+                        {details.file_analysis.pdf_info.text_extraction_error && (
+                          <Alert severity="error" sx={{ mt: 1 }}>
+                            <strong>PDF Text Extraction Error:</strong> {details.file_analysis.pdf_info.text_extraction_error}
+                          </Alert>
+                        )}
+                      </Paper>
+                    ) : details.file_analysis.text_preview ? (
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>Text Preview</Typography>
+                        <Typography variant="body2" sx={{ 
+                          backgroundColor: 'grey.100', 
+                          p: 1, 
+                          borderRadius: 1,
+                          fontFamily: 'monospace',
+                          fontSize: '0.85em'
+                        }}>
+                          {details.file_analysis.text_preview}
+                        </Typography>
+                      </Paper>
+                    ) : (
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>File Content</Typography>
+                        <Typography color="text.secondary">No preview available for this file type</Typography>
+                      </Paper>
+                    )}
+                  </Grid>
+                </Grid>
+              </Box>
+            )}
+          </Box>
+        )}
+
+        {step.step === 2 && ( // OCR Queue Enrollment
+          <Box>
+            <Grid container spacing={2}>
+              <Grid item xs={12} md={6}>
+                <Paper sx={{ p: 2 }}>
+                  <Typography variant="h6" gutterBottom>Queue Status</Typography>
+                  <Typography><strong>User OCR Enabled:</strong> <Chip 
+                    label={details.user_ocr_enabled ? 'Yes' : 'No'} 
+                    color={details.user_ocr_enabled ? 'success' : 'warning'} 
+                    size="small" 
+                  /></Typography>
+                  <Typography sx={{ mt: 1 }}><strong>Queue Entries:</strong> {details.queue_entries_count}</Typography>
+                </Paper>
+              </Grid>
+            </Grid>
+            
+            {details.queue_history && details.queue_history.length > 0 && (
+              <Box sx={{ mt: 2 }}>
+                <Typography variant="h6" gutterBottom>Queue History</Typography>
+                <TableContainer component={Paper}>
+                  <Table size="small">
+                    <TableHead>
+                      <TableRow>
+                        <TableCell>Status</TableCell>
+                        <TableCell>Priority</TableCell>
+                        <TableCell>Created</TableCell>
+                        <TableCell>Started</TableCell>
+                        <TableCell>Completed</TableCell>
+                        <TableCell>Attempts</TableCell>
+                        <TableCell>Worker</TableCell>
+                      </TableRow>
+                    </TableHead>
+                    <TableBody>
+                      {details.queue_history.map((entry: any, index: number) => (
+                        <TableRow key={index}>
+                          <TableCell>
+                            <Chip 
+                              label={entry.status} 
+                              color={entry.status === 'completed' ? 'success' : entry.status === 'failed' ? 'error' : 'default'} 
+                              size="small" 
+                            />
+                          </TableCell>
+                          <TableCell>{entry.priority}</TableCell>
+                          <TableCell>{new Date(entry.created_at).toLocaleString()}</TableCell>
+                          <TableCell>{entry.started_at ? new Date(entry.started_at).toLocaleString() : '-'}</TableCell>
+                          <TableCell>{entry.completed_at ? new Date(entry.completed_at).toLocaleString() : '-'}</TableCell>
+                          <TableCell>{entry.attempts}</TableCell>
+                          <TableCell>{entry.worker_id || '-'}</TableCell>
+                        </TableRow>
+                      ))}
+                    </TableBody>
+                  </Table>
+                </TableContainer>
+              </Box>
+            )}
+          </Box>
+        )}
+
+        {step.step === 3 && ( // OCR Processing
+          <Grid container spacing={2}>
+            <Grid item xs={12} md={6}>
+              <Paper sx={{ p: 2 }}>
+                <Typography variant="h6" gutterBottom>OCR Results</Typography>
+                <Typography><strong>Text Length:</strong> {details.ocr_text_length} characters</Typography>
+                <Typography><strong>Confidence:</strong> {details.ocr_confidence ? `${details.ocr_confidence.toFixed(1)}%` : 'N/A'}</Typography>
+                <Typography><strong>Word Count:</strong> {details.ocr_word_count || 0}</Typography>
+                <Typography><strong>Processing Time:</strong> {details.ocr_processing_time_ms ? `${details.ocr_processing_time_ms}ms` : 'N/A'}</Typography>
+                <Typography><strong>Completed:</strong> {details.ocr_completed_at ? new Date(details.ocr_completed_at).toLocaleString() : 'Not completed'}</Typography>
+              </Paper>
+            </Grid>
+            <Grid item xs={12} md={6}>
+              <Paper sx={{ p: 2 }}>
+                <Typography variant="h6" gutterBottom>Processing Details</Typography>
+                <Typography><strong>Has Processed Image:</strong> <Chip 
+                  label={details.has_processed_image ? 'Yes' : 'No'} 
+                  color={details.has_processed_image ? 'success' : 'default'} 
+                  size="small" 
+                /></Typography>
+                {details.processed_image_info && (
+                  <>
+                    <Typography sx={{ mt: 1 }}><strong>Image Size:</strong> {details.processed_image_info.image_width}x{details.processed_image_info.image_height}</Typography>
+                    <Typography><strong>File Size:</strong> {(details.processed_image_info.file_size / 1024).toFixed(1)} KB</Typography>
+                    <Typography><strong>Processing Steps:</strong> {details.processed_image_info.processing_steps?.join(', ') || 'None'}</Typography>
+                    {details.processed_image_info.processing_parameters && (
+                      <Typography><strong>Processing Parameters:</strong> {JSON.stringify(details.processed_image_info.processing_parameters)}</Typography>
+                    )}
+                  </>
+                )}
+              </Paper>
+            </Grid>
+          </Grid>
+        )}
+
+        {step.step === 4 && ( // Quality Validation
+          <Box>
+            <Grid container spacing={2}>
+              <Grid item xs={12} md={6}>
+                <Paper sx={{ p: 2 }}>
+                  <Typography variant="h6" gutterBottom>Quality Thresholds</Typography>
+                  <Typography><strong>Min Confidence:</strong> {details.quality_thresholds.min_confidence}%</Typography>
+                  <Typography><strong>Brightness:</strong> {details.quality_thresholds.brightness_threshold}</Typography>
+                  <Typography><strong>Contrast:</strong> {details.quality_thresholds.contrast_threshold}</Typography>
+                  <Typography><strong>Noise:</strong> {details.quality_thresholds.noise_threshold}</Typography>
+                  <Typography><strong>Sharpness:</strong> {details.quality_thresholds.sharpness_threshold}</Typography>
+                </Paper>
+              </Grid>
+              <Grid item xs={12} md={6}>
+                <Paper sx={{ p: 2 }}>
+                  <Typography variant="h6" gutterBottom>Actual Values</Typography>
+                  <Typography><strong>Confidence:</strong> {details.actual_values.confidence ? `${details.actual_values.confidence.toFixed(1)}%` : 'N/A'}</Typography>
+                  <Typography><strong>Word Count:</strong> {details.actual_values.word_count || 0}</Typography>
+                  <Typography><strong>Processed Image Available:</strong> <Chip 
+                    label={details.actual_values.processed_image_available ? 'Yes' : 'No'} 
+                    color={details.actual_values.processed_image_available ? 'success' : 'default'} 
+                    size="small" 
+                  /></Typography>
+                  {details.actual_values.processing_parameters && (
+                    <Typography><strong>Processing Parameters:</strong> {JSON.stringify(details.actual_values.processing_parameters)}</Typography>
+                  )}
+                </Paper>
+              </Grid>
+            </Grid>
+            
+            <Box sx={{ mt: 2 }}>
+              <Typography variant="h6" gutterBottom>Quality Checks</Typography>
+              <Grid container spacing={1}>
+                {Object.entries(details.quality_checks).map(([check, passed]: [string, any]) => (
+                  <Grid item key={check}>
+                    <Chip 
+                      label={check.replace('_check', '').replace('_', ' ')} 
+                      color={passed === true ? 'success' : passed === false ? 'error' : 'default'}
+                      size="small"
+                      icon={passed === true ? <CheckCircleIcon /> : passed === false ? <ErrorIcon /> : <WarningIcon />}
+                    />
+                  </Grid>
+                ))}
+              </Grid>
+            </Box>
+          </Box>
+        )}
+      </Box>
+    );
+  };
+
+  const renderUploadTab = () => (
+    <Box>
+      <Card sx={{ mb: 4 }}>
+        <CardContent>
+          <Typography variant="h6" gutterBottom>
+            Upload Document for Debug Analysis
+          </Typography>
+          <Typography variant="body2" color="text.secondary" sx={{ mb: 3 }}>
+            Upload a PDF or image file to analyze the processing pipeline in real-time.
+          </Typography>
+          
+          <Box sx={{ mb: 3 }}>
+            <input
+              accept=".pdf,.png,.jpg,.jpeg,.tiff,.bmp,.txt"
+              style={{ display: 'none' }}
+              id="debug-file-upload"
+              type="file"
+              onChange={handleFileSelect}
+            />
+            <label htmlFor="debug-file-upload">
+              <Button
+                variant="outlined"
+                component="span"
+                startIcon={<UploadIcon />}
+                disabled={uploading}
+                sx={{ mr: 2 }}
+              >
+                Select File
+              </Button>
+            </label>
+            
+            {selectedFile && (
+              <Box sx={{ mt: 2 }}>
+                <Typography variant="body2">
+                  <strong>Selected:</strong> {selectedFile.name} ({(selectedFile.size / 1024 / 1024).toFixed(2)} MB)
+                </Typography>
+              </Box>
+            )}
+            
+            {selectedFile && (
+              <Button
+                variant="contained"
+                onClick={uploadDocument}
+                disabled={uploading}
+                startIcon={uploading ? <CircularProgress size={20} /> : <UploadIcon />}
+                sx={{ mt: 2 }}
+              >
+                {uploading ? 'Uploading...' : 'Upload & Debug'}
+              </Button>
+            )}
+          </Box>
+          
+          {uploading && uploadProgress > 0 && (
+            <Box sx={{ mb: 2 }}>
+              <Typography variant="body2" gutterBottom>
+                Upload Progress: {uploadProgress}%
+              </Typography>
+              <LinearProgress variant="determinate" value={uploadProgress} />
+            </Box>
+          )}
+          
+          {processingStatus && (
+            <Alert 
+              severity={processingStatus.includes('failed') ? 'error' : 
+                       processingStatus.includes('completed') ? 'success' : 'info'}
+              sx={{ mb: 2 }}
+            >
+              {processingStatus}
+              {monitoringInterval && (
+                <Box sx={{ mt: 1 }}>
+                  <LinearProgress />
+                </Box>
+              )}
+            </Alert>
+          )}
+          
+          {uploadedDocumentId && (
+            <Box sx={{ mt: 2 }}>
+              <Typography variant="body2">
+                <strong>Document ID:</strong> {uploadedDocumentId}
+              </Typography>
+              <Box sx={{ mt: 2 }}>
+                <Button
+                  variant="contained"
+                  size="small"
+                  onClick={() => {
+                    fetchDebugInfo(uploadedDocumentId);
+                    setActiveTab(2); // Switch to debug results tab
+                  }}
+                  startIcon={<BugReportIcon />}
+                  sx={{ mr: 1 }}
+                  color={processingStatus.includes('failed') ? 'error' : 'primary'}
+                >
+                  {processingStatus.includes('failed') ? 'Show Debug Details' : 'Debug Analysis'}
+                </Button>
+                <Button
+                  variant="outlined"
+                  size="small"
+                  onClick={() => fetchDebugInfo(uploadedDocumentId)}
+                  startIcon={<RefreshIcon />}
+                  sx={{ mr: 1 }}
+                >
+                  Refresh Status
+                </Button>
+                <Button
+                  variant="outlined"
+                  size="small"
+                  onClick={() => window.open(`/api/documents/${uploadedDocumentId}/view`, '_blank')}
+                  startIcon={<PreviewIcon />}
+                >
+                  View Document
+                </Button>
+              </Box>
+            </Box>
+          )}
+          
+          {selectedFile && selectedFile.type.startsWith('image/') && (
+            <Box sx={{ mt: 3 }}>
+              <Typography variant="h6" gutterBottom>Preview</Typography>
+              <Box 
+                component="img"
+                src={URL.createObjectURL(selectedFile)}
+                alt="Document preview"
+                sx={{
+                  maxWidth: '100%',
+                  maxHeight: '400px',
+                  objectFit: 'contain',
+                  border: '1px solid',
+                  borderColor: 'divider',
+                  borderRadius: 1
+                }}
+              />
+            </Box>
+          )}
+        </CardContent>
+      </Card>
+    </Box>
+  );
+
+  const renderSearchTab = () => (
+    <Box>
+      <Card sx={{ mb: 4 }}>
+        <CardContent>
+          <Typography variant="h6" gutterBottom>
+            Debug Existing Document
+          </Typography>
+          <Typography variant="body2" color="text.secondary" sx={{ mb: 3 }}>
+            Enter a document ID to analyze the processing pipeline for an existing document.
+          </Typography>
+          
+          <Box sx={{ display: 'flex', gap: 2, alignItems: 'center' }}>
+            <TextField
+              label="Document ID"
+              value={documentId}
+              onChange={(e) => setDocumentId(e.target.value)}
+              placeholder="e.g., 123e4567-e89b-12d3-a456-426614174000"
+              fullWidth
+              size="small"
+            />
+            <Button
+              variant="contained"
+              onClick={() => fetchDebugInfo()}
+              disabled={loading || !documentId.trim()}
+              startIcon={loading ? <CircularProgress size={20} /> : <SearchIcon />}
+            >
+              Debug
+            </Button>
+          </Box>
+          
+          {error && (
+            <Alert severity="error" sx={{ mt: 2 }}>
+              {error}
+            </Alert>
+          )}
+        </CardContent>
+      </Card>
+    </Box>
+  );
+
+  return (
+    <Container maxWidth="xl">
+      <Box sx={{ mb: 4 }}>
+        <Typography variant="h4" component="h1" gutterBottom>
+          <BugReportIcon sx={{ mr: 1, verticalAlign: 'middle' }} />
+          Document Processing Debug
+        </Typography>
+        <Typography variant="body1" color="text.secondary">
+          Upload documents or analyze existing ones to troubleshoot OCR processing issues.
+        </Typography>
+      </Box>
+
+      <Card sx={{ mb: 4 }}>
+        <Box sx={{ borderBottom: 1, borderColor: 'divider' }}>
+          <Tabs value={activeTab} onChange={(_, newValue) => setActiveTab(newValue)}>
+            <Tab 
+              label="Upload & Debug" 
+              icon={<UploadIcon />} 
+              iconPosition="start"
+            />
+            <Tab 
+              label="Search Existing" 
+              icon={<SearchIcon />} 
+              iconPosition="start"
+            />
+            {debugInfo && (
+              <Tab 
+                label="Debug Results" 
+                icon={<PreviewIcon />} 
+                iconPosition="start"
+              />
+            )}
+          </Tabs>
+        </Box>
+        
+        <CardContent>
+          {activeTab === 0 && renderUploadTab()}
+          {activeTab === 1 && renderSearchTab()}
+        </CardContent>
+      </Card>
+
+      {error && (
+        <Alert severity="error" sx={{ mb: 4 }}>
+          <Typography variant="h6">Debug Error</Typography>
+          {error}
+        </Alert>
+      )}
+
+      {debugInfo && activeTab === 2 && (
+        <Box>
+          <Card sx={{ mb: 4 }}>
+            <CardContent>
+              <Typography variant="h6" gutterBottom>
+                Document: {debugInfo.filename}
+              </Typography>
+              <Box sx={{ display: 'flex', gap: 2, alignItems: 'center', mb: 2 }}>
+                <Chip 
+                  label={`Status: ${debugInfo.overall_status}`}
+                  color={getStatusColor(debugInfo.overall_status, debugInfo.overall_status === 'success')}
+                />
+                <Typography variant="body2" color="text.secondary">
+                  Debug run at: {new Date(debugInfo.debug_timestamp).toLocaleString()}
+                </Typography>
+              </Box>
+            </CardContent>
+          </Card>
+
+          <Card sx={{ mb: 4 }}>
+            <CardContent>
+              <Typography variant="h6" gutterBottom>
+                Processing Pipeline
+              </Typography>
+              <Stepper orientation="vertical">
+                {debugInfo.pipeline_steps.map((step) => (
+                  <Step key={step.step} active={true}>
+                    <StepLabel 
+                      icon={getStepIcon(step.status, step.success)}
+                      StepIconProps={{ 
+                        style: { color: step.success ? '#4caf50' : step.status === 'failed' ? '#f44336' : '#ff9800' }
+                      }}
+                    >
+                      <Box sx={{ display: 'flex', alignItems: 'center', gap: 1 }}>
+                        <Typography variant="subtitle1">{step.name}</Typography>
+                        <Chip 
+                          label={step.status} 
+                          size="small" 
+                          color={getStatusColor(step.status, step.success)}
+                        />
+                      </Box>
+                    </StepLabel>
+                    <StepContent>
+                      {renderStepDetails(step)}
+                    </StepContent>
+                  </Step>
+                ))}
+              </Stepper>
+            </CardContent>
+          </Card>
+
+          {debugInfo.failed_document_info && (
+            <Card sx={{ mb: 4 }}>
+              <CardContent>
+                <Typography variant="h6" gutterBottom color="error">
+                  Failed Document Information
+                </Typography>
+                <Grid container spacing={2}>
+                  <Grid item xs={12} md={6}>
+                    <Paper sx={{ p: 2 }}>
+                      <Typography variant="subtitle1" gutterBottom>Failure Details</Typography>
+                      <Typography><strong>Failure Reason:</strong> {debugInfo.failed_document_info.failure_reason}</Typography>
+                      <Typography><strong>Failure Stage:</strong> {debugInfo.failed_document_info.failure_stage}</Typography>
+                      <Typography><strong>Retry Count:</strong> {debugInfo.failed_document_info.retry_count || 0}</Typography>
+                      <Typography><strong>Created:</strong> {new Date(debugInfo.failed_document_info.created_at).toLocaleString()}</Typography>
+                      {debugInfo.failed_document_info.last_retry_at && (
+                        <Typography><strong>Last Retry:</strong> {new Date(debugInfo.failed_document_info.last_retry_at).toLocaleString()}</Typography>
+                      )}
+                    </Paper>
+                  </Grid>
+                  <Grid item xs={12} md={6}>
+                    <Paper sx={{ p: 2 }}>
+                      <Typography variant="subtitle1" gutterBottom>Failed OCR Results</Typography>
+                      {debugInfo.failed_document_info.failed_ocr_text ? (
+                        <>
+                          <Typography><strong>OCR Text Length:</strong> {debugInfo.failed_document_info.failed_ocr_text.length} chars</Typography>
+                          <Typography><strong>OCR Confidence:</strong> {debugInfo.failed_document_info.failed_ocr_confidence?.toFixed(1)}%</Typography>
+                          <Typography><strong>Word Count:</strong> {debugInfo.failed_document_info.failed_ocr_word_count || 0}</Typography>
+                          <Typography><strong>Processing Time:</strong> {debugInfo.failed_document_info.failed_ocr_processing_time_ms || 0}ms</Typography>
+                        </>
+                      ) : (
+                        <Typography color="text.secondary">No OCR results available</Typography>
+                      )}
+                    </Paper>
+                  </Grid>
+                  {debugInfo.failed_document_info.error_message && (
+                    <Grid item xs={12}>
+                      <Alert severity="error">
+                        <strong>Error Message:</strong> {debugInfo.failed_document_info.error_message}
+                      </Alert>
+                    </Grid>
+                  )}
+                  {debugInfo.failed_document_info.content_preview && (
+                    <Grid item xs={12}>
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>Content Preview</Typography>
+                        <Typography variant="body2" sx={{ 
+                          backgroundColor: 'grey.100', 
+                          p: 1, 
+                          borderRadius: 1,
+                          fontFamily: 'monospace',
+                          fontSize: '0.85em'
+                        }}>
+                          {debugInfo.failed_document_info.content_preview}
+                        </Typography>
+                      </Paper>
+                    </Grid>
+                  )}
+                </Grid>
+              </CardContent>
+            </Card>
+          )}
+
+          {debugInfo.detailed_processing_logs && debugInfo.detailed_processing_logs.length > 0 && (
+            <Card sx={{ mb: 4 }}>
+              <CardContent>
+                <Typography variant="h6" gutterBottom>
+                  Detailed Processing Logs
+                </Typography>
+                <Typography variant="body2" color="text.secondary" sx={{ mb: 2 }}>
+                  Complete history of all OCR processing attempts for this document.
+                </Typography>
+                <TableContainer component={Paper}>
+                  <Table size="small">
+                    <TableHead>
+                      <TableRow>
+                        <TableCell>Attempt</TableCell>
+                        <TableCell>Status</TableCell>
+                        <TableCell>Priority</TableCell>
+                        <TableCell>Created</TableCell>
+                        <TableCell>Started</TableCell>
+                        <TableCell>Completed</TableCell>
+                        <TableCell>Duration</TableCell>
+                        <TableCell>Wait Time</TableCell>
+                        <TableCell>Attempts</TableCell>
+                        <TableCell>Worker</TableCell>
+                        <TableCell>Error</TableCell>
+                      </TableRow>
+                    </TableHead>
+                    <TableBody>
+                      {debugInfo.detailed_processing_logs.map((log: any, index: number) => (
+                        <TableRow key={log.id}>
+                          <TableCell>{index + 1}</TableCell>
+                          <TableCell>
+                            <Chip 
+                              label={log.status} 
+                              color={log.status === 'completed' ? 'success' : log.status === 'failed' ? 'error' : 'default'} 
+                              size="small" 
+                            />
+                          </TableCell>
+                          <TableCell>{log.priority}</TableCell>
+                          <TableCell>{new Date(log.created_at).toLocaleString()}</TableCell>
+                          <TableCell>{log.started_at ? new Date(log.started_at).toLocaleString() : '-'}</TableCell>
+                          <TableCell>{log.completed_at ? new Date(log.completed_at).toLocaleString() : '-'}</TableCell>
+                          <TableCell>{log.processing_duration_ms ? `${log.processing_duration_ms}ms` : '-'}</TableCell>
+                          <TableCell>{log.queue_wait_time_ms ? `${log.queue_wait_time_ms}ms` : '-'}</TableCell>
+                          <TableCell>{log.attempts || 0}</TableCell>
+                          <TableCell>{log.worker_id || '-'}</TableCell>
+                          <TableCell>
+                            {log.error_message ? (
+                              <Alert severity="error" sx={{ minWidth: '200px' }}>
+                                {log.error_message}
+                              </Alert>
+                            ) : '-'}
+                          </TableCell>
+                        </TableRow>
+                      ))}
+                    </TableBody>
+                  </Table>
+                </TableContainer>
+              </CardContent>
+            </Card>
+          )}
+
+          {debugInfo.file_analysis && (
+            <Card sx={{ mb: 4 }}>
+              <CardContent>
+                <Typography variant="h6" gutterBottom>
+                  File Analysis Summary
+                </Typography>
+                <Grid container spacing={2}>
+                  <Grid item xs={12} md={6}>
+                    <Paper sx={{ p: 2 }}>
+                      <Typography variant="subtitle1" gutterBottom>File Properties</Typography>
+                      <Typography><strong>File Type:</strong> {debugInfo.file_analysis.file_type}</Typography>
+                      <Typography><strong>Size:</strong> {(debugInfo.file_analysis.file_size_bytes / 1024 / 1024).toFixed(2)} MB</Typography>
+                      <Typography><strong>Readable:</strong> <Chip 
+                        label={debugInfo.file_analysis.is_readable ? 'Yes' : 'No'} 
+                        color={debugInfo.file_analysis.is_readable ? 'success' : 'error'} 
+                        size="small" 
+                      /></Typography>
+                    </Paper>
+                  </Grid>
+                  <Grid item xs={12} md={6}>
+                    {debugInfo.file_analysis.pdf_info && (
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>PDF Properties</Typography>
+                        <Typography><strong>Valid PDF:</strong> <Chip 
+                          label={debugInfo.file_analysis.pdf_info.is_valid_pdf ? 'Yes' : 'No'} 
+                          color={debugInfo.file_analysis.pdf_info.is_valid_pdf ? 'success' : 'error'} 
+                          size="small" 
+                        /></Typography>
+                        <Typography><strong>Has Text Content:</strong> <Chip 
+                          label={debugInfo.file_analysis.pdf_info.has_text_content ? 'Yes' : 'No'} 
+                          color={debugInfo.file_analysis.pdf_info.has_text_content ? 'success' : 'warning'} 
+                          size="small" 
+                        /></Typography>
+                        <Typography><strong>Text Length:</strong> {debugInfo.file_analysis.pdf_info.estimated_text_length} chars</Typography>
+                        <Typography><strong>Page Count:</strong> {debugInfo.file_analysis.pdf_info.page_count || 'Unknown'}</Typography>
+                        <Typography><strong>Encrypted:</strong> <Chip 
+                          label={debugInfo.file_analysis.pdf_info.is_encrypted ? 'Yes' : 'No'} 
+                          color={debugInfo.file_analysis.pdf_info.is_encrypted ? 'error' : 'success'} 
+                          size="small" 
+                        /></Typography>
+                      </Paper>
+                    )}
+                  </Grid>
+                  {debugInfo.file_analysis.pdf_info?.text_extraction_error && (
+                    <Grid item xs={12}>
+                      <Alert severity="error">
+                        <strong>PDF Text Extraction Issue:</strong> {debugInfo.file_analysis.pdf_info.text_extraction_error}
+                      </Alert>
+                    </Grid>
+                  )}
+                </Grid>
+              </CardContent>
+            </Card>
+          )}
+
+          {debugInfo.pipeline_steps.some(step => step.step === 3 && step.details.has_processed_image) && (
+            <Card sx={{ mb: 4 }}>
+              <CardContent>
+                <Typography variant="h6" gutterBottom>
+                  Processed Images
+                </Typography>
+                <Grid container spacing={2}>
+                  <Grid item xs={12} md={6}>
+                    <Paper sx={{ p: 2 }}>
+                      <Typography variant="subtitle1" gutterBottom>Original Document</Typography>
+                      <Box 
+                        component="iframe"
+                        src={`/api/documents/${debugInfo.document_id}/view`}
+                        sx={{
+                          width: '100%',
+                          height: '300px',
+                          border: '1px solid',
+                          borderColor: 'divider',
+                          borderRadius: 1
+                        }}
+                      />
+                    </Paper>
+                  </Grid>
+                  <Grid item xs={12} md={6}>
+                    <Paper sx={{ p: 2 }}>
+                      <Typography variant="subtitle1" gutterBottom>Processed Image (OCR Input)</Typography>
+                      <Box 
+                        component="img"
+                        src={`/api/documents/${debugInfo.document_id}/processed-image`}
+                        alt="Processed image for OCR"
+                        onError={(e) => {
+                          (e.target as HTMLImageElement).style.display = 'none';
+                          (e.target as HTMLImageElement).parentNode?.appendChild(
+                            document.createTextNode('Processed image not available')
+                          );
+                        }}
+                        sx={{
+                          maxWidth: '100%',
+                          maxHeight: '300px',
+                          objectFit: 'contain',
+                          border: '1px solid',
+                          borderColor: 'divider',
+                          borderRadius: 1
+                        }}
+                      />
+                    </Paper>
+                  </Grid>
+                </Grid>
+              </CardContent>
+            </Card>
+          )}
+
+          <Card>
+            <CardContent>
+              <Accordion>
+                <AccordionSummary expandIcon={<ExpandMoreIcon />}>
+                  <Typography variant="h6">User Settings</Typography>
+                </AccordionSummary>
+                <AccordionDetails>
+                  <Grid container spacing={2}>
+                    <Grid item xs={12} md={6}>
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>OCR Settings</Typography>
+                        <Typography><strong>Background OCR:</strong> {debugInfo.user_settings.enable_background_ocr ? 'Enabled' : 'Disabled'}</Typography>
+                        <Typography><strong>Min Confidence:</strong> {debugInfo.user_settings.ocr_min_confidence}%</Typography>
+                        <Typography><strong>Max File Size:</strong> {debugInfo.user_settings.max_file_size_mb} MB</Typography>
+                      </Paper>
+                    </Grid>
+                    <Grid item xs={12} md={6}>
+                      <Paper sx={{ p: 2 }}>
+                        <Typography variant="subtitle1" gutterBottom>Quality Thresholds</Typography>
+                        <Typography><strong>Brightness:</strong> {debugInfo.user_settings.quality_thresholds.brightness}</Typography>
+                        <Typography><strong>Contrast:</strong> {debugInfo.user_settings.quality_thresholds.contrast}</Typography>
+                        <Typography><strong>Noise:</strong> {debugInfo.user_settings.quality_thresholds.noise}</Typography>
+                        <Typography><strong>Sharpness:</strong> {debugInfo.user_settings.quality_thresholds.sharpness}</Typography>
+                      </Paper>
+                    </Grid>
+                  </Grid>
+                </AccordionDetails>
+              </Accordion>
+            </CardContent>
+          </Card>
+        </Box>
+      )}
+    </Container>
+  );
+};
+
+export default DebugPage;
\ No newline at end of file
diff --git a/src/routes/documents.rs b/src/routes/documents.rs
index f8c5a43..cec3549 100644
--- a/src/routes/documents.rs
+++ b/src/routes/documents.rs
@@ -58,6 +58,7 @@ pub fn router() -> Router<Arc<AppState>> {
         .route("/{id}/ocr", get(get_document_ocr))
         .route("/{id}/processed-image", get(get_processed_image))
         .route("/{id}/retry-ocr", post(retry_ocr))
+        .route("/{id}/debug", get(get_document_debug_info))
         .route("/duplicates", get(get_user_duplicates))
         .route("/failed", get(get_failed_documents))
         .route("/failed/{id}/view", get(view_failed_document))
@@ -645,6 +646,560 @@ async fn retry_ocr(
     }
 }
 
+#[utoipa::path(
+    get,
+    path = "/api/documents/{id}/debug",
+    tag = "documents",
+    security(
+        ("bearer_auth" = [])
+    ),
+    params(
+        ("id" = uuid::Uuid, Path, description = "Document ID")
+    ),
+    responses(
+        (status = 200, description = "Debug information for document processing pipeline", body = String),
+        (status = 404, description = "Document not found"),
+        (status = 401, description = "Unauthorized")
+    )
+)]
+async fn get_document_debug_info(
+    State(state): State<Arc<AppState>>,
+    auth_user: AuthUser,
+    Path(document_id): Path<uuid::Uuid>,
+) -> Result<Json<serde_json::Value>, StatusCode> {
+    tracing::info!("Starting debug analysis for document {} by user {}", document_id, auth_user.user.id);
+    
+    // Get the document
+    let document = match state
+        .db
+        .get_document_by_id(document_id, auth_user.user.id, auth_user.user.role)
+        .await
+    {
+        Ok(Some(doc)) => {
+            tracing::info!("Found document: {} ({})", doc.filename, doc.mime_type);
+            doc
+        }
+        Ok(None) => {
+            tracing::warn!("Document {} not found for user {}", document_id, auth_user.user.id);
+            return Err(StatusCode::NOT_FOUND);
+        }
+        Err(e) => {
+            tracing::error!("Database error fetching document {}: {}", document_id, e);
+            return Err(StatusCode::INTERNAL_SERVER_ERROR);
+        }
+    };
+
+    // Get user settings
+    tracing::info!("Fetching user settings for user {}", auth_user.user.id);
+    let settings = match state
+        .db
+        .get_user_settings(auth_user.user.id)
+        .await
+    {
+        Ok(Some(s)) => {
+            tracing::info!("Found user settings: OCR enabled={}, min_confidence={}", s.enable_background_ocr, s.ocr_min_confidence);
+            s
+        }
+        Ok(None) => {
+            tracing::info!("No user settings found, using defaults");
+            crate::models::Settings::default()
+        }
+        Err(e) => {
+            tracing::error!("Error fetching user settings: {}", e);
+            return Err(StatusCode::INTERNAL_SERVER_ERROR);
+        }
+    };
+
+    // Get OCR queue history for this document
+    tracing::info!("Fetching OCR queue history for document {}", document_id);
+    let queue_history = match sqlx::query(
+        r#"
+        SELECT id, status, priority, created_at, started_at, completed_at, 
+               error_message, attempts, worker_id
+        FROM ocr_queue 
+        WHERE document_id = $1 
+        ORDER BY created_at DESC
+        LIMIT 10
+        "#
+    )
+    .bind(document_id)
+    .fetch_all(state.db.get_pool())
+    .await {
+        Ok(history) => {
+            tracing::info!("Queue history query successful, found {} entries", history.len());
+            history
+        },
+        Err(e) => {
+            tracing::error!("Queue history query error: {}", e);
+            return Err(StatusCode::INTERNAL_SERVER_ERROR);
+        }
+    };
+
+    // Get processed image info if it exists
+    tracing::info!("Fetching processed image for document {}", document_id);
+    let processed_image = match state
+        .db
+        .get_processed_image_by_document_id(document_id, auth_user.user.id)
+        .await {
+        Ok(Some(img)) => {
+            tracing::info!("Found processed image for document {}", document_id);
+            Some(img)
+        },
+        Ok(None) => {
+            tracing::info!("No processed image found for document {}", document_id);
+            None
+        },
+        Err(e) => {
+            tracing::warn!("Error fetching processed image for document {}: {}", document_id, e);
+            None
+        }
+    };
+
+    // Get failed document record if it exists
+    tracing::info!("Fetching failed document record for document {}", document_id);
+    let failed_document = match sqlx::query(
+        r#"
+        SELECT failure_reason, failure_stage, error_message, retry_count, 
+               last_retry_at, created_at, content, ocr_text, ocr_confidence,
+               ocr_word_count, ocr_processing_time_ms
+        FROM failed_documents 
+        WHERE id = $1 OR existing_document_id = $1
+        ORDER BY created_at DESC
+        LIMIT 1
+        "#
+    )
+    .bind(document_id)
+    .fetch_optional(state.db.get_pool())
+    .await {
+        Ok(result) => {
+            tracing::info!("Failed document query successful, found: {}", result.is_some());
+            result
+        },
+        Err(e) => {
+            tracing::error!("Failed document query error: {}", e);
+            return Err(StatusCode::INTERNAL_SERVER_ERROR);
+        }
+    };
+
+    // Get detailed OCR processing logs and attempts
+    tracing::info!("Fetching detailed OCR processing logs for document {}", document_id);
+    let ocr_processing_logs = match sqlx::query(
+        r#"
+        SELECT id, status, priority, created_at, started_at, completed_at,
+               error_message, attempts, worker_id, processing_time_ms, file_size
+        FROM ocr_queue 
+        WHERE document_id = $1 
+        ORDER BY created_at ASC
+        "#
+    )
+    .bind(document_id)
+    .fetch_all(state.db.get_pool())
+    .await {
+        Ok(logs) => {
+            tracing::info!("OCR processing logs query successful, found {} entries", logs.len());
+            logs
+        },
+        Err(e) => {
+            tracing::error!("OCR processing logs query error: {}", e);
+            return Err(StatusCode::INTERNAL_SERVER_ERROR);
+        }
+    };
+
+    // File service for file info
+    let file_service = FileService::new(state.config.upload_path.clone());
+    
+    // Check if file exists
+    let file_exists = tokio::fs::metadata(&document.file_path).await.is_ok();
+    let file_metadata = if file_exists {
+        tokio::fs::metadata(&document.file_path).await.ok()
+    } else {
+        None
+    };
+
+    // Try to analyze file content for additional diagnostic info
+    tracing::info!("Analyzing file content for document {} (exists: {})", document_id, file_exists);
+    let file_analysis = if file_exists {
+        match analyze_file_content(&document.file_path, &document.mime_type).await {
+            Ok(analysis) => {
+                tracing::info!("File analysis successful for document {}", document_id);
+                analysis
+            },
+            Err(e) => {
+                tracing::warn!("Failed to analyze file content for {}: {}", document_id, e);
+                FileAnalysis {
+                    error_details: Some(format!("File analysis failed: {}", e)),
+                    ..Default::default()
+                }
+            }
+        }
+    } else {
+        tracing::warn!("File does not exist for document {}, skipping analysis", document_id);
+        FileAnalysis::default()
+    };
+
+    // Pipeline steps analysis
+    let mut pipeline_steps = Vec::new();
+
+    // Step 1: File Upload & Ingestion
+    pipeline_steps.push(serde_json::json!({
+        "step": 1,
+        "name": "File Upload & Ingestion",
+        "status": "completed", // Document exists if we got this far
+        "details": {
+            "filename": document.filename,
+            "original_filename": document.original_filename,
+            "file_size": document.file_size,
+            "mime_type": document.mime_type,
+            "file_exists": file_exists,
+            "file_path": document.file_path,
+            "created_at": document.created_at,
+            "file_metadata": file_metadata.as_ref().map(|m| serde_json::json!({
+                "size": m.len(),
+                "modified": m.modified().ok(),
+                "is_file": m.is_file(),
+                "is_dir": m.is_dir()
+            })),
+            "file_analysis": file_analysis
+        },
+        "success": true,
+        "error": None::<String>
+    }));
+
+    // Step 2: OCR Queue Enrollment
+    let queue_enrollment_status = if queue_history.is_empty() {
+        if settings.enable_background_ocr {
+            "not_queued"
+        } else {
+            "ocr_disabled"
+        }
+    } else {
+        "queued"
+    };
+
+    pipeline_steps.push(serde_json::json!({
+        "step": 2,
+        "name": "OCR Queue Enrollment",
+        "status": queue_enrollment_status,
+        "details": {
+            "user_ocr_enabled": settings.enable_background_ocr,
+            "queue_entries_count": queue_history.len(),
+            "queue_history": queue_history.iter().map(|row| serde_json::json!({
+                "id": row.get::<uuid::Uuid, _>("id"),
+                "status": row.get::<String, _>("status"),
+                "priority": row.get::<i32, _>("priority"),
+                "created_at": row.get::<chrono::DateTime<chrono::Utc>, _>("created_at"),
+                "started_at": row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("started_at"),
+                "completed_at": row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("completed_at"),
+                "error_message": row.get::<Option<String>, _>("error_message"),
+                "attempts": row.get::<i32, _>("attempts"),
+                "worker_id": row.get::<Option<String>, _>("worker_id")
+            })).collect::<Vec<_>>()
+        },
+        "success": !queue_history.is_empty() || !settings.enable_background_ocr,
+        "error": if !settings.enable_background_ocr && queue_history.is_empty() {
+            Some("OCR processing is disabled in user settings")
+        } else { None }
+    }));
+
+    // Step 3: OCR Processing
+    let ocr_status = document.ocr_status.as_deref().unwrap_or("not_started");
+    let ocr_success = matches!(ocr_status, "completed");
+    
+    pipeline_steps.push(serde_json::json!({
+        "step": 3,
+        "name": "OCR Text Extraction",
+        "status": ocr_status,
+        "details": {
+            "ocr_text_length": document.ocr_text.as_ref().map(|t| t.len()).unwrap_or(0),
+            "ocr_confidence": document.ocr_confidence,
+            "ocr_word_count": document.ocr_word_count,
+            "ocr_processing_time_ms": document.ocr_processing_time_ms,
+            "ocr_completed_at": document.ocr_completed_at,
+            "ocr_error": document.ocr_error,
+            "has_processed_image": processed_image.is_some(),
+            "processed_image_info": processed_image.as_ref().map(|pi| serde_json::json!({
+                "image_path": pi.processed_image_path,
+                "image_width": pi.image_width,
+                "image_height": pi.image_height,
+                "file_size": pi.file_size,
+                "processing_parameters": pi.processing_parameters,
+                "processing_steps": pi.processing_steps,
+                "created_at": pi.created_at
+            }))
+        },
+        "success": ocr_success,
+        "error": document.ocr_error.clone()
+    }));
+
+    // Step 4: Quality Validation
+    let quality_passed = if let Some(confidence) = document.ocr_confidence {
+        confidence >= settings.ocr_min_confidence && document.ocr_word_count.unwrap_or(0) > 0
+    } else {
+        false
+    };
+
+    pipeline_steps.push(serde_json::json!({
+        "step": 4,
+        "name": "OCR Quality Validation",
+        "status": if ocr_success {
+            if quality_passed { "passed" } else { "failed" }
+        } else {
+            "not_reached"
+        },
+        "details": {
+            "quality_thresholds": {
+                "min_confidence": settings.ocr_min_confidence,
+                "brightness_threshold": settings.ocr_quality_threshold_brightness,
+                "contrast_threshold": settings.ocr_quality_threshold_contrast,
+                "noise_threshold": settings.ocr_quality_threshold_noise,
+                "sharpness_threshold": settings.ocr_quality_threshold_sharpness
+            },
+            "actual_values": {
+                "confidence": document.ocr_confidence,
+                "word_count": document.ocr_word_count,
+                "processed_image_available": processed_image.is_some(),
+                "processing_parameters": processed_image.as_ref().map(|pi| &pi.processing_parameters)
+            },
+            "quality_checks": {
+                "confidence_check": document.ocr_confidence.map(|c| c >= settings.ocr_min_confidence),
+                "word_count_check": document.ocr_word_count.map(|w| w > 0),
+                "processed_image_available": processed_image.is_some()
+            }
+        },
+        "success": quality_passed,
+        "error": if !quality_passed && ocr_success {
+            Some(format!("Quality validation failed: confidence {:.1}% (required: {:.1}%), words: {}", 
+                document.ocr_confidence.unwrap_or(0.0),
+                settings.ocr_min_confidence,
+                document.ocr_word_count.unwrap_or(0)
+            ))
+        } else { None }
+    }));
+
+    // Overall summary
+    let overall_status = if quality_passed {
+        "success"
+    } else if matches!(ocr_status, "failed") {
+        "failed"
+    } else if matches!(ocr_status, "processing") {
+        "processing"
+    } else if matches!(ocr_status, "pending") {
+        "pending"
+    } else {
+        "not_started"
+    };
+
+    Ok(Json(serde_json::json!({
+        "document_id": document_id,
+        "filename": document.filename,
+        "overall_status": overall_status,
+        "pipeline_steps": pipeline_steps,
+        "failed_document_info": failed_document.as_ref().map(|row| serde_json::json!({
+            "failure_reason": row.get::<String, _>("failure_reason"),
+            "failure_stage": row.get::<String, _>("failure_stage"),
+            "error_message": row.get::<Option<String>, _>("error_message"),
+            "retry_count": row.get::<Option<i32>, _>("retry_count"),
+            "last_retry_at": row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("last_retry_at"),
+            "created_at": row.get::<chrono::DateTime<chrono::Utc>, _>("created_at"),
+            "content_preview": row.get::<Option<String>, _>("content").map(|c| 
+                c.chars().take(200).collect::<String>()
+            ),
+            "failed_ocr_text": row.get::<Option<String>, _>("ocr_text"),
+            "failed_ocr_confidence": row.get::<Option<f32>, _>("ocr_confidence"),
+            "failed_ocr_word_count": row.get::<Option<i32>, _>("ocr_word_count"),
+            "failed_ocr_processing_time_ms": row.get::<Option<i32>, _>("ocr_processing_time_ms")
+        })),
+        "user_settings": {
+            "enable_background_ocr": settings.enable_background_ocr,
+            "ocr_min_confidence": settings.ocr_min_confidence,
+            "max_file_size_mb": settings.max_file_size_mb,
+            "quality_thresholds": {
+                "brightness": settings.ocr_quality_threshold_brightness,
+                "contrast": settings.ocr_quality_threshold_contrast,
+                "noise": settings.ocr_quality_threshold_noise,
+                "sharpness": settings.ocr_quality_threshold_sharpness
+            }
+        },
+        "debug_timestamp": chrono::Utc::now(),
+        "file_analysis": file_analysis,
+        "detailed_processing_logs": ocr_processing_logs.iter().map(|row| serde_json::json!({
+            "id": row.get::<uuid::Uuid, _>("id"),
+            "status": row.get::<String, _>("status"),
+            "priority": row.get::<i32, _>("priority"),
+            "created_at": row.get::<chrono::DateTime<chrono::Utc>, _>("created_at"),
+            "started_at": row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("started_at"),
+            "completed_at": row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("completed_at"),
+            "error_message": row.get::<Option<String>, _>("error_message"),
+            "attempts": row.get::<i32, _>("attempts"),
+            "worker_id": row.get::<Option<String>, _>("worker_id"),
+            "processing_time_ms": row.get::<Option<i32>, _>("processing_time_ms"),
+            "file_size": row.get::<Option<i64>, _>("file_size"),
+            // Calculate processing duration if both timestamps are available
+            "processing_duration_ms": if let (Some(started), Some(completed)) = (
+                row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("started_at"),
+                row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("completed_at")
+            ) {
+                Some((completed.timestamp_millis() - started.timestamp_millis()) as i32)
+            } else {
+                row.get::<Option<i32>, _>("processing_time_ms")
+            },
+            // Calculate queue wait time
+            "queue_wait_time_ms": if let Some(started) = row.get::<Option<chrono::DateTime<chrono::Utc>>, _>("started_at") {
+                let created = row.get::<chrono::DateTime<chrono::Utc>, _>("created_at");
+                Some((started.timestamp_millis() - created.timestamp_millis()) as i32)
+            } else {
+                None::<i32>
+            }
+        })).collect::<Vec<_>>()
+    })))
+}
+
+#[derive(Debug, Default, serde::Serialize)]
+struct FileAnalysis {
+    file_type: String,
+    file_size_bytes: u64,
+    is_readable: bool,
+    pdf_info: Option<PdfAnalysis>,
+    text_preview: Option<String>,
+    error_details: Option<String>,
+}
+
+#[derive(Debug, serde::Serialize)]
+struct PdfAnalysis {
+    is_valid_pdf: bool,
+    page_count: Option<i32>,
+    has_text_content: bool,
+    has_images: bool,
+    is_encrypted: bool,
+    pdf_version: Option<String>,
+    font_count: usize,
+    text_extraction_error: Option<String>,
+    estimated_text_length: usize,
+}
+
+async fn analyze_file_content(file_path: &str, mime_type: &str) -> Result<FileAnalysis, Box<dyn std::error::Error + Send + Sync>> {
+    let mut analysis = FileAnalysis {
+        file_type: mime_type.to_string(),
+        ..Default::default()
+    };
+
+    // Try to read file size
+    if let Ok(metadata) = tokio::fs::metadata(file_path).await {
+        analysis.file_size_bytes = metadata.len();
+    }
+
+    // Try to read the file
+    let file_content = match tokio::fs::read(file_path).await {
+        Ok(content) => {
+            analysis.is_readable = true;
+            content
+        }
+        Err(e) => {
+            analysis.error_details = Some(format!("Failed to read file: {}", e));
+            return Ok(analysis);
+        }
+    };
+
+    // Analyze based on file type
+    if mime_type.contains("pdf") {
+        analysis.pdf_info = Some(analyze_pdf_content(&file_content).await);
+    } else if mime_type.starts_with("text/") {
+        // For text files, show a preview
+        match String::from_utf8(file_content.clone()) {
+            Ok(text) => {
+                analysis.text_preview = Some(text.chars().take(500).collect());
+            }
+            Err(e) => {
+                analysis.error_details = Some(format!("Failed to decode text file: {}", e));
+            }
+        }
+    }
+
+    Ok(analysis)
+}
+
+async fn analyze_pdf_content(content: &[u8]) -> PdfAnalysis {
+    use std::panic;
+
+    let mut analysis = PdfAnalysis {
+        is_valid_pdf: false,
+        page_count: None,
+        has_text_content: false,
+        has_images: false,
+        is_encrypted: false,
+        pdf_version: None,
+        font_count: 0,
+        text_extraction_error: None,
+        estimated_text_length: 0,
+    };
+
+    // Check PDF header
+    if content.len() < 8 {
+        analysis.text_extraction_error = Some("File too small to be a valid PDF".to_string());
+        return analysis;
+    }
+
+    if !content.starts_with(b"%PDF-") {
+        analysis.text_extraction_error = Some("File does not start with PDF header".to_string());
+        return analysis;
+    }
+
+    analysis.is_valid_pdf = true;
+
+    // Extract PDF version from header
+    if content.len() >= 8 {
+        if let Ok(header) = std::str::from_utf8(&content[0..8]) {
+            if let Some(version) = header.strip_prefix("%PDF-") {
+                analysis.pdf_version = Some(version.to_string());
+            }
+        }
+    }
+
+    // Try to extract text using pdf_extract (same as the main OCR pipeline)
+    let text_result = panic::catch_unwind(|| {
+        pdf_extract::extract_text_from_mem(content)
+    });
+
+    match text_result {
+        Ok(Ok(text)) => {
+            analysis.has_text_content = !text.trim().is_empty();
+            analysis.estimated_text_length = text.len();
+            
+            // Count words for comparison with OCR results
+            let word_count = text.split_whitespace().count();
+            if word_count == 0 && text.len() > 0 {
+                analysis.text_extraction_error = Some("PDF contains characters but no extractable words".to_string());
+            }
+        }
+        Ok(Err(e)) => {
+            analysis.text_extraction_error = Some(format!("PDF text extraction failed: {}", e));
+        }
+        Err(_) => {
+            analysis.text_extraction_error = Some("PDF text extraction panicked (likely corrupted PDF)".to_string());
+        }
+    }
+
+    // Basic PDF structure analysis
+    let content_str = String::from_utf8_lossy(content);
+    
+    // Check for encryption
+    analysis.is_encrypted = content_str.contains("/Encrypt");
+    
+    // Check for images
+    analysis.has_images = content_str.contains("/Image") || content_str.contains("/XObject");
+    
+    // Estimate page count (rough)
+    let page_matches = content_str.matches("/Type /Page").count();
+    if page_matches > 0 {
+        analysis.page_count = Some(page_matches as i32);
+    }
+
+    // Count fonts (rough)
+    analysis.font_count = content_str.matches("/Type /Font").count();
+
+    analysis
+}
+
 #[utoipa::path(
     get,
     path = "/api/documents/failed-ocr",