diff --git a/frontend/src/components/__tests__/FileIntegrityDisplay.test.tsx b/frontend/src/components/__tests__/FileIntegrityDisplay.test.tsx
deleted file mode 100644
index 060ef67..0000000
--- a/frontend/src/components/__tests__/FileIntegrityDisplay.test.tsx
+++ /dev/null
@@ -1,79 +0,0 @@
-import React from 'react';
-import { render, screen } from '@testing-library/react';
-import { ThemeProvider } from '@mui/material/styles';
-import theme from '../../theme';
-import FileIntegrityDisplay from '../FileIntegrityDisplay';
-
-const renderWithTheme = (component: React.ReactElement) => {
- return render(
-
- {component}
-
- );
-};
-
-describe('FileIntegrityDisplay', () => {
- const mockProps = {
- fileHash: 'a1b2c3d4e5f6789012345678901234567890123456789012345678901234567890',
- fileName: 'test-document.pdf',
- fileSize: 1048576, // 1MB
- mimeType: 'application/pdf',
- createdAt: '2024-01-01T12:00:00Z',
- updatedAt: '2024-01-01T12:00:00Z',
- userId: 'user-123-456-789',
- };
-
- it('renders file integrity information', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('File Integrity & Verification')).toBeInTheDocument();
- expect(screen.getByText('SHA256 Hash')).toBeInTheDocument();
- expect(screen.getByText('File Properties')).toBeInTheDocument();
- });
-
- it('displays file hash correctly', () => {
- renderWithTheme(
-
- );
-
- // Should show the full hash in expanded view
- expect(screen.getByText(mockProps.fileHash)).toBeInTheDocument();
- });
-
- it('shows compact view when compact prop is true', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('File Integrity')).toBeInTheDocument();
- // Should show abbreviated hash in compact view
- expect(screen.getByText('a1b2c3d4...34567890')).toBeInTheDocument();
- });
-
- it('handles missing file hash gracefully', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('Hash not available')).toBeInTheDocument();
- expect(screen.getByText('File hash not available. Enable hash generation in upload settings.')).toBeInTheDocument();
- });
-
- it('formats file size correctly', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('1 MB')).toBeInTheDocument();
- });
-
- it('displays user information', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('User: user-123...')).toBeInTheDocument();
- });
-});
\ No newline at end of file
diff --git a/frontend/src/components/__tests__/ProcessingTimeline.test.tsx b/frontend/src/components/__tests__/ProcessingTimeline.test.tsx
deleted file mode 100644
index 38f8924..0000000
--- a/frontend/src/components/__tests__/ProcessingTimeline.test.tsx
+++ /dev/null
@@ -1,90 +0,0 @@
-import React from 'react';
-import { render, screen } from '@testing-library/react';
-import { ThemeProvider } from '@mui/material/styles';
-import theme from '../../theme';
-import ProcessingTimeline from '../ProcessingTimeline';
-
-const renderWithTheme = (component: React.ReactElement) => {
- return render(
-
- {component}
-
- );
-};
-
-describe('ProcessingTimeline', () => {
- const mockProps = {
- documentId: 'doc-123',
- fileName: 'test-document.pdf',
- createdAt: '2024-01-01T12:00:00Z',
- updatedAt: '2024-01-01T12:30:00Z',
- userId: 'user-123',
- ocrStatus: 'completed',
- ocrCompletedAt: '2024-01-01T12:15:00Z',
- ocrRetryCount: 0,
- };
-
- it('renders processing timeline', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('Processing Timeline')).toBeInTheDocument();
- expect(screen.getByText('Document Uploaded')).toBeInTheDocument();
- expect(screen.getByText('OCR Processing Completed')).toBeInTheDocument();
- });
-
- it('shows retry information when retries exist', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('2 retries')).toBeInTheDocument();
- expect(screen.getByText('Detailed Retry History')).toBeInTheDocument();
- });
-
- it('renders compact view correctly', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('Processing Timeline')).toBeInTheDocument();
- expect(screen.getByText('View Full Timeline')).toBeInTheDocument();
- });
-
- it('handles OCR error status', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('OCR Processing Failed')).toBeInTheDocument();
- });
-
- it('shows pending OCR status', () => {
- renderWithTheme(
-
- );
-
- expect(screen.getByText('OCR Processing Started')).toBeInTheDocument();
- });
-
- it('displays event count', () => {
- renderWithTheme(
-
- );
-
- // Should show at least 2 events (upload + OCR completion)
- expect(screen.getByText(/\d+ events/)).toBeInTheDocument();
- });
-});
\ No newline at end of file
diff --git a/src/bin/test_metadata.rs b/src/bin/test_metadata.rs
new file mode 100644
index 0000000..e31fa19
--- /dev/null
+++ b/src/bin/test_metadata.rs
@@ -0,0 +1,62 @@
+use std::fs;
+use readur::metadata_extraction::extract_content_metadata;
+
+#[tokio::main]
+async fn main() -> Result<(), Box> {
+ println!("Testing metadata extraction...");
+
+ // Test image metadata
+ if let Ok(image_data) = fs::read("test_files/portrait_100x200.png") {
+ println!("\n=== Testing Image (portrait_100x200.png) ===");
+ match extract_content_metadata(&image_data, "image/png", "portrait_100x200.png").await {
+ Ok(Some(metadata)) => {
+ println!("Metadata extracted:");
+ println!("{:#}", serde_json::to_string_pretty(&metadata)?);
+ }
+ Ok(None) => println!("No metadata extracted"),
+ Err(e) => println!("Error: {}", e),
+ }
+ }
+
+ // Test PDF metadata
+ if let Ok(pdf_data) = fs::read("test_files/single_page_v14.pdf") {
+ println!("\n=== Testing PDF (single_page_v14.pdf) ===");
+ match extract_content_metadata(&pdf_data, "application/pdf", "single_page_v14.pdf").await {
+ Ok(Some(metadata)) => {
+ println!("Metadata extracted:");
+ println!("{:#}", serde_json::to_string_pretty(&metadata)?);
+ }
+ Ok(None) => println!("No metadata extracted"),
+ Err(e) => println!("Error: {}", e),
+ }
+ }
+
+ // Test text metadata
+ if let Ok(text_data) = fs::read("test_files/comprehensive_text.txt") {
+ println!("\n=== Testing Text (comprehensive_text.txt) ===");
+ match extract_content_metadata(&text_data, "text/plain", "comprehensive_text.txt").await {
+ Ok(Some(metadata)) => {
+ println!("Metadata extracted:");
+ println!("{:#}", serde_json::to_string_pretty(&metadata)?);
+ }
+ Ok(None) => println!("No metadata extracted"),
+ Err(e) => println!("Error: {}", e),
+ }
+ }
+
+ // Test JSON format detection
+ if let Ok(json_data) = fs::read("test_files/test_format.json") {
+ println!("\n=== Testing JSON Format (test_format.json) ===");
+ match extract_content_metadata(&json_data, "text/plain", "test_format.json").await {
+ Ok(Some(metadata)) => {
+ println!("Metadata extracted:");
+ println!("{:#}", serde_json::to_string_pretty(&metadata)?);
+ }
+ Ok(None) => println!("No metadata extracted"),
+ Err(e) => println!("Error: {}", e),
+ }
+ }
+
+ println!("\nMetadata extraction testing complete!");
+ Ok(())
+}
\ No newline at end of file
diff --git a/src/tests/document_response_serialization_tests.rs b/src/tests/document_response_serialization_tests.rs
index b0a6fcc..c873d46 100644
--- a/src/tests/document_response_serialization_tests.rs
+++ b/src/tests/document_response_serialization_tests.rs
@@ -12,11 +12,14 @@ mod tests {
"id": "550e8400-e29b-41d4-a716-446655440000",
"filename": "test.pdf",
"original_filename": "test.pdf",
+ "file_path": "/storage/test.pdf",
"file_size": 1024,
"mime_type": "application/pdf",
"tags": [],
"labels": [],
"created_at": "2024-01-01T12:00:00Z",
+ "updated_at": "2024-01-01T12:00:00Z",
+ "user_id": "550e8400-e29b-41d4-a716-446655440001",
"has_ocr_text": false,
"ocr_confidence": null,
"ocr_word_count": null,
@@ -43,11 +46,14 @@ mod tests {
"id": "550e8400-e29b-41d4-a716-446655440000",
"filename": "test.pdf",
"original_filename": "test.pdf",
+ "file_path": "/storage/test.pdf",
"file_size": 1024,
"mime_type": "application/pdf",
"tags": [],
"labels": [],
"created_at": "2024-01-01T12:00:00Z",
+ "updated_at": "2024-01-01T12:00:00Z",
+ "user_id": "550e8400-e29b-41d4-a716-446655440001",
"has_ocr_text": false,
"ocr_confidence": null,
"ocr_word_count": null,