M3-AP-006: Fehlerklassifikation vereinfacht und Logging auf korrekte
Ergebnisfälle ausgerichtet
This commit is contained in:
@@ -0,0 +1,195 @@
|
||||
package de.gecheckt.pdf.umbenenner.application.service;
|
||||
|
||||
import de.gecheckt.pdf.umbenenner.application.config.StartConfiguration;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3DocumentProcessingOutcome;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3PreCheckFailed;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3PreCheckPassed;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3TechnicalDocumentError;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.PdfExtractionContentError;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.PdfExtractionSuccess;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.PdfExtractionTechnicalError;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.PdfPageCount;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.SourceDocumentCandidate;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.SourceDocumentLocator;
|
||||
|
||||
import org.junit.jupiter.api.BeforeEach;
|
||||
import org.junit.jupiter.api.Test;
|
||||
import org.junit.jupiter.api.io.TempDir;
|
||||
|
||||
import java.net.URI;
|
||||
import java.nio.file.Files;
|
||||
import java.nio.file.Path;
|
||||
|
||||
import static org.junit.jupiter.api.Assertions.*;
|
||||
|
||||
/**
|
||||
* Tests for {@link M3DocumentProcessingService}.
|
||||
* <p>
|
||||
* Verifies that all four M3 document processing outcomes are correctly classified.
|
||||
*/
|
||||
class M3DocumentProcessingServiceTest {
|
||||
|
||||
@TempDir
|
||||
Path tempDir;
|
||||
|
||||
private SourceDocumentCandidate candidate;
|
||||
private StartConfiguration configuration;
|
||||
|
||||
@BeforeEach
|
||||
void setUp() throws Exception {
|
||||
// Create test PDF file
|
||||
Path pdfFile = tempDir.resolve("document.pdf");
|
||||
Files.createFile(pdfFile);
|
||||
SourceDocumentLocator locator = new SourceDocumentLocator(pdfFile.toString());
|
||||
candidate = new SourceDocumentCandidate("document.pdf", 2048L, locator);
|
||||
|
||||
// Create directories and files for configuration
|
||||
Path sourceDir = Files.createDirectories(tempDir.resolve("source"));
|
||||
Path targetDir = Files.createDirectories(tempDir.resolve("target"));
|
||||
Path dbFile = tempDir.resolve("db.sqlite");
|
||||
Files.createFile(dbFile);
|
||||
Path promptFile = tempDir.resolve("prompt.txt");
|
||||
Files.createFile(promptFile);
|
||||
|
||||
configuration = new StartConfiguration(
|
||||
sourceDir,
|
||||
targetDir,
|
||||
dbFile,
|
||||
URI.create("http://localhost:8000"),
|
||||
"gpt-4",
|
||||
30,
|
||||
3,
|
||||
10,
|
||||
5000,
|
||||
promptFile,
|
||||
tempDir.resolve("lock"),
|
||||
tempDir.resolve("logs"),
|
||||
"INFO",
|
||||
"test-key"
|
||||
);
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithSuccessfulExtraction_AndPassedPreChecks() {
|
||||
// Arrange: Successful extraction with valid text
|
||||
var extraction = new PdfExtractionSuccess("This is valid PDF text", new PdfPageCount(5));
|
||||
|
||||
// Act
|
||||
M3DocumentProcessingOutcome outcome = M3DocumentProcessingService.processDocument(
|
||||
candidate, extraction, configuration);
|
||||
|
||||
// Assert: Should produce M3PreCheckPassed
|
||||
assertInstanceOf(M3PreCheckPassed.class, outcome);
|
||||
M3PreCheckPassed passed = (M3PreCheckPassed) outcome;
|
||||
assertEquals(candidate, passed.candidate());
|
||||
assertEquals(extraction, passed.extraction());
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithSuccessfulExtraction_AndFailedPreCheck_NoUsableText() {
|
||||
// Arrange: Successful extraction but with only whitespace
|
||||
var extraction = new PdfExtractionSuccess(" \n \t ", new PdfPageCount(1));
|
||||
|
||||
// Act
|
||||
M3DocumentProcessingOutcome outcome = M3DocumentProcessingService.processDocument(
|
||||
candidate, extraction, configuration);
|
||||
|
||||
// Assert: Should produce M3PreCheckFailed with appropriate reason
|
||||
assertInstanceOf(M3PreCheckFailed.class, outcome);
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) outcome;
|
||||
assertEquals(candidate, failed.candidate());
|
||||
assertTrue(failed.failureReason().toLowerCase().contains("usable"));
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithSuccessfulExtraction_AndFailedPreCheck_PageLimitExceeded() {
|
||||
// Arrange: Successful extraction but exceeds page limit
|
||||
var extraction = new PdfExtractionSuccess("Valid text content", new PdfPageCount(50));
|
||||
|
||||
// Act
|
||||
M3DocumentProcessingOutcome outcome = M3DocumentProcessingService.processDocument(
|
||||
candidate, extraction, configuration);
|
||||
|
||||
// Assert: Should produce M3PreCheckFailed with page limit reason
|
||||
assertInstanceOf(M3PreCheckFailed.class, outcome);
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) outcome;
|
||||
assertEquals(candidate, failed.candidate());
|
||||
assertTrue(failed.failureReason().toLowerCase().contains("page"));
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithContentError() {
|
||||
// Arrange: PDF content not extractable (classified as technical document error in M3)
|
||||
var contentError = new PdfExtractionContentError("PDF is corrupted");
|
||||
|
||||
// Act
|
||||
M3DocumentProcessingOutcome outcome = M3DocumentProcessingService.processDocument(
|
||||
candidate, contentError, configuration);
|
||||
|
||||
// Assert: Should produce M3TechnicalDocumentError
|
||||
assertInstanceOf(M3TechnicalDocumentError.class, outcome);
|
||||
M3TechnicalDocumentError result = (M3TechnicalDocumentError) outcome;
|
||||
assertEquals(candidate, result.candidate());
|
||||
assertTrue(result.errorMessage().contains("PDF is corrupted"));
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithTechnicalError() {
|
||||
// Arrange: Technical error during extraction
|
||||
var technicalError = new PdfExtractionTechnicalError("I/O error reading file",
|
||||
new RuntimeException("File not found"));
|
||||
|
||||
// Act
|
||||
M3DocumentProcessingOutcome outcome = M3DocumentProcessingService.processDocument(
|
||||
candidate, technicalError, configuration);
|
||||
|
||||
// Assert: Should produce M3TechnicalDocumentError
|
||||
assertInstanceOf(M3TechnicalDocumentError.class, outcome);
|
||||
M3TechnicalDocumentError result = (M3TechnicalDocumentError) outcome;
|
||||
assertEquals(candidate, result.candidate());
|
||||
assertEquals("I/O error reading file", result.errorMessage());
|
||||
assertNotNull(result.cause());
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithTechnicalError_WithoutCause() {
|
||||
// Arrange: Technical error without underlying exception
|
||||
var technicalError = new PdfExtractionTechnicalError("Unknown error", null);
|
||||
|
||||
// Act
|
||||
M3DocumentProcessingOutcome outcome = M3DocumentProcessingService.processDocument(
|
||||
candidate, technicalError, configuration);
|
||||
|
||||
// Assert
|
||||
assertInstanceOf(M3TechnicalDocumentError.class, outcome);
|
||||
M3TechnicalDocumentError result = (M3TechnicalDocumentError) outcome;
|
||||
assertNull(result.cause());
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithNullCandidate_ThrowsException() {
|
||||
// Arrange
|
||||
var extraction = new PdfExtractionSuccess("Text", new PdfPageCount(1));
|
||||
|
||||
// Act & Assert
|
||||
assertThrows(NullPointerException.class,
|
||||
() -> M3DocumentProcessingService.processDocument(null, extraction, configuration));
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithNullExtractionResult_ThrowsException() {
|
||||
// Act & Assert
|
||||
assertThrows(NullPointerException.class,
|
||||
() -> M3DocumentProcessingService.processDocument(candidate, null, configuration));
|
||||
}
|
||||
|
||||
@Test
|
||||
void testProcessDocument_WithNullConfiguration_ThrowsException() {
|
||||
// Arrange
|
||||
var extraction = new PdfExtractionSuccess("Text", new PdfPageCount(1));
|
||||
|
||||
// Act & Assert
|
||||
assertThrows(NullPointerException.class,
|
||||
() -> M3DocumentProcessingService.processDocument(candidate, extraction, null));
|
||||
}
|
||||
}
|
||||
@@ -1,10 +1,10 @@
|
||||
package de.gecheckt.pdf.umbenenner.application.service;
|
||||
|
||||
import de.gecheckt.pdf.umbenenner.application.config.StartConfiguration;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3DocumentProcessingOutcome;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3PreCheckFailed;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3PreCheckFailureReason;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3PreCheckPassed;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.M3ProcessingDecision;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.PdfExtractionSuccess;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.PdfPageCount;
|
||||
import de.gecheckt.pdf.umbenenner.domain.model.SourceDocumentCandidate;
|
||||
@@ -35,7 +35,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("Some meaningful text", new PdfPageCount(5));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass when text is usable and page count is valid");
|
||||
M3PreCheckPassed passed = (M3PreCheckPassed) result;
|
||||
@@ -49,7 +49,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckFailed, "Should fail with empty text");
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) result;
|
||||
@@ -62,7 +62,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess(" \n\t \r\n ", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckFailed, "Should fail with whitespace-only text");
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) result;
|
||||
@@ -75,7 +75,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("!@#$%^&*()_+-=[]{}|;:',.<>?/", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckFailed, "Should fail with special characters only");
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) result;
|
||||
@@ -88,7 +88,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("a", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass with single letter");
|
||||
}
|
||||
@@ -99,7 +99,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("5", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass with single digit");
|
||||
}
|
||||
@@ -110,7 +110,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("!@#a$%^&*", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass when letters/digits are present among special chars");
|
||||
}
|
||||
@@ -121,7 +121,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess(" meaningful text ", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass when text has meaningful content despite whitespace");
|
||||
}
|
||||
@@ -132,7 +132,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("Valid text", new PdfPageCount(5));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass when page count equals limit (not exceeded)");
|
||||
}
|
||||
@@ -143,7 +143,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("Valid text", new PdfPageCount(6));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckFailed, "Should fail when page count exceeds limit");
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) result;
|
||||
@@ -156,7 +156,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("Excellent meaningful text with lots of content", new PdfPageCount(100));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckFailed, "Should fail with page limit exceeded even if text is good");
|
||||
M3PreCheckFailed failed = (M3PreCheckFailed) result;
|
||||
@@ -171,7 +171,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("", new PdfPageCount(10));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckFailed, "Should fail when both checks fail");
|
||||
// The specific order of checks doesn't matter for M3; just verify one reason is returned
|
||||
@@ -216,7 +216,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("Äußerst äöüß Großes", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass with German umlauts (ÄÖÜß)");
|
||||
}
|
||||
@@ -227,7 +227,7 @@ class M3PreCheckEvaluatorTest {
|
||||
SourceDocumentCandidate candidate = buildCandidate();
|
||||
PdfExtractionSuccess extraction = new PdfExtractionSuccess("Αβγδ 中文 καλημέρα", new PdfPageCount(1));
|
||||
|
||||
M3ProcessingDecision result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
M3DocumentProcessingOutcome result = M3PreCheckEvaluator.evaluate(candidate, extraction, config);
|
||||
|
||||
assertTrue(result instanceof M3PreCheckPassed, "Should pass with Greek, Chinese, and other Unicode letters");
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user