Skip to content

Commit 3db2caf

Browse files
committed
Do not accept empty OCRmyPDF results and fix log #79
Signed-off-by: Robin Windey <[email protected]>
1 parent 05e2509 commit 3db2caf

File tree

2 files changed

+45
-7
lines changed

2 files changed

+45
-7
lines changed

lib/OcrProcessors/PdfOcrProcessor.php

+13-7
Original file line numberDiff line numberDiff line change
@@ -50,15 +50,21 @@ public function ocrFile(string $fileContent): string {
5050
$stdErr = $this->command->getStdErr();
5151
$exitCode = $this->command->getExitCode();
5252

53-
if ($success) {
54-
if ($stdErr !== '' || $errorOutput !== '') {
55-
// Log warning if ocrmypdf wrote a warning to the stderr
56-
$this->logger->warning('OCRmyPDF succeeded with warning(s): {stdErr}, {errorOutput}', [$stdErr, $errorOutput]);
57-
}
53+
if (!$success) {
54+
throw new OcrNotPossibleException('OCRmyPDF exited abnormally with exit-code ' . $exitCode . '. Message: ' . $errorOutput . ' ' . $stdErr);
55+
}
56+
57+
if ($stdErr !== '' || $errorOutput !== '') {
58+
// Log warning if ocrmypdf wrote a warning to the stderr
59+
$this->logger->warning('OCRmyPDF succeeded with warning(s): {stdErr}, {errorOutput}', [$stdErr, $errorOutput]);
60+
}
61+
62+
$ocrOutput = $this->command->getOutput();
5863

59-
return $this->command->getOutput();
64+
if (!$ocrOutput) {
65+
throw new OcrNotPossibleException('OCRmyPDF did not produce any output');
6066
}
6167

62-
throw new OcrNotPossibleException('OCRmyPDF exited abnormally with exit-code ' . $exitCode . '. Message: ' . $errorOutput . ' ' . $stdErr);
68+
return $ocrOutput;
6369
}
6470
}

tests/Unit/OcrProcessors/PdfOcrProcessorTest.php

+32
Original file line numberDiff line numberDiff line change
@@ -111,6 +111,9 @@ public function testLogsWarningIfOcrMyPdfSucceedsWithWarningOutput() {
111111
$this->command->expects($this->once())
112112
->method('getStdErr')
113113
->willReturn('stdErr');
114+
$this->command->expects($this->once())
115+
->method('getOutput')
116+
->willReturn('someOcrFileContent');
114117
$this->logger->expects($this->once())
115118
->method('warning')
116119
->with(
@@ -125,4 +128,33 @@ public function testLogsWarningIfOcrMyPdfSucceedsWithWarningOutput() {
125128
$processor = new PdfOcrProcessor($this->command, $this->logger);
126129
$processor->ocrFile('someContent');
127130
}
131+
132+
public function testThrowsErrorIfOcrFileWasEmpty() {
133+
$this->command->expects($this->once())
134+
->method('execute')
135+
->willReturn(true);
136+
$this->command->expects($this->once())
137+
->method('getError')
138+
->willReturn('error');
139+
$this->command->expects($this->once())
140+
->method('getStdErr')
141+
->willReturn('stdErr');
142+
$this->command->expects($this->once())
143+
->method('getOutput')
144+
->willReturn('');
145+
146+
147+
$thrown = false;
148+
$processor = new PdfOcrProcessor($this->command, $this->logger);
149+
150+
try {
151+
$processor->ocrFile('someContent');
152+
} catch (\Throwable $t) {
153+
$thrown = true;
154+
$this->assertInstanceOf(OcrNotPossibleException::class, $t);
155+
$this->assertEquals('OCRmyPDF did not produce any output', $t->getMessage());
156+
}
157+
158+
$this->assertTrue($thrown);
159+
}
128160
}

0 commit comments

Comments
 (0)