PHP code example of ahmedghanem00 / tesseract-ocr

1. Go to this page and download the library: Download ahmedghanem00/tesseract-ocr library. Choose the download type require.

2. Extract the ZIP file and open the index.php.

3. Add this code to the index.php.
    
        
<?php
require_once('vendor/autoload.php');

/* Start to develop here. Best regards https://php-download.com/ */

    

ahmedghanem00 / tesseract-ocr example snippets


$tesseract = new \ahmedghanem00\TesseractOCR\Tesseract();

$tesseract = new \ahmedghanem00\TesseractOCR\Tesseract("path/to/binary/location");
# OR, If you already have an initiated instance 
$tesseract->setBinaryPath("path/to/binary/location");

$tesseract = new \ahmedghanem00\TesseractOCR\Tesseract(processTimeout: 3);
# OR
$tesseract->setProcessTimeout(2.5);

$tesseract->setTessDataDirPath("path/to/data/dir")

$tesseract->resetTessDataDirPath();

$version = $tesseract->getVersion();

$languages = $tesseract->getSupportedLanguages();

$result = $tesseract->recognize("test.png");
## OR
$result = $tesseract->recognize("https://example.com/test.png");
## etc.

$result = $tesseract->recognize("test.png", langs: ["eng", "ara"]);

use ahmedghanem00\TesseractOCR\Enum\PSM;

# using PSM enum
$result = $tesseract->recognize("test.png", psm: PSM::SINGLE_BLOCK);
# OR by using id directly
$result = $tesseract->recognize("test.png", psm: 3);

use ahmedghanem00\TesseractOCR\Enum\OEM;

# using OEM enum
$result = $tesseract->recognize("test.png", oem: OEM::LEGACY_WITH_LSTM);
# OR by using id directly
$result = $tesseract->recognize("test.png", oem: 3);

$result = $tesseract->recognize("test.png", dpi: 200);

$pdfBinaryData = $tesseract->recognize("test.png", outputAsPDF: true);

file_put_contents("result.pdf", $pdfBinaryData)

$result = $tesseract->recognize("test.png", wordsFilePath: "/path/to/file");
# OR
$result = $tesseract->recognize("test.png", patternsFilePath: "/path/to/file");

use ahmedghanem00\TesseractOCR\ConfigBag;

$config = ConfigBag::new()
    ->setParameter("tessedit_char_whitelist", "abcrety")
    ->setParameter("textord_pitch_range", 3);

$result = $tesseract->recognize("test.png", config: $config);