BCL easyConverter SDK HTML
easyConverter SDK Usermanual
PDF-to-HTML Programming API  |  Download Free Trial  |  Contact Us to Purchase

OcrOption Property

Set the option for handling OCR-ed documents.

This property does not work when AbsolutePositioning is set to True.

optOcr OcrOption { set; }
Property OcrOption As optOcr
def setOcrOption(self, newVal)
void setOcrOption(optOcr newVal) throws PDF2HTMLException
function setOcrOption($newVal)
BclHtoptOcr OcrOption;
Sub OcrOption(newVal As Long)
beconvh.exe -ocred image+text|text|image|image+hiddenText

Parameters

newVal

One of optOcr values:

OPT_OCR_TEXT_IMAGE = 0,
OPT_OCR_TEXTONLY = 1,
OPT_OCR_IMAGEONLY = 2,
OPT_OCR_IMAGE_HIDDEN_TEXT = 3

Exception Handling

Please refer to the list of return exceptions.

Example Usage

using BCL.easyConverter.HTML;
...
PDF2HTML pdf2html = new PDF2HTML();
try
{
   pdf2html.ImageFormat = optOcr.OPT_OCR_IMAGE_HIDDEN_TEXT; // Set option for handling OCR'ed documents
   pdf2html.ConvertToHTML(@"c:\temp\input.pdf", @"c:\temp\output.html");
}
catch(PDF2HTMLException ex)
{
   Console.WriteLine(ex.Message);
}
finally
{
   pdf2html.Dispose();
}
Imports BCL.easyConverter.HTML
...
Dim pdf2html As New PDF2HTML()
Try
   pdf2html.ImageFormat = optOcr.OPT_OCR_IMAGE_HIDDEN_TEXT ' Set option for handling OCR'ed documents
   pdf2html.ConvertToHTML("c:\test\input.pdf", "c:\test\output.html")
Catch ex As PDF2HTMLException
   System.Console.WriteLine(ex.Message)
Finally
   pdf2html.Dispose()
End Try
import PDF2HTML
pdf2html = PDF2HTML.PDF2HTML()
try:
   pdf2html.setImageFormat(PDF2HTML.optOcr.OPT_OCR_IMAGE_HIDDEN_TEXT) # Set option for handling OCR'ed documents
   pdf2html.ConvertToHTML("c:\\test\\input.pdf", "c:\\test\\output.html")
except PDF2HTML.PDF2HTMLException as ex:
   print(ex)
PDF2HTML pdf2html = new PDF2HTML();
try
{
   pdf2html.setImageFormat(optOcr.OPT_OCR_IMAGE_HIDDEN_TEXT); // Set option for handling OCR'ed documents
   pdf2html.ConvertToHTML("c:\\temp\\input.pdf", "c:\\temp\\output.html", "", 0, -1);
}
catch(PDF2HTMLException e)
{
   System.out.println(e);
}
finally
{
   pdf2html.dispose();
}
<?php
require("PDF2HTML.php");
$pdf2html = new BCL\easyConverter\HTML\PDF2HTML();
try
{
   $pdf2html->setImageFormat(BCL\easyConverter\HTML\optOcr::OPT_OCR_IMAGE_HIDDEN_TEXT); // Set option for handling OCR'ed documents
   $pdf2html->ConvertToHTML("c:\\test\\input.pdf", "c:\\test\\output.html");
}
catch(BCL\easyConverter\HTML\PDF2HTMLException $ex)
{
   echo $ex->getMessage(), "\n";
}
?>
#include <stdio.h>
#include <windows.h>
#include "easyConverterHTML.h"

int main()
{
   HMODULE hPdf2HtmlDll = LoadLibraryW(L"C:\\Program Files\\BCL Technologies\\easyConverter SDK 5\\Html\\easyConverterHTML.dll");
   if(!hPdf2HtmlDll)
   {
      printf("easyConverter could not be loaded.\n");
      return 1;
   }
   else
   {
      BclWdhrError error;
      BclPDF2HTML* pPdf2Html = CreatePDF2HTML(hPdf2HtmlDll);
      if(!pPdf2Html)
      {
         printf("easyConverter could not be initialized.\n");
         FreeLibrary(hPdf2HtmlDll);
         return 1;
      }
      pPdf2Html->OcrOption = BCL_HT_OPT_OCR_IMAGE_HIDDEN_TEXT; // Set option for handling OCR'ed documents 
      error = pPdf2Html->ConvertToHTML(pPdf2Html, L"c:\\test\\input.pdf", L"c:\\test\\output.html", L"", 0, -1);
      if(error)
      {
         printf("Conversion failed with error %d.\n", error);
         FreeLibrary(hPdf2HtmlDll);
         return 1;
      }
      pPdf2Html->Dispose(pPdf2Html);
      FreeLibrary(hPdf2HtmlDll);
      return 0;
   }
}
oConverter = CreateObject("EasyConverter.PDF2HTML.5")
' Set option for handling OCR'ed documents
oConverter.OcrOption = OPT_OCR_IMAGE_HIDDEN_TEXT
Call oConverter.ConvertToHTML(inFileName, outFileName)
set beconvh="C:\Program Files\BCL Technologies\easyConverter SDK 5\Html\beconvh.exe"
REM Set option for handling OCR'ed documents
%beconvh% -ocred image+hiddenText -i "c:\test\input.pdf" -o "c:\test\output.html"