[SerializableAttribute()]public struct OcrAutoRecognizeJobData
Use this structure to specify the input data for an OCR job. After creating an instance of OcrAutoRecognizeJobData with the data, pass it to IOcrAutoRecognizeManager.CreateJob to create an IOcrAutoRecognizeJob object. Then use the IOcrAutoRecognizeJob object with the IOcrAutoRecognizeManager.RunJob and IOcrAutoRecognizeManager.RunJobAsync methods to run and monitor an OCR job.
The OcrAutoRecognizeJobData structure contains the following members:
| Member | Description | 
|---|---|
| ImageFileName and ImageStream | 
             The name of the file or the .NET stream containing the source image. This can be any single or multipage image file format supported by LEADTOOLS. One of these must not be null. If ImageFileName is not null, then it must contain the name of a file currently existing on disk.  | 
    
| FirstPageNumber | 
             1-based index of the first page number in ImageFileName or ImageStream to recognize. Use this and LastPageNumber to recognize only a certain range of pages in the source file. This member must be greater than or equal to 1 (first page in the file).  | 
    
| LastPageNumber | 
             1-based index of the last page number in ImageFileName or ImageStream to recognize. Use this and FirstPageNumber to recognize only a certain range of pages in the source file. Use a value of -1 to indicate "up to last page in the file"; otherwise, this member must be a value greater than or equal to FirstPageNumber, up to the maximum number of pages in the source file name.  | 
    
| ZonesFileName | 
             Optional name of prepared multipage zone file. This member can be a null (Nothing in Visual Basic) reference. When no zone file is specified, the IOcrAutoRecognizeManager will auto-detect the zones for each page using IOcrPage.AutoZone.  | 
    
| Format | 
             The output document format, which can be any of the supported DocumentFormats such as PDF, DOC and TEXT. If this member is DocumentFormat.User, then the document id saved using the native engine format set in IOcrDocumentManager.EngineFormat if the engine used supports native formats; otherwise, an exception will be thrown.  | 
    
| DocumentFileName and DocumentStream | 
             The name of the output document file or the .NET stream to use for output. When recognition is completed, this file will be created on disk. One of these must not be null.  | 
    
| JobName | 
             Optional job name. If tracing is enabled with IOcrAutoRecognizeManager.EnableTrace, then the engine will use its value in the trace messages. If this member is a null reference (Nothing in Visual Basic), then the trace will show the generic [Untitled] name next to the trace messages.  | 
    
| UserData | 
             Optional user data associated with the job. Use this value to store any extra information required by your application. The IOcrAutoRecognizeJob will contain the same object used here in its IOcrAutoRecognizeJob.JobData member.  | 
    
using Leadtools;using Leadtools.Codecs;using Leadtools.Ocr;using Leadtools.Document.Writer;using Leadtools.Forms.Common;using Leadtools.WinForms;public class RunJobExample{// Number of documents that are pendingprivate int _documentsPending;// Event to trigger when all documents are finishedprivate AutoResetEvent _allDocumentsFinishedEvent;public void Start(){string imagesDirectory = LEAD_VARS.ImagesDir;string documentsDirectory = Path.Combine(LEAD_VARS.ImagesDir, "RunJobExample");// Create the output (documents) directoryif (!Directory.Exists(documentsDirectory)){Directory.CreateDirectory(documentsDirectory);}// Get all TIF files in input (images) directorystring[] imageFileNames = Directory.GetFiles(imagesDirectory, "*.tif");if (imageFileNames.Length == 0){Console.WriteLine("No images to OCR");return;}// Create a new OCR engine instanceOcrEngineType engineType = OcrEngineType.LEAD;Console.WriteLine(string.Format("Starting up {0} engine", engineType));using (IOcrEngine ocrEngine = OcrEngineManager.CreateEngine(engineType)){ocrEngine.Startup(null, null, null, LEAD_VARS.OcrLEADRuntimeDir);// Setup document PDF save options: Image/Text with CCITT G4 encoding for B/WDocumentWriter docWriter = ocrEngine.DocumentWriterInstance;PdfDocumentOptions pdfOptions = docWriter.GetOptions(DocumentFormat.Pdf) as PdfDocumentOptions;pdfOptions.ImageOverText = true;pdfOptions.DocumentType = PdfDocumentType.Pdf;pdfOptions.FontEmbedMode = DocumentFontEmbedMode.None;pdfOptions.OneBitImageCompression = OneBitImageCompressionType.FaxG4;docWriter.SetOptions(DocumentFormat.Pdf, pdfOptions);// We are going to use multiple-threads, so disable threading in// IOcrAutoRecognizeManagerIOcrAutoRecognizeManager autoRecognizeManager = ocrEngine.AutoRecognizeManager;autoRecognizeManager.MaximumThreadsPerJob = 1;// Tell the recognize manager to continue on errorsautoRecognizeManager.JobErrorMode = OcrAutoRecognizeManagerJobErrorMode.Continue;// Instead of using events to trigger when documents are done,// we will use the JobCompleted events of IOcrAutoRecognizeManager// to decrement a counter and trigger one event when the counter reaches 0autoRecognizeManager.JobStarted += new EventHandler<OcrAutoRecognizeRunJobEventArgs>(autoRecognizeManager_JobStarted);autoRecognizeManager.JobCompleted += new EventHandler<OcrAutoRecognizeRunJobEventArgs>(autoRecognizeManager_JobCompleted);int count = imageFileNames.Length;_documentsPending = count;_allDocumentsFinishedEvent = new AutoResetEvent(false);for (int i = 0; i < count; i++){// Create the job datastring imageFileName = imageFileNames[i];string name = "Document " + (i + 1).ToString();Console.WriteLine("Queuing {0} file {1}", name, imageFileName);JobData data = new JobData();data.AutoRecognizeManager = autoRecognizeManager;data.ImageFileName = imageFileName;data.DocumentFileName = Path.Combine(documentsDirectory, Path.GetFileNameWithoutExtension(imageFileName) + ".pdf");data.JobName = name;// Queue this jobThreadPool.QueueUserWorkItem(new WaitCallback(RunJob), data);}// Wait for all documents to finish_allDocumentsFinishedEvent.WaitOne();_allDocumentsFinishedEvent.Close();autoRecognizeManager.JobStarted -= new EventHandler<OcrAutoRecognizeRunJobEventArgs>(autoRecognizeManager_JobStarted);autoRecognizeManager.JobCompleted -= new EventHandler<OcrAutoRecognizeRunJobEventArgs>(autoRecognizeManager_JobCompleted);Console.WriteLine("All documents finished, check the result files in {0}", documentsDirectory);}}private void autoRecognizeManager_JobStarted(object sender, OcrAutoRecognizeRunJobEventArgs e){// This is not strictly needed in this example, we will// use it to show informationConsole.WriteLine("{0} started...", e.Job.JobData.JobName);// Check if we need to abortif (AbortJobs(e.Job)){// Yes, abort all jobse.Job.AutoRecognizeManager.AbortAllJobs();}}private void autoRecognizeManager_JobCompleted(object sender, OcrAutoRecognizeRunJobEventArgs e){string message = string.Format("{0} completed ", e.Job.JobData.JobName);IOcrAutoRecognizeJob job = e.Job;// Show any errorsif (job.Errors.Count == 0){message += "successfully...";}else{message += "with errors, first error is " + job.Errors[0].Exception.Message;// And save the errors to a text file in the document directorystring documentFileName = job.JobData.DocumentFileName;string textPathName = Path.Combine(Path.GetDirectoryName(documentFileName), Path.GetFileNameWithoutExtension(documentFileName) + "_errors.txt");using (StreamWriter writer = File.CreateText(textPathName)){writer.WriteLine(job.JobData.JobName);writer.WriteLine("Data:");writer.WriteLine(" Image file name: " + job.JobData.ImageFileName);writer.WriteLine(" First page number: " + job.JobData.FirstPageNumber);writer.WriteLine(" Last page number: " + job.JobData.LastPageNumber);writer.WriteLine(" Format:" + job.JobData.Format);writer.WriteLine(" Document file name: " + job.JobData.DocumentFileName);writer.WriteLine("Errors:");foreach (OcrAutoRecognizeManagerJobError error in job.Errors){writer.WriteLine(" Page: {0} during {1}. Error: {2}", error.ImagePageNumber, error.Operation, error.Exception.Message);}}}Console.WriteLine(message);// Decrement the documents count, when we reach 0, we are done// Since this will be called from multiple threads, we need// to use a thread-safety procedureint pending = Interlocked.Decrement(ref _documentsPending);// If we are the last document, wait up main threadif (pending == 0){_allDocumentsFinishedEvent.Set();}}private class JobData{public IOcrAutoRecognizeManager AutoRecognizeManager;public string ImageFileName;public string DocumentFileName;public string JobName;}private void RunJob(object state){JobData data = state as JobData;Console.WriteLine("Running {0}", data.JobName);// Run itOcrAutoRecognizeJobData jobData = new OcrAutoRecognizeJobData(data.ImageFileName, DocumentFormat.Pdf, data.DocumentFileName);jobData.JobName = data.JobName;IOcrAutoRecognizeJob job = data.AutoRecognizeManager.CreateJob(jobData);data.AutoRecognizeManager.RunJob(job);}private bool AbortJobs(IOcrAutoRecognizeJob ocrJob){// In your application, you can check if abortion is required, for example, if the user// has pressed the Cancel button on a progress bar or if your service is shutting down.// In this example, we will never abort, but you can change this code to return true// upon any condition (or when a specific job is about to start)// and the engine will abort all current and pending jobsreturn false;}}static class LEAD_VARS{public const string ImagesDir = @"C:\LEADTOOLS23\Resources\Images";public const string OcrLEADRuntimeDir = @"C:\LEADTOOLS23\Bin\Common\OcrLEADRuntime";}