Hi Team,
i’m using 17.3.0.0 of Aspose.OCR for .NET.
OCR do not recognize all the words in the image it also gives lots of symbols in places of words.
Attached the tiff source and generated text file.
How can i get good quality text data from the image. Actually i would be searching for the words after retrieving the text data.
Following is the code snippet i use:
p.p1 {margin: 0.0px 0.0px 0.0px 0.0px; font: 10.5px Consolas}
p.p2 {margin: 0.0px 0.0px 0.0px 0.0px; font: 10.5px Consolas; color: #33a2bd}
p.p3 {margin: 0.0px 0.0px 0.0px 0.0px; font: 10.5px Consolas; min-height: 13.0px}
p.p4 {margin: 0.0px 0.0px 0.0px 0.0px; font: 10.5px Consolas; color: #008f00}
span.s1 {color: #33a2bd}
span.s2 {color: #0433ff}
span.s3 {color: #000000}
span.s4 {color: #b4261a}
Aspose.OCR.OcrEngine ocrEngine = new Aspose.OCR.OcrEngine();
ocrEngine.Image = ImageStream.FromFile(@"C:\GAImages\1.Tiff");
ocrEngine.ClearNotifies();
ocrEngine.ProcessAllPages = true;
ocrEngine.Config.DetectTextRegions = false;
if (ocrEngine.Process())
{
Aspose.OCR.Page[] pages = ocrEngine.Pages;
foreach (Aspose.OCR.Page page in pages)
{
var pageText = page.PageText.ToString();
File.WriteAllText(@"C:\Images\1.txt", pageText);
if(pageText.contains(""))
}
if(pageText.Contains("abc"))
{
Console.WriteLine("It's the required page");
p.p1 {margin: 0.0px 0.0px 0.0px 0.0px; font: 10.5px Consolas}
span.s1 {color: #0433ff}
span.s2 {color: #b4261a}
span.s3 {color: #33a2bd}
}
}