module Asposeocrjava::RecognizeWhiteListedCharacters
Public Class Methods
new()
click to toggle source
# File lib/asposeocrjava/OCR/recognizewhitelistedcharacters.rb, line 3 def initialize() data_dir = File.dirname(File.dirname(File.dirname(File.dirname(__FILE__)))) + '/data/' # Initialize an instance of OcrEngine ocr_engine = Rjb::import('com.aspose.ocr.OcrEngine').new # Retrieve the OcrConfig of the OcrEngine object ocr_config = ocr_engine.getConfig() # Set the Whitelist property to recognize numbers only #ocr_config.setWhitelist(['1', '2', '3', '4', '5', '6', '7', '8', '9', '0']) # Set the Image property by loading the image from file path location ocr_engine.setImage(Rjb::import('com.aspose.ocr.ImageStream').fromFile(data_dir + 'ocr.png')) # Set the RemoveNonText to true ocr_engine.getConfig().setRemoveNonText(true) # Process the image if ocr_engine.process() text = ocr_engine.getText() puts "Text: " + text.to_string expression = "(\\d+)" # Create a Pattern object pattern = Rjb::import('java.util.regex.Pattern').compile(expression) # Now create matcher object matcher = pattern.matcher(text.toString()) if matcher.find() puts "Found value: " + matcher.group(0).to_string end end end