Module: Asposeocrjava::RecognizeWhiteListedCharacters

Defined in:
lib/asposeocrjava/OCR/recognizewhitelistedcharacters.rb

Instance Method Summary collapse

Instance Method Details

#initializeObject



3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
# File 'lib/asposeocrjava/OCR/recognizewhitelistedcharacters.rb', line 3

def initialize()
    data_dir = File.dirname(File.dirname(File.dirname(File.dirname(__FILE__)))) + '/data/'
            
    # Initialize an instance of OcrEngine
    ocr_engine = Rjb::import('com.aspose.ocr.OcrEngine').new

    # Retrieve the OcrConfig of the OcrEngine object
    ocr_config = ocr_engine.getConfig()

    # Set the Whitelist property to recognize numbers only
    #ocr_config.setWhitelist(['1', '2', '3', '4', '5', '6', '7', '8', '9', '0'])

    # Set the Image property by loading the image from file path location
    ocr_engine.setImage(Rjb::import('com.aspose.ocr.ImageStream').fromFile(data_dir + 'ocr.png'))

    # Set the RemoveNonText to true
    ocr_engine.getConfig().setRemoveNonText(true)

    # Process the image
    if ocr_engine.process()
        text = ocr_engine.getText()
        puts "Text: " + text.to_string
         
        expression = "(\\d+)"
        # Create a Pattern object
        pattern = Rjb::import('java.util.regex.Pattern').compile(expression)

        # Now create matcher object
        matcher = pattern.matcher(text.toString())
        if matcher.find()
            puts "Found value: " + matcher.group(0).to_string
        end
    end
end