Method: PDFextract#extract_with_ocr

Defined in:
lib/pdf_extract.rb

#extract_with_ocr(page_path, dimensions) ⇒ Object



180
181
182
183
184
185
186
187
# File 'lib/pdf_extract.rb', line 180

def extract_with_ocr(page_path,dimensions)
  engine = Tesseract::Engine.new(language: :eng)
  engine.image = page_path
  engine.select 1,34,59,281
  text = engine.text.strip
  dimensions[:result] = text 
  return text
end