lib/ocr-file/document.rb in ocr-file-0.0.2 vs lib/ocr-file/document.rb in ocr-file-0.0.3
- old
+ new
@@ -20,10 +20,10 @@
image_annotator: nil, # Needed for Cloud-Vision
type_of_ocr: OcrFile::OcrEngines::CloudVision::DOCUMENT_TEXT_DETECTION,
ocr_engine: 'tesseract', # 'cloud-vision'
# Image Pre-Processing
image_preprocess: true,
- effects: ['despeckle', 'deskew', 'enhance', 'sharpen', 'bw'],
+ effects: ['despeckle', 'deskew', 'enhance', 'sharpen', 'remove_shadow', 'bw'],
# PDF to Image Processing
optimise_pdf: true,
extract_pdf_images: true, # if false will screenshot each PDF page
temp_filename_prefix: 'image',
# Console Output