From 9b772c120dc78617b3e58c47aaf799c9b79b5d66 Mon Sep 17 00:00:00 2001 From: Micah Lee Date: Thu, 12 Dec 2013 14:23:50 -0800 Subject: [PATCH] Fixes #1, so this runs in Ubuntu. --- README.md | 7 +++++++ docs2csv.rb | 2 +- 2 files changed, 8 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 43494a2..9e3324b 100644 --- a/README.md +++ b/README.md @@ -22,6 +22,13 @@ JPGs will allways be OCRd. Without Tesseract installed, you'll still be able to extract text from documents, but you won't be able to automatically OCR them. + - Ruby 1.9.x + + Ubuntu comes with ruby 1.8. You can install ruby 1.9.1 like this: + + ```sudo apt-get install ruby1.9.1``` + ```sudo update-alternatives --set ruby /usr/bin/ruby1.9.1``` + **Typical usage** ruby docs2csv.rb -r -o directory-to-scan output.csv diff --git a/docs2csv.rb b/docs2csv.rb index dd17c9e..1a40c9b 100644 --- a/docs2csv.rb +++ b/docs2csv.rb @@ -8,7 +8,7 @@ # Requires tesseract and poppler for OCR functionality require 'rubygems' -require 'Digest' +require 'digest' require 'tmpdir' require 'ostruct' require 'optparse'