homebrew-core/Formula/tesseract.rb

112 lines
3.7 KiB
Ruby

class Tesseract < Formula
desc "OCR (Optical Character Recognition) engine"
homepage "https://github.com/tesseract-ocr/"
url "https://github.com/tesseract-ocr/tesseract/archive/3.05.01.tar.gz"
sha256 "05898f93c5d057fada49b9a116fc86ad9310ff1726a0f499c3e5211b3af47ec1"
bottle do
sha256 "60437cd40788761462c432ac924d2c7658ddbb8f40a11b0356f4647c8420a652" => :high_sierra
sha256 "6b3a0e12659b57344a67bfde229353593ba06b4fe26b7eb1eb9e585f8906a032" => :sierra
sha256 "788a83d200ba3aa34140fa0d2dbc2ecbf6cfb2a3eeb412417cbbf68dfc4678b4" => :el_capitan
sha256 "8798858e2d3846eb7b10335cb08c349fd18bb040a2e8b5e9bb3737d1bf2071d5" => :yosemite
end
head do
url "https://github.com/tesseract-ocr/tesseract.git"
resource "tessdata-head" do
url "https://github.com/tesseract-ocr/tessdata.git"
end
end
option "with-all-languages", "Install recognition data for all languages"
option "with-training-tools", "Install OCR training tools"
option "with-opencl", "Enable OpenCL support"
option "with-serial-num-pack", "Install serial number recognition pack"
deprecated_option "all-languages" => "with-all-languages"
depends_on "autoconf" => :build
depends_on "autoconf-archive" => :build
depends_on "automake" => :build
depends_on "libtool" => :build
depends_on "pkg-config" => :build
depends_on "leptonica"
depends_on "libtiff"
if build.with? "training-tools"
depends_on "libtool" => :build
depends_on "icu4c"
depends_on "glib"
depends_on "cairo"
depends_on "pango"
depends_on :x11
end
needs :cxx11
resource "tessdata" do
url "https://github.com/tesseract-ocr/tessdata/archive/3.04.00.tar.gz"
sha256 "5dcb37198336b6953843b461ee535df1401b41008d550fc9e43d0edabca7adb1"
end
resource "eng" do
url "https://github.com/tesseract-ocr/tessdata/raw/3.04.00/eng.traineddata"
sha256 "c0515c9f1e0c79e1069fcc05c2b2f6a6841fb5e1082d695db160333c1154f06d"
end
resource "osd" do
url "https://github.com/tesseract-ocr/tessdata/raw/3.04.00/osd.traineddata"
sha256 "9cf5d576fcc47564f11265841e5ca839001e7e6f38ff7f7aacf46d15a96b00ff"
end
resource "snum" do
url "https://github.com/USCDataScience/counterfeit-electronics-tesseract/raw/319a6eeacff181dad5c02f3e7a3aff804eaadeca/Training%20Tesseract/snum.traineddata"
sha256 "36f772980ff17c66a767f584a0d80bf2302a1afa585c01a226c1863afcea1392"
end
def install
if build.with? "training-tools"
icu4c = Formula["icu4c"]
ENV.append "CFLAGS", "-I#{icu4c.opt_include}"
ENV.append "LDFLAGS", "-L#{icu4c.opt_lib}"
end
# explicitly state leptonica header location, as the makefile defaults to /usr/local/include,
# which doesn't work for non-default homebrew location
ENV["LIBLEPT_HEADERSDIR"] = HOMEBREW_PREFIX/"include"
ENV.cxx11
system "./autogen.sh"
args = %W[
--disable-dependency-tracking
--prefix=#{prefix}
]
args << "--enable-opencl" if build.with? "opencl"
system "./configure", *args
system "make", "install"
if build.with? "serial-num-pack"
resource("snum").stage { mv "snum.traineddata", share/"tessdata" }
end
if build.with? "training-tools"
system "make", "training"
system "make", "training-install"
end
if build.head?
resource("tessdata-head").stage { mv Dir["*"], share/"tessdata" }
elsif build.with? "all-languages"
resource("tessdata").stage { mv Dir["*"], share/"tessdata" }
else
resource("eng").stage { mv "eng.traineddata", share/"tessdata" }
resource("osd").stage { mv "osd.traineddata", share/"tessdata" }
end
end
test do
assert_match version.to_s, shell_output("#{bin}/tesseract -v 2>&1")
end
end