File tesseract-ocr.spec of Package tesseract-ocr
#
# spec file for package tesseract-ocr
#
# Copyright (c) 2020 SUSE LLC
#
# All modifications and additions to the file contributed by third parties
# remain the property of their copyright owners, unless otherwise agreed
# upon. The license for this file, and modifications and additions to the
# file, is the same license as for the pristine package itself (unless the
# license for the pristine package is not an Open Source License, in which
# case the license is the MIT License). An "Open Source License" is a
# license that conforms to the Open Source Definition (Version 1.9)
# published by the Open Source Initiative.
# Please submit bugfixes or comments via https://bugs.opensuse.org/
#
%define so_ver 4
Name: tesseract-ocr
Version: 4.1.1
Release: 0
Summary: Open Source OCR Engine
License: Apache-2.0 AND GPL-2.0-or-later
URL: https://github.com/tesseract-ocr/tesseract
Source0: https://github.com/tesseract-ocr/tesseract/archive/%{version}.tar.gz#/%{name}-%{version}.tar.gz
# PATCH-FIX-OPENSUSE -- boo#1159231
Patch0: tesseract-ocr-no-cpudetection.patch
BuildRequires: asciidoc
BuildRequires: autoconf
BuildRequires: automake
BuildRequires: doxygen
BuildRequires: fdupes
BuildRequires: gcc-c++
BuildRequires: libtool
BuildRequires: libxslt-tools
BuildRequires: opencl-headers
BuildRequires: pkgconfig >= 0.9.0
BuildRequires: pkgconfig(OpenCL)
BuildRequires: pkgconfig(cairo)
BuildRequires: pkgconfig(fontconfig)
BuildRequires: pkgconfig(icu-i18n) >= 52.1
BuildRequires: pkgconfig(icu-uc) >= 52.1
BuildRequires: pkgconfig(lept) >= 1.74
BuildRequires: pkgconfig(libarchive)
BuildRequires: pkgconfig(pango) >= 1.22.0
BuildRequires: pkgconfig(pangocairo) >= 1.22.0
BuildRequires: pkgconfig(pangoft2) >= 1.22.0
Recommends: tesseract-ocr-traineddata-english
%description
A commercial quality OCR engine originally developed at HP between 1985 and
1995. In 1995, this engine was among the top 3 evaluated by UNLV. It was
open-sourced by HP and UNLV in 2005. From 2007 it is developed by Google.
%package devel
Summary: Tesseract Open Source OCR Engine Development files
Requires: libtesseract%{so_ver} = %{version}
Requires: pkgconfig(lept) >= 1.74
Requires: pkgconfig(libarchive)
%description devel
This package contains development files for the Tesseract Open Source OCR
Engine.
%package -n libtesseract%{so_ver}
Summary: Open Source OCR Engine
%description -n libtesseract%{so_ver}
A commercial quality OCR engine originally developed at HP between 1985 and
1995. In 1995, this engine was among the top 3 evaluated by UNLV. It was
open-sourced by HP and UNLV in 2005. From 2007 it is developed by Google.
%prep
%autosetup -n tesseract-%{version} -p1
%build
autoreconf -fiv
%configure \
--enable-opencl \
--disable-static
%make_build all training doc
%install
%make_install all training-install
# Remove libtool config files
rm -f %{buildroot}%{_libdir}/libtesseract.la
# Manually install the devel docs in order to fix rpmlint warnings "files-duplicate" and "doc-file-dependency"
mkdir -p %{buildroot}%{_defaultdocdir}/%{name}-devel
cp -a doc/html/ %{buildroot}%{_defaultdocdir}/%{name}-devel/
# Fix rpmlint warning "doc-file-dependency"
rm -f %{buildroot}%{_defaultdocdir}/%{name}-devel/html/installdox
# Fix rpmlint warning "non-executable-in-bin"
chmod 0755 %{buildroot}%{_bindir}/tesstrain_utils.sh
# Fix rpmlint warning "files-duplicate"
%fdupes -s %{buildroot}
%post -n libtesseract%{so_ver} -p /sbin/ldconfig
%postun -n libtesseract%{so_ver} -p /sbin/ldconfig
%files
%doc AUTHORS ChangeLog README.md
%license LICENSE
%{_bindir}/*
%dir %{_datadir}/tessdata
%{_datadir}/tessdata/configs/
%{_datadir}/tessdata/tessconfigs/
%{_datadir}/tessdata/pdf.ttf
%{_mandir}/man1/*.1%{?ext_man}
%{_mandir}/man5/*.5%{?ext_man}
%files devel
%doc %{_defaultdocdir}/tesseract-ocr-devel/
%{_includedir}/tesseract/
%{_libdir}/libtesseract*.so
%{_libdir}/pkgconfig/*.pc
%files -n libtesseract%{so_ver}
%{_libdir}/libtesseract.so.%{so_ver}*
%changelog