File python-ocrmypdf.spec of Package python-ocrmypdf
#
# spec file for package python-ocrmypdf
#
# Copyright (c) 2024 SUSE LLC
#
# All modifications and additions to the file contributed by third parties
# remain the property of their copyright owners, unless otherwise agreed
# upon. The license for this file, and modifications and additions to the
# file, is the same license as for the pristine package itself (unless the
# license for the pristine package is not an Open Source License, in which
# case the license is the MIT License). An "Open Source License" is a
# license that conforms to the Open Source Definition (Version 1.9)
# published by the Open Source Initiative.
# Please submit bugfixes or comments via https://bugs.opensuse.org/
#
%define skip_python39 1
%{?sle15_python_module_pythons}
Name: python-ocrmypdf
Version: 16.6.0
Release: 0
Summary: OCRmyPDF adds an OCR text layer to scanned PDF files
License: MPL-2.0
Group: Development/Languages/Python
URL: https://github.com/ocrmypdf/OCRmyPDF
Source: https://files.pythonhosted.org/packages/source/o/ocrmypdf/ocrmypdf-%{version}.tar.gz
BuildRequires: %{python_module base >= 3.10}
BuildRequires: %{python_module hatch-vcs}
BuildRequires: %{python_module hatchling}
BuildRequires: %{python_module pip}
BuildRequires: %{python_module wheel}
BuildRequires: fdupes
BuildRequires: python-rpm-macros
# upstream use Requires: ghostscript >= 10.01.2
Requires: ghostscript >= 9.55
Requires: python-Pillow >= 10.0.1
Requires: python-deprecation >= 2.1.0
Requires: python-img2pdf >= 0.5
Requires: python-packaging >= 20
Requires: python-pdfminer.six >= 20220319
Requires: python-pikepdf >= 8.10.1
Requires: python-pluggy >= 1
Requires: python-reportlab >= 3.6.8
Requires: python-rich >= 13
Requires: tesseract-ocr >= 5.3.2
Requires: tesseract-ocr-traineddata-deu >= 4.1.0
Requires: tesseract-ocr-traineddata-eng >= 4.1.0
Requires(post): update-alternatives
Requires(postun): update-alternatives
Suggests: python-Flask >= 2.0.1
Suggests: python-PyMuPDF >= 1.19.1
Suggests: python-python-dotenv
Suggests: python-sphinx
Suggests: python-sphinx-issues
Suggests: python-sphinx-rtd-theme
Suggests: python-typer
Suggests: python-watchdog >= 1.0.2
BuildArch: noarch
# SECTION test requirements
BuildRequires: %{python_module Pillow >= 10.0.1}
BuildRequires: %{python_module deprecation >= 2.1.0}
BuildRequires: %{python_module hypothesis >= 6.36.0}
BuildRequires: %{python_module img2pdf >= 0.5}
BuildRequires: %{python_module packaging >= 20}
BuildRequires: %{python_module pdfminer.six >= 20220319}
BuildRequires: %{python_module pikepdf >= 8.10.1}
BuildRequires: %{python_module pluggy >= 1}
BuildRequires: %{python_module pytest >= 6.2.5}
BuildRequires: %{python_module python-xmp-toolkit == 2.0.1}
BuildRequires: %{python_module reportlab >= 3.6.8}
BuildRequires: %{python_module rich >= 13}
BuildRequires: %{python_module types-Pillow}
BuildRequires: %{python_module types-humanfriendly}
# upstream use BuildRequires: ghostscript >= 10.02.1
BuildRequires: ghostscript >= 9.55
BuildRequires: tesseract-ocr >= 5.3.2
BuildRequires: tesseract-ocr-traineddata-eng >= 4.1.0
# /SECTION
%python_subpackages
%description
OCRmyPDF adds an OCR text layer to scanned PDF files, allowing them to be searched
%prep
%autosetup -p1 -n ocrmypdf-%{version}
# rpmlintrc
# Cleanup shebang and executable bits.
for f in src/ocrmypdf/*.py src/ocrmypdf/*/*.py; do
sed -e '1{\@^#!%{_bindir}/env python@d}' $f > $f.new &&
touch -r $f $f.new &&
mv $f.new $f
chmod -x $f
done
# Switch off parallelization of testing in the config file
# and getting coverage for our tests (useless for packaging)
sed -i -e '/addopts = "-n auto"/d' \
-e '/^\[tool.coverage\./,/^[[:blank:]]*$/d' \
pyproject.toml
%build
%pyproject_wheel
%install
%pyproject_install
%python_clone -a %{buildroot}%{_bindir}/ocrmypdf
%python_expand %fdupes %{buildroot}%{$python_sitelib}
%check
donttest="test_acroform_and_redo"
donttest+=" or test_blank_input_pdf"
donttest+=" or test_decompression_bomb_error"
donttest+=" or test_force_ocr"
donttest+=" or test_graft"
donttest+=" or test_image_input"
donttest+=" or test_input_file_not_found"
donttest+=" or test_input_file_not_readable"
donttest+=" or test_invalid_input_pdf"
donttest+=" or test_jbig2_passthrough"
donttest+=" or test_maximum_options"
donttest+=" or test_ocr_timeout"
donttest+=" or test_oversample"
donttest+=" or test_pagesegmode"
donttest+=" or test_pagesize_consistency"
donttest+=" or test_pdfa"
donttest+=" or test_quick"
donttest+=" or test_redo_ocr"
donttest+=" or test_repeat_ocr"
donttest+=" or test_rotate_deskew_ocr_timeout"
donttest+=" or test_sidecar_nonempty"
donttest+=" or test_sidecar_pagecount"
donttest+=" or test_skip_big"
donttest+=" or test_skip_ocr"
donttest+=" or test_tesseract_config_valid"
donttest+=" or test_tesseract_crash_autorotate"
donttest+=" or test_tesseract_crash"
donttest+=" or test_tesseract_oem"
donttest+=" or test_tesseract_thresholding"
donttest+=" or test_user_words_ocr"
donttest+=" or test_very_high_dpi"
# gh#ocrmypdf/OCRmyPDF#1423
donttest+=" or test_malformed_docinfo"
%pytest -k "not ($donttest)"
%post
%python_install_alternative ocrmypdf
%postun
%python_uninstall_alternative ocrmypdf
%files %{python_files}
%doc README.md
%license LICENSE LICENSES
%{python_sitelib}/ocrmypdf
%{python_sitelib}/ocrmypdf-%{version}.dist-info
%python_alternative %{_bindir}/ocrmypdf
%changelog