Unverified Commit 4ca42ad0 authored by Daniel Albert's avatar Daniel Albert
Browse files

invoice2data: 0.3.6 -> 0.4.2

Update invoice2data to version v0.4.2 [released on 2023-02-11](https://github.com/invoice-x/invoice2data/releases/tag/v0.4.2).

This change also
* Installs `ghostscript`, which is used to convert pdfs to images used as input for tesseract
* Uses tesseract 5 instead of tesseract 3
* Switches from `xpdf` (which is also marked as insecure) to `poppler_utils`, which is the recommended provider of `pdftotext` according to the `invoice2data` repo.
parent 68bfdaec
Loading
Loading
Loading
Loading
+10 −9
Original line number Diff line number Diff line
{ lib
, fetchFromGitHub
, ghostscript
, imagemagick
, poppler_utils
, python3
, tesseract
, xpdf
, tesseract5
}:

python3.pkgs.buildPythonApplication rec {
  pname = "invoice2data";
  version = "0.3.6";
  version = "0.4.2";
  format = "setuptools";

  src = fetchFromGitHub {
    owner = "invoice-x";
    repo = pname;
    rev = "v${version}";
    sha256 = "sha256-t1jgLyKtQsLINlnkCdSbVfTM6B/EiD1yGtx9UHjyZVE=";
    sha256 = "sha256-ss2h8cg0sga+lzJyQHckrZB/Eb63Oj3FkqmGqWCzCQ8=";
  };

  nativeBuildInputs = with python3.pkgs; [
    setuptools-git
  ];
  buildInputs = with python3.pkgs; [ setuptools-git ];

  propagatedBuildInputs = with python3.pkgs; [
    chardet
@@ -28,6 +27,7 @@ python3.pkgs.buildPythonApplication rec {
    pdfminer-six
    pillow
    pyyaml
    setuptools
    unidecode
  ];

@@ -37,9 +37,10 @@ python3.pkgs.buildPythonApplication rec {
  '';

  makeWrapperArgs = ["--prefix" "PATH" ":" (lib.makeBinPath [
    ghostscript
    imagemagick
    tesseract
    xpdf
    tesseract5
    poppler_utils
  ])];

  # Tests fails even when ran manually on my ubuntu machine !!