Unverified Commit 61fcc28b authored by xanderio's avatar xanderio Committed by GitHub
Browse files

markitdown: unstable-2024-12-18 -> 0.1.1 (#401090)

parents c47b4cf7 73873af8
Loading
Loading
Loading
Loading
+17 −4
Original line number Diff line number Diff line
@@ -5,6 +5,7 @@
  hatchling,
  beautifulsoup4,
  ffmpeg-headless,
  magika,
  mammoth,
  markdownify,
  numpy,
@@ -19,30 +20,38 @@
  requests,
  speechrecognition,
  youtube-transcript-api,
  olefile,
  xlrd,
  lxml,
  pytestCheckHook,
  gitUpdater,
}:

buildPythonPackage {
buildPythonPackage rec {
  pname = "markitdown";
  version = "unstable-2024-12-18";
  version = "0.1.1";
  pyproject = true;

  src = fetchFromGitHub {
    owner = "microsoft";
    repo = "markitdown";
    rev = "3ce21a47abed0e4db162de1088d661887ae076ff";
    hash = "sha256-5YafFL8OHNcGgB/qH6CmX0rTith1ZSRNIa+ktl4Ffvg=";
    tag = "v${version}";
    hash = "sha256-siXam2a+ryyLBbciQgjd9k6zC8r46LbzjPMoc1dG0wk=";
  };

  sourceRoot = "${src.name}/packages/markitdown";

  build-system = [ hatchling ];

  dependencies = [
    beautifulsoup4
    ffmpeg-headless
    lxml
    magika
    mammoth
    markdownify
    numpy
    olefile
    openai
    openpyxl
    pandas
@@ -53,6 +62,7 @@ buildPythonPackage {
    python-pptx
    requests
    speechrecognition
    xlrd
    youtube-transcript-api
  ];

@@ -63,6 +73,9 @@ buildPythonPackage {
  disabledTests = [
    # Require network access
    "test_markitdown_remote"
    "test_module_vectors"
    "test_cli_vectors"
    "test_module_misc"
  ];

  passthru.updateScripts = gitUpdater { };