Unverified Commit 5138eb3f authored by Gaétan Lepage's avatar Gaétan Lepage Committed by GitHub
Browse files

python3Packages.mlcroissant: 1.0.22 -> 1.1.0 (#511707)

parents 0412aed9 25f11f8e
Loading
Loading
Loading
Loading
+8 −7
Original line number Diff line number Diff line
@@ -29,19 +29,20 @@
  writableTmpDirAsHomeHook,
}:

buildPythonPackage rec {
buildPythonPackage (finalAttrs: {
  pname = "mlcroissant";
  version = "1.0.22";
  version = "1.1.0";
  pyproject = true;
  __structuredAttrs = true;

  src = fetchFromGitHub {
    owner = "mlcommons";
    repo = "croissant";
    tag = "v${version}";
    hash = "sha256-uJOxKNrK3eN2wyPFEQr2J4+vZeSK1KPyFDag2jcyWZw=";
    tag = "v${finalAttrs.version}";
    hash = "sha256-IaRlmNQjOSIT3/b6AM68eRmweZEI5yjo6I9ievQIIsE=";
  };

  sourceRoot = "${src.name}/python/mlcroissant";
  sourceRoot = "${finalAttrs.src.name}/python/mlcroissant";

  build-system = [
    setuptools
@@ -91,10 +92,10 @@ buildPythonPackage rec {
  meta = {
    description = "High-level format for machine learning datasets that brings together four rich layers";
    homepage = "https://github.com/mlcommons/croissant";
    changelog = "https://github.com/mlcommons/croissant/releases/tag/${src.tag}";
    changelog = "https://github.com/mlcommons/croissant/releases/tag/${finalAttrs.src.tag}";
    license = lib.licenses.asl20;
    maintainers = with lib.maintainers; [ GaetanLepage ];
    platforms = lib.platforms.all;
    mainProgram = "mlcroissant";
  };
}
})
+10 −0
Original line number Diff line number Diff line
@@ -93,6 +93,16 @@ buildPythonPackage (finalAttrs: {
          "elif field.label == field.LABEL_REPEATED:" \
          "elif hasattr(field_value, 'extend'):"
    ''
    # mlcroissant 1.1.0 requires leaf fields to define `source` or `value`
    + ''
      substituteInPlace tensorflow_datasets/core/utils/croissant_utils_test.py \
        --replace-fail \
          "references=mlc.Source(field='splits/name')," \
          "references=mlc.Source(field='splits/name'), source=mlc.Source(field='splits/name')," \
        --replace-fail \
          "references=mlc.Source(field='labels/label')," \
          "references=mlc.Source(field='labels/label'), source=mlc.Source(field='labels/label'),"
    ''
    # TypeError: only 0-dimensional arrays can be converted to Python scalars
    + ''
      substituteInPlace tensorflow_datasets/datasets/smallnorb/smallnorb_dataset_builder.py \