Unverified Commit c13ff346 authored by Peder Bergebakken Sundt's avatar Peder Bergebakken Sundt Committed by GitHub
Browse files

Merge pull request #258261 from pacien/translatelocally-models

translatelocally: update, fix aarch64, add model pkgs
parents adc2612d a6515b40
Loading
Loading
Loading
Loading
+22 −6
Original line number Diff line number Diff line
{ lib, stdenv, fetchFromGitHub
, cmake, qt6, libarchive, pcre2, protobuf, gperftools, blas
, runCommand, translatelocally, translatelocally-models
}:

let
  rev = "f8a2dba0a63989c6b3a7be36f736ed478cad1dd2";
  rev = "a210037760ca3ca9016ca1831c97531318df70fe";

in stdenv.mkDerivation (finalAttrs: {
  pname = "translatelocally";
  version = "unstable-2023-08-25";
  version = "unstable-2023-09-20";

  src = fetchFromGitHub {
    owner = "XapaJIaMnu";
    repo = "translateLocally";
    inherit rev;
    hash = "sha256-uUdDi0CwCR/FQjw5D2s088d/Tp7NQOI0ia30oOhlGoc=";
    hash = "sha256-T7cZdR09yDrPTwYxvDIaKTdV4mrB+gTHYVfch5BQ+PE=";
    fetchSubmodules = true;
  };

@@ -26,6 +27,11 @@ in stdenv.mkDerivation (finalAttrs: {
      3rd_party/bergamot-translator/3rd_party/marian-dev/src/common/git_revision.h
  '';

  # https://github.com/XapaJIaMnu/translateLocally/blob/81ed8b9/.github/workflows/build.yml#L330
  postConfigure = lib.optionalString stdenv.isAarch64 ''
    bash ../cmake/fix_ruy_build.sh .. .
  '';

  nativeBuildInputs = [
    cmake
    protobuf
@@ -48,6 +54,19 @@ in stdenv.mkDerivation (finalAttrs: {
    "-DCBLAS_LIBRARIES=-lcblas"
  ];

  passthru.tests = {
    cli-translate = runCommand "${finalAttrs.pname}-test-cli-translate" {
      nativeBuildInputs = [
        translatelocally
        translatelocally-models.fr-en-tiny
      ];
    } ''
      export LC_ALL="C.UTF-8"
      echo "Bonjour" | translateLocally -m fr-en-tiny > $out
      diff "$out" <(echo "Hello")
    '';
  };

  meta = with lib; {
    mainProgram = "translateLocally";
    homepage = "https://translatelocally.com/";
@@ -55,8 +74,5 @@ in stdenv.mkDerivation (finalAttrs: {
    license = licenses.mit;
    maintainers = with maintainers; [ pacien ];
    platforms = platforms.linux;

    # https://github.com/XapaJIaMnu/translateLocally/issues/150
    broken = stdenv.isAarch64;
  };
})
+43 −0
Original line number Diff line number Diff line
{ lib, stdenvNoCC, fetchurl }:

let
  modelSpecs = (builtins.fromJSON (builtins.readFile ./models.json));
  withCodeAsKey = f: { code, ... }@attrs: lib.nameValuePair code (f attrs);
  mkModelPackage = { name, code, version, url, checksum }:
    stdenvNoCC.mkDerivation {
      pname = "translatelocally-model-${code}";
      version = toString version;

      src = fetchurl {
        inherit url;
        sha256 = checksum;
      };
      dontUnpack = true;

      installPhase = ''
        TARGET="$out/share/translateLocally/models"
        mkdir -p "$TARGET"
        tar -xzf "$src" -C "$TARGET"

        # avoid patching shebangs in inconsistently executable extra files
        find "$out" -type f -exec chmod -x {} +
      '';

      meta = {
        description = "translateLocally model - ${name}";
        homepage = "https://translatelocally.com/";
        # https://github.com/browsermt/students/blob/master/LICENSE.md
        license = lib.licenses.cc-by-sa-40;
      };
    };
  allModelPkgs =
    lib.listToAttrs (map (withCodeAsKey mkModelPackage) modelSpecs);

in allModelPkgs // {
  is-en-tiny = allModelPkgs.is-en-tiny.overrideAttrs (super: {
    # missing model https://github.com/XapaJIaMnu/translateLocally/issues/147
    meta = super.meta // { broken = true; };
  });
} // {
  passthru.updateScript = ./update.sh;
}
+149 −0
Original line number Diff line number Diff line
[
  {
    "version": 1,
    "checksum": "3714539160d5b4dce3ce0d829939315e3daffeaff53647249cc6336d745c09f2",
    "url": "https://data.statmt.org/bergamot/models/csen/csen.student.base.tar.gz",
    "name": "Czech-English base",
    "code": "cs-en-base"
  },
  {
    "version": 1,
    "checksum": "693aa14ecb86275169ad4b01cbca294f3bd38d8d9bc1fad8dd89fa7e937e7d2c",
    "url": "https://data.statmt.org/bergamot/models/csen/csen.student.tiny11.tar.gz",
    "name": "Czech-English tiny",
    "code": "cs-en-tiny"
  },
  {
    "version": 1,
    "checksum": "7a57b4e3a11a2c5e03fc6855ffc2b8f61ce3f1a68aeefa4592577a9eebe25031",
    "url": "https://data.statmt.org/bergamot/models/csen/encs.student.base.tar.gz",
    "name": "English-Czech base",
    "code": "en-cs-base"
  },
  {
    "version": 1,
    "checksum": "f999d6511bdb4f1ff246b0563fdf9b71d836e1c3037fe5306a61836d3b5b8d19",
    "url": "https://data.statmt.org/bergamot/models/csen/encs.student.tiny11.tar.gz",
    "name": "English-Czech tiny",
    "code": "en-cs-tiny"
  },
  {
    "version": 2,
    "checksum": "e7362faa83c4f61e552adf8fbd4bc528fe706746eb9fc1c286ec9af7566e3daf",
    "url": "https://data.statmt.org/bergamot/models/deen/deen.student.base.tar.gz",
    "name": "German-English base",
    "code": "de-en-base"
  },
  {
    "version": 2,
    "checksum": "5c11b6ccfa0533fd5632b3cbccbb054972076266e2d1d989d3babb0ec0b10e28",
    "url": "https://data.statmt.org/bergamot/models/deen/deen.student.tiny11.tar.gz",
    "name": "German-English tiny",
    "code": "de-en-tiny"
  },
  {
    "version": 2,
    "checksum": "cf9ab5a41ce359672ab47579686f9af50fc1fe040552c375ca86912f0fce7827",
    "url": "https://data.statmt.org/bergamot/models/deen/ende.student.base.tar.gz",
    "name": "English-German base",
    "code": "en-de-base"
  },
  {
    "version": 2,
    "checksum": "0e85d1d7ee4f8a3ec12680696ffc11fa97d67a54d068ceafcf390a87df94877f",
    "url": "https://data.statmt.org/bergamot/models/deen/ende.student.tiny11.tar.gz",
    "name": "English-German tiny",
    "code": "en-de-tiny"
  },
  {
    "version": 1,
    "checksum": "adf49d0e2f21b82414bc353ae1f0904d93360caa92203ae9f2fc209a83882d81",
    "url": "https://data.statmt.org/bergamot/models/esen/esen.student.tiny11.tar.gz",
    "name": "Spanish-English tiny",
    "code": "es-en-tiny"
  },
  {
    "version": 1,
    "checksum": "6594dda2a4f5d333969c30f8356f4a9f3fe15a9f8a5fd018b0d85b9d9ad2abb0",
    "url": "https://data.statmt.org/bergamot/models/esen/enes.student.tiny11.tar.gz",
    "name": "English-Spanish tiny",
    "code": "en-es-tiny"
  },
  {
    "version": 1,
    "checksum": "05c6525549c9c621e348f8de74533764ad7696aba8245fc9a504116f8ef4053c",
    "url": "https://data.statmt.org/bergamot/models/eten/eten.student.tiny11.tar.gz",
    "name": "Estonian-English tiny",
    "code": "et-en-tiny"
  },
  {
    "version": 1,
    "checksum": "afce6c566270abdd4db332e8dcf4fe22057ada3b2a1171aab04d0d4817396fb5",
    "url": "https://data.statmt.org/bergamot/models/eten/enet.student.tiny11.tar.gz",
    "name": "English-Estonian tiny",
    "code": "en-et-tiny"
  },
  {
    "version": 1,
    "checksum": "5c1696747590d1a75bef67348dce96bcd3889eb5a06a0f670c3d7232ed79f60e",
    "url": "https://data.statmt.org/bergamot/models/isen/isen.student.tiny11.tar.gz",
    "name": "Icelandic-English tiny",
    "code": "is-en-tiny"
  },
  {
    "version": 1,
    "checksum": "9f5dde2f4f87438c24c9561990636e624c53b527ddc8505f822b22b073069de8",
    "url": "https://data.statmt.org/bergamot/models/nben/nben.student.tiny11.tar.gz",
    "name": "Norwegian (Bokmål)-English tiny",
    "code": "nb-en-tiny"
  },
  {
    "version": 1,
    "checksum": "0bb4b83560caaffae95940574d939999092800a7803fae4c79a97e6481887a4f",
    "url": "https://data.statmt.org/bergamot/models/nnen/nnen.student.tiny11.tar.gz",
    "name": "Norwegian (Nynorsk)-English tiny",
    "code": "nn-en-tiny"
  },
  {
    "version": 1,
    "checksum": "ecfe9c2b0be3406c0205ad2da58f4005893a4ae969e81dd9c523093cf5c7abc3",
    "url": "https://data.statmt.org/bergamot/models/bgen/bgen.student.tiny11.tar.gz",
    "name": "Bulgarian-English tiny",
    "code": "bg-en-tiny"
  },
  {
    "version": 1,
    "checksum": "eb9a7511ae9c89fb91ab6da1e9d5061946ad752e5801351f39c8eddca9705c74",
    "url": "https://data.statmt.org/bergamot/models/bgen/enbg.student.tiny11.tar.gz",
    "name": "English-Bulgarian tiny",
    "code": "en-bg-tiny"
  },
  {
    "version": 1,
    "checksum": "87148203cbda28421d76fffbd7d3cd6c1fc0d6dae2843c248870274d6512a388",
    "url": "https://data.statmt.org/bergamot/models/plen/plen.student.tiny11.tar.gz",
    "name": "Polish-English tiny",
    "code": "pl-en-tiny"
  },
  {
    "version": 1,
    "checksum": "c33219daa12e7872cf7ac8a1b86a2f3e0592ebadd7e756bf11d16d9a7725cf9b",
    "url": "https://data.statmt.org/bergamot/models/plen/enpl.student.tiny11.tar.gz",
    "name": "English-Polish tiny",
    "code": "en-pl-tiny"
  },
  {
    "version": 1,
    "checksum": "817a45ed9ec3228bfb797e5e14781ab7fe9f388fe1e834e280031f05089809f8",
    "url": "https://data.statmt.org/bergamot/models/fren/fren.student.tiny11.tar.gz",
    "name": "French-English tiny",
    "code": "fr-en-tiny"
  },
  {
    "version": 1,
    "checksum": "28deea86d2a02102a7fedf19391a7628386f01f1f532d430306a9728dc5ec2d6",
    "url": "https://data.statmt.org/bergamot/models/fren/enfr.student.tiny11.tar.gz",
    "name": "English-French tiny",
    "code": "en-fr-tiny"
  }
]
+14 −0
Original line number Diff line number Diff line
#!/usr/bin/env nix-shell
#! nix-shell -i bash -p curl -p jq

set -eu -o pipefail

curl https://translatelocally.com/models.json \
  | jq '.models | map(with_entries(select([.key] | inside([
      "name",
      "code",
      "version",
      "url",
      "checksum"
    ]))))' \
  > "$(dirname "$0")/models.json"
+2 −0
Original line number Diff line number Diff line
@@ -14105,6 +14105,8 @@ with pkgs;
  translatelocally = callPackage ../applications/misc/translatelocally { };
  translatelocally-models = recurseIntoAttrs (callPackages ../misc/translatelocally-models { });
  translate-shell = callPackage ../applications/misc/translate-shell { };
  translatepy = with python3.pkgs; toPythonApplication translatepy;