about summary refs log tree commit diff
path: root/nixpkgs/pkgs/development/python-modules/spacy/models.nix
blob: c34bbdfb83d85c1cc048e68a85c6f29cff208bed (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
{ lib
, buildPythonPackage
, fetchurl
, jieba
, pymorphy2
, sentencepiece
, spacy
, spacy-pkuseg
, spacy-transformers }:
let
  buildModelPackage = { pname, version, sha256, license }:
  let
    lang = builtins.substring 0 2 pname;
  in buildPythonPackage {
    inherit pname version;

    src = fetchurl {
      url = "https://github.com/explosion/spacy-models/releases/download/${pname}-${version}/${pname}-${version}.tar.gz";
      inherit sha256;
    };

    propagatedBuildInputs = [ spacy ]
      ++ lib.optionals (lang == "zh") [ jieba spacy-pkuseg ]
      ++ lib.optionals (lib.hasSuffix "_trf" pname) [ spacy-transformers ]
      ++ lib.optionals (lang == "ru") [ pymorphy2 ]
      ++ lib.optionals (pname == "fr_dep_news_trf") [ sentencepiece ];

    postPatch = lib.optionals (pname == "fr_dep_news_trf") ''
      substituteInPlace meta.json \
        --replace "sentencepiece==0.1.91" "sentencepiece>=0.1.91"
    '';

    pythonImportsCheck = [ pname ];

    meta = with lib; {
      description = "Models for the spaCy NLP library";
      homepage    = "https://github.com/explosion/spacy-models";
      license     = licenses.${license};
      maintainers = with maintainers; [ rvl ];
    };
  };

  makeModelSet = models: with lib; listToAttrs (map (m: nameValuePair m.pname (buildModelPackage m)) models);

in makeModelSet (lib.importJSON ./models.json)

# cat models.json | jq -r '.[] | @uri "https://github.com/explosion/spacy-models/releases/download/\(.pname)-\(.version)/\(.pname)-\(.version).tar.gz"' | xargs -n1 nix-prefetch-url