blob: 0c40f67c21ee503bb4da604af5779205f7feab08 (
plain) (
blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
|
{ lib
, fetchFromGitHub
, stdenv
, cmake
, gperftools
, withGPerfTools ? true
}:
stdenv.mkDerivation rec {
pname = "sentencepiece";
version = "0.2.0";
src = fetchFromGitHub {
owner = "google";
repo = pname;
rev = "refs/tags/v${version}";
sha256 = "sha256-tMt6UBDqpdjAhxAJlVOFFlE3RC36/t8K0gBAzbesnsg=";
};
nativeBuildInputs = [ cmake ];
buildInputs = lib.optionals withGPerfTools [ gperftools ];
outputs = [ "bin" "dev" "out" ];
# https://github.com/google/sentencepiece/issues/754
postPatch = ''
substituteInPlace CMakeLists.txt \
--replace '\$'{exec_prefix}/'$'{CMAKE_INSTALL_LIBDIR} '$'{CMAKE_INSTALL_FULL_LIBDIR} \
--replace '\$'{prefix}/'$'{CMAKE_INSTALL_INCLUDEDIR} '$'{CMAKE_INSTALL_FULL_INCLUDEDIR}
'';
meta = with lib; {
homepage = "https://github.com/google/sentencepiece";
description = "Unsupervised text tokenizer for Neural Network-based text generation";
license = licenses.asl20;
platforms = platforms.unix;
maintainers = with maintainers; [ pashashocky ];
};
}
|