2020-02-25 16:06:24 +01:00
|
|
|
{ lib
|
2019-12-07 02:15:09 +01:00
|
|
|
, fetchFromGitHub
|
|
|
|
, stdenv
|
|
|
|
, cmake
|
|
|
|
, gperftools
|
2020-02-25 16:06:24 +01:00
|
|
|
|
|
|
|
, withGPerfTools ? true
|
2019-12-07 02:15:09 +01:00
|
|
|
}:
|
|
|
|
|
|
|
|
stdenv.mkDerivation rec {
|
|
|
|
pname = "sentencepiece";
|
2020-10-14 10:11:37 +02:00
|
|
|
version = "0.1.93";
|
2019-12-07 02:15:09 +01:00
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "google";
|
|
|
|
repo = pname;
|
|
|
|
rev = "v${version}";
|
2020-10-14 10:11:37 +02:00
|
|
|
sha256 = "0h9c1xs0sab23labh8m3ar6kvzfldv2id2f17icja61ihyw06nrd";
|
2019-12-07 02:15:09 +01:00
|
|
|
};
|
|
|
|
|
2020-02-25 16:06:24 +01:00
|
|
|
nativeBuildInputs = [ cmake ] ++ lib.optional withGPerfTools gperftools;
|
|
|
|
|
|
|
|
outputs = [ "bin" "dev" "out" ];
|
2019-12-07 02:15:09 +01:00
|
|
|
|
|
|
|
meta = with stdenv.lib; {
|
2020-02-21 15:38:07 +01:00
|
|
|
homepage = "https://github.com/google/sentencepiece";
|
2019-12-07 02:15:09 +01:00
|
|
|
description = "Unsupervised text tokenizer for Neural Network-based text generation";
|
|
|
|
license = licenses.asl20;
|
2020-02-21 15:38:07 +01:00
|
|
|
platforms = platforms.unix;
|
2020-03-09 12:55:48 +01:00
|
|
|
maintainers = with maintainers; [ danieldk pashashocky ];
|
2019-12-07 02:15:09 +01:00
|
|
|
};
|
|
|
|
}
|