2021-01-30 22:00:55 +00:00
|
|
|
{ lib, stdenv, fetchFromGitHub, buildPythonPackage, isPy3k, regex }:
|
2020-02-28 10:30:50 +00:00
|
|
|
|
|
|
|
buildPythonPackage rec {
|
|
|
|
pname = "SoMaJo";
|
2021-03-06 07:16:19 +00:00
|
|
|
version = "2.1.3";
|
2020-02-28 10:30:50 +00:00
|
|
|
disabled = !isPy3k;
|
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "tsproisl";
|
|
|
|
repo = pname;
|
|
|
|
rev = "v${version}";
|
2021-03-06 07:16:19 +00:00
|
|
|
sha256 = "07jkkg5ph5m47xf8w5asy5930qcpy6p11j0admll2y6yjynd2b47";
|
2020-02-28 10:30:50 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
propagatedBuildInputs = [ regex ];
|
|
|
|
|
2021-01-30 22:00:55 +00:00
|
|
|
# loops forever
|
|
|
|
doCheck = !stdenv.isDarwin;
|
|
|
|
|
2021-01-11 07:54:33 +00:00
|
|
|
meta = with lib; {
|
2020-02-28 10:30:50 +00:00
|
|
|
description = "Tokenizer and sentence splitter for German and English web texts";
|
|
|
|
homepage = "https://github.com/tsproisl/SoMaJo";
|
2021-01-29 08:49:20 +00:00
|
|
|
license = licenses.gpl3Plus;
|
2020-02-28 10:30:50 +00:00
|
|
|
maintainers = with maintainers; [ danieldk ];
|
|
|
|
};
|
|
|
|
}
|