Some checks failed
Periodic Merges (6h) / master → staging-nixos (push) Failing after 12m50s
Periodic Merges (6h) / master → staging-next (push) Failing after 12m54s
Periodic Merges (24h) / merge-base(master,staging) → haskell-updates (push) Failing after 11m54s
Periodic Merges (6h) / staging-next → staging (push) Failing after 12m13s
Periodic Merges (24h) / staging-next-25.05 → staging-25.05 (push) Failing after 13m24s
Periodic Merges (24h) / release-25.05 → staging-next-25.05 (push) Failing after 14m28s
71 lines
1.7 KiB
Nix
71 lines
1.7 KiB
Nix
{
|
|
lib,
|
|
stdenv,
|
|
fetchFromGitHub,
|
|
gitUpdater,
|
|
autoreconfHook,
|
|
bzip2,
|
|
libtar,
|
|
libtool,
|
|
pkg-config,
|
|
autoconf-archive,
|
|
libxml2,
|
|
ticcutils,
|
|
timbl,
|
|
frog,
|
|
}:
|
|
|
|
stdenv.mkDerivation (finalAttrs: {
|
|
pname = "mbt";
|
|
version = "3.2.16";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "LanguageMachines";
|
|
repo = "mbt";
|
|
tag = "v${finalAttrs.version}";
|
|
hash = "sha256-O/LhLWgLwDctkRYjds+AM9fGMIRX3eCnJhRIXyVrJ04=";
|
|
};
|
|
|
|
nativeBuildInputs = [
|
|
pkg-config
|
|
autoreconfHook
|
|
];
|
|
buildInputs = [
|
|
bzip2
|
|
libtar
|
|
libtool
|
|
autoconf-archive
|
|
libxml2
|
|
ticcutils
|
|
timbl
|
|
];
|
|
patches = [ ./mbt-add-libxml2-dep.patch ];
|
|
|
|
passthru = {
|
|
updateScript = gitUpdater { rev-prefix = "v"; };
|
|
tests = {
|
|
/**
|
|
Reverse dependencies. Does not respect overrides.
|
|
*/
|
|
reverseDependencies = lib.recurseIntoAttrs {
|
|
inherit frog;
|
|
};
|
|
};
|
|
};
|
|
|
|
meta = with lib; {
|
|
description = "Memory Based Tagger";
|
|
homepage = "https://languagemachines.github.io/mbt/";
|
|
license = licenses.gpl3;
|
|
platforms = platforms.all;
|
|
maintainers = with maintainers; [ roberth ];
|
|
|
|
longDescription = ''
|
|
MBT is a memory-based tagger-generator and tagger in one. The tagger-generator part can generate a sequence tagger on the basis of a training set of tagged sequences; the tagger part can tag new sequences. MBT can, for instance, be used to generate part-of-speech taggers or chunkers for natural language processing. It has also been used for named-entity recognition, information extraction in domain-specific texts, and disfluency chunking in transcribed speech.
|
|
|
|
Mbt is used by Frog for Dutch tagging.
|
|
'';
|
|
};
|
|
|
|
})
|