nixpkgs-suyu/pkgs/development/libraries/languagemachines/frog.nix

{ stdenv, fetchurl
, automake, autoconf, bzip2, libtar, libtool, pkgconfig, autoconf-archive
, libxml2, icu
, languageMachines
}:

let
  release = builtins.fromJSON (builtins.readFile ./release-info/LanguageMachines-frog.json);
in

stdenv.mkDerivation {
  name = "frog-${release.version}";
  version = release.version;
  src = fetchurl { inherit (release) url sha256;
                   name = "frog-v${release.version}.tar.gz"; };
  nativeBuildInputs = [ pkgconfig ];
  buildInputs = [ automake autoconf bzip2 libtar libtool autoconf-archive
                  libxml2 icu
                  languageMachines.ticcutils
                  languageMachines.timbl
                  languageMachines.mbt
                  languageMachines.libfolia
                  languageMachines.ucto
                  languageMachines.frogdata
                ];

  preConfigure = ''
    sh bootstrap.sh
  '';
  postInstall = ''
    # frog expects the data files installed in the same prefix
    mkdir -p $out/share/frog/;
    for f in ${languageMachines.frogdata}/share/frog/*; do
      ln -s $f $out/share/frog/;
    done;

    make check
  '';

  meta = with stdenv.lib; {
    description = "A Tagger-Lemmatizer-Morphological-Analyzer-Dependency-Parser for Dutch";
    homepage    = https://languagemachines.github.io/frog;
    license     = licenses.gpl3;
    platforms   = platforms.all;
    maintainers = with maintainers; [ roberth ];

    longDescription = ''
      Frog is an integration of memory-based natural language processing (NLP) modules developed for Dutch. All NLP modules are based on Timbl, the Tilburg memory-based learning software package. Most modules were created in the 1990s at the ILK Research Group (Tilburg University, the Netherlands) and the CLiPS Research Centre (University of Antwerp, Belgium). Over the years they have been integrated into a single text processing tool, which is currently maintained and developed by the Language Machines Research Group and the Centre for Language and Speech Technology at Radboud University Nijmegen. A dependency parser, a base phrase chunker, and a named-entity recognizer module were added more recently. Where possible, Frog makes use of multi-processor support to run subtasks in parallel.

      Various (re)programming rounds have been made possible through funding by NWO, the Netherlands Organisation for Scientific Research, particularly under the CGN project, the IMIX programme, the Implicit Linguistics project, the CLARIN-NL programme and the CLARIAH programme.
    '';
  };

}
frog: init at v0.13.7 2017-08-08 11:34:09 +02:00			`{ stdenv, fetchurl`
languagemachines: fix darwin build 2018-03-11 07:39:04 +01:00			`, automake, autoconf, bzip2, libtar, libtool, pkgconfig, autoconf-archive`
frog: init at v0.13.7 2017-08-08 11:34:09 +02:00			`, libxml2, icu`
			`, languageMachines`
			`}:`

			`let`
			`release = builtins.fromJSON (builtins.readFile ./release-info/LanguageMachines-frog.json);`
			`in`

			`stdenv.mkDerivation {`
treewide: add version to packages Lots of packages are missing versions in their name. This adds them where appropriate. These were found with this command: $ nix-env -qa -f. \| grep -v '\-[0-9A-Za-z.-_+]*$' \| grep -v '^hook$' See issue #41007. 2018-05-24 06:37:33 +02:00			`name = "frog-${release.version}";`
frog: init at v0.13.7 2017-08-08 11:34:09 +02:00			`version = release.version;`
			`src = fetchurl { inherit (release) url sha256;`
frog: adhere to version schema convention see issue #43717 2018-07-20 23:04:39 +02:00			`name = "frog-v${release.version}.tar.gz"; };`
misc pkgs: Basic sed to get fix `pkgconfig` and `autoreconfHook` `buildInputs` Only acts on one-line dependency lists. 2017-09-05 23:26:13 +02:00			`nativeBuildInputs = [ pkgconfig ];`
languagemachines: fix darwin build 2018-03-11 07:39:04 +01:00			`buildInputs = [ automake autoconf bzip2 libtar libtool autoconf-archive`
frog: init at v0.13.7 2017-08-08 11:34:09 +02:00			`libxml2 icu`
			`languageMachines.ticcutils`
			`languageMachines.timbl`
			`languageMachines.mbt`
			`languageMachines.libfolia`
			`languageMachines.ucto`
			`languageMachines.frogdata`
			`];`

			`preConfigure = ''`
			`sh bootstrap.sh`
			`'';`
			`postInstall = ''`
			`# frog expects the data files installed in the same prefix`
			`mkdir -p $out/share/frog/;`
			`for f in ${languageMachines.frogdata}/share/frog/*; do`
			`ln -s $f $out/share/frog/;`
			`done;`

			`make check`
			`'';`

			`meta = with stdenv.lib; {`
			`description = "A Tagger-Lemmatizer-Morphological-Analyzer-Dependency-Parser for Dutch";`
			`homepage = https://languagemachines.github.io/frog;`
			`license = licenses.gpl3;`
			`platforms = platforms.all;`
			`maintainers = with maintainers; [ roberth ];`

			`longDescription = ''`
			Frog is an integration of memory-based natural language processing (NLP) modules developed for Dutch. All NLP modules are based on Timbl, the Tilburg memory-based learning software package. Most modules were created in the 1990s at the ILK Research Group (Tilburg University, the Netherlands) and the CLiPS Research Centre (University of Antwerp, Belgium). Over the years they have been integrated into a single text processing tool, which is currently maintained and developed by the Language Machines Research Group and the Centre for Language and Speech Technology at Radboud University Nijmegen. A dependency parser, a base phrase chunker, and a named-entity recognizer module were added more recently. Where possible, Frog makes use of multi-processor support to run subtasks in parallel.

			`Various (re)programming rounds have been made possible through funding by NWO, the Netherlands Organisation for Scientific Research, particularly under the CGN project, the IMIX programme, the Implicit Linguistics project, the CLARIN-NL programme and the CLARIAH programme.`
			`'';`
			`};`

			`}`