Add mecab and wp2txt
mecab-variable-param.patch unknown status 1
1 | + | From 2396e90056706ef897acab3aaa081289c7336483 Mon Sep 17 00:00:00 2001 | |
2 | + | From: LEPILLER Julien <julien.lepiller@irisa.fr> | |
3 | + | Date: Fri, 19 Apr 2019 11:48:39 +0200 | |
4 | + | Subject: [PATCH] Allow variable parameters | |
5 | + | ||
6 | + | --- | |
7 | + | src/param.cpp | 6 +++++- | |
8 | + | 1 file changed, 5 insertions(+), 1 deletion(-) | |
9 | + | ||
10 | + | diff --git a/src/param.cpp b/src/param.cpp | |
11 | + | index 65328a2..006b1b5 100644 | |
12 | + | --- a/src/param.cpp | |
13 | + | +++ b/src/param.cpp | |
14 | + | @@ -79,8 +79,12 @@ bool Param::load(const char *filename) { | |
15 | + | size_t s1, s2; | |
16 | + | for (s1 = pos+1; s1 < line.size() && isspace(line[s1]); s1++); | |
17 | + | for (s2 = pos-1; static_cast<long>(s2) >= 0 && isspace(line[s2]); s2--); | |
18 | + | - const std::string value = line.substr(s1, line.size() - s1); | |
19 | + | + std::string value = line.substr(s1, line.size() - s1); | |
20 | + | const std::string key = line.substr(0, s2 + 1); | |
21 | + | + | |
22 | + | + if(value.find('$') == 0) { | |
23 | + | + value = std::getenv(value.substr(1).c_str()); | |
24 | + | + } | |
25 | + | set<std::string>(key.c_str(), value, false); | |
26 | + | } | |
27 | + | ||
28 | + | -- | |
29 | + | 2.20.1 | |
30 | + |
more/packages/games.scm
353 | 353 | lightweight & fast actor implementations, pattern matching for messages, | |
354 | 354 | network transparent messaging, and more.") | |
355 | 355 | (license (list license:boost1.0 license:bsd-3)))) | |
356 | + | ||
357 | + | (define-public mecab | |
358 | + | (package | |
359 | + | (name "mecab") | |
360 | + | (version "0.996") | |
361 | + | (source (origin | |
362 | + | (method url-fetch) | |
363 | + | (uri "https://drive.google.com/uc?export=download&id=0B4y35FiV1wh7cENtOXlicTFaRUE") | |
364 | + | (file-name (string-append name "-" version ".tar.gz")) | |
365 | + | (sha256 | |
366 | + | (base32 | |
367 | + | "0ncwlqxl1hdn1x4v4kr2sn1sbbcgnhdphp0lcvk74nqkhdbk4wz0")) | |
368 | + | (patches | |
369 | + | (search-patches | |
370 | + | "mecab-variable-param.patch")))) | |
371 | + | (build-system gnu-build-system) | |
372 | + | (search-paths | |
373 | + | (list (search-path-specification | |
374 | + | (variable "MECAB_DICDIR") | |
375 | + | (separator #f) | |
376 | + | (files '("lib/mecab/dic"))))) | |
377 | + | (arguments | |
378 | + | `(#:phases | |
379 | + | (modify-phases %standard-phases | |
380 | + | (add-before 'build 'add-mecab-dicdir-variable | |
381 | + | (lambda _ | |
382 | + | (substitute* "mecabrc.in" | |
383 | + | (("dicdir = .*") | |
384 | + | "dicdir = $MECAB_DICDIR")) | |
385 | + | (substitute* "mecab-config.in" | |
386 | + | (("echo @libdir@/mecab/dic") | |
387 | + | "if [ -z \"$MECAB_DICDIR\" ]; then | |
388 | + | echo @libdir@/mecab/dic | |
389 | + | else | |
390 | + | echo \"$MECAB_DICDIR\" | |
391 | + | fi")) | |
392 | + | #t))))) | |
393 | + | (inputs | |
394 | + | `(("libiconv" ,libiconv))) | |
395 | + | (home-page "https://taku910.github.io/mecab") | |
396 | + | (synopsis "Morphological analysis engine for texts") | |
397 | + | (description "Mecab is a morphological analysis engine developped as a | |
398 | + | collaboration between the Kyoto university and Nippon Telegraph and Telephone | |
399 | + | Corporation. The engine is independent of any language, dictionary or corpus. | |
400 | + | ") | |
401 | + | (license (list license:gpl2+ license:lgpl2.1+ license:bsd-3)))) | |
402 | + | ||
403 | + | (define-public mecab-ipadic | |
404 | + | (package | |
405 | + | (name "mecab-ipadic") | |
406 | + | (version "2.7.0") | |
407 | + | (source (origin | |
408 | + | (method url-fetch) | |
409 | + | (uri "https://drive.google.com/uc?export=download&id=0B4y35FiV1wh7MWVlSDBCSXZMTXM") | |
410 | + | (file-name (string-append name "-" version ".tar.gz")) | |
411 | + | (sha256 | |
412 | + | (base32 | |
413 | + | "08rmkvj0f0x6jq0axrjw2y5nam0mavv6x77dp9v4al0wi1ym4bxn")))) | |
414 | + | (build-system gnu-build-system) | |
415 | + | (arguments | |
416 | + | `(#:configure-flags | |
417 | + | (list (string-append "--with-dicdir=" (assoc-ref %outputs "out") | |
418 | + | "/lib/mecab/dic") | |
419 | + | "--with-charset=utf8") | |
420 | + | #:phases | |
421 | + | (modify-phases %standard-phases | |
422 | + | (add-before 'configure 'set-mecab-dir | |
423 | + | (lambda* (#:key outputs #:allow-other-keys) | |
424 | + | (setenv "MECAB_DICDIR" (string-append (assoc-ref outputs "out") | |
425 | + | "/lib/mecab/dic")) | |
426 | + | #t))))) | |
427 | + | (native-inputs | |
428 | + | `(("mecab" ,mecab))); for mecab-config | |
429 | + | (home-page "") | |
430 | + | (synopsis "") | |
431 | + | (description "") | |
432 | + | (license (license:non-copyleft "COPYING")))) |
more/packages/ruby.scm
552 | 552 | ") | |
553 | 553 | (home-page "http://www.rubocop.org/") | |
554 | 554 | (license license:expat))) | |
555 | + | ||
556 | + | (define-public ruby-trollop | |
557 | + | (package | |
558 | + | (name "ruby-trollop") | |
559 | + | (version "2.9.9") | |
560 | + | (source | |
561 | + | (origin | |
562 | + | (method url-fetch) | |
563 | + | (uri (rubygems-uri "trollop" version)) | |
564 | + | (sha256 | |
565 | + | (base32 | |
566 | + | "074h7lns72kg1dl5gvz5apl3xz1i0axbnbc01pf2kbw4q0lkpnp4")))) | |
567 | + | (build-system ruby-build-system) | |
568 | + | (arguments | |
569 | + | `(#:tests? #f)) | |
570 | + | (synopsis | |
571 | + | "Trollop is a commandline option parser for Ruby that just gets out of your way.") | |
572 | + | (description | |
573 | + | "Trollop is a commandline option parser for Ruby that just gets out of your way.") | |
574 | + | (home-page "") | |
575 | + | (license license:expat))) | |
576 | + | ||
577 | + | (define-public ruby-htmlentities | |
578 | + | (package | |
579 | + | (name "ruby-htmlentities") | |
580 | + | (version "4.3.4") | |
581 | + | (source | |
582 | + | (origin | |
583 | + | (method url-fetch) | |
584 | + | (uri (rubygems-uri "htmlentities" version)) | |
585 | + | (sha256 | |
586 | + | (base32 | |
587 | + | "1nkklqsn8ir8wizzlakncfv42i32wc0w9hxp00hvdlgjr7376nhj")))) | |
588 | + | (build-system ruby-build-system) | |
589 | + | (arguments | |
590 | + | `(#:tests? #f)) | |
591 | + | (synopsis | |
592 | + | "A module for encoding and decoding (X)HTML entities.") | |
593 | + | (description | |
594 | + | "This package provides a module for encoding and decoding (X)HTML entities.") | |
595 | + | (home-page | |
596 | + | "https://github.com/threedaymonk/htmlentities") | |
597 | + | (license license:expat))) | |
598 | + | ||
599 | + | (define-public ruby-wp2txt | |
600 | + | (package | |
601 | + | (name "ruby-wp2txt") | |
602 | + | (version "0.9.1") | |
603 | + | (source | |
604 | + | (origin | |
605 | + | (method url-fetch) | |
606 | + | (uri (rubygems-uri "wp2txt" version)) | |
607 | + | (sha256 | |
608 | + | (base32 | |
609 | + | "01l0r83ma3fp9zb94km4lqasvxpml2azd4dj36qzpm71c2pyhng4")))) | |
610 | + | (build-system ruby-build-system) | |
611 | + | (arguments | |
612 | + | `(#:tests? #f)) | |
613 | + | (propagated-inputs | |
614 | + | `(("ruby-htmlentities" ,ruby-htmlentities) | |
615 | + | ("ruby-nokogiri" ,ruby-nokogiri) | |
616 | + | ("ruby-parallel" ,ruby-parallel) | |
617 | + | ("ruby-trollop" ,ruby-trollop))) | |
618 | + | (synopsis | |
619 | + | "WP2TXT extracts plain text data from Wikipedia dump file (encoded in XML/compressed with Bzip2) stripping all the MediaWiki markups and other metadata.") | |
620 | + | (description | |
621 | + | "WP2TXT extracts plain text data from Wikipedia dump file (encoded in XML/compressed with Bzip2) stripping all the MediaWiki markups and other metadata.") | |
622 | + | (home-page "http://github.com/yohasebe/wp2txt") | |
623 | + | (license #f))) |