52058a1144
* gnu/packages/search.scm (searx): New variable. Signed-off-by: Ludovic Courtès <ludo@gnu.org>
527 lines
22 KiB
Scheme
527 lines
22 KiB
Scheme
;;; GNU Guix --- Functional package management for GNU
|
|
;;; Copyright © 2014 Mark H Weaver <mhw@netris.org>
|
|
;;; Copyright © 2015, 2016 Eric Bavier <bavier@member.fsf.org>
|
|
;;; Copyright © 2017 Thomas Danckaert <post@thomasdanckaert.be>
|
|
;;; Copyright © 2017 Ricardo Wurmus <rekado@elephly.net>
|
|
;;; Copyright © 2018, 2020, 2021 Tobias Geerinckx-Rice <me@tobias.gr>
|
|
;;; Copyright © 2018 Adam Massmann <massmannak@gmail.com>
|
|
;;; Copyright © 2020 Hartmut Goebel <h.goebel@crazy-compilers.com>
|
|
;;; Copyright © 2021 Vinicius Monego <monego@posteo.net>
|
|
;;;
|
|
;;; This file is part of GNU Guix.
|
|
;;;
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
;;; under the terms of the GNU General Public License as published by
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
;;; your option) any later version.
|
|
;;;
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
;;; GNU General Public License for more details.
|
|
;;;
|
|
;;; You should have received a copy of the GNU General Public License
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
(define-module (gnu packages search)
|
|
#:use-module ((guix licenses)
|
|
#:select (gpl2 gpl2+ gpl3+ agpl3+ lgpl2.1+ bsd-3 x11 perl-license))
|
|
#:use-module (guix packages)
|
|
#:use-module (guix download)
|
|
#:use-module (guix git-download)
|
|
#:use-module (guix utils)
|
|
#:use-module (guix build-system gnu)
|
|
#:use-module (guix build-system perl)
|
|
#:use-module (guix build-system python)
|
|
#:use-module (gnu packages)
|
|
#:use-module (gnu packages compression)
|
|
#:use-module (gnu packages check)
|
|
#:use-module (gnu packages databases)
|
|
#:use-module (gnu packages freedesktop)
|
|
#:use-module (gnu packages less)
|
|
#:use-module (gnu packages linux)
|
|
#:use-module (gnu packages pcre)
|
|
#:use-module (gnu packages perl)
|
|
#:use-module (gnu packages pdf)
|
|
#:use-module (gnu packages python)
|
|
#:use-module (gnu packages python-crypto)
|
|
#:use-module (gnu packages python-web)
|
|
#:use-module (gnu packages python-xyz)
|
|
#:use-module (gnu packages sphinx)
|
|
#:use-module (gnu packages time)
|
|
#:use-module (gnu packages web)
|
|
#:use-module (gnu packages xdisorg)
|
|
#:use-module (gnu packages xml))
|
|
|
|
(define-public xapian
|
|
(package
|
|
(name "xapian")
|
|
(version "1.4.18")
|
|
;; Note: When updating Xapian, remember to update xapian-bindings below.
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "https://oligarchy.co.uk/xapian/" version
|
|
"/xapian-core-" version ".tar.xz"))
|
|
(sha256
|
|
(base32 "0xsb4ihf3p767f0zx9p4janwni6r9sg5j6lry0002i8hmnsdnv8r"))))
|
|
(build-system gnu-build-system)
|
|
(inputs `(("zlib" ,zlib)
|
|
("util-linux" ,util-linux "lib")))
|
|
(arguments
|
|
`(#:phases
|
|
(modify-phases %standard-phases
|
|
(replace 'check
|
|
;; As of Xapian 1.3.3, the TCP server implementation uses
|
|
;; getaddrinfo(). This does not work in the build environment,
|
|
;; so exclude those tests. See HACKING for the list of targets.
|
|
(lambda _
|
|
(invoke "make"
|
|
"check-inmemory"
|
|
"check-remoteprog"
|
|
;"check-remotetcp"
|
|
"check-multi"
|
|
"check-glass"
|
|
"check-chert"))))))
|
|
(synopsis "Search Engine Library")
|
|
(description
|
|
"Xapian is a highly adaptable toolkit which allows developers to easily
|
|
add advanced indexing and search facilities to their own applications. It
|
|
supports the Probabilistic Information Retrieval model and also supports a
|
|
rich set of boolean query operators.")
|
|
(home-page "https://xapian.org/")
|
|
(license (list gpl2+ bsd-3 x11))))
|
|
|
|
(define-public python-xapian-bindings
|
|
(package (inherit xapian)
|
|
(name "python-xapian-bindings")
|
|
(version (package-version xapian))
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "https://oligarchy.co.uk/xapian/" version
|
|
"/xapian-bindings-" version ".tar.xz"))
|
|
(sha256
|
|
(base32
|
|
"13ziql8027glgihgvnbsa75vkcn82g83mbihj60zf0njj170clpy"))))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:configure-flags '("--with-python3")
|
|
#:make-flags
|
|
(list (string-append "pkgpylibdir="
|
|
(assoc-ref %outputs "out")
|
|
"/lib/python" ,(version-major+minor
|
|
(package-version python))
|
|
"/site-packages/xapian"))))
|
|
(native-inputs
|
|
`(("python-sphinx" ,python-sphinx))) ;for documentation
|
|
(inputs
|
|
`(("python" ,python)
|
|
("xapian" ,xapian)
|
|
("zlib" ,zlib)))
|
|
(synopsis "Python bindings for the Xapian search engine library")
|
|
(license gpl2+)))
|
|
|
|
(define-public perl-search-xapian
|
|
(package
|
|
(name "perl-search-xapian")
|
|
(version "1.2.25.4")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://cpan/authors/id/O/OL/OLLY/"
|
|
"Search-Xapian-" version ".tar.gz"))
|
|
(sha256
|
|
(base32 "1pbl8pbgmbs3i8yik4p63g4pd9bhn0dp3d7l667dkvw0kccl66c7"))))
|
|
(build-system perl-build-system)
|
|
(native-inputs
|
|
`(("perl-devel-leak" ,perl-devel-leak)))
|
|
(inputs
|
|
`(("xapian" ,xapian)))
|
|
(home-page "https://metacpan.org/release/Search-Xapian")
|
|
(synopsis "Perl XS frontend to the Xapian C++ search library")
|
|
(description
|
|
"Search::Xapian wraps most methods of most Xapian classes. The missing
|
|
classes and methods should be added in the future. It also provides a
|
|
simplified, more 'perlish' interface to some common operations.")
|
|
(license perl-license)))
|
|
|
|
(define-public libtocc
|
|
(package
|
|
(name "libtocc")
|
|
(version "1.0.1")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "https://github.com/aidin36/tocc/releases/download/"
|
|
"v" version "/tocc-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1kd2jd74m8ksc8s7hh0haz0q0c3n0mr39bbky262kk4l58f1g068"))))
|
|
(build-system gnu-build-system)
|
|
(native-inputs `(("catch" ,catch-framework)))
|
|
(inputs `(("unqlite" ,unqlite)))
|
|
(arguments
|
|
`(#:phases (modify-phases %standard-phases
|
|
(add-before 'configure 'chdir-source
|
|
(lambda _
|
|
(chdir "libtocc/src")
|
|
#t))
|
|
(replace 'check
|
|
(lambda _
|
|
(with-directory-excursion "../tests"
|
|
(invoke "./configure"
|
|
(string-append "CONFIG_SHELL="
|
|
(which "sh"))
|
|
(string-append "SHELL="
|
|
(which "sh"))
|
|
"CPPFLAGS=-I../src"
|
|
(string-append
|
|
"LDFLAGS=-L../src/.libs "
|
|
"-Wl,-rpath=../src/.libs"))
|
|
(invoke "make")
|
|
(invoke "./libtocctests")))))))
|
|
(home-page "https://t-o-c-c.com/")
|
|
(synopsis "Tool for Obsessive Compulsive Classifiers")
|
|
(description
|
|
"libtocc is the engine of the Tocc project, a tag-based file management
|
|
system. The goal of Tocc is to provide a better system for classifying files
|
|
that is more flexible than classic file systems that are based on a tree of
|
|
files and directories.")
|
|
(license gpl3+)))
|
|
|
|
(define-public tocc
|
|
(package
|
|
(name "tocc")
|
|
(version (package-version libtocc))
|
|
(source (package-source libtocc))
|
|
(build-system gnu-build-system)
|
|
(inputs
|
|
`(("libtocc" ,libtocc)
|
|
("unqlite" ,unqlite)))
|
|
(arguments
|
|
`(#:tests? #f ;No tests
|
|
#:phases (modify-phases %standard-phases
|
|
(add-after
|
|
'unpack 'chdir-source
|
|
(lambda _ (chdir "cli/src"))))))
|
|
(home-page "https://t-o-c-c.com/")
|
|
(synopsis "Command-line interface to libtocc")
|
|
(description
|
|
"Tocc is a tag-based file management system. This package contains the
|
|
command line tool for interacting with libtocc.")
|
|
(license gpl3+)))
|
|
|
|
(define-public searx
|
|
(package
|
|
(name "searx")
|
|
(version "1.0.0")
|
|
(source
|
|
(origin
|
|
(method git-fetch)
|
|
(uri (git-reference
|
|
(url "https://github.com/searx/searx")
|
|
(commit version)))
|
|
(file-name (git-file-name name version))
|
|
(sha256
|
|
(base32 "0ghkx8g8jnh8yd46p4mlbjn2zm12nx27v7qflr4c8xhlgi0px0mh"))))
|
|
(build-system python-build-system)
|
|
(arguments
|
|
`(#:tests? #f ;what tests do is make online requests to each engine
|
|
#:phases
|
|
(modify-phases %standard-phases
|
|
(add-after 'unpack 'relax-requirements
|
|
(lambda _
|
|
;; These packages are outdated in Guix at the time of packaging.
|
|
;; When they are updated, remove corresponding substitutions.
|
|
;; Tests can run after build with 'searx-checker' tool in /bin.
|
|
(substitute* "requirements.txt"
|
|
(("flask-babel==2.0.0") "flask-babel>=1.0.0")
|
|
(("jinja2==2.11.3") "jinja2>=2.11.2")
|
|
(("lxml==4.6.3") "lxml>=4.4.2")
|
|
(("pygments==2.8.0") "pygments>=2.7.3")
|
|
(("requests\\[socks\\]==2.25.1") "requests>=2.25")
|
|
(("==") ">=")))))))
|
|
(propagated-inputs
|
|
`(("python-babel" ,python-babel)
|
|
("python-certifi" ,python-certifi)
|
|
("python-dateutil" ,python-dateutil)
|
|
("python-flask" ,python-flask)
|
|
("python-flask-babel" ,python-flask-babel)
|
|
("python-idna" ,python-idna)
|
|
("python-jinja2" ,python-jinja2)
|
|
("python-langdetect" ,python-langdetect)
|
|
("python-lxml" ,python-lxml)
|
|
("python-pygments" ,python-pygments)
|
|
("python-pyyaml" ,python-pyyaml)
|
|
("python-requests" ,python-requests)))
|
|
(home-page "https://searx.github.io/searx/")
|
|
(synopsis "Privacy-respecting metasearch engine")
|
|
(description "Searx is a privacy-respecting, hackable metasearch engine.")
|
|
(license agpl3+)))
|
|
|
|
(define-public bool
|
|
(package
|
|
(name "bool")
|
|
(version "0.2.2")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://gnu/bool/bool-"
|
|
version ".tar.xz"))
|
|
(sha256
|
|
(base32
|
|
"1frdmgrmb509fxbdpsxxw3lvvwv7xm1pavqrqgm4jg698iix6xfw"))))
|
|
(build-system gnu-build-system)
|
|
(home-page "https://www.gnu.org/software/bool/")
|
|
(synopsis "Finding text and HTML files that match boolean expressions")
|
|
(description
|
|
"GNU Bool is a utility to perform text searches on files using Boolean
|
|
expressions. For example, a search for \"hello AND world\" would return a
|
|
file containing the phrase \"Hello, world!\". It supports both AND and OR
|
|
statements, as well as the NEAR statement to search for the occurrence of
|
|
words in close proximity to each other. It handles context gracefully,
|
|
accounting for new lines and paragraph changes. It also has robust support
|
|
for parsing HTML files.")
|
|
(license gpl3+)))
|
|
|
|
(define-public hyperestraier
|
|
(package
|
|
(name "hyperestraier")
|
|
(version "1.4.13")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://fallabs.com/" name "/"
|
|
name "-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1qk3pxgzyrpcz5qfyd5xs2hw9q1cbb7j5zd4kp1diq501wcj2vs9"))))
|
|
(inputs
|
|
`(("qdbm" ,qdbm)
|
|
("zlib" ,zlib)))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:configure-flags (list (string-append "LDFLAGS=-Wl,-rpath="
|
|
(assoc-ref %outputs "out")
|
|
"/lib"))))
|
|
(home-page "https://fallabs.com/hyperestraier")
|
|
(synopsis "Full-text search system")
|
|
(description "Hyper Estraier can be used to integrate full-text
|
|
search into applications, using either the provided command line and CGI
|
|
interfaces, or a C API.")
|
|
(license lgpl2.1+)))
|
|
|
|
(define-public mlocate
|
|
(package
|
|
(name "mlocate")
|
|
(version "0.26")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://releases.pagure.org/mlocate/"
|
|
"mlocate-" version ".tar.xz"))
|
|
(sha256
|
|
(base32
|
|
"0gi6y52gkakhhlnzy0p6izc36nqhyfx5830qirhvk3qrzrwxyqrh"))))
|
|
(build-system gnu-build-system)
|
|
(home-page "https://pagure.io/mlocate")
|
|
(synopsis "Locate files on the file system")
|
|
(description
|
|
"mlocate is a locate/updatedb implementation. The @code{m} stands for
|
|
\"merging\": @code{updatedb} reuses the existing database to avoid rereading
|
|
most of the file system, which makes it faster and does not trash the system
|
|
caches as much. The locate(1) utility is intended to be completely compatible
|
|
with slocate, and attempts to be compatible to GNU locate when it does not
|
|
conflict with slocate compatibility.")
|
|
(license gpl2)))
|
|
|
|
(define-public swish-e
|
|
(package
|
|
(name "swish-e")
|
|
(version "2.4.7")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (list (string-append
|
|
"https://web.archive.org/web/20160730145202/"
|
|
"http://swish-e.org/distribution/"
|
|
"swish-e-" version ".tar.gz")
|
|
(string-append "http://http.debian.net/debian/pool/"
|
|
"main/s/swish-e/swish-e_" version
|
|
".orig.tar.gz")))
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0qkrk7z25yp9hynj21vxkyn7yi8gcagcfxnass5cgczcz0gm9pax"))
|
|
(patches (search-patches "swish-e-search.patch"
|
|
"swish-e-format-security.patch"))))
|
|
(build-system gnu-build-system)
|
|
;; Several other packages and perl modules may be installed alongside
|
|
;; swish-e to extend its features at runtime, but are not required for
|
|
;; building: xpdf, catdoc, MP3::Tag, Spreadsheet::ParseExcel,
|
|
;; HTML::Entities.
|
|
(inputs
|
|
`(("perl" ,perl)
|
|
("perl-uri" ,perl-uri)
|
|
("perl-html-parser" ,perl-html-parser)
|
|
("perl-html-tagset" ,perl-html-tagset)
|
|
("perl-mime-types" ,perl-mime-types)))
|
|
(arguments
|
|
`(;; XXX: This fails to build with zlib (API mismatch) and tests fail
|
|
;; with libxml2, so disable both.
|
|
#:configure-flags (list (string-append "--without-zlib")
|
|
(string-append "--without-libxml2"))
|
|
#:phases (modify-phases %standard-phases
|
|
(add-after 'install 'wrap-programs
|
|
(lambda* (#:key inputs outputs #:allow-other-keys)
|
|
(let* ((out (assoc-ref outputs "out")))
|
|
(for-each
|
|
(lambda (program)
|
|
(wrap-program program
|
|
`("PERL5LIB" ":" prefix
|
|
,(map (lambda (i)
|
|
(string-append (assoc-ref inputs i)
|
|
"/lib/perl5/site_perl"))
|
|
;; These perl modules have no propagated
|
|
;; inputs, so no further analysis needed.
|
|
'("perl-uri"
|
|
"perl-html-parser"
|
|
"perl-html-tagset"
|
|
"perl-mime-types")))))
|
|
(list (string-append out "/lib/swish-e/swishspider")
|
|
(string-append out "/bin/swish-filter-test")))
|
|
#t))))))
|
|
(home-page (string-append "https://web.archive.org/web/20160730145202/"
|
|
"http://swish-e.org"))
|
|
(synopsis "Web indexing system")
|
|
(description
|
|
"Swish-e is Simple Web Indexing System for Humans - Enhanced. Swish-e
|
|
can quickly and easily index directories of files or remote web sites and
|
|
search the generated indexes.")
|
|
(license gpl2+))) ;with exception
|
|
|
|
(define-public xapers
|
|
(package
|
|
(name "xapers")
|
|
(version "0.8.2")
|
|
(source
|
|
(origin
|
|
(method url-fetch)
|
|
(uri (string-append
|
|
"https://finestructure.net/xapers/releases/xapers-"
|
|
version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"0ykz6hn3qj46w3c99d6q0pi5ncq2894simcl7vapv047zm3cylmd"))))
|
|
(build-system python-build-system)
|
|
(propagated-inputs
|
|
`(("poppler" ,poppler)
|
|
("python-urwid" ,python-urwid)
|
|
("xclip" ,xclip)
|
|
("xdg-utils" ,xdg-utils)))
|
|
(inputs
|
|
`(("python-latexcodec" ,python-latexcodec)
|
|
("python-pybtex" ,python-pybtex)
|
|
("python-pycurl" ,python-pycurl)
|
|
("python-pyyaml" ,python-pyyaml)
|
|
("python-six" ,python-six)
|
|
("python-xapian-bindings" ,python-xapian-bindings)))
|
|
(arguments
|
|
`(#:modules ((ice-9 rdelim)
|
|
(guix build python-build-system)
|
|
(guix build utils))
|
|
#:phases
|
|
(modify-phases %standard-phases
|
|
(add-after 'install 'install-doc
|
|
(lambda* (#:key inputs outputs #:allow-other-keys)
|
|
(define (purge-term-support input output)
|
|
(let loop ((line (read-line input)))
|
|
(if (string-prefix? "if [[ \"$term\"" line)
|
|
(begin (display "eval \"$cmd\"\n" output)
|
|
#t)
|
|
(begin (display (string-append line "\n") output)
|
|
(loop (read-line input))))))
|
|
(let* ((out (assoc-ref outputs "out"))
|
|
(bin (string-append out "/bin"))
|
|
(adder-out (string-append bin "/xapers-adder"))
|
|
(man1 (string-append out "/share/man/man1")))
|
|
(install-file "man/man1/xapers.1" man1)
|
|
(install-file "man/man1/xapers-adder.1" man1)
|
|
;; below is equivalent to setting --no-term option
|
|
;; permanently on; this is desirable to avoid imposing
|
|
;; an x-terminal installation on the user but breaks
|
|
;; some potential xapers-adder uses like auto browser
|
|
;; pdf handler, but user could instead still use
|
|
;; e.g. "xterm -e xapers-adder %F" for same use.
|
|
;; alternatively we could propagate xterm as an input
|
|
;; and replace 'x-terminal-emulator' with 'xterm'
|
|
(call-with-input-file "bin/xapers-adder"
|
|
(lambda (input)
|
|
(call-with-output-file adder-out
|
|
(lambda (output)
|
|
(purge-term-support input output)))))
|
|
(chmod adder-out #o555)))))))
|
|
(home-page "https://finestructure.net/xapers/")
|
|
(synopsis "Personal document indexing system")
|
|
(description
|
|
"Xapers is a personal document indexing system,
|
|
geared towards academic journal articles build on the Xapian search engine.
|
|
Think of it as your own personal document search engine, or a local cache of
|
|
online libraries. It provides fast search of document text and
|
|
bibliographic data and simple document and bibtex retrieval.")
|
|
(license gpl3+)))
|
|
|
|
(define-public ugrep
|
|
(package
|
|
(name "ugrep")
|
|
(version "3.1.12")
|
|
(source (origin
|
|
(method git-fetch)
|
|
(uri (git-reference
|
|
(url "https://github.com/Genivia/ugrep")
|
|
(commit (string-append "v" version))))
|
|
(sha256
|
|
(base32 "06y61sf2ywjaix4nss11wwkxipj8cc9ccx6bsmdm31h8d8wd2s0j"))
|
|
(file-name (git-file-name name version))
|
|
(modules '((guix build utils)))
|
|
(snippet
|
|
'(begin
|
|
(delete-file-recursively "bin") ; pre-built executables
|
|
(for-each delete-file (find-files "tests" "^archive\\..*"))
|
|
(for-each delete-file (find-files "tests" "^.*\\.pdf$"))
|
|
(for-each delete-file (find-files "tests" "^.*\\.class$"))
|
|
#t))))
|
|
(build-system gnu-build-system)
|
|
(inputs
|
|
`(("bzip2" ,bzip2)
|
|
("less" ,less)
|
|
("lz4" ,lz4)
|
|
("lzip" ,lzip) ;; lzma
|
|
("pcre2" ,pcre2)
|
|
("zlib" ,zlib)))
|
|
(arguments
|
|
`(#:tests? #f ; no way to rebuild the binary input files
|
|
#:test-target "test"
|
|
#:phases
|
|
(modify-phases %standard-phases
|
|
(add-before 'check 'check-setup
|
|
(lambda _
|
|
;; Unpatch shebangs in tests.
|
|
(substitute* '("tests/Hello.bat"
|
|
"tests/Hello.sh")
|
|
(("#!/gnu/store/.*/bin/sh") "#!/bin/sh")))))))
|
|
(home-page "https://github.com/Genivia/ugrep/")
|
|
(synopsis "Faster grep with an interactive query UI")
|
|
(description "Ugrep is a ultra fast searcher of file systems, text
|
|
and binary files, source code, archives, compressed files, documents, and
|
|
more.
|
|
|
|
While still being compatible with the standard GNU/BSD grep command-line
|
|
options, ugrep supports fuzzy search as well as structured and (adjustable)
|
|
colored output, piped through \"less\" for pagination. An interactive query
|
|
UI allows refinement and has a built-in help (press F1). Ugrep implements
|
|
multi-threaded and other techniques to speed up search, pattern-matching and
|
|
decompression. Many pre-defined regexps ease searching e.g. C typdefs or XML
|
|
attributes. Results can be output in several structured or self-defined
|
|
formats.")
|
|
(license bsd-3)))
|
|
|
|
;;; search.scm ends here
|