From 042280b96b67cb863ceb7bb2195b6b271fbd6170 Mon Sep 17 00:00:00 2001 From: merdely Date: Tue, 11 Sep 2007 20:52:49 +0000 Subject: [PATCH] Swish-e is a fast, flexible, and free open source system for indexing collections of Web pages or other files. Swish-e is ideally suited for collections of a million documents or smaller. Using the GNOME libxml2 parser and a collection of filters, Swish-e can index plain text, e-mail, PDF, HTML, XML, Microsoft Word/PowerPoint/Excel and just about any file that can be converted to XML or HTML text. Swish-e is also often used to supplement databases like the MySQL DBMS for very fast full-text searching. help from simon, ok steven@, sturm@ --- textproc/swish-e/Makefile | 38 ++++++ textproc/swish-e/distinfo | 5 + .../swish-e/patches/patch-conf_Makefile_in | 12 ++ .../patches/patch-filter-bin_Makefile_in | 12 ++ .../swish-e/patches/patch-filters_Makefile_in | 12 ++ .../patches/patch-prog-bin_Makefile_in | 12 ++ textproc/swish-e/patches/patch-src_filter_c | 12 ++ textproc/swish-e/pkg/DESCR | 8 ++ textproc/swish-e/pkg/MESSAGE | 8 ++ textproc/swish-e/pkg/PFRAG.shared | 2 + textproc/swish-e/pkg/PLIST | 122 ++++++++++++++++++ 11 files changed, 243 insertions(+) create mode 100644 textproc/swish-e/Makefile create mode 100644 textproc/swish-e/distinfo create mode 100644 textproc/swish-e/patches/patch-conf_Makefile_in create mode 100644 textproc/swish-e/patches/patch-filter-bin_Makefile_in create mode 100644 textproc/swish-e/patches/patch-filters_Makefile_in create mode 100644 textproc/swish-e/patches/patch-prog-bin_Makefile_in create mode 100644 textproc/swish-e/patches/patch-src_filter_c create mode 100644 textproc/swish-e/pkg/DESCR create mode 100644 textproc/swish-e/pkg/MESSAGE create mode 100644 textproc/swish-e/pkg/PFRAG.shared create mode 100644 textproc/swish-e/pkg/PLIST diff --git a/textproc/swish-e/Makefile b/textproc/swish-e/Makefile new file mode 100644 index 00000000000..65704b66751 --- /dev/null +++ b/textproc/swish-e/Makefile @@ -0,0 +1,38 @@ +# $OpenBSD: Makefile,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ + +COMMENT= web/text search engine + +DISTNAME= swish-e-2.4.5 +SHARED_LIBS= swish-e 2.0 +CATEGORIES= textproc www + +HOMEPAGE= http://swish-e.org/ +MASTER_SITES= ${HOMEPAGE}distribution/ + +MAINTAINER= Michael Erdely + +# GPLv2 +PERMIT_PACKAGE_CDROM= Yes +PERMIT_PACKAGE_FTP= Yes +PERMIT_DISTFILES_CDROM= Yes +PERMIT_DISTFILES_FTP= Yes + +MODULES= converters/libiconv +WANTLIB= c m z + +LIB_DEPENDS= pcreposix,pcre::devel/pcre \ + xml2::textproc/libxml + +RUN_DEPENDS= ::www/p5-URI \ + ::www/p5-libwww \ + ::www/p5-HTML-Parser \ + :p5-HTML-Tagset->=3:www/p5-HTML-Tagset \ + ::mail/p5-MIME-Types \ + ::www/p5-HTML-FillInForm \ + ::www/p5-HTML-Template + +USE_LIBTOOL= Yes +CONFIGURE_STYLE= gnu +CONFIGURE_ARGS+= --with-pcre + +.include diff --git a/textproc/swish-e/distinfo b/textproc/swish-e/distinfo new file mode 100644 index 00000000000..a9a21eacb15 --- /dev/null +++ b/textproc/swish-e/distinfo @@ -0,0 +1,5 @@ +MD5 (swish-e-2.4.5.tar.gz) = /q5cofX0NSGQFWtUoZwBUw== +RMD160 (swish-e-2.4.5.tar.gz) = uJ2MyNj4UNLd8LUrWDocscDzwbM= +SHA1 (swish-e-2.4.5.tar.gz) = npNYDvdcNy6yMrwKSUDOdvQah/Y= +SHA256 (swish-e-2.4.5.tar.gz) = H+lr+hiz5je9M/OjemY39eDP1v87YkQOrBvtPn76lgA= +SIZE (swish-e-2.4.5.tar.gz) = 1474881 diff --git a/textproc/swish-e/patches/patch-conf_Makefile_in b/textproc/swish-e/patches/patch-conf_Makefile_in new file mode 100644 index 00000000000..458a5de010d --- /dev/null +++ b/textproc/swish-e/patches/patch-conf_Makefile_in @@ -0,0 +1,12 @@ +$OpenBSD: patch-conf_Makefile_in,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +--- conf/Makefile.in.orig Sat Apr 14 19:26:45 2007 ++++ conf/Makefile.in Sat Apr 14 19:27:09 2007 +@@ -185,7 +185,7 @@ sbindir = @sbindir@ + sharedstatedir = @sharedstatedir@ + sysconfdir = @sysconfdir@ + target_alias = @target_alias@ +-exampledir = $(datadir)/doc/$(PACKAGE)/examples/conf ++exampledir = $(datadir)/examples/$(PACKAGE)/conf + conf_dir = \ + stopwords/dutch.txt \ + stopwords/english.txt \ diff --git a/textproc/swish-e/patches/patch-filter-bin_Makefile_in b/textproc/swish-e/patches/patch-filter-bin_Makefile_in new file mode 100644 index 00000000000..9002a68efe6 --- /dev/null +++ b/textproc/swish-e/patches/patch-filter-bin_Makefile_in @@ -0,0 +1,12 @@ +$OpenBSD: patch-filter-bin_Makefile_in,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +--- filter-bin/Makefile.in.orig Sat Apr 14 19:28:20 2007 ++++ filter-bin/Makefile.in Sat Apr 14 19:28:47 2007 +@@ -185,7 +185,7 @@ sbindir = @sbindir@ + sharedstatedir = @sharedstatedir@ + sysconfdir = @sysconfdir@ + target_alias = @target_alias@ +-exampledir = $(datadir)/doc/$(PACKAGE)/examples/filter-bin ++exampledir = $(datadir)/examples/$(PACKAGE)/filter-bin + example_DATA = \ + README \ + swish_filter.pl \ diff --git a/textproc/swish-e/patches/patch-filters_Makefile_in b/textproc/swish-e/patches/patch-filters_Makefile_in new file mode 100644 index 00000000000..2f74793d064 --- /dev/null +++ b/textproc/swish-e/patches/patch-filters_Makefile_in @@ -0,0 +1,12 @@ +$OpenBSD: patch-filters_Makefile_in,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +--- filters/Makefile.in.orig Sat Apr 14 19:28:59 2007 ++++ filters/Makefile.in Sat Apr 14 19:29:13 2007 +@@ -198,7 +198,7 @@ sharedstatedir = @sharedstatedir@ + sysconfdir = @sysconfdir@ + target_alias = @target_alias@ + SUBDIRS = SWISH +-exampledir = $(datadir)/doc/$(PACKAGE)/examples/filters ++exampledir = $(datadir)/examples/$(PACKAGE)/filters + bin_SCRIPTS = swish-filter-test + example_DATA = README + CLEANFILES = swish-filter-test diff --git a/textproc/swish-e/patches/patch-prog-bin_Makefile_in b/textproc/swish-e/patches/patch-prog-bin_Makefile_in new file mode 100644 index 00000000000..5cbdc232b49 --- /dev/null +++ b/textproc/swish-e/patches/patch-prog-bin_Makefile_in @@ -0,0 +1,12 @@ +$OpenBSD: patch-prog-bin_Makefile_in,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +--- prog-bin/Makefile.in.orig Sat Apr 14 19:29:29 2007 ++++ prog-bin/Makefile.in Sat Apr 14 19:29:47 2007 +@@ -191,7 +191,7 @@ sharedstatedir = @sharedstatedir@ + sysconfdir = @sysconfdir@ + target_alias = @target_alias@ + perlmoduledir = $(libexecdir)/perl +-exampledir = $(datadir)/doc/$(PACKAGE)/examples/prog-bin ++exampledir = $(datadir)/examples/$(PACKAGE)/prog-bin + libexec_SCRIPTS = spider.pl DirTree.pl + + # These are really out dated diff --git a/textproc/swish-e/patches/patch-src_filter_c b/textproc/swish-e/patches/patch-src_filter_c new file mode 100644 index 00000000000..ef8b6786f98 --- /dev/null +++ b/textproc/swish-e/patches/patch-src_filter_c @@ -0,0 +1,12 @@ +$OpenBSD: patch-src_filter_c,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +--- src/filter.c.orig Tue Sep 11 10:07:02 2007 ++++ src/filter.c Tue Sep 11 10:07:13 2007 +@@ -51,7 +51,7 @@ $Id: filter.c,v 1.35 2007/01/05 22:14:10 whmoseley Exp + #endif /* HAVE_SYS_WAIT_H */ + #endif /* HAVE_WORKING_FORK */ + +- ++#include + + + diff --git a/textproc/swish-e/pkg/DESCR b/textproc/swish-e/pkg/DESCR new file mode 100644 index 00000000000..eae6f4e8e7c --- /dev/null +++ b/textproc/swish-e/pkg/DESCR @@ -0,0 +1,8 @@ +Swish-e is a fast, flexible, and free open source system for indexing +collections of Web pages or other files. Swish-e is ideally suited for +collections of a million documents or smaller. Using the GNOME libxml2 +parser and a collection of filters, Swish-e can index plain text, +e-mail, PDF, HTML, XML, Microsoft Word/PowerPoint/Excel and just about +any file that can be converted to XML or HTML text. Swish-e is also +often used to supplement databases like the MySQL DBMS for very fast +full-text searching. diff --git a/textproc/swish-e/pkg/MESSAGE b/textproc/swish-e/pkg/MESSAGE new file mode 100644 index 00000000000..1a19de9f338 --- /dev/null +++ b/textproc/swish-e/pkg/MESSAGE @@ -0,0 +1,8 @@ +See ${PREFIX}/share/doc/swish-e/INSTALL for more setup information. + +Additional indexing functionality: +* For PDF Documents, install xpdf package. +* For MS Word Documents, install catdoc package. +* For MP3 ID3 Tags, install p5-MP3-Tag package. +* For MS Excel Files, install p5-Spreadsheet-ParseExcel package. + diff --git a/textproc/swish-e/pkg/PFRAG.shared b/textproc/swish-e/pkg/PFRAG.shared new file mode 100644 index 00000000000..be13019e36b --- /dev/null +++ b/textproc/swish-e/pkg/PFRAG.shared @@ -0,0 +1,2 @@ +@comment $OpenBSD: PFRAG.shared,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +@lib lib/libswish-e.so.${LIBswish-e_VERSION} diff --git a/textproc/swish-e/pkg/PLIST b/textproc/swish-e/pkg/PLIST new file mode 100644 index 00000000000..90a681b7dd2 --- /dev/null +++ b/textproc/swish-e/pkg/PLIST @@ -0,0 +1,122 @@ +@comment $OpenBSD: PLIST,v 1.1.1.1 2007/09/11 20:52:49 merdely Exp $ +%%SHARED%% +bin/swish-config +bin/swish-e +bin/swish-filter-test +include/swish-e.h +lib/libswish-e.a +lib/libswish-e.la +lib/pkgconfig/ +lib/pkgconfig/swish-e.pc +lib/swish-e/ +lib/swish-e/DirTree.pl +lib/swish-e/perl/ +lib/swish-e/perl/SWISH/ +lib/swish-e/perl/SWISH/DateRanges.pm +lib/swish-e/perl/SWISH/DefaultHighlight.pm +lib/swish-e/perl/SWISH/Filter.pm +lib/swish-e/perl/SWISH/Filters/ +lib/swish-e/perl/SWISH/Filters/Doc2html.pm +lib/swish-e/perl/SWISH/Filters/Doc2txt.pm +lib/swish-e/perl/SWISH/Filters/ID3toHTML.pm +lib/swish-e/perl/SWISH/Filters/Pdf2HTML.pm +lib/swish-e/perl/SWISH/Filters/XLtoHTML.pm +lib/swish-e/perl/SWISH/Filters/pp2html.pm +lib/swish-e/perl/SWISH/ParseQuery.pm +lib/swish-e/perl/SWISH/PhraseHighlight.pm +lib/swish-e/perl/SWISH/SimpleHighlight.pm +lib/swish-e/perl/SWISH/TemplateDefault.pm +lib/swish-e/perl/SWISH/TemplateDumper.pm +lib/swish-e/perl/SWISH/TemplateFrame.pm +lib/swish-e/perl/SWISH/TemplateHTMLTemplate.pm +lib/swish-e/perl/SWISH/TemplateToolkit.pm +lib/swish-e/perl/doc2txt.pm +lib/swish-e/perl/pdf2html.pm +lib/swish-e/perl/pdf2xml.pm +lib/swish-e/search.cgi +lib/swish-e/spider.pl +lib/swish-e/swish.cgi +lib/swish-e/swishspider +@man man/man1/SWISH-CONFIG.1 +@man man/man1/SWISH-FAQ.1 +@man man/man1/SWISH-LIBRARY.1 +@man man/man1/SWISH-RUN.1 +@man man/man1/swish-e.1 +share/doc/swish-e/ +share/doc/swish-e/INSTALL +share/doc/swish-e/README +share/doc/swish-e/README.cvs +share/doc/swish-e/html/ +share/doc/swish-e/html/api.html +share/doc/swish-e/html/changes.html +share/doc/swish-e/html/filter.html +share/doc/swish-e/html/index.html +share/doc/swish-e/html/install.html +share/doc/swish-e/html/readme.html +share/doc/swish-e/html/search.cgi.html +share/doc/swish-e/html/spider.html +share/doc/swish-e/html/swish-3.0.html +share/doc/swish-e/html/swish-bugs.html +share/doc/swish-e/html/swish-config.html +share/doc/swish-e/html/swish-faq.html +share/doc/swish-e/html/swish-library.html +share/doc/swish-e/html/swish-run.html +share/doc/swish-e/html/swish-search.html +share/doc/swish-e/html/swish.cgi.html +share/doc/swish-e/html/swish.css +share/doc/swish-e/pod/ +share/doc/swish-e/pod/CHANGES.pod +share/doc/swish-e/pod/INSTALL.pod +share/doc/swish-e/pod/README.pod +share/doc/swish-e/pod/SWISH-3.0.pod +share/doc/swish-e/pod/SWISH-BUGS.pod +share/doc/swish-e/pod/SWISH-CONFIG.pod +share/doc/swish-e/pod/SWISH-FAQ.pod +share/doc/swish-e/pod/SWISH-LIBRARY.pod +share/doc/swish-e/pod/SWISH-RUN.pod +share/doc/swish-e/pod/SWISH-SEARCH.pod +share/doc/swish-e/pod/swish-e.pod +share/examples/swish-e/ +share/examples/swish-e/conf/ +share/examples/swish-e/conf/README +share/examples/swish-e/conf/example1.config +share/examples/swish-e/conf/example2.config +share/examples/swish-e/conf/example3.config +share/examples/swish-e/conf/example4.config +share/examples/swish-e/conf/example5.config +share/examples/swish-e/conf/example6.config +share/examples/swish-e/conf/example7.config +share/examples/swish-e/conf/example8.config +share/examples/swish-e/conf/example9.config +share/examples/swish-e/conf/example9.pl +share/examples/swish-e/conf/stopwords/ +share/examples/swish-e/conf/stopwords/dutch.txt +share/examples/swish-e/conf/stopwords/english.txt +share/examples/swish-e/conf/stopwords/german.txt +share/examples/swish-e/conf/stopwords/spanish.txt +share/examples/swish-e/filter-bin/ +share/examples/swish-e/filter-bin/README +share/examples/swish-e/filter-bin/_binfilter.sh +share/examples/swish-e/filter-bin/_pdf2html.pl +share/examples/swish-e/filter-bin/swish_filter.pl +share/examples/swish-e/filters/ +share/examples/swish-e/filters/README +share/examples/swish-e/prog-bin/ +share/examples/swish-e/prog-bin/MySQL.pl +share/examples/swish-e/prog-bin/README +share/examples/swish-e/prog-bin/SwishSpiderConfig.pl +share/examples/swish-e/prog-bin/doc2txt.pm +share/examples/swish-e/prog-bin/file.pl +share/examples/swish-e/prog-bin/index_hypermail.pl +share/examples/swish-e/prog-bin/pdf2html.pm +share/examples/swish-e/prog-bin/pdf2xml.pm +share/swish-e/ +share/swish-e/swish.tmpl +share/swish-e/swish.tt +share/swish-e/templates/ +share/swish-e/templates/common_footer +share/swish-e/templates/common_header +share/swish-e/templates/markup.css +share/swish-e/templates/page_layout +share/swish-e/templates/search.tt +share/swish-e/templates/style.css