From a54a1a593b1b5b5bf836f709cfa401e2249fdbbf Mon Sep 17 00:00:00 2001 From: Daniel Berteaud Date: Thu, 3 Oct 2013 18:38:50 +0200 Subject: [PATCH] Add indexing support using the lucene engine --- .../ajaxplorer/bootstrap_repositories.php/050repo | 4 ++++ .../plugins/conf.serial/plugins_configs.ser/10All | 13 +++++++++++++ root/usr/bin/ajxppdftotext | 2 ++ 3 files changed, 19 insertions(+) create mode 100644 root/usr/bin/ajxppdftotext diff --git a/root/etc/e-smith/templates/etc/ajaxplorer/bootstrap_repositories.php/050repo b/root/etc/e-smith/templates/etc/ajaxplorer/bootstrap_repositories.php/050repo index 03cc66a..a6519f5 100644 --- a/root/etc/e-smith/templates/etc/ajaxplorer/bootstrap_repositories.php/050repo +++ b/root/etc/e-smith/templates/etc/ajaxplorer/bootstrap_repositories.php/050repo @@ -68,6 +68,10 @@ foreach my $share ($a->get_all_by_prop(type=>'share')){ ), "meta.filehasher" => array(), "meta.watch" => array(), + "index.lucene" => array( + "index_content" => true, + "index_meta_fields" => 'tags,anything_area' + ) ) ), ); diff --git a/root/etc/e-smith/templates/var/lib/ajaxplorer/plugins/conf.serial/plugins_configs.ser/10All b/root/etc/e-smith/templates/var/lib/ajaxplorer/plugins/conf.serial/plugins_configs.ser/10All index e808a0d..c2f57ec 100644 --- a/root/etc/e-smith/templates/var/lib/ajaxplorer/plugins/conf.serial/plugins_configs.ser/10All +++ b/root/etc/e-smith/templates/var/lib/ajaxplorer/plugins/conf.serial/plugins_configs.ser/10All @@ -50,6 +50,19 @@ $data->{'action.powerfs'} = { 'AJXP_PLUGIN_ENABLED' => '1' }; +$data->{'index.lucene'} = { + 'QUERY_ANALYSER' => 'utf8num_insensitive', + 'AJXP_PLUGIN_ENABLED' => '__true__', + 'WILDCARD_LIMITATION' => '0', + 'PDFTOTEXT' => '/usr/bin/ajxppdftotext', + 'PARSE_CONTENT_HTML' => 'html,htm', + 'PARSE_CONTENT_TXT' => 'txt', + 'PARSE_CONTENT_MAX_SIZE' => '20000000', + 'UNOCONV' => '/usr/bin/unoconv --server 127.0.0.1', + 'index_content' => '__true__' +}; + + $data = serialize($data); # PHP::Serialization has now way to # represent a boolean, so lets replace __true__ diff --git a/root/usr/bin/ajxppdftotext b/root/usr/bin/ajxppdftotext new file mode 100644 index 0000000..6b6de45 --- /dev/null +++ b/root/usr/bin/ajxppdftotext @@ -0,0 +1,2 @@ +#!/bin/bash +gs -q -dNODISPLAY -dSAFER -dDELAYBIND -dWRITESYSTEMDICT -dSIMPLE -c save -f ps2ascii.ps $1 -c quit 2>/dev/null