Error using Tika as meta extractor with solr

Davide davide.marchi at mail.cgilfe.it
Thu Nov 13 08:49:18 UTC 2014


Hi to all, i have a dovecot 2.2.15 installation which uses tika and solr 
for indexing and meta extraction from messages:
this is my doveconf -n output

# 2.2.15: /usr/local/etc/dovecot/dovecot.conf
# OS: Linux 2.6.32-5-amd64 x86_64 Debian 6.0.10
auth_cache_negative_ttl = 10 mins
auth_cache_size = 8 M
auth_cache_ttl = 20 mins
debug_log_path = /var/log/dovecot/dovecot-debug.log
first_valid_gid = 89
first_valid_uid = 89
info_log_path = /var/log/dovecot/dovecot.log
last_valid_gid = 89
last_valid_uid = 89
lda_mailbox_autocreate = yes
lda_mailbox_autosubscribe = yes
listen = 127.0.0.1
log_path = /var/log/dovecot/dovecot-err.log
log_timestamp = "%Y-%m-%d %H:%M:%S "
mail_fsync = never
mail_gid = 89
mail_location = maildir:~/Maildir:INDEX=/mnt/ramdisk/%u
mail_plugins = " notify zlib quota fts fts_solr"
mail_uid = 89
mailbox_list_index = yes
maildir_very_dirty_syncs = yes
managesieve_notify_capability = mailto
managesieve_sieve_capability = fileinto reject envelope 
encoded-character vacation subaddress comparator-i;ascii-numeric 
relational regex imap4flags copy include variables body enotify 
environment mailbox date ihave duplicate
mmap_disable = yes
namespace {
   inbox = yes
   location =
   prefix =
   separator = /
   type = private
}
namespace {
   list = children
   location = maildir:/var/mail/public
   prefix = Public/
   separator = /
   subscriptions = no
   type = public
}
passdb {
   args = webmail=127.0.0.1 cache_key=%u%s
   driver = vpopmail
}
plugin {
   antispam_backend = crm114
   antispam_crm_args = 
-u;/opt/crm114;--fileprefix=/opt/crm114/;--config=/usr/share/crm114/mailfilter.cf
   antispam_crm_binary = /usr/share/crm114/mailreaver.crm
   antispam_crm_notspam_arg = --good
   antispam_crm_spam_arg = --spam
   antispam_signature = X-CRM114-CacheID
   antispam_spam_pattern_ignorecase = crm-spam*
   antispam_trash_pattern_ignorecase = Trash*
   antispam_unsure_pattern_ignorecase = crm-unsure*
   fts = solr
   fts_solr = url=http://192.168.119.5:8983/solr/ break-imap-search
   fts_tika = http://192.168.119.5:9998/tika/
   mail_log_events = delete undelete expunge copy
   mail_log_fields = uid box msgid size
   mail_log_group_events =
   quota = dict:::redis:host=127.0.0.1:prefix=user/
   quota_rule2 = Trash:storage=+20%%
   quota_warning = storage=95%% quota-warning 95 %u
   quota_warning2 = storage=80%% quota-warning 80 %u
   sieve = ~/.dovecot.sieve
   sieve_before = /usr/local/lib/dovecot/sieve/default.sieve
   sieve_default = /usr/local/lib/dovecot/sieve/default.sieve
   sieve_dir = ~/sieve
   sieve_global_dir = /usr/local/lib/dovecot/sieve/
   zlib_save = gz
   zlib_save_level = 9
}
protocols = imap sieve
service auth {
   unix_listener auth-master {
     group = vchkpw
     mode = 0600
     user = vpopmail
   }
   unix_listener auth-userdb {
     group = vchkpw
     mode = 0600
     user = vpopmail
   }
}
service decode2text {
   executable = script /usr/local/libexec/dovecot/decode2text.sh
   unix_listener decode2text {
     mode = 0666
     user = dovecot
   }
}
service imap-login {
   executable = /usr/local/libexec/dovecot/imap-login
   inet_listener imaps {
     address = 192.168.10.50
   }
   process_limit = 500
   process_min_avail = 2
   service_count = 0
}
service imap {
   executable = /usr/local/libexec/dovecot/imap
}
service managesieve-login {
   executable = managesieve-login
   inet_listener sieve {
     address = 127.0.0.1
     port = 4190
   }
   process_min_avail = 2
   service_count = 0
}
service managesieve {
   process_limit = 10
}
service quota-warning {
   executable = script /usr/local/libexec/dovecot/quota-warning
   unix_listener quota-warning {
     mode = 0660
     user = vpopmail
   }
   user = vpopmail
}
ssl_cert = </var/qmail/control/servercert.pem
ssl_key = </var/qmail/control/servercert.pem
ssl_protocols = !SSLv2 !SSLv3
userdb {
   args = username_format=%u /usr/local/etc/dovecot/users
   driver = passwd-file
}
userdb {
   args = quota_template=quota_rule=*:storage=100M
   driver = vpopmail
}
protocol sieve {
   info_log_path = /var/log/dovecot/dovecot-sieve.log
   log_path = /var/log/dovecot/dovecot-sieve-error.log
   managesieve_implementation_string = Dovecot Pigeonhole
   managesieve_logout_format = bytes=%i/%o
   managesieve_max_line_length = 65536
}
protocol imap {
   imap_client_workarounds = delay-newmail tb-extra-mailbox-sep 
tb-lsub-flags
   imap_max_line_length = 64 k
   mail_plugin_dir = /usr/local/lib/dovecot
   mail_plugins = " notify zlib quota fts fts_solr imap_quota mail_log 
antispam imap_zlib"
}
protocol lda {
   auth_socket_path = /usr/local/var/run/dovecot/auth-userdb
   deliver_log_format = msgid=<%f>-<%s>-%m: %$
   hostname = mail.cgilfe.it
   info_log_path = /var/log/dovecot/dovecot-deliver.log
   log_path = /var/log/dovecot/dovecot-deliver.log
   mail_fsync = optimized
   mail_plugin_dir = /usr/local/lib/dovecot
   mail_plugins = " notify zlib quota fts fts_solr mail_log sieve"
   postmaster_address = postmaster at mail.cgilfe.it
   rejection_reason = Il messaggio destinato a <%t> è stato 
automaticamente rifiutato:%n%r
   rejection_subject = Messaggio Rifiutato: %s
   submission_host = 127.0.0.1
}

If i throw a command like this
doveadm -Dv index -u davide.marchi at mail.cgilfe.it INBOX i receive the 
error that i attach to this message
Any idea about the reason of error and how can i resolve it?
-- 
*Davide Marchi
Teorema Ferrara Srl**

**Via Spronello, 7 - Ferrara - 44121
05327831610532783368
davide.marchi at mail.cgilfe.it
davide.marchi73
Web: http://www.cgilfe.it*
*
CONFIDENZIALITA'*
*Ai sensi del D.Lgs. 196/2003 si precisa che le informazioni contenute 
in questo messaggio sono riservate ed a uso esclusivo del 
destinatario/dei destinatari. Qualora il messaggio in parola Le fosse 
pervenuto per errore, La invitiamo ad eliminarlo senza copiarlo e a non 
inoltrarlo a terzi, dandocene gentilmente comunicazione.*
*Per favore, pensa all'ambiente. Stampa questa email solo se necessario.*
-------------- next part --------------
A non-text attachment was scrubbed...
Name: footer_location_12_tran.png
Type: image/png
Size: 492 bytes
Desc: not available
URL: <http://dovecot.org/pipermail/dovecot/attachments/20141113/bda3e47b/attachment-0005.png>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: footer_phone_12_tran.png
Type: image/png
Size: 409 bytes
Desc: not available
URL: <http://dovecot.org/pipermail/dovecot/attachments/20141113/bda3e47b/attachment-0006.png>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: fax.png
Type: image/png
Size: 872 bytes
Desc: not available
URL: <http://dovecot.org/pipermail/dovecot/attachments/20141113/bda3e47b/attachment-0007.png>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: footer_mail_12_tran.png
Type: image/png
Size: 375 bytes
Desc: not available
URL: <http://dovecot.org/pipermail/dovecot/attachments/20141113/bda3e47b/attachment-0008.png>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: footer_skype_12_tran.png
Type: image/png
Size: 407 bytes
Desc: not available
URL: <http://dovecot.org/pipermail/dovecot/attachments/20141113/bda3e47b/attachment-0009.png>
-------------- next part --------------
A non-text attachment was scrubbed...
Name: error_tika.7z
Type: application/octet-stream
Size: 2756 bytes
Desc: not available
URL: <http://dovecot.org/pipermail/dovecot/attachments/20141113/bda3e47b/attachment-0001.obj>


More information about the dovecot mailing list