2009-11-25 21:55:06 +01:00
|
|
|
/*
|
2010-01-01 14:56:45 +01:00
|
|
|
** Copyright (C) 2010 Dirk-Jan C. Binnema <djcb@djcbsoftware.nl>
|
2009-11-25 21:55:06 +01:00
|
|
|
**
|
|
|
|
** This program is free software; you can redistribute it and/or modify
|
|
|
|
** it under the terms of the GNU General Public License as published by
|
|
|
|
** the Free Software Foundation; either version 3 of the License, or
|
|
|
|
** (at your option) any later version.
|
|
|
|
**
|
|
|
|
** This program is distributed in the hope that it will be useful,
|
|
|
|
** but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
** MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
** GNU General Public License for more details.
|
|
|
|
**
|
|
|
|
** You should have received a copy of the GNU General Public License
|
|
|
|
** along with this program; if not, write to the Free Software Foundation,
|
|
|
|
** Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
|
|
**
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <xapian.h>
|
|
|
|
#include <glib/gstdio.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <string>
|
|
|
|
|
|
|
|
#include "mu-query-xapian.h"
|
|
|
|
|
2010-01-23 22:34:27 +01:00
|
|
|
#include "mu-msg-iter-xapian.h"
|
|
|
|
#include "mu-msg-iter-xapian-priv.hh"
|
2009-11-25 21:55:06 +01:00
|
|
|
|
2010-01-05 07:32:23 +01:00
|
|
|
#include "mu-util.h"
|
2010-01-23 19:50:06 +01:00
|
|
|
#include "mu-util-xapian.h"
|
2010-01-05 07:32:23 +01:00
|
|
|
|
|
|
|
|
2010-01-23 13:13:04 +01:00
|
|
|
static void add_prefix (const MuMsgField* field,
|
|
|
|
Xapian::QueryParser* qparser);
|
2009-12-05 19:10:58 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
struct _MuQueryXapian {
|
|
|
|
Xapian::Database* _db;
|
|
|
|
Xapian::QueryParser* _qparser;
|
|
|
|
Xapian::Sorter* _sorters[MU_MSG_FIELD_TYPE_NUM];
|
|
|
|
};
|
2009-12-05 19:10:58 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
gboolean
|
2010-01-15 21:15:09 +01:00
|
|
|
init_mu_query_xapian (MuQueryXapian *mqx, const char* dbpath)
|
2009-12-08 23:01:49 +01:00
|
|
|
{
|
|
|
|
mqx->_db = 0;
|
|
|
|
mqx->_qparser = 0;
|
|
|
|
|
|
|
|
try {
|
|
|
|
mqx->_db = new Xapian::Database(dbpath);
|
|
|
|
mqx->_qparser = new Xapian::QueryParser;
|
2009-12-05 19:10:58 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
mqx->_qparser->set_database(*mqx->_db);
|
|
|
|
mqx->_qparser->set_default_op(Xapian::Query::OP_OR);
|
2010-01-05 07:32:23 +01:00
|
|
|
mqx->_qparser->set_stemming_strategy
|
|
|
|
(Xapian::QueryParser::STEM_SOME);
|
2009-12-08 23:01:49 +01:00
|
|
|
|
|
|
|
memset (mqx->_sorters, 0, sizeof(mqx->_sorters));
|
2009-12-05 19:10:58 +01:00
|
|
|
mu_msg_field_foreach ((MuMsgFieldForEachFunc)add_prefix,
|
2009-12-08 23:01:49 +01:00
|
|
|
(gpointer)mqx->_qparser);
|
2010-01-05 07:32:23 +01:00
|
|
|
return TRUE;
|
2009-12-23 23:39:49 +01:00
|
|
|
|
2010-01-06 00:30:45 +01:00
|
|
|
} MU_XAPIAN_CATCH_BLOCK;
|
2010-01-05 07:32:23 +01:00
|
|
|
|
2010-01-08 19:49:55 +01:00
|
|
|
try {
|
|
|
|
delete mqx->_db;
|
|
|
|
delete mqx->_qparser;
|
|
|
|
|
|
|
|
} MU_XAPIAN_CATCH_BLOCK;
|
|
|
|
|
2010-01-05 07:32:23 +01:00
|
|
|
return FALSE;
|
2009-12-08 23:01:49 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static void
|
2010-01-15 21:15:09 +01:00
|
|
|
uninit_mu_query_xapian (MuQueryXapian *mqx)
|
2009-12-08 23:01:49 +01:00
|
|
|
{
|
|
|
|
try {
|
|
|
|
delete mqx->_db;
|
|
|
|
delete mqx->_qparser;
|
2009-12-05 19:10:58 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
for (int i = 0; i != MU_MSG_FIELD_TYPE_NUM; ++i)
|
|
|
|
delete mqx->_sorters[i];
|
|
|
|
|
2010-01-06 00:30:45 +01:00
|
|
|
} MU_XAPIAN_CATCH_BLOCK;
|
2009-12-08 23:01:49 +01:00
|
|
|
}
|
2009-12-23 23:39:49 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
static Xapian::Query
|
2010-01-15 21:15:09 +01:00
|
|
|
get_query (MuQueryXapian * mqx, const char* searchexpr, int *err = 0) {
|
2009-12-05 15:05:15 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
try {
|
|
|
|
return mqx->_qparser->parse_query
|
2009-12-05 19:10:58 +01:00
|
|
|
(searchexpr,
|
|
|
|
Xapian::QueryParser::FLAG_BOOLEAN |
|
|
|
|
Xapian::QueryParser::FLAG_PHRASE |
|
2010-01-15 21:11:51 +01:00
|
|
|
// Xapian::QueryParser::FLAG_LOVEHATE |
|
|
|
|
// Xapian::QueryParser::FLAG_BOOLEAN_ANY_CASE |
|
2009-12-05 19:10:58 +01:00
|
|
|
Xapian::QueryParser::FLAG_WILDCARD |
|
|
|
|
Xapian::QueryParser::FLAG_PURE_NOT |
|
|
|
|
Xapian::QueryParser::FLAG_PARTIAL);
|
2009-12-23 23:39:49 +01:00
|
|
|
|
2010-01-06 00:30:45 +01:00
|
|
|
} MU_XAPIAN_CATCH_BLOCK;
|
2009-12-23 23:39:49 +01:00
|
|
|
|
2009-12-11 21:06:49 +01:00
|
|
|
if (err)
|
|
|
|
*err = 1;
|
|
|
|
|
|
|
|
return Xapian::Query();
|
2009-12-08 23:01:49 +01:00
|
|
|
}
|
2009-11-25 21:55:06 +01:00
|
|
|
|
|
|
|
static void
|
|
|
|
add_prefix (const MuMsgField* field, Xapian::QueryParser* qparser)
|
|
|
|
{
|
|
|
|
if (!mu_msg_field_is_xapian_enabled(field))
|
|
|
|
return;
|
|
|
|
|
|
|
|
const std::string prefix (mu_msg_field_xapian_prefix(field));
|
2009-12-08 23:01:49 +01:00
|
|
|
|
2009-11-25 21:55:06 +01:00
|
|
|
qparser->add_boolean_prefix(std::string(mu_msg_field_name(field)),
|
|
|
|
prefix);
|
|
|
|
qparser->add_boolean_prefix(std::string(mu_msg_field_shortcut(field)),
|
2009-12-08 23:01:49 +01:00
|
|
|
prefix);
|
2009-11-25 21:55:06 +01:00
|
|
|
|
|
|
|
/* make the empty string match this field too*/
|
|
|
|
qparser->add_prefix ("", prefix);
|
|
|
|
}
|
|
|
|
|
|
|
|
MuQueryXapian*
|
2010-01-06 00:30:45 +01:00
|
|
|
mu_query_xapian_new (const char* xpath)
|
2009-11-25 21:55:06 +01:00
|
|
|
{
|
2009-12-08 23:01:49 +01:00
|
|
|
MuQueryXapian *mqx;
|
2009-11-25 21:55:06 +01:00
|
|
|
|
2010-01-06 00:30:45 +01:00
|
|
|
g_return_val_if_fail (xpath, NULL);
|
|
|
|
|
|
|
|
if (!mu_util_check_dir (xpath, TRUE, FALSE)) {
|
2010-01-23 19:50:06 +01:00
|
|
|
g_warning ("'%s' is not a readable xapian dir", xpath);
|
2009-11-25 21:55:06 +01:00
|
|
|
return NULL;
|
|
|
|
}
|
2009-12-08 23:01:49 +01:00
|
|
|
|
2010-01-23 19:50:06 +01:00
|
|
|
if (!mu_util_xapian_db_version_up_to_date (xpath)) {
|
|
|
|
g_warning ("%s is not up-to-date, needs full reindex",
|
|
|
|
xpath);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
mqx = g_new (MuQueryXapian, 1);
|
2010-01-06 00:30:45 +01:00
|
|
|
|
2010-01-15 21:15:09 +01:00
|
|
|
if (!init_mu_query_xapian (mqx, xpath)) {
|
2010-01-08 19:49:55 +01:00
|
|
|
g_warning ("failed to initalize xapian query");
|
2010-01-05 07:32:23 +01:00
|
|
|
g_free (mqx);
|
2010-01-08 19:49:55 +01:00
|
|
|
return NULL;
|
2010-01-05 07:32:23 +01:00
|
|
|
}
|
2010-01-08 19:49:55 +01:00
|
|
|
|
2009-12-08 23:01:49 +01:00
|
|
|
return mqx;
|
2009-11-25 21:55:06 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2010-01-23 19:50:06 +01:00
|
|
|
|
2009-11-25 21:55:06 +01:00
|
|
|
void
|
|
|
|
mu_query_xapian_destroy (MuQueryXapian *self)
|
|
|
|
{
|
2009-12-11 18:44:05 +01:00
|
|
|
if (!self)
|
|
|
|
return;
|
|
|
|
|
2010-01-15 21:15:09 +01:00
|
|
|
uninit_mu_query_xapian (self);
|
2009-12-11 18:44:05 +01:00
|
|
|
g_free (self);
|
2009-11-25 21:55:06 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
|
2010-01-23 22:34:27 +01:00
|
|
|
MuMsgIterXapian*
|
2009-11-25 21:55:06 +01:00
|
|
|
mu_query_xapian_run (MuQueryXapian *self, const char* searchexpr,
|
|
|
|
const MuMsgField* sortfield, gboolean ascending)
|
|
|
|
{
|
|
|
|
g_return_val_if_fail (self, NULL);
|
|
|
|
g_return_val_if_fail (searchexpr, NULL);
|
|
|
|
|
|
|
|
try {
|
2010-01-23 19:50:06 +01:00
|
|
|
|
2010-01-15 21:15:09 +01:00
|
|
|
Xapian::Query q(get_query(self, searchexpr));
|
2009-12-08 23:01:49 +01:00
|
|
|
Xapian::Enquire enq (*self->_db);
|
2009-11-25 21:55:06 +01:00
|
|
|
|
|
|
|
if (sortfield)
|
|
|
|
enq.set_sort_by_value (
|
|
|
|
(Xapian::valueno)mu_msg_field_id(sortfield),
|
|
|
|
ascending);
|
|
|
|
|
|
|
|
enq.set_query (q);
|
|
|
|
enq.set_cutoff (0,0);
|
|
|
|
|
2010-01-23 22:34:27 +01:00
|
|
|
return mu_msg_iter_xapian_new (enq, 10000); /* FIXME */
|
2009-11-25 21:55:06 +01:00
|
|
|
|
2010-01-08 19:49:55 +01:00
|
|
|
} MU_XAPIAN_CATCH_BLOCK_RETURN(NULL);
|
2009-11-25 21:55:06 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
char*
|
|
|
|
mu_query_xapian_as_string (MuQueryXapian *self, const char* searchexpr)
|
|
|
|
{
|
|
|
|
g_return_val_if_fail (self, NULL);
|
|
|
|
g_return_val_if_fail (searchexpr, NULL);
|
|
|
|
|
|
|
|
try {
|
2010-01-15 21:15:09 +01:00
|
|
|
Xapian::Query q(get_query(self, searchexpr));
|
2009-11-25 21:55:06 +01:00
|
|
|
return g_strdup(q.get_description().c_str());
|
|
|
|
|
2010-01-06 00:30:45 +01:00
|
|
|
} MU_XAPIAN_CATCH_BLOCK_RETURN(NULL);
|
2009-11-25 21:55:06 +01:00
|
|
|
}
|
|
|
|
|
2010-01-02 13:44:26 +01:00
|
|
|
|
2010-01-13 21:35:16 +01:00
|
|
|
static gboolean
|
2010-01-15 21:15:09 +01:00
|
|
|
needs_quotes (const char* str)
|
2010-01-13 21:35:16 +01:00
|
|
|
{
|
|
|
|
int i;
|
|
|
|
const char *keywords[] = {
|
|
|
|
"ANO", "OR", "NOT", "NEAR", "ADJ"
|
|
|
|
};
|
|
|
|
|
|
|
|
for (i = 0; i != G_N_ELEMENTS(keywords); ++i)
|
|
|
|
if (g_strcasecmp (str, keywords[i]) == 0)
|
|
|
|
return TRUE;
|
|
|
|
|
|
|
|
return FALSE;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2009-11-25 21:55:06 +01:00
|
|
|
char*
|
2010-01-02 13:44:26 +01:00
|
|
|
mu_query_xapian_combine (const gchar **params, gboolean connect_or)
|
2009-11-25 21:55:06 +01:00
|
|
|
{
|
|
|
|
GString *str;
|
2009-12-11 21:06:49 +01:00
|
|
|
int i;
|
|
|
|
|
|
|
|
g_return_val_if_fail (params && params[0], NULL);
|
2009-11-25 21:55:06 +01:00
|
|
|
|
|
|
|
str = g_string_sized_new (64); /* just a guess */
|
2009-12-11 21:06:49 +01:00
|
|
|
|
|
|
|
for (i = 0; params && params[i]; ++i) {
|
|
|
|
|
2009-12-06 23:22:42 +01:00
|
|
|
const char* elm;
|
2009-11-25 21:55:06 +01:00
|
|
|
const char* cnx = "";
|
2009-12-06 23:22:42 +01:00
|
|
|
gboolean do_quote;
|
|
|
|
|
2009-12-11 21:06:49 +01:00
|
|
|
elm = (const gchar*)params[i];
|
2009-12-06 23:22:42 +01:00
|
|
|
if (!elm) /* shouldn't happen */
|
|
|
|
break;
|
|
|
|
|
2009-12-11 21:06:49 +01:00
|
|
|
if (params[i + 1])
|
2009-11-25 21:55:06 +01:00
|
|
|
cnx = connect_or ? " OR " : " AND ";
|
|
|
|
|
2010-01-15 21:15:09 +01:00
|
|
|
do_quote = needs_quotes (elm);
|
2009-12-06 23:22:42 +01:00
|
|
|
g_string_append_printf (str, "%s%s%s%s",
|
|
|
|
do_quote ? "\"" : "",
|
2009-12-11 21:06:49 +01:00
|
|
|
elm,
|
2009-12-06 23:22:42 +01:00
|
|
|
do_quote ? "\"" : "",
|
|
|
|
cnx);
|
2009-11-25 21:55:06 +01:00
|
|
|
}
|
2010-01-08 19:49:55 +01:00
|
|
|
|
2009-11-25 21:55:06 +01:00
|
|
|
return g_string_free (str, FALSE);
|
2009-12-05 19:10:58 +01:00
|
|
|
}
|
2010-01-03 22:53:49 +01:00
|
|
|
|
|
|
|
|