118 lines
3.8 KiB
C++
118 lines
3.8 KiB
C++
/* Copyright (C) 2007 J.F.Dockes
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the
|
|
* Free Software Foundation, Inc.,
|
|
* 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
|
|
*/
|
|
#ifndef _rclquery_p_h_included_
|
|
#define _rclquery_p_h_included_
|
|
|
|
#include <map>
|
|
#include <vector>
|
|
#include <string>
|
|
#include <unordered_set>
|
|
|
|
#include <xapian.h>
|
|
#include "rclquery.h"
|
|
|
|
class Chrono;
|
|
|
|
namespace Rcl {
|
|
|
|
class Query::Native {
|
|
public:
|
|
// The query I belong to
|
|
Query *m_q;
|
|
// query descriptor: terms and subqueries joined by operators
|
|
// (or/and etc...)
|
|
Xapian::Query xquery;
|
|
// Open query descriptor.
|
|
Xapian::Enquire *xenquire;
|
|
// Partial result set
|
|
Xapian::MSet xmset;
|
|
// Term frequencies for current query. See makeAbstract, setQuery
|
|
std::map<std::string, double> termfreqs;
|
|
|
|
Native(Query *q)
|
|
: m_q(q), xenquire(0) { }
|
|
~Native() {
|
|
clear();
|
|
}
|
|
void clear() {
|
|
delete xenquire; xenquire = 0;
|
|
termfreqs.clear();
|
|
}
|
|
/** Return a list of terms which matched for a specific result document */
|
|
bool getMatchTerms(unsigned long xdocid, std::vector<std::string>& terms);
|
|
int makeAbstract(Xapian::docid id, std::vector<Snippet>&,
|
|
int maxoccs = -1, int ctxwords = -1);
|
|
int getFirstMatchPage(Xapian::docid docid, std::string& term);
|
|
void setDbWideQTermsFreqs();
|
|
double qualityTerms(Xapian::docid docid,
|
|
const std::vector<std::string>& terms,
|
|
std::multimap<double, std::vector<std::string> >& byQ);
|
|
void abstractPopulateQTerm(
|
|
Xapian::Database& xrdb,
|
|
Xapian::docid docid,
|
|
const string& qterm,
|
|
int qtrmwrdcnt,
|
|
int ctxwords,
|
|
unsigned int maxgrpoccs,
|
|
unsigned int maxtotaloccs,
|
|
std::map<unsigned int, std::string>& sparseDoc,
|
|
std::unordered_set<unsigned int>& searchTermPositions,
|
|
unsigned int& maxpos,
|
|
unsigned int& totaloccs,
|
|
unsigned int& grpoccs,
|
|
int& ret
|
|
);
|
|
void abstractPopulateContextTerms(
|
|
Xapian::Database& xrdb,
|
|
Xapian::docid docid,
|
|
unsigned int maxpos,
|
|
std::map<unsigned int, std::string>& sparseDoc,
|
|
int& ret
|
|
);
|
|
void abstractCreateSnippetsVector(
|
|
Db::Native *ndb,
|
|
std::map<unsigned int, std::string>& sparseDoc,
|
|
std::unordered_set<unsigned int>& searchTermPositions,
|
|
std::vector<int>& vpbreaks,
|
|
std::vector<Snippet>& vabs);
|
|
int abstractFromIndex(
|
|
Rcl::Db::Native *ndb,
|
|
Xapian::docid docid,
|
|
const std::vector<std::string>& matchTerms,
|
|
const std::multimap<double, std::vector<std::string>> byQ,
|
|
double totalweight,
|
|
int ctxwords,
|
|
unsigned int maxtotaloccs,
|
|
std::vector<Snippet>& vabs,
|
|
Chrono& chron
|
|
);
|
|
int abstractFromText(
|
|
Rcl::Db::Native *ndb,
|
|
Xapian::docid docid,
|
|
const std::vector<std::string>& matchTerms,
|
|
const std::multimap<double, std::vector<std::string>> byQ,
|
|
double totalweight,
|
|
int ctxwords,
|
|
unsigned int maxtotaloccs,
|
|
vector<Snippet>& vabs,
|
|
Chrono& chron
|
|
);
|
|
};
|
|
|
|
}
|
|
#endif /* _rclquery_p_h_included_ */
|