Files
GoldenCheetah/deprecated/Lucene.cpp
Mark Liversedge 804f30502e Reorg tidy src directory
.. move the fluff that has collected into the src directory
   to somewhere more appropriate.
2016-02-26 09:28:28 +00:00

228 lines
6.1 KiB
C++

/*
* Copyright (c) 2012 Mark Liversedge (liversedge@gmail.com)
*
* This program is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License as published by the Free
* Software Foundation; either version 2 of the License, or (at your option)
* any later version.
*
* This program is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
* more details.
*
* You should have received a copy of the GNU General Public License along
* with this program; if not, write to the Free Software Foundation, Inc., 51
* Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
*/
#include "Lucene.h"
#include "Context.h"
#include "Athlete.h"
#include "RideItem.h"
// stdc strings
using namespace std;
// here we go
using namespace lucene::analysis;
using namespace lucene::index;
using namespace lucene::document;
using namespace lucene::queryParser;
using namespace lucene::search;
using namespace lucene::store;
Lucene::Lucene(QObject *parent, Context *context) : QObject(parent), context(context)
{
// create the directory if needed
context->athlete->home->cache().mkdir("index");
// make index directory if needed
dir = QDir(context->athlete->home->cache().canonicalPath() + "/index");
try {
// set lock timeout to a bit longer
bool indexExists = IndexReader::indexExists(dir.canonicalPath().toLocal8Bit().data());
// clear any locks
if (indexExists && IndexReader::isLocked(dir.canonicalPath().toLocal8Bit().data()))
IndexReader::unlock(dir.canonicalPath().toLocal8Bit().data());
if (!indexExists) {
// ridecache will need to build the index !
context->athlete->emptyindex = true;
IndexWriter *create = new IndexWriter(dir.canonicalPath().toLocal8Bit().data(), &analyzer, true);
// lets flush to disk and reopen
create->close();
delete create;
}
} catch (CLuceneError &e) {
//qDebug()<<"clucene error!"<<e.what();
}
}
Lucene::~Lucene()
{
}
bool Lucene::importRide(RideFile *ride)
{
QMutexLocker locker(&mutex);
// create a document
Document doc;
// add Filename special field (unique)
std::wstring cname = ride->getTag("Filename","").toStdWString();
Field *fadd = new Field(_T("Filename"), cname.c_str(), Field::STORE_YES | Field::INDEX_UNTOKENIZED);
doc.add(*fadd);
QString alltexts;
// And all the metadata texts individually
QMapIterator<QString,QString> iterate(ride->tags());
while (iterate.hasNext()) {
iterate.next();
std::wstring name = iterate.key().toStdWString();
std::wstring value = iterate.value().toStdWString();
alltexts += iterate.value() + " ";
Field *add = new Field(name.c_str(), value.c_str(), Field::STORE_YES | Field::INDEX_TOKENIZED);
doc.add( *add );
}
// add a catchall text which is concat of all text fields
std::wstring value = alltexts.toStdWString();
Field *cadd = new Field(_T("contents"), value.c_str(), Field::STORE_YES | Field::INDEX_TOKENIZED);
doc.add( *cadd );
// now add to index
IndexWriter *writer = NULL;
try {
// now lets open using a mnodifier since the API is much simpler
writer = new IndexWriter(dir.canonicalPath().toLocal8Bit().data(), &analyzer, false); // for updates
writer->addDocument(&doc);
doc.clear();
} catch (CLuceneError &e) {
qDebug()<<"add document clucene error!"<<e.what();
}
if (writer) {
writer->close();
delete writer;
}
return true;
}
bool Lucene::deleteRide(QString name)
{
QMutexLocker locker(&mutex);
std::wstring cname = name.toStdWString();
try {
IndexReader *reader = IndexReader::open(dir.canonicalPath().toLocal8Bit().data());
Term del = Term(_T("Filename"), cname.c_str());
reader->deleteDocuments(&del);
reader->close();
delete reader;
} catch (CLuceneError &e) {
qDebug()<<"deleteDocuments clucene error!"<<e.what();
}
return true;
}
bool Lucene::exists(QString name)
{
bool returning = false;
std::wstring cname = name.toStdWString();
try {
IndexReader *reader = IndexReader::open(dir.canonicalPath().toLocal8Bit().data());
Term check = Term(_T("Filename"), cname.c_str());
TermDocs *td = reader->termDocs(&check);
if (td->next()) returning = true;
td->close();
delete td;
reader->close();
delete reader;
} catch (CLuceneError &e) {
qDebug()<<"termDocs clucene error!"<<e.what();
}
return returning;
}
void Lucene::optimise()
{
try {
IndexWriter *writer = new IndexWriter(dir.canonicalPath().toLocal8Bit().data(), &analyzer, false); // for updates
writer->optimize();
writer->close();
delete writer;
} catch(CLuceneError &e) {
qDebug()<<"optimise clucene error!"<<e.what();
}
}
QList<QString> Lucene::search(QString query)
{
filenames.clear();
try {
// parse query
QueryParser parser(_T("contents"), &analyzer);
parser.setPhraseSlop(4);
std::wstring querystring = query.toStdWString();
Query* lquery = parser.parse(querystring.c_str());
if (lquery == NULL) return filenames;
IndexReader *reader = IndexReader::open(dir.canonicalPath().toLocal8Bit().data());
IndexSearcher *searcher = new IndexSearcher(reader); // to perform searches
// go find hits
hits = searcher->search(lquery);
for (size_t i=0; i< hits->length(); i++) {
Document *d = &hits->doc(i);
filenames << QString::fromWCharArray(d->get(_T("Filename")));
}
searcher->close();
reader->close();
delete hits;
delete lquery;
delete searcher;
delete reader;
} catch (CLuceneError &e) {
//qDebug()<<"clucene error:"<<e.what();
return filenames;
}
emit results(filenames);
return filenames;
}