You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
234 lines
7.3 KiB
234 lines
7.3 KiB
/***************************************************************************
|
|
copyright : (C) 2008 by Robby Stephenson
|
|
email : robby@periapsis.org
|
|
***************************************************************************/
|
|
|
|
/***************************************************************************
|
|
* *
|
|
* This program is free software; you can redistribute it and/or modify *
|
|
* it under the terms of version 2 of the GNU General Public License as *
|
|
* published by the Free Software Foundation; *
|
|
* *
|
|
***************************************************************************/
|
|
|
|
#include "googlescholarfetcher.h"
|
|
#include "messagehandler.h"
|
|
#include "../filehandler.h"
|
|
#include "../translators/bibteximporter.h"
|
|
#include "../collection.h"
|
|
#include "../entry.h"
|
|
#include "../tellico_kernel.h"
|
|
#include "../tellico_debug.h"
|
|
|
|
#include <klocale.h>
|
|
#include <kconfig.h>
|
|
#include <kio/job.h>
|
|
|
|
#include <tqlabel.h>
|
|
#include <tqlayout.h>
|
|
|
|
namespace {
|
|
static const int GOOGLE_MAX_RETURNS_TOTAL = 20;
|
|
static const char* SCHOLAR_BASE_URL = "http://scholar.google.com/scholar";
|
|
}
|
|
|
|
using Tellico::Fetch::GoogleScholarFetcher;
|
|
|
|
GoogleScholarFetcher::GoogleScholarFetcher(TQObject* parent_, const char* name_)
|
|
: Fetcher(parent_, name_),
|
|
m_limit(GOOGLE_MAX_RETURNS_TOTAL), m_start(0), m_job(0), m_started(false),
|
|
m_cookieIsSet(false) {
|
|
m_bibtexRx = TQRegExp(TQString::fromLatin1("<a\\s.*href\\s*=\\s*\"([^>]*scholar\\.bib[^>]*)\""));
|
|
m_bibtexRx.setMinimal(true);
|
|
}
|
|
|
|
GoogleScholarFetcher::~GoogleScholarFetcher() {
|
|
}
|
|
|
|
TQString GoogleScholarFetcher::defaultName() {
|
|
// no i18n
|
|
return TQString::fromLatin1("Google Scholar");
|
|
}
|
|
|
|
TQString GoogleScholarFetcher::source() const {
|
|
return m_name.isEmpty() ? defaultName() : m_name;
|
|
}
|
|
|
|
bool GoogleScholarFetcher::canFetch(int type) const {
|
|
return type == Data::Collection::Bibtex;
|
|
}
|
|
|
|
void GoogleScholarFetcher::readConfigHook(const KConfigGroup& config_) {
|
|
Q_UNUSED(config_);
|
|
}
|
|
|
|
void GoogleScholarFetcher::search(FetchKey key_, const TQString& value_) {
|
|
if(!m_cookieIsSet) {
|
|
// have to set preferences to have bibtex output
|
|
FileHandler::readTextFile(TQString::fromLatin1("http://scholar.google.com/scholar_setprefs?num=100&scis=yes&scisf=4&submit=Save+Preferences"), true);
|
|
m_cookieIsSet = true;
|
|
}
|
|
m_key = key_;
|
|
m_value = value_;
|
|
m_started = true;
|
|
m_start = 0;
|
|
m_total = -1;
|
|
doSearch();
|
|
}
|
|
|
|
void GoogleScholarFetcher::continueSearch() {
|
|
m_started = true;
|
|
doSearch();
|
|
}
|
|
|
|
void GoogleScholarFetcher::doSearch() {
|
|
// myDebug() << "GoogleScholarFetcher::search() - value = " << value_ << endl;
|
|
|
|
if(!canFetch(Kernel::self()->collectionType())) {
|
|
message(i18n("%1 does not allow searching for this collection type.").tqarg(source()), MessageHandler::Warning);
|
|
stop();
|
|
return;
|
|
}
|
|
|
|
KURL u(TQString::fromLatin1(SCHOLAR_BASE_URL));
|
|
u.addQueryItem(TQString::fromLatin1("start"), TQString::number(m_start));
|
|
|
|
switch(m_key) {
|
|
case Title:
|
|
u.addQueryItem(TQString::fromLatin1("q"), TQString::fromLatin1("allintitle:%1").tqarg(m_value));
|
|
break;
|
|
|
|
case Keyword:
|
|
u.addQueryItem(TQString::fromLatin1("q"), m_value);
|
|
break;
|
|
|
|
case Person:
|
|
u.addQueryItem(TQString::fromLatin1("q"), TQString::fromLatin1("author:%1").tqarg(m_value));
|
|
break;
|
|
|
|
default:
|
|
kdWarning() << "GoogleScholarFetcher::search() - key not recognized: " << m_key << endl;
|
|
stop();
|
|
return;
|
|
}
|
|
// myDebug() << "GoogleScholarFetcher::search() - url: " << u.url() << endl;
|
|
|
|
m_job = KIO::get(u, false, false);
|
|
connect(m_job, TQT_SIGNAL(data(KIO::Job*, const TQByteArray&)),
|
|
TQT_SLOT(slotData(KIO::Job*, const TQByteArray&)));
|
|
connect(m_job, TQT_SIGNAL(result(KIO::Job*)),
|
|
TQT_SLOT(slotComplete(KIO::Job*)));
|
|
}
|
|
|
|
void GoogleScholarFetcher::stop() {
|
|
if(!m_started) {
|
|
return;
|
|
}
|
|
if(m_job) {
|
|
m_job->kill();
|
|
m_job = 0;
|
|
}
|
|
m_data.truncate(0);
|
|
m_started = false;
|
|
emit signalDone(this);
|
|
}
|
|
|
|
void GoogleScholarFetcher::slotData(KIO::Job*, const TQByteArray& data_) {
|
|
TQDataStream stream(m_data, IO_WriteOnly | IO_Append);
|
|
stream.writeRawBytes(data_.data(), data_.size());
|
|
}
|
|
|
|
void GoogleScholarFetcher::slotComplete(KIO::Job* job_) {
|
|
// myDebug() << "GoogleScholarFetcher::slotComplete()" << endl;
|
|
// since the fetch is done, don't worry about holding the job pointer
|
|
m_job = 0;
|
|
|
|
if(job_->error()) {
|
|
job_->showErrorDialog(Kernel::self()->widget());
|
|
stop();
|
|
return;
|
|
}
|
|
|
|
if(m_data.isEmpty()) {
|
|
myDebug() << "GoogleScholarFetcher::slotComplete() - no data" << endl;
|
|
stop();
|
|
return;
|
|
}
|
|
|
|
TQString text = TQString::fromUtf8(m_data, m_data.size());
|
|
TQString bibtex;
|
|
int count = 0;
|
|
for(int pos = text.find(m_bibtexRx); count < m_limit && pos > -1; pos = text.find(m_bibtexRx, pos+m_bibtexRx.matchedLength()), ++count) {
|
|
KURL bibtexUrl(TQString::fromLatin1(SCHOLAR_BASE_URL), m_bibtexRx.cap(1));
|
|
// myDebug() << bibtexUrl << endl;
|
|
bibtex += FileHandler::readTextFile(bibtexUrl, true);
|
|
}
|
|
|
|
Import::BibtexImporter imp(bibtex);
|
|
Data::CollPtr coll = imp.collection();
|
|
if(!coll) {
|
|
myDebug() << "GoogleScholarFetcher::slotComplete() - no collection pointer" << endl;
|
|
stop();
|
|
return;
|
|
}
|
|
|
|
count = 0;
|
|
Data::EntryVec entries = coll->entries();
|
|
for(Data::EntryVec::Iterator entry = entries.begin(); count < m_limit && entry != entries.end(); ++entry, ++count) {
|
|
if(!m_started) {
|
|
// might get aborted
|
|
break;
|
|
}
|
|
TQString desc = entry->field(TQString::fromLatin1("author"))
|
|
+ TQChar('/') + entry->field(TQString::fromLatin1("publisher"));
|
|
if(!entry->field(TQString::fromLatin1("year")).isEmpty()) {
|
|
desc += TQChar('/') + entry->field(TQString::fromLatin1("year"));
|
|
}
|
|
|
|
SearchResult* r = new SearchResult(this, entry->title(), desc, entry->field(TQString::fromLatin1("isbn")));
|
|
m_entries.insert(r->uid, Data::EntryPtr(entry));
|
|
emit signalResultFound(r);
|
|
}
|
|
m_start = m_entries.count();
|
|
// m_hasMoreResults = m_start <= m_total;
|
|
m_hasMoreResults = false; // for now, no continued searches
|
|
|
|
stop(); // required
|
|
}
|
|
|
|
Tellico::Data::EntryPtr GoogleScholarFetcher::fetchEntry(uint uid_) {
|
|
return m_entries[uid_];
|
|
}
|
|
|
|
void GoogleScholarFetcher::updateEntry(Data::EntryPtr entry_) {
|
|
// myDebug() << "GoogleScholarFetcher::updateEntry()" << endl;
|
|
// limit to top 5 results
|
|
m_limit = 5;
|
|
|
|
TQString title = entry_->field(TQString::fromLatin1("title"));
|
|
if(!title.isEmpty()) {
|
|
search(Title, title);
|
|
return;
|
|
}
|
|
|
|
myDebug() << "GoogleScholarFetcher::updateEntry() - insufficient info to search" << endl;
|
|
emit signalDone(this); // always need to emit this if not continuing with the search
|
|
}
|
|
|
|
Tellico::Fetch::ConfigWidget* GoogleScholarFetcher::configWidget(TQWidget* parent_) const {
|
|
return new GoogleScholarFetcher::ConfigWidget(parent_, this);
|
|
}
|
|
|
|
GoogleScholarFetcher::ConfigWidget::ConfigWidget(TQWidget* parent_, const GoogleScholarFetcher*/*=0*/)
|
|
: Fetch::ConfigWidget(parent_) {
|
|
TQVBoxLayout* l = new TQVBoxLayout(optionsWidget());
|
|
l->addWidget(new TQLabel(i18n("This source has no options."), optionsWidget()));
|
|
l->addStretch();
|
|
}
|
|
|
|
TQString GoogleScholarFetcher::ConfigWidget::preferredName() const {
|
|
return GoogleScholarFetcher::defaultName();
|
|
}
|
|
|
|
#include "googlescholarfetcher.moc"
|