/*************************************************************************** copyright : (C) 2008 by Robby Stephenson email : robby@periapsis.org ***************************************************************************/ /*************************************************************************** * * * This program is free software; you can redistribute it and/or modify * * it under the terms of version 2 of the GNU General Public License as * * published by the Free Software Foundation; * * * ***************************************************************************/ #include "googlescholarfetcher.h" #include "messagehandler.h" #include "../filehandler.h" #include "../translators/bibteximporter.h" #include "../collection.h" #include "../entry.h" #include "../tellico_kernel.h" #include "../tellico_debug.h" #include #include #include #include #include namespace { static const size_t GOOGLE_MAX_RETURNS_TOTAL = 20; static const char* SCHOLAR_BASE_URL = "http://scholar.google.com/scholar"; } using Tellico::Fetch::GoogleScholarFetcher; GoogleScholarFetcher::GoogleScholarFetcher(TQObject* parent_, const char* name_) : Fetcher(parent_, name_), m_limit(GOOGLE_MAX_RETURNS_TOTAL), m_start(0), m_job(0), m_started(false), m_cookieIsSet(false) { m_bibtexRx = TQRegExp(TQString::fromLatin1("]*scholar\\.bib[^>]*)\"")); m_bibtexRx.setMinimal(true); } GoogleScholarFetcher::~GoogleScholarFetcher() { } TQString GoogleScholarFetcher::defaultName() { // no i18n return TQString::fromLatin1("Google Scholar"); } TQString GoogleScholarFetcher::source() const { return m_name.isEmpty() ? defaultName() : m_name; } bool GoogleScholarFetcher::canFetch(int type) const { return type == Data::Collection::Bibtex; } void GoogleScholarFetcher::readConfigHook(const TDEConfigGroup& config_) { Q_UNUSED(config_); } void GoogleScholarFetcher::search(FetchKey key_, const TQString& value_) { if(!m_cookieIsSet) { // have to set preferences to have bibtex output FileHandler::readTextFile(TQString::fromLatin1("http://scholar.google.com/scholar_setprefs?num=100&scis=yes&scisf=4&submit=Save+Preferences"), true); m_cookieIsSet = true; } m_key = key_; m_value = value_; m_started = true; m_start = 0; m_total = -1; doSearch(); } void GoogleScholarFetcher::continueSearch() { m_started = true; doSearch(); } void GoogleScholarFetcher::doSearch() { // myDebug() << "GoogleScholarFetcher::search() - value = " << value_ << endl; if(!canFetch(Kernel::self()->collectionType())) { message(i18n("%1 does not allow searching for this collection type.").arg(source()), MessageHandler::Warning); stop(); return; } KURL u(TQString::fromLatin1(SCHOLAR_BASE_URL)); u.addQueryItem(TQString::fromLatin1("start"), TQString::number(m_start)); switch(m_key) { case Title: u.addQueryItem(TQString::fromLatin1("q"), TQString::fromLatin1("allintitle:%1").arg(m_value)); break; case Keyword: u.addQueryItem(TQString::fromLatin1("q"), m_value); break; case Person: u.addQueryItem(TQString::fromLatin1("q"), TQString::fromLatin1("author:%1").arg(m_value)); break; default: kdWarning() << "GoogleScholarFetcher::search() - key not recognized: " << m_key << endl; stop(); return; } // myDebug() << "GoogleScholarFetcher::search() - url: " << u.url() << endl; m_job = TDEIO::get(u, false, false); connect(m_job, TQ_SIGNAL(data(TDEIO::Job*, const TQByteArray&)), TQ_SLOT(slotData(TDEIO::Job*, const TQByteArray&))); connect(m_job, TQ_SIGNAL(result(TDEIO::Job*)), TQ_SLOT(slotComplete(TDEIO::Job*))); } void GoogleScholarFetcher::stop() { if(!m_started) { return; } if(m_job) { m_job->kill(); m_job = 0; } m_data.truncate(0); m_started = false; emit signalDone(this); } void GoogleScholarFetcher::slotData(TDEIO::Job*, const TQByteArray& data_) { TQDataStream stream(m_data, IO_WriteOnly | IO_Append); stream.writeRawBytes(data_.data(), data_.size()); } void GoogleScholarFetcher::slotComplete(TDEIO::Job* job_) { // myDebug() << "GoogleScholarFetcher::slotComplete()" << endl; // since the fetch is done, don't worry about holding the job pointer m_job = 0; if(job_->error()) { job_->showErrorDialog(Kernel::self()->widget()); stop(); return; } if(m_data.isEmpty()) { myDebug() << "GoogleScholarFetcher::slotComplete() - no data" << endl; stop(); return; } TQString text = TQString::fromUtf8(m_data, m_data.size()); TQString bibtex; size_t count = 0; for(int pos = text.find(m_bibtexRx); count < m_limit && pos > -1; pos = text.find(m_bibtexRx, pos+m_bibtexRx.matchedLength()), ++count) { KURL bibtexUrl(TQString::fromLatin1(SCHOLAR_BASE_URL), m_bibtexRx.cap(1)); // myDebug() << bibtexUrl << endl; bibtex += FileHandler::readTextFile(bibtexUrl, true); } Import::BibtexImporter imp(bibtex); Data::CollPtr coll = imp.collection(); if(!coll) { myDebug() << "GoogleScholarFetcher::slotComplete() - no collection pointer" << endl; stop(); return; } count = 0; Data::EntryVec entries = coll->entries(); for(Data::EntryVec::Iterator entry = entries.begin(); count < m_limit && entry != entries.end(); ++entry, ++count) { if(!m_started) { // might get aborted break; } TQString desc = entry->field(TQString::fromLatin1("author")) + TQChar('/') + entry->field(TQString::fromLatin1("publisher")); if(!entry->field(TQString::fromLatin1("year")).isEmpty()) { desc += TQChar('/') + entry->field(TQString::fromLatin1("year")); } SearchResult* r = new SearchResult(this, entry->title(), desc, entry->field(TQString::fromLatin1("isbn"))); m_entries.insert(r->uid, Data::EntryPtr(entry)); emit signalResultFound(r); } m_start = m_entries.count(); // m_hasMoreResults = m_start <= m_total; m_hasMoreResults = false; // for now, no continued searches stop(); // required } Tellico::Data::EntryPtr GoogleScholarFetcher::fetchEntry(uint uid_) { return m_entries[uid_]; } void GoogleScholarFetcher::updateEntry(Data::EntryPtr entry_) { // myDebug() << "GoogleScholarFetcher::updateEntry()" << endl; // limit to top 5 results m_limit = 5; TQString title = entry_->field(TQString::fromLatin1("title")); if(!title.isEmpty()) { search(Title, title); return; } myDebug() << "GoogleScholarFetcher::updateEntry() - insufficient info to search" << endl; emit signalDone(this); // always need to emit this if not continuing with the search } Tellico::Fetch::ConfigWidget* GoogleScholarFetcher::configWidget(TQWidget* parent_) const { return new GoogleScholarFetcher::ConfigWidget(parent_, this); } GoogleScholarFetcher::ConfigWidget::ConfigWidget(TQWidget* parent_, const GoogleScholarFetcher*/*=0*/) : Fetch::ConfigWidget(parent_) { TQVBoxLayout* l = new TQVBoxLayout(optionsWidget()); l->addWidget(new TQLabel(i18n("This source has no options."), optionsWidget())); l->addStretch(); } TQString GoogleScholarFetcher::ConfigWidget::preferredName() const { return GoogleScholarFetcher::defaultName(); } #include "googlescholarfetcher.moc"