You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
tdewebdev/klinkstatus/src/engine/linkchecker.h

130 lines
4.2 KiB

/***************************************************************************
* Copyright (C) 2004 by Paulo Moura Guedes *
* moura@tdewebdev.org *
* *
* This program is free software; you can redistribute it and/or modify *
* it under the terms of the GNU General Public License as published by *
* the Free Software Foundation; either version 2 of the License, or *
* (at your option) any later version. *
* *
* This program is distributed in the hope that it will be useful, *
* but WITHOUT ANY WARRANTY; without even the implied warranty of *
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the *
* GNU General Public License for more details. *
* *
* You should have received a copy of the GNU General Public License *
* along with this program; if not, write to the *
* Free Software Foundation, Inc., *
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA. *
***************************************************************************/
#ifndef LINKCHECKER_H
#define LINKCHECKER_H
#include <tqobject.h>
#include <tqthread.h>
#include <tqstring.h>
#include <kio/jobclasses.h>
class KHTMLPart;
#include "../parser/http.h"
#include "linkstatus.h"
class SearchManager;
#include <iostream>
using namespace std;
/**
@author Paulo Moura Guedes
*/
class LinkChecker : public TQObject
{
Q_OBJECT
TQ_OBJECT
public:
LinkChecker(LinktqStatus* linkstatus, int time_out = 50,
TQObject *parent = 0, const char *name = 0);
~LinkChecker();
//virtual void run();
void check();
void setSearchManager(SearchManager* search_manager);
LinktqStatus const* linktqStatus() const;
static bool hasAnchor(KHTMLPart* html_part, TQString const& anchor);
signals:
void transactionFinished(const LinktqStatus * linkstatus,
LinkChecker * checker);
void jobFinnished(LinkChecker * checker);
protected slots:
void slotData(KIO::Job *, const TQByteArray &data);
void slotRedirection (KIO::Job *, const KURL &url);
void slotMimetype(KIO::Job *, const TQString &type);
void slotResult(KIO::Job* job);
void slotTimeOut();
protected:
void finnish();
HttpResponseHeader getHttpHeader(KIO::Job* job, bool remember_check = true);
void checkRef(); // #...
private:
LinktqStatus::tqStatus getHttptqStatus() const;
void checkRef(LinktqStatus const* linkstatus_parent);
void checkRef(KURL const& url);
void killJob();
/**
* @param url
* @return false if the redirection was already checked by the search manager
*/
bool processRedirection(KURL const& url);
void findDocumentCharset(TQString const& data);
private:
SearchManager* search_manager_;
LinktqStatus* const linkstatus_;
KIO::TransferJob* t_job_;
int time_out_;
LinkChecker* checker_;
TQString document_charset_;
/* A redirection has appened, with the current URL. Several redirections
can happen until the final URL is reached.*/
bool redirection_;
KURL redirection_url_;
TQString doc_html_;
bool header_checked_;
bool finnished_;
bool parsing_;
/**
* Whether the charset of the document is already checked.
* (e.g. <meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>)
*/
bool is_charset_checked_;
/**
* Wheter the page define the enconding (latin1, utf8, etc).
* According to the spec (http://www.w3.org/TR/html4/charset.html),
* it first check the server response and then the info in the html meta element.
*/
bool has_defined_charset_;
static int count_; // debug attribute that counts how many links were checked
};
inline LinktqStatus const* LinkChecker::linktqStatus() const
{
return linkstatus_;
}
#endif