1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63
|
/* -*- C++ -*- */
//=============================================================================
/**
* @file Web_Crawler.h
*
* $Id: Web_Crawler.h 93639 2011-03-24 13:32:13Z johnnyw $
*
* @author Douglas C. Schmidt <schmidt@cs.wustl.edu>
*/
//=============================================================================
#ifndef _WEB_CRAWLER_H
#define _WEB_CRAWLER_H
#include "URL_Addr.h"
#include "HTTP_URL.h"
#if !defined (ACE_LACKS_PRAGMA_ONCE)
#pragma once
#endif /* ACE_LACKS_PRAGMA_ONCE */
// Forward declaration.
class URL_Visitor_Factory;
/**
* @class Web_Crawler
*
* @brief An abstraction for a Web Crawler.
*
* This class is a Facade that organizes the other classes in the
* solution, which include a factory that creates a visitor,
* which in turn embodies the appropriate visitation strategy.
*/
class Web_Crawler
{
public:
// = Initialization and termination methods.
/// Constructor.
Web_Crawler (void);
/// Destructor.
~Web_Crawler (void);
/// Parses the command-line options and initializes the
/// <URL_Visitor_Factory>.
int open (int argc, ACE_TCHAR *argv[]);
/// Run the Web Crawler and carries out whatever visitation strategy
/// is configured. Returns -1 on failure and 0 on success.
int run (void);
private:
/**
* Pointer to a factory that creates visitors that explore URLs and
* perform various tasks. Subclasses of <URL_Visitor_Factory>
* determine what happens during a visitation.
*/
URL_Visitor_Factory *url_visitor_factory_;
};
#endif /* _WEB_CRAWLER_H */
|