blob: 78acb845102f719a4cd7afed83f1ce23781d3a98 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
|
/* -*- C++ -*- */
// $Id$
// ============================================================================
//
// = LIBRARY
// examples/Web_Crawler
//
// = FILENAME
// Web_Crawler.h
//
// = AUTHOR
// Douglas C. Schmidt <schmidt@cs.wustl.edu>
//
// ============================================================================
#ifndef _WEB_CRAWLER_H
#define _WEB_CRAWLER_H
#include "URL_Addr.h"
#include "HTTP_URL.h"
#if !defined (ACE_LACKS_PRAGMA_ONCE)
#define ACE_LACKS_PRAGMA_ONCE
#endif /* ACE_LACKS_PRAGMA_ONCE */
// Forward declaration.
class URL_Visitor_Factory;
class Web_Crawler
{
// = TITLE
// An abstraction for a Web Crawler.
//
// = DESCRIPTION
// This class is a Facade that organizes the other classes in the
// solution, which include a factory that creates a visitor,
// which in turn embodies the appropriate visitation strategy.
public:
// = Initialization and termination methods.
Web_Crawler (void);
// Constructor.
~Web_Crawler (void);
// Destructor.
int open (int argc, char *argv[]);
// Parses the command-line options and initializes the
// <URL_Visitor_Factory>.
int run (void);
// Run the Web Crawler and carries out whatever visitation strategy
// is configured. Returns -1 on failure and 0 on success.
private:
URL_Visitor_Factory *url_visitor_factory_;
// Pointer to a factory that creates visitors that explore URLs and
// perform various tasks. Subclasses of <URL_Visitor_Factory>
// determine what happens during a visitation.
};
#endif /* _WEB_CRAWLER_H */
|