comparison src/scanner.h @ 76:81f1e400e8ab

start coding on new config syntax
author carl
date Sat, 16 Jul 2005 13:47:19 -0700
parents 1142e46be550
children aa07452e641b
comparison
equal deleted inserted replaced
75:1142e46be550 76:81f1e400e8ab
15 int bad_html_tags; 15 int bad_html_tags;
16 int binary_tags; 16 int binary_tags;
17 17
18 public: 18 public:
19 recorder(mlfiPriv *priv_, string_set &html_tags_, string_set &tlds_); 19 recorder(mlfiPriv *priv_, string_set &html_tags_, string_set &tlds_);
20 ~recorder(); 20 ~recorder() { empty(); };
21 void empty(); 21 void empty();
22 void new_url(char *host); 22 void new_url(char *host);
23 void new_tag(char *tag); 23 void new_tag(char *tag);
24 void binary(); 24 void binary();
25 mlfiPriv *get_priv() {return priv; }; 25 mlfiPriv *get_priv() { return priv; };
26 string_set *get_tlds() {return tlds; }; 26 string_set *get_tlds() { return tlds; };
27 string_set &get_hosts() {return hosts; }; 27 string_set &get_hosts() { return hosts; };
28 bool excessive_bad_tags(int limit) {return (limit > 0) && (bad_html_tags > limit) && (bad_html_tags > 3*binary_tags); }; 28 bool excessive_bad_tags(int limit) { return (limit > 0) && (bad_html_tags > limit) && (bad_html_tags > 3*binary_tags); };
29 bool excessive_hosts(int limit) {return (limit > 0) && (hosts.size() > limit); }; 29 bool excessive_hosts(int limit) { return (limit > 0) && (hosts.size() > limit); };
30 }; 30 };
31 31
32 32
33 //////////////////////////////////////////////// 33 ////////////////////////////////////////////////
34 // the content scanner 34 // the content scanner