annotate src/scanner.cpp @ 23:06de5ab6a232

add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
author carl
date Wed, 12 May 2004 13:23:22 -0700
parents b8f5fa3dd5b8
children 2e23b7184d2b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1 /*
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
3 Copyright (c) 2004 Carl Byington - 510 Software Group, released under
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
4 the GPL version 2 or any later version at your choice available at
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
5 http://www.fsf.org/licenses/gpl.txt
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
7 */
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
8
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
9 static char* scanner_version="$Id$";
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
10
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
11 using namespace std;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
12
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
13 enum state {// host name recognizer states
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
14 h_init,
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
15 h_host,
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
17 // html tag discarder states
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
18 t_init,
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
19 t_disc,
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
20
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
21 // url recognizer states
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
22 u_init,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
23 u_http,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
24 u_sla,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
25 u_url,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
26
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
27 // url decoder states %xx
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
28 d_init,
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
29 d_pcnt,
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
30 d_1,
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
31
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
32 // html entity decoder states &#nnn;
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
33 e_init,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
34 e_amp,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
35 e_num,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
36
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
37 // mime decoder states =xx
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
38 m_init,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
39 m_eq,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
40 m_1,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
41
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
42 // base64 decoder states
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
43 b_init,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
44 b_lf,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
45 b_lf2,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
46 b_64,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
47
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
48 // counter for number of columns in the table
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
49 end_state,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
50
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
51 // temporary states
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
52 h_end,
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
53 t_end,
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
54 u_reco,
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
55 d_2,
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
56 e_semi,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
57 m_2,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
58 m_cr,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
59 m_nl,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
60 b_cr,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
61 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
62
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
63 typedef state PARSE[end_state];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
64
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
65 static PARSE parse_table[256] = {
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
66 // h_init, h_host, t_init, t_disc, u_init, u_http, u_sla , u_url, d_init, d_pcnt, d_1, e_init, e_amp, e_num, m_init, m_eq, m_1, b_init, b_lf, b_lf2, b_64
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
67
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
68 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x00
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
69 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x01
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
70 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x02
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
71 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x03
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
72 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x04
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
73 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x05
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
74 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x06
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
75 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x07
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
76 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x08
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
77 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x09 <tab>
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
78 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_nl, m_init, b_lf, b_init, b_lf2, b_init, }, // 0x0a <lf>
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
79 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0b
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
80 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0c
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
81 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_cr, m_init, b_init, b_init, b_init, b_cr, }, // 0x0d <cr>
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
82 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0e
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
83 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0f
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
84 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x10
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
85 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x11 xon char
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
86 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x12
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
87 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x13 xoff char
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
88 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x14
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
89 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x15
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
90 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x16
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
91 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x17
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
92 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x18
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
93 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x19
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
94 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1a
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
95 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1b
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
96 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1c
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
97 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1d
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
98 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1e
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
99 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1f
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
100 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x20 space
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
101 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x21 !
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
102 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x22 ""
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
103 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_num, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x23 #
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
104 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x24 $
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
105 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_pcnt, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x25 %
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
106 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_amp, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x26 &
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
107 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x27 '
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
108 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x28 (
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
109 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x29 )
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
110 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2A *
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
111 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x2B +
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
112 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2C ,
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
113 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2D -
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
114 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2E .
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
115 {h_init, h_end, t_init, t_disc, u_init, u_sla, u_sla, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x2F /
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
116 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x30 0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
117 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x31 1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
118 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x32 2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
119 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x33 3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
120 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x34 4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
121 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x35 5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
122 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x36 6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
123 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x37 7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
124 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x38 8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
125 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x39 9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
126 {h_init, h_end, t_init, t_disc, u_http, u_http, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3A :
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
127 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_semi, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3B ;
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
128 {h_init, h_end, t_disc, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3C <
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
129 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_eq, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x3D =
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
130 {h_init, h_end, t_init, t_end, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3E >
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
131 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3F ?
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
132 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x40 @
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
133 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x41 A
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
134 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x42 B
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
135 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x43 C
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
136 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x44 D
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
137 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x45 E
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
138 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x46 F
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
139 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x47 G
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
140 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x48 H
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
141 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x49 I
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
142 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4A J
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
143 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4B K
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
144 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4C L
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
145 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4D M
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
146 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4E N
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
147 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4F O
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
148 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x50 P
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
149 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x51 Q
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
150 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x52 R
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
151 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x53 S
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
152 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x54 T
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
153 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x55 U
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
154 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x56 V
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
155 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x57 W
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
156 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x58 X
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
157 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x59 Y
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
158 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x5A Z
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
159 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5B [
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
160 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5C brace
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
161 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5D ]
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
162 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5E ^
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
163 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5F _
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
164 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x60 `
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
165 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x61 a
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
166 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x62 b
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
167 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x63 c
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
168 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x64 d
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
169 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x65 e
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
170 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_1, d_2, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x66 f
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
171 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x67 g
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
172 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x68 h
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
173 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x69 i
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
174 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6A j
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
175 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6B k
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
176 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6C l
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
177 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6D m
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
178 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6E n
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
179 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6F o
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
180 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x70 p
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
181 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x71 q
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
182 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x72 r
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
183 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x73 s
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
184 {h_host, h_host, t_init, t_disc, u_http, u_http, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x74 t
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
185 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x75 u
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
186 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x76 v
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
187 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x77 w
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
188 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x78 x
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
189 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x79 y
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
190 {h_host, h_host, t_init, t_disc, u_init, u_init, u_url, u_url, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x7A z
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
191 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7B {
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
192 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7C |
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
193 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7D }
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
194 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7E ~
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
195 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7f
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
196 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x80
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
197 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x81
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
198 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x82
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
199 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x83
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
200 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x84
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
201 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x85
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
202 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x86
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
203 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x87
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
204 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x88
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
205 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x89
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
206 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8a
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
207 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8b
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
208 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8c
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
209 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8d
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
210 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8e
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
211 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8f
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
212 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x90
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
213 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x91
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
214 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x92
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
215 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x93
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
216 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x94
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
217 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x95
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
218 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x96
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
219 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x97
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
220 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x98
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
221 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x99
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
222 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9a
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
223 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9b
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
224 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9c
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
225 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9d
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
226 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9e
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
227 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9f
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
228 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
229 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
230 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
231 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
232 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
233 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
234 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
235 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
236 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
237 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
238 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xaa
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
239 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xab
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
240 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xac
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
241 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xad
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
242 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xae
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
243 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xaf
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
244 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
245 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
246 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
247 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
248 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
249 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
250 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
251 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
252 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
253 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
254 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xba
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
255 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbb
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
256 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbc
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
257 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbd
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
258 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbe
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
259 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbf
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
260 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
261 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
262 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
263 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
264 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
265 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
266 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
267 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
268 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
269 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
270 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xca
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
271 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcb
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
272 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcc
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
273 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcd
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
274 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xce
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
275 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcf
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
276 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
277 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
278 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
279 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
280 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
281 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
282 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
283 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
284 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
285 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
286 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xda
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
287 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdb
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
288 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdc
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
289 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdd
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
290 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xde
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
291 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdf
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
292 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
293 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
294 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
295 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
296 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
297 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
298 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
299 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
300 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
301 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
302 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xea
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
303 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xeb
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
304 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xec
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
305 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xed
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
306 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xee
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
307 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xef
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
308 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf0
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
309 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf1
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
310 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf2
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
311 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf3
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
312 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf4
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
313 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf5
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
314 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf6
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
315 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf7
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
316 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf8
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
317 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf9
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
318 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfa
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
319 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfb
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
320 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfc
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
321 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfd
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
322 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfe
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
323 {h_init, h_end, t_init, t_disc, u_init, u_init, u_init, u_reco, d_init, d_init, d_init, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xff
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
324 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
325
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
326
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
327 char *tlds[] = {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
328 ".com",
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
329 ".net",
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
330 ".org",
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
331 ".biz",
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
332 NULL
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
333 };
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
334
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
335 u_char hex_decode[256] = {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
336 0, // 0x00
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
337 0, // 0x01
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
338 0, // 0x02
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
339 0, // 0x03
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
340 0, // 0x04
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
341 0, // 0x05
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
342 0, // 0x06
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
343 0, // 0x07
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
344 0, // 0x08
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
345 0, // 0x09 <tab>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
346 0, // 0x0a <lf>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
347 0, // 0x0b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
348 0, // 0x0c
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
349 0, // 0x0d <cr>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
350 0, // 0x0e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
351 0, // 0x0f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
352 0, // 0x10
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
353 0, // 0x11 xon char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
354 0, // 0x12
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
355 0, // 0x13 xoff char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
356 0, // 0x14
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
357 0, // 0x15
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
358 0, // 0x16
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
359 0, // 0x17
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
360 0, // 0x18
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
361 0, // 0x19
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
362 0, // 0x1a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
363 0, // 0x1b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
364 0, // 0x1c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
365 0, // 0x1d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
366 0, // 0x1e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
367 0, // 0x1f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
368 0, // 0x20 space
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
369 0, // 0x21 !
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
370 0, // 0x22 ""
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
371 0, // 0x23 #
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
372 0, // 0x24 $
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
373 0, // 0x25 %
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
374 0, // 0x26 &
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
375 0, // 0x27 '
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
376 0, // 0x28 (
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
377 0, // 0x29 )
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
378 0, // 0x2A *
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
379 0, // 0x2B +
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
380 0, // 0x2C ,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
381 0, // 0x2D -
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
382 0, // 0x2E .
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
383 0, // 0x2F /
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
384 0, // 0x30 0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
385 1, // 0x31 1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
386 2, // 0x32 2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
387 3, // 0x33 3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
388 4, // 0x34 4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
389 5, // 0x35 5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
390 6, // 0x36 6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
391 7, // 0x37 7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
392 8, // 0x38 8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
393 9, // 0x39 9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
394 0, // 0x3A :
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
395 0, // 0x3B ;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
396 0, // 0x3C <
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
397 0, // 0x3D =
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
398 0, // 0x3E >
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
399 0, // 0x3F ?
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
400 0, // 0x40 @
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
401 10, // 0x41 A
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
402 11, // 0x42 B
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
403 12, // 0x43 C
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
404 13, // 0x44 D
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
405 14, // 0x45 E
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
406 15, // 0x46 F
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
407 0, // 0x47 G
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
408 0, // 0x48 H
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
409 0, // 0x49 I
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
410 0, // 0x4A J
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
411 0, // 0x4B K
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
412 0, // 0x4C L
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
413 0, // 0x4D M
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
414 0, // 0x4E N
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
415 0, // 0x4F O
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
416 0, // 0x50 P
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
417 0, // 0x51 Q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
418 0, // 0x52 R
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
419 0, // 0x53 S
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
420 0, // 0x54 T
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
421 0, // 0x55 U
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
422 0, // 0x56 V
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
423 0, // 0x57 W
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
424 0, // 0x58 X
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
425 0, // 0x59 Y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
426 0, // 0x5A Z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
427 0, // 0x5B [
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
428 0, // 0x5C brace
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
429 0, // 0x5D ]
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
430 0, // 0x5E ^
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
431 0, // 0x5F _
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
432 0, // 0x60 `
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
433 10, // 0x61 a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
434 11, // 0x62 b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
435 12, // 0x63 c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
436 13, // 0x64 d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
437 14, // 0x65 e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
438 15, // 0x66 f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
439 0, // 0x67 g
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
440 0, // 0x68 h
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
441 0, // 0x69 i
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
442 0, // 0x6A j
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
443 0, // 0x6B k
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
444 0, // 0x6C l
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
445 0, // 0x6D m
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
446 0, // 0x6E n
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
447 0, // 0x6F o
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
448 0, // 0x70 p
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
449 0, // 0x71 q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
450 0, // 0x72 r
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
451 0, // 0x73 s
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
452 0, // 0x74 t
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
453 0, // 0x75 u
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
454 0, // 0x76 v
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
455 0, // 0x77 w
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
456 0, // 0x78 x
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
457 0, // 0x79 y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
458 0, // 0x7A z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
459 0, // 0x7B {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
460 0, // 0x7C |
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
461 0, // 0x7D }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
462 0, // 0x7E ~
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
463 0, // 0x7f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
464 0, // 0x80
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
465 0, // 0x81
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
466 0, // 0x82
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
467 0, // 0x83
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
468 0, // 0x84
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
469 0, // 0x85
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
470 0, // 0x86
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
471 0, // 0x87
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
472 0, // 0x88
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
473 0, // 0x89
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
474 0, // 0x8a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
475 0, // 0x8b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
476 0, // 0x8c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
477 0, // 0x8d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
478 0, // 0x8e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
479 0, // 0x8f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
480 0, // 0x90
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
481 0, // 0x91
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
482 0, // 0x92
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
483 0, // 0x93
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
484 0, // 0x94
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
485 0, // 0x95
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
486 0, // 0x96
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
487 0, // 0x97
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
488 0, // 0x98
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
489 0, // 0x99
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
490 0, // 0x9a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
491 0, // 0x9b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
492 0, // 0x9c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
493 0, // 0x9d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
494 0, // 0x9e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
495 0, // 0x9f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
496 0, // 0xa0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
497 0, // 0xa1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
498 0, // 0xa2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
499 0, // 0xa3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
500 0, // 0xa4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
501 0, // 0xa5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
502 0, // 0xa6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
503 0, // 0xa7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
504 0, // 0xa8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
505 0, // 0xa9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
506 0, // 0xaa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
507 0, // 0xab
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
508 0, // 0xac
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
509 0, // 0xad
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
510 0, // 0xae
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
511 0, // 0xaf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
512 0, // 0xb0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
513 0, // 0xb1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
514 0, // 0xb2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
515 0, // 0xb3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
516 0, // 0xb4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
517 0, // 0xb5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
518 0, // 0xb6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
519 0, // 0xb7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
520 0, // 0xb8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
521 0, // 0xb9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
522 0, // 0xba
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
523 0, // 0xbb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
524 0, // 0xbc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
525 0, // 0xbd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
526 0, // 0xbe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
527 0, // 0xbf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
528 0, // 0xc0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
529 0, // 0xc1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
530 0, // 0xc2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
531 0, // 0xc3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
532 0, // 0xc4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
533 0, // 0xc5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
534 0, // 0xc6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
535 0, // 0xc7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
536 0, // 0xc8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
537 0, // 0xc9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
538 0, // 0xca
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
539 0, // 0xcb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
540 0, // 0xcc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
541 0, // 0xcd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
542 0, // 0xce
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
543 0, // 0xcf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
544 0, // 0xd0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
545 0, // 0xd1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
546 0, // 0xd2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
547 0, // 0xd3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
548 0, // 0xd4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
549 0, // 0xd5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
550 0, // 0xd6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
551 0, // 0xd7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
552 0, // 0xd8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
553 0, // 0xd9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
554 0, // 0xda
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
555 0, // 0xdb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
556 0, // 0xdc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
557 0, // 0xdd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
558 0, // 0xde
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
559 0, // 0xdf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
560 0, // 0xe0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
561 0, // 0xe1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
562 0, // 0xe2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
563 0, // 0xe3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
564 0, // 0xe4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
565 0, // 0xe5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
566 0, // 0xe6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
567 0, // 0xe7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
568 0, // 0xe8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
569 0, // 0xe9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
570 0, // 0xea
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
571 0, // 0xeb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
572 0, // 0xec
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
573 0, // 0xed
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
574 0, // 0xee
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
575 0, // 0xef
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
576 0, // 0xf0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
577 0, // 0xf1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
578 0, // 0xf2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
579 0, // 0xf3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
580 0, // 0xf4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
581 0, // 0xf5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
582 0, // 0xf6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
583 0, // 0xf7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
584 0, // 0xf8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
585 0, // 0xf9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
586 0, // 0xfa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
587 0, // 0xfb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
588 0, // 0xfc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
589 0, // 0xfd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
590 0, // 0xfe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
591 0, // 0xff
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
592 };
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
593
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
594 u_char b64_decode[256] = {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
595 0, // 0x00
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
596 0, // 0x01
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
597 0, // 0x02
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
598 0, // 0x03
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
599 0, // 0x04
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
600 0, // 0x05
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
601 0, // 0x06
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
602 0, // 0x07
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
603 0, // 0x08
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
604 0, // 0x09 <tab>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
605 0, // 0x0a <lf>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
606 0, // 0x0b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
607 0, // 0x0c
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
608 0, // 0x0d <cr>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
609 0, // 0x0e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
610 0, // 0x0f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
611 0, // 0x10
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
612 0, // 0x11 xon char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
613 0, // 0x12
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
614 0, // 0x13 xoff char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
615 0, // 0x14
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
616 0, // 0x15
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
617 0, // 0x16
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
618 0, // 0x17
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
619 0, // 0x18
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
620 0, // 0x19
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
621 0, // 0x1a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
622 0, // 0x1b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
623 0, // 0x1c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
624 0, // 0x1d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
625 0, // 0x1e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
626 0, // 0x1f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
627 0, // 0x20 space
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
628 0, // 0x21 !
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
629 0, // 0x22 ""
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
630 0, // 0x23 #
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
631 0, // 0x24 $
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
632 0, // 0x25 %
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
633 0, // 0x26 &
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
634 0, // 0x27 '
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
635 0, // 0x28 (
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
636 0, // 0x29 )
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
637 0, // 0x2A *
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
638 62, // 0x2B +
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
639 0, // 0x2C ,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
640 0, // 0x2D -
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
641 0, // 0x2E .
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
642 63, // 0x2F /
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
643 52, // 0x30 0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
644 53, // 0x31 1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
645 54, // 0x32 2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
646 55, // 0x33 3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
647 56, // 0x34 4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
648 57, // 0x35 5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
649 58, // 0x36 6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
650 59, // 0x37 7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
651 60, // 0x38 8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
652 61, // 0x39 9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
653 0, // 0x3A :
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
654 0, // 0x3B ;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
655 0, // 0x3C <
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
656 0, // 0x3D =
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
657 0, // 0x3E >
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
658 0, // 0x3F ?
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
659 0, // 0x40 @
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
660 0, // 0x41 A
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
661 1, // 0x42 B
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
662 2, // 0x43 C
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
663 3, // 0x44 D
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
664 4, // 0x45 E
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
665 5, // 0x46 F
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
666 6, // 0x47 G
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
667 7, // 0x48 H
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
668 8, // 0x49 I
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
669 9, // 0x4A J
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
670 10, // 0x4B K
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
671 11, // 0x4C L
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
672 12, // 0x4D M
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
673 13, // 0x4E N
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
674 14, // 0x4F O
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
675 15, // 0x50 P
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
676 16, // 0x51 Q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
677 17, // 0x52 R
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
678 18, // 0x53 S
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
679 19, // 0x54 T
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
680 20, // 0x55 U
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
681 21, // 0x56 V
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
682 22, // 0x57 W
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
683 23, // 0x58 X
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
684 24, // 0x59 Y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
685 25, // 0x5A Z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
686 0, // 0x5B [
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
687 0, // 0x5C brace
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
688 0, // 0x5D ]
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
689 0, // 0x5E ^
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
690 0, // 0x5F _
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
691 0, // 0x60 `
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
692 26, // 0x61 a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
693 27, // 0x62 b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
694 28, // 0x63 c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
695 29, // 0x64 d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
696 30, // 0x65 e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
697 31, // 0x66 f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
698 32, // 0x67 g
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
699 33, // 0x68 h
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
700 34, // 0x69 i
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
701 35, // 0x6A j
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
702 36, // 0x6B k
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
703 37, // 0x6C l
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
704 38, // 0x6D m
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
705 39, // 0x6E n
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
706 40, // 0x6F o
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
707 41, // 0x70 p
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
708 42, // 0x71 q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
709 43, // 0x72 r
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
710 44, // 0x73 s
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
711 45, // 0x74 t
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
712 46, // 0x75 u
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
713 47, // 0x76 v
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
714 48, // 0x77 w
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
715 49, // 0x78 x
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
716 50, // 0x79 y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
717 51, // 0x7A z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
718 0, // 0x7B {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
719 0, // 0x7C |
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
720 0, // 0x7D }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
721 0, // 0x7E ~
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
722 0, // 0x7f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
723 0, // 0x80
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
724 0, // 0x81
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
725 0, // 0x82
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
726 0, // 0x83
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
727 0, // 0x84
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
728 0, // 0x85
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
729 0, // 0x86
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
730 0, // 0x87
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
731 0, // 0x88
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
732 0, // 0x89
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
733 0, // 0x8a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
734 0, // 0x8b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
735 0, // 0x8c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
736 0, // 0x8d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
737 0, // 0x8e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
738 0, // 0x8f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
739 0, // 0x90
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
740 0, // 0x91
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
741 0, // 0x92
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
742 0, // 0x93
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
743 0, // 0x94
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
744 0, // 0x95
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
745 0, // 0x96
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
746 0, // 0x97
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
747 0, // 0x98
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
748 0, // 0x99
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
749 0, // 0x9a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
750 0, // 0x9b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
751 0, // 0x9c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
752 0, // 0x9d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
753 0, // 0x9e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
754 0, // 0x9f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
755 0, // 0xa0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
756 0, // 0xa1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
757 0, // 0xa2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
758 0, // 0xa3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
759 0, // 0xa4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
760 0, // 0xa5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
761 0, // 0xa6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
762 0, // 0xa7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
763 0, // 0xa8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
764 0, // 0xa9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
765 0, // 0xaa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
766 0, // 0xab
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
767 0, // 0xac
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
768 0, // 0xad
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
769 0, // 0xae
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
770 0, // 0xaf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
771 0, // 0xb0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
772 0, // 0xb1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
773 0, // 0xb2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
774 0, // 0xb3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
775 0, // 0xb4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
776 0, // 0xb5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
777 0, // 0xb6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
778 0, // 0xb7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
779 0, // 0xb8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
780 0, // 0xb9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
781 0, // 0xba
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
782 0, // 0xbb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
783 0, // 0xbc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
784 0, // 0xbd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
785 0, // 0xbe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
786 0, // 0xbf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
787 0, // 0xc0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
788 0, // 0xc1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
789 0, // 0xc2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
790 0, // 0xc3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
791 0, // 0xc4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
792 0, // 0xc5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
793 0, // 0xc6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
794 0, // 0xc7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
795 0, // 0xc8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
796 0, // 0xc9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
797 0, // 0xca
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
798 0, // 0xcb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
799 0, // 0xcc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
800 0, // 0xcd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
801 0, // 0xce
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
802 0, // 0xcf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
803 0, // 0xd0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
804 0, // 0xd1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
805 0, // 0xd2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
806 0, // 0xd3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
807 0, // 0xd4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
808 0, // 0xd5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
809 0, // 0xd6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
810 0, // 0xd7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
811 0, // 0xd8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
812 0, // 0xd9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
813 0, // 0xda
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
814 0, // 0xdb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
815 0, // 0xdc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
816 0, // 0xdd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
817 0, // 0xde
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
818 0, // 0xdf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
819 0, // 0xe0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
820 0, // 0xe1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
821 0, // 0xe2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
822 0, // 0xe3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
823 0, // 0xe4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
824 0, // 0xe5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
825 0, // 0xe6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
826 0, // 0xe7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
827 0, // 0xe8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
828 0, // 0xe9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
829 0, // 0xea
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
830 0, // 0xeb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
831 0, // 0xec
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
832 0, // 0xed
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
833 0, // 0xee
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
834 0, // 0xef
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
835 0, // 0xf0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
836 0, // 0xf1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
837 0, // 0xf2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
838 0, // 0xf3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
839 0, // 0xf4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
840 0, // 0xf5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
841 0, // 0xf6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
842 0, // 0xf7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
843 0, // 0xf8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
844 0, // 0xf9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
845 0, // 0xfa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
846 0, // 0xfb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
847 0, // 0xfc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
848 0, // 0xfd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
849 0, // 0xfe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
850 0, // 0xff
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
851 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
852
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
853 #define PENDING_LIMIT 100
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
854 struct fsa {
12
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
855 u_char pending[PENDING_LIMIT];
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
856 int count;
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
857 state st;
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
858 state init;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
859 fsa* next1;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
860 fsa* next2;
12
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
861 string_set *hosts;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
862
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
863 fsa(state init, fsa* next1_, fsa* next2_, string_set *hosts_);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
864 void push(u_char *buf, int len);
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
865 void pusher();
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
866 void error(char *err);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
867 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
868
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
869 fsa::fsa(state init_, fsa *next1_, fsa *next2_, string_set *hosts_) {
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
870 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
871 st = init_;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
872 init = init_;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
873 next1 = next1_;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
874 next2 = next2_;
12
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
875 hosts = hosts_;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
876 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
877
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
878 void fsa::error(char *err) {
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
879 count = 0;
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
880 st = init;
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
881 if (err) my_syslog(err);
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
882 }
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
883
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
884 void fsa::pusher() {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
885 if (next1) next1->push(pending, count);
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
886 if (next2) next2->push(pending, count);
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
887 count = 0;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
888 }
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
889
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
890 void fsa::push(u_char *buf, int len) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
891 for (int i=0; i<len; i++) {
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
892 if (count == (PENDING_LIMIT-1)) error(NULL);
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
893 if (st >= end_state) error("finite state machine impossible state");
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
894 u_char c = buf[i];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
895 pending[count++] = c;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
896 st = parse_table[c][st];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
897 switch (st) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
898
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
899 //////////////////////////////
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
900 // host name recognizer
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
901 case h_end: {
18
041ea016b684 add scanning for bare hostnames
carl
parents: 17
diff changeset
902 pending[--count] = '\0'; // null terminate host name by overwriting the terminator
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
903 char *tld;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
904 for (int i=0; (tld = tlds[i]); i++) {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
905 int n = strlen(tld);
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
906 if (count > n) {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
907 if (strncasecmp((const char *)(pending+count-n), tld, n) == 0) {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
908 register_string(*hosts, (char*)pending);
17
b6a4b72bb96e add scanning for bare hostnames
carl
parents: 16
diff changeset
909 break;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
910 }
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
911 }
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
912 }
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
913 st = h_init;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
914 } // fall thru
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
915
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
916 case h_init: {
18
041ea016b684 add scanning for bare hostnames
carl
parents: 17
diff changeset
917 count = 0;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
918 } break;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
919
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
920
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
921 //////////////////////////////
18
041ea016b684 add scanning for bare hostnames
carl
parents: 17
diff changeset
922 // html tag discarder
041ea016b684 add scanning for bare hostnames
carl
parents: 17
diff changeset
923 case t_end: {
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
924 st = t_init;
18
041ea016b684 add scanning for bare hostnames
carl
parents: 17
diff changeset
925 } // fall thru
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
926
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
927 case t_disc: {
18
041ea016b684 add scanning for bare hostnames
carl
parents: 17
diff changeset
928 count = 0; // discard all characters
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
929 } break;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
930
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
931 case t_init: {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
932 pusher();
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
933 } break;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
934
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
935
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
936 //////////////////////////////
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
937 // url recognizer
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
938 case u_reco: {
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
939 if (count > 13) { // need some minimal length host name after the protocol
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
940 pending[--count] = '\0'; // null terminate host name by overwriting the terminator
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
941 char *p = strrchr((const char *)pending, '/');
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
942 if (p && // have a leading /
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
943 strchr(p, '.') && // require at least one . in a dns name
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
944 (strncasecmp((const char *)pending, "http", 4) == 0)) { // must start with protocol
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
945 register_string(*hosts, ++p); // we seem to have a host name, skip the last /
9
8c65411cd7ab integration work on url scanner
carl
parents: 8
diff changeset
946 }
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
947 }
19
b8f5fa3dd5b8 fix problems in the state transitions causing impossible states
carl
parents: 18
diff changeset
948 st = u_init;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
949 } // fall thru
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
950
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
951 case u_init: {
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
952 count = 0; // discard all characters
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
953 } break;
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
954
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
955
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
956 //////////////////////////////
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
957 // url decoder %xx
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
958 case d_2: {
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
959 pending[0] = hex_decode[pending[1]] * 16 + hex_decode[pending[2]];
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
960 count = 1;
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
961 st = d_init;
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
962 } // fall thru
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
963
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
964 case d_init: {
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
965 pusher();
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
966 } break;
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
967
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
968
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
969 //////////////////////////////
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
970 // html entity decoder &#nnn;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
971 case e_semi: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
972 pending[--count] = '\0'; // null terminate the digit string by overwriting the semicolon
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
973 pending[0] = atoi((const char *)pending+2);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
974 count = 1;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
975 st = e_init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
976 } // fall thru
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
977
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
978 case e_init: {
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
979 pusher();
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
980 } break;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
981
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
982
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
983 //////////////////////////////
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
984 // mime decoder =xx
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
985 case m_2: {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
986 pending[0] = hex_decode[pending[1]] * 16 + hex_decode[pending[2]];
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
987 count = 1;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
988 st = m_init;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
989 } // fall thru
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
990
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
991 case m_init: {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
992 pusher();
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
993 } break;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
994
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
995 case m_cr: {
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
996 count = 1;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
997 st = m_eq;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
998 } break;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
999
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1000 case m_nl: {
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1001 count = 0;
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1002 st = m_init;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1003 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1004
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1005
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1006 //////////////////////////////
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1007 // base64 decoder
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1008 case b_lf2: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1009 count--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1010 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1011
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1012 case b_cr: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1013 int cnt = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1014 if ((count % 4) == 1) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1015 count--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1016 // might have proper b64 data
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1017 for (int i=0; i<count; i+=4) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1018 unsigned long a1 = b64_decode[pending[i]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1019 unsigned long a2 = b64_decode[pending[i+1]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1020 unsigned long a3 = b64_decode[pending[i+2]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1021 unsigned long a4 = b64_decode[pending[i+3]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1022 unsigned long a = (a1 << 18) | (a2 << 12) | (a3 << 6) | a4;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1023 pending[cnt++] = (a & 0x00ff0000) >> 16;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1024 pending[cnt++] = (a & 0x0000ff00) >> 8;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1025 pending[cnt++] = (a & 0x000000ff);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1026 if ((char)pending[i+3] == '=') cnt--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1027 if ((char)pending[i+2] == '=') cnt--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1028 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1029 count = cnt;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1030 st = b_lf2;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1031 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1032 else st = b_init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1033 } // fall thru
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1034
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1035 case b_lf:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1036 case b_init: {
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1037 pusher();
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1038 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1039
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1040
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1041 //////////////////////////////
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1042 // states that just accumulate characters in the pending buffer
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1043 case h_host:
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
1044 case u_http:
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
1045 case u_url:
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1046 case u_sla:
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1047 case d_pcnt:
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1048 case d_1:
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1049 case e_amp:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1050 case e_num:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1051 case m_eq:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1052 case m_1:
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1053 case b_64:
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1054 default: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1055 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1056 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1057 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1058 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1059
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1060 struct url_scanner {
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1061 fsa *host_parser;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1062 fsa *tags_parser;
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1063 fsa *urls_parser;
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1064 fsa *urld_parser;
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1065 fsa *html_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1066 fsa *mime_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1067 fsa *b64_parser;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1068
12
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
1069 url_scanner(string_set *hosts);
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1070 ~url_scanner();
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1071 void scan(u_char *buffer, size_t length);
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1072 };
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1073
12
6ac6d6b822ce fix memory leak with duplicate url host names,
carl
parents: 11
diff changeset
1074 url_scanner::url_scanner(string_set *hosts) {
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1075 host_parser = new fsa(h_init, NULL, NULL, hosts);
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1076 tags_parser = new fsa(t_init, host_parser, NULL, NULL);
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1077 urls_parser = new fsa(u_init, NULL, NULL, hosts);
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1078 urld_parser = new fsa(d_init, urls_parser, tags_parser, NULL);
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1079 html_parser = new fsa(e_init, urld_parser, NULL, NULL);
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1080 mime_parser = new fsa(m_init, html_parser, NULL, NULL);
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1081 b64_parser = new fsa(b_init, mime_parser, NULL, NULL);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1082 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1083
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1084 url_scanner::~url_scanner() {
16
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1085 delete host_parser;
2ae8d953f1d0 add scanning for bare hostnames
carl
parents: 12
diff changeset
1086 delete tags_parser;
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1087 delete urls_parser;
23
06de5ab6a232 add url decoding stage, allow http:/ single / in yahoo redirector, allow ip address hostnames
carl
parents: 19
diff changeset
1088 delete urld_parser;
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1089 delete html_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1090 delete mime_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1091 delete b64_parser;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1092 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1093
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1094 void url_scanner::scan(u_char *buffer, size_t length) {
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1095 b64_parser->push(buffer, length);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1096 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
1097