annotate src/scanner.cpp @ 11:2c206836b4cc

integration work on url scanner
author carl
date Thu, 22 Apr 2004 20:19:01 -0700
parents 8c65411cd7ab
children 6ac6d6b822ce
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
1 static char* scanner_version="$Id$";
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
3 using namespace std;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
4
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
5 enum state {// url decoder states
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
6 u_init,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
7 u_http,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
8 u_sla,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
9 u_url,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
10
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
11 // html entity decoder states
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
12 e_init,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
13 e_amp,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
14 e_num,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
15
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
16 // mime decoder states
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
17 m_init,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
18 m_eq,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
19 m_1,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
20
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
21 // base64 decoder states
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
22 b_init,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
23 b_lf,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
24 b_lf2,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
25 b_64,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
26
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
27 // counter for number of columns in the table
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
28 end_state,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
29
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
30 // temporary mime states
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
31 u_reco,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
32 e_semi,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
33 m_2,
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
34 m_cr,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
35 m_nl,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
36 b_cr,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
37 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
38
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
39 typedef state PARSE[end_state];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
40
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
41 static PARSE parse_table[256] = {
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
42 // u_init, u_http, u_sla , u_url, e_init, e_amp, e_num, m_init, m_eq, m_1, b_init, b_lf, b_lf2, b_64
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
43
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
44 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x00
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
45 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x01
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
46 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x02
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
47 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x03
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
48 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x04
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
49 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x05
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
50 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x06
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
51 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x07
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
52 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x08
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
53 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x09 <tab>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
54 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_nl, m_init, b_lf, b_init, b_lf2, b_init, }, // 0x0a <lf>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
55 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0b
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
56 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0c
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
57 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_cr, m_init, b_init, b_init, b_init, b_cr, }, // 0x0d <cr>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
58 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0e
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
59 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x0f
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
60 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x10
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
61 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x11 xon char
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
62 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x12
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
63 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x13 xoff char
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
64 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x14
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
65 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x15
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
66 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x16
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
67 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x17
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
68 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x18
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
69 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x19
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
70 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1a
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
71 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1b
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
72 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1c
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
73 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1d
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
74 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1e
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
75 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x1f
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
76 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x20 space
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
77 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x21 !
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
78 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x22 ""
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
79 {u_init, u_init, u_init, u_reco, e_init, e_num, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x23 #
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
80 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x24 $
11
2c206836b4cc integration work on url scanner
carl
parents: 9
diff changeset
81 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x25 %
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
82 {u_init, u_init, u_init, u_reco, e_amp, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x26 &
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
83 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x27 '
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
84 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x28 (
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
85 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x29 )
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
86 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2A *
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
87 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x2B +
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
88 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2C ,
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
89 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2D -
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
90 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x2E .
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
91 {u_init, u_sla, u_sla, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x2F /
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
92 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x30 0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
93 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x31 1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
94 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x32 2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
95 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x33 3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
96 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x34 4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
97 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x35 5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
98 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x36 6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
99 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x37 7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
100 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x38 8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
101 {u_init, u_init, u_url, u_url, e_init, e_init, e_num, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x39 9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
102 {u_http, u_http, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3A :
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
103 {u_init, u_init, u_init, u_reco, e_init, e_init, e_semi, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3B ;
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
104 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3C <
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
105 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_eq, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x3D =
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
106 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3E >
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
107 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x3F ?
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
108 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x40 @
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
109 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x41 A
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
110 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x42 B
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
111 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x43 C
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
112 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x44 D
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
113 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x45 E
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
114 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x46 F
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
115 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x47 G
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
116 {u_http, u_http, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x48 H
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
117 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x49 I
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
118 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4A J
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
119 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4B K
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
120 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4C L
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
121 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4D M
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
122 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4E N
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
123 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x4F O
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
124 {u_http, u_http, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x50 P
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
125 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x51 Q
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
126 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x52 R
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
127 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x53 S
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
128 {u_http, u_http, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x54 T
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
129 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x55 U
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
130 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x56 V
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
131 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x57 W
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
132 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x58 X
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
133 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x59 Y
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
134 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x5A Z
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
135 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5B [
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
136 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5C brace
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
137 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5D ]
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
138 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5E ^
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
139 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x5F _
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
140 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x60 `
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
141 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x61 a
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
142 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x62 b
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
143 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x63 c
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
144 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x64 d
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
145 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x65 e
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
146 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_1, m_2, b_init, b_64, b_64, b_64, }, // 0x66 f
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
147 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x67 g
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
148 {u_http, u_http, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x68 h
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
149 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x69 i
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
150 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6A j
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
151 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6B k
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
152 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6C l
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
153 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6D m
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
154 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6E n
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
155 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x6F o
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
156 {u_http, u_http, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x70 p
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
157 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x71 q
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
158 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x72 r
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
159 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x73 s
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
160 {u_http, u_http, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x74 t
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
161 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x75 u
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
162 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x76 v
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
163 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x77 w
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
164 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x78 x
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
165 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x79 y
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
166 {u_init, u_init, u_url, u_url, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_64, b_64, b_64, }, // 0x7A z
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
167 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7B {
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
168 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7C |
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
169 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7D }
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
170 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7E ~
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
171 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x7f
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
172 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x80
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
173 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x81
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
174 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x82
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
175 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x83
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
176 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x84
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
177 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x85
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
178 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x86
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
179 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x87
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
180 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x88
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
181 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x89
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
182 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8a
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
183 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8b
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
184 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8c
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
185 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8d
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
186 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8e
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
187 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x8f
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
188 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x90
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
189 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x91
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
190 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x92
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
191 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x93
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
192 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x94
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
193 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x95
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
194 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x96
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
195 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x97
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
196 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x98
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
197 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x99
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
198 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9a
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
199 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9b
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
200 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9c
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
201 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9d
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
202 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9e
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
203 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0x9f
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
204 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
205 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
206 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
207 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
208 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
209 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
210 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
211 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
212 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
213 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xa9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
214 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xaa
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
215 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xab
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
216 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xac
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
217 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xad
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
218 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xae
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
219 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xaf
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
220 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
221 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
222 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
223 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
224 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
225 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
226 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
227 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
228 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
229 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xb9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
230 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xba
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
231 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbb
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
232 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbc
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
233 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbd
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
234 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbe
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
235 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xbf
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
236 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
237 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
238 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
239 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
240 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
241 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
242 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
243 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
244 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
245 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xc9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
246 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xca
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
247 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcb
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
248 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcc
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
249 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcd
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
250 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xce
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
251 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xcf
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
252 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
253 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
254 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
255 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
256 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
257 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
258 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
259 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
260 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
261 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xd9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
262 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xda
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
263 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdb
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
264 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdc
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
265 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdd
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
266 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xde
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
267 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xdf
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
268 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
269 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
270 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
271 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
272 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
273 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
274 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
275 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
276 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
277 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xe9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
278 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xea
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
279 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xeb
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
280 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xec
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
281 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xed
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
282 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xee
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
283 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xef
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
284 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf0
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
285 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf1
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
286 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf2
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
287 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf3
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
288 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf4
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
289 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf5
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
290 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf6
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
291 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
292 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf8
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
293 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xf9
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
294 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfa
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
295 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfb
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
296 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfc
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
297 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfd
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
298 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xfe
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
299 {u_init, u_init, u_init, u_reco, e_init, e_init, e_init, m_init, m_init, m_init, b_init, b_init, b_init, b_init, }, // 0xff
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
300 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
301
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
302
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
303 u_char hex_decode[256] = {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
304 0, // 0x00
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
305 0, // 0x01
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
306 0, // 0x02
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
307 0, // 0x03
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
308 0, // 0x04
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
309 0, // 0x05
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
310 0, // 0x06
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
311 0, // 0x07
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
312 0, // 0x08
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
313 0, // 0x09 <tab>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
314 0, // 0x0a <lf>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
315 0, // 0x0b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
316 0, // 0x0c
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
317 0, // 0x0d <cr>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
318 0, // 0x0e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
319 0, // 0x0f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
320 0, // 0x10
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
321 0, // 0x11 xon char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
322 0, // 0x12
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
323 0, // 0x13 xoff char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
324 0, // 0x14
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
325 0, // 0x15
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
326 0, // 0x16
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
327 0, // 0x17
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
328 0, // 0x18
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
329 0, // 0x19
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
330 0, // 0x1a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
331 0, // 0x1b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
332 0, // 0x1c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
333 0, // 0x1d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
334 0, // 0x1e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
335 0, // 0x1f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
336 0, // 0x20 space
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
337 0, // 0x21 !
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
338 0, // 0x22 ""
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
339 0, // 0x23 #
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
340 0, // 0x24 $
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
341 0, // 0x25 %
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
342 0, // 0x26 &
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
343 0, // 0x27 '
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
344 0, // 0x28 (
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
345 0, // 0x29 )
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
346 0, // 0x2A *
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
347 0, // 0x2B +
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
348 0, // 0x2C ,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
349 0, // 0x2D -
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
350 0, // 0x2E .
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
351 0, // 0x2F /
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
352 0, // 0x30 0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
353 1, // 0x31 1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
354 2, // 0x32 2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
355 3, // 0x33 3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
356 4, // 0x34 4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
357 5, // 0x35 5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
358 6, // 0x36 6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
359 7, // 0x37 7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
360 8, // 0x38 8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
361 9, // 0x39 9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
362 0, // 0x3A :
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
363 0, // 0x3B ;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
364 0, // 0x3C <
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
365 0, // 0x3D =
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
366 0, // 0x3E >
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
367 0, // 0x3F ?
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
368 0, // 0x40 @
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
369 10, // 0x41 A
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
370 11, // 0x42 B
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
371 12, // 0x43 C
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
372 13, // 0x44 D
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
373 14, // 0x45 E
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
374 15, // 0x46 F
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
375 0, // 0x47 G
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
376 0, // 0x48 H
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
377 0, // 0x49 I
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
378 0, // 0x4A J
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
379 0, // 0x4B K
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
380 0, // 0x4C L
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
381 0, // 0x4D M
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
382 0, // 0x4E N
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
383 0, // 0x4F O
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
384 0, // 0x50 P
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
385 0, // 0x51 Q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
386 0, // 0x52 R
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
387 0, // 0x53 S
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
388 0, // 0x54 T
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
389 0, // 0x55 U
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
390 0, // 0x56 V
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
391 0, // 0x57 W
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
392 0, // 0x58 X
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
393 0, // 0x59 Y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
394 0, // 0x5A Z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
395 0, // 0x5B [
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
396 0, // 0x5C brace
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
397 0, // 0x5D ]
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
398 0, // 0x5E ^
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
399 0, // 0x5F _
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
400 0, // 0x60 `
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
401 10, // 0x61 a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
402 11, // 0x62 b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
403 12, // 0x63 c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
404 13, // 0x64 d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
405 14, // 0x65 e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
406 15, // 0x66 f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
407 0, // 0x67 g
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
408 0, // 0x68 h
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
409 0, // 0x69 i
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
410 0, // 0x6A j
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
411 0, // 0x6B k
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
412 0, // 0x6C l
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
413 0, // 0x6D m
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
414 0, // 0x6E n
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
415 0, // 0x6F o
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
416 0, // 0x70 p
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
417 0, // 0x71 q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
418 0, // 0x72 r
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
419 0, // 0x73 s
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
420 0, // 0x74 t
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
421 0, // 0x75 u
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
422 0, // 0x76 v
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
423 0, // 0x77 w
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
424 0, // 0x78 x
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
425 0, // 0x79 y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
426 0, // 0x7A z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
427 0, // 0x7B {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
428 0, // 0x7C |
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
429 0, // 0x7D }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
430 0, // 0x7E ~
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
431 0, // 0x7f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
432 0, // 0x80
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
433 0, // 0x81
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
434 0, // 0x82
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
435 0, // 0x83
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
436 0, // 0x84
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
437 0, // 0x85
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
438 0, // 0x86
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
439 0, // 0x87
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
440 0, // 0x88
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
441 0, // 0x89
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
442 0, // 0x8a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
443 0, // 0x8b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
444 0, // 0x8c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
445 0, // 0x8d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
446 0, // 0x8e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
447 0, // 0x8f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
448 0, // 0x90
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
449 0, // 0x91
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
450 0, // 0x92
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
451 0, // 0x93
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
452 0, // 0x94
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
453 0, // 0x95
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
454 0, // 0x96
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
455 0, // 0x97
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
456 0, // 0x98
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
457 0, // 0x99
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
458 0, // 0x9a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
459 0, // 0x9b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
460 0, // 0x9c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
461 0, // 0x9d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
462 0, // 0x9e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
463 0, // 0x9f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
464 0, // 0xa0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
465 0, // 0xa1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
466 0, // 0xa2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
467 0, // 0xa3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
468 0, // 0xa4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
469 0, // 0xa5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
470 0, // 0xa6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
471 0, // 0xa7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
472 0, // 0xa8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
473 0, // 0xa9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
474 0, // 0xaa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
475 0, // 0xab
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
476 0, // 0xac
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
477 0, // 0xad
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
478 0, // 0xae
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
479 0, // 0xaf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
480 0, // 0xb0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
481 0, // 0xb1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
482 0, // 0xb2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
483 0, // 0xb3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
484 0, // 0xb4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
485 0, // 0xb5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
486 0, // 0xb6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
487 0, // 0xb7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
488 0, // 0xb8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
489 0, // 0xb9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
490 0, // 0xba
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
491 0, // 0xbb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
492 0, // 0xbc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
493 0, // 0xbd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
494 0, // 0xbe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
495 0, // 0xbf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
496 0, // 0xc0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
497 0, // 0xc1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
498 0, // 0xc2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
499 0, // 0xc3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
500 0, // 0xc4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
501 0, // 0xc5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
502 0, // 0xc6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
503 0, // 0xc7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
504 0, // 0xc8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
505 0, // 0xc9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
506 0, // 0xca
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
507 0, // 0xcb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
508 0, // 0xcc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
509 0, // 0xcd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
510 0, // 0xce
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
511 0, // 0xcf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
512 0, // 0xd0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
513 0, // 0xd1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
514 0, // 0xd2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
515 0, // 0xd3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
516 0, // 0xd4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
517 0, // 0xd5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
518 0, // 0xd6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
519 0, // 0xd7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
520 0, // 0xd8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
521 0, // 0xd9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
522 0, // 0xda
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
523 0, // 0xdb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
524 0, // 0xdc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
525 0, // 0xdd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
526 0, // 0xde
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
527 0, // 0xdf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
528 0, // 0xe0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
529 0, // 0xe1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
530 0, // 0xe2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
531 0, // 0xe3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
532 0, // 0xe4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
533 0, // 0xe5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
534 0, // 0xe6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
535 0, // 0xe7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
536 0, // 0xe8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
537 0, // 0xe9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
538 0, // 0xea
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
539 0, // 0xeb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
540 0, // 0xec
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
541 0, // 0xed
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
542 0, // 0xee
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
543 0, // 0xef
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
544 0, // 0xf0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
545 0, // 0xf1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
546 0, // 0xf2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
547 0, // 0xf3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
548 0, // 0xf4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
549 0, // 0xf5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
550 0, // 0xf6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
551 0, // 0xf7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
552 0, // 0xf8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
553 0, // 0xf9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
554 0, // 0xfa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
555 0, // 0xfb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
556 0, // 0xfc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
557 0, // 0xfd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
558 0, // 0xfe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
559 0, // 0xff
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
560 };
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
561
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
562 u_char b64_decode[256] = {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
563 0, // 0x00
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
564 0, // 0x01
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
565 0, // 0x02
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
566 0, // 0x03
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
567 0, // 0x04
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
568 0, // 0x05
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
569 0, // 0x06
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
570 0, // 0x07
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
571 0, // 0x08
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
572 0, // 0x09 <tab>
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
573 0, // 0x0a <lf>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
574 0, // 0x0b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
575 0, // 0x0c
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
576 0, // 0x0d <cr>
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
577 0, // 0x0e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
578 0, // 0x0f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
579 0, // 0x10
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
580 0, // 0x11 xon char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
581 0, // 0x12
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
582 0, // 0x13 xoff char
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
583 0, // 0x14
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
584 0, // 0x15
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
585 0, // 0x16
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
586 0, // 0x17
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
587 0, // 0x18
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
588 0, // 0x19
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
589 0, // 0x1a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
590 0, // 0x1b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
591 0, // 0x1c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
592 0, // 0x1d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
593 0, // 0x1e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
594 0, // 0x1f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
595 0, // 0x20 space
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
596 0, // 0x21 !
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
597 0, // 0x22 ""
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
598 0, // 0x23 #
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
599 0, // 0x24 $
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
600 0, // 0x25 %
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
601 0, // 0x26 &
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
602 0, // 0x27 '
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
603 0, // 0x28 (
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
604 0, // 0x29 )
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
605 0, // 0x2A *
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
606 62, // 0x2B +
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
607 0, // 0x2C ,
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
608 0, // 0x2D -
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
609 0, // 0x2E .
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
610 63, // 0x2F /
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
611 52, // 0x30 0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
612 53, // 0x31 1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
613 54, // 0x32 2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
614 55, // 0x33 3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
615 56, // 0x34 4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
616 57, // 0x35 5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
617 58, // 0x36 6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
618 59, // 0x37 7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
619 60, // 0x38 8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
620 61, // 0x39 9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
621 0, // 0x3A :
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
622 0, // 0x3B ;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
623 0, // 0x3C <
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
624 0, // 0x3D =
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
625 0, // 0x3E >
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
626 0, // 0x3F ?
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
627 0, // 0x40 @
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
628 0, // 0x41 A
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
629 1, // 0x42 B
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
630 2, // 0x43 C
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
631 3, // 0x44 D
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
632 4, // 0x45 E
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
633 5, // 0x46 F
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
634 6, // 0x47 G
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
635 7, // 0x48 H
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
636 8, // 0x49 I
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
637 9, // 0x4A J
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
638 10, // 0x4B K
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
639 11, // 0x4C L
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
640 12, // 0x4D M
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
641 13, // 0x4E N
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
642 14, // 0x4F O
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
643 15, // 0x50 P
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
644 16, // 0x51 Q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
645 17, // 0x52 R
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
646 18, // 0x53 S
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
647 19, // 0x54 T
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
648 20, // 0x55 U
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
649 21, // 0x56 V
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
650 22, // 0x57 W
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
651 23, // 0x58 X
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
652 24, // 0x59 Y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
653 25, // 0x5A Z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
654 0, // 0x5B [
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
655 0, // 0x5C brace
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
656 0, // 0x5D ]
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
657 0, // 0x5E ^
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
658 0, // 0x5F _
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
659 0, // 0x60 `
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
660 26, // 0x61 a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
661 27, // 0x62 b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
662 28, // 0x63 c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
663 29, // 0x64 d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
664 30, // 0x65 e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
665 31, // 0x66 f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
666 32, // 0x67 g
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
667 33, // 0x68 h
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
668 34, // 0x69 i
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
669 35, // 0x6A j
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
670 36, // 0x6B k
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
671 37, // 0x6C l
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
672 38, // 0x6D m
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
673 39, // 0x6E n
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
674 40, // 0x6F o
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
675 41, // 0x70 p
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
676 42, // 0x71 q
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
677 43, // 0x72 r
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
678 44, // 0x73 s
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
679 45, // 0x74 t
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
680 46, // 0x75 u
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
681 47, // 0x76 v
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
682 48, // 0x77 w
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
683 49, // 0x78 x
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
684 50, // 0x79 y
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
685 51, // 0x7A z
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
686 0, // 0x7B {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
687 0, // 0x7C |
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
688 0, // 0x7D }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
689 0, // 0x7E ~
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
690 0, // 0x7f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
691 0, // 0x80
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
692 0, // 0x81
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
693 0, // 0x82
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
694 0, // 0x83
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
695 0, // 0x84
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
696 0, // 0x85
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
697 0, // 0x86
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
698 0, // 0x87
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
699 0, // 0x88
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
700 0, // 0x89
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
701 0, // 0x8a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
702 0, // 0x8b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
703 0, // 0x8c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
704 0, // 0x8d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
705 0, // 0x8e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
706 0, // 0x8f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
707 0, // 0x90
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
708 0, // 0x91
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
709 0, // 0x92
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
710 0, // 0x93
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
711 0, // 0x94
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
712 0, // 0x95
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
713 0, // 0x96
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
714 0, // 0x97
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
715 0, // 0x98
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
716 0, // 0x99
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
717 0, // 0x9a
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
718 0, // 0x9b
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
719 0, // 0x9c
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
720 0, // 0x9d
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
721 0, // 0x9e
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
722 0, // 0x9f
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
723 0, // 0xa0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
724 0, // 0xa1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
725 0, // 0xa2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
726 0, // 0xa3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
727 0, // 0xa4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
728 0, // 0xa5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
729 0, // 0xa6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
730 0, // 0xa7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
731 0, // 0xa8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
732 0, // 0xa9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
733 0, // 0xaa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
734 0, // 0xab
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
735 0, // 0xac
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
736 0, // 0xad
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
737 0, // 0xae
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
738 0, // 0xaf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
739 0, // 0xb0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
740 0, // 0xb1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
741 0, // 0xb2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
742 0, // 0xb3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
743 0, // 0xb4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
744 0, // 0xb5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
745 0, // 0xb6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
746 0, // 0xb7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
747 0, // 0xb8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
748 0, // 0xb9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
749 0, // 0xba
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
750 0, // 0xbb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
751 0, // 0xbc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
752 0, // 0xbd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
753 0, // 0xbe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
754 0, // 0xbf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
755 0, // 0xc0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
756 0, // 0xc1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
757 0, // 0xc2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
758 0, // 0xc3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
759 0, // 0xc4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
760 0, // 0xc5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
761 0, // 0xc6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
762 0, // 0xc7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
763 0, // 0xc8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
764 0, // 0xc9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
765 0, // 0xca
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
766 0, // 0xcb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
767 0, // 0xcc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
768 0, // 0xcd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
769 0, // 0xce
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
770 0, // 0xcf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
771 0, // 0xd0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
772 0, // 0xd1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
773 0, // 0xd2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
774 0, // 0xd3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
775 0, // 0xd4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
776 0, // 0xd5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
777 0, // 0xd6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
778 0, // 0xd7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
779 0, // 0xd8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
780 0, // 0xd9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
781 0, // 0xda
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
782 0, // 0xdb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
783 0, // 0xdc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
784 0, // 0xdd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
785 0, // 0xde
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
786 0, // 0xdf
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
787 0, // 0xe0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
788 0, // 0xe1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
789 0, // 0xe2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
790 0, // 0xe3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
791 0, // 0xe4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
792 0, // 0xe5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
793 0, // 0xe6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
794 0, // 0xe7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
795 0, // 0xe8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
796 0, // 0xe9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
797 0, // 0xea
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
798 0, // 0xeb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
799 0, // 0xec
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
800 0, // 0xed
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
801 0, // 0xee
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
802 0, // 0xef
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
803 0, // 0xf0
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
804 0, // 0xf1
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
805 0, // 0xf2
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
806 0, // 0xf3
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
807 0, // 0xf4
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
808 0, // 0xf5
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
809 0, // 0xf6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
810 0, // 0xf7
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
811 0, // 0xf8
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
812 0, // 0xf9
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
813 0, // 0xfa
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
814 0, // 0xfb
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
815 0, // 0xfc
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
816 0, // 0xfd
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
817 0, // 0xfe
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
818 0, // 0xff
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
819 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
820
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
821 #define PENDING_LIMIT 100
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
822 struct fsa {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
823 u_char pending[PENDING_LIMIT];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
824 int count;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
825 state st;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
826 state init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
827 fsa* next;
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
828 string_set *urls;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
829
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
830 fsa(state init, fsa* next_, string_set *urls_);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
831 void push(u_char *buf, int len);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
832 };
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
833
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
834 fsa::fsa(state init_, fsa *next_, string_set *urls_) {
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
835 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
836 st = init_;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
837 init = init_;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
838 next = next_;
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
839 urls = urls_;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
840 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
841
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
842 void fsa::push(u_char *buf, int len) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
843 for (int i=0; i<len; i++) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
844 u_char c = buf[i];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
845 // guard against buffer overflow
9
8c65411cd7ab integration work on url scanner
carl
parents: 8
diff changeset
846 if (count == (PENDING_LIMIT-1)) {
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
847 if (next) next->push(pending, count);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
848 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
849 st = init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
850 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
851 pending[count++] = c;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
852 st = parse_table[c][st];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
853 switch (st) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
854
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
855 //////////////////////////////
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
856 // url recognizer
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
857 case u_sla: {
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
858 if ((count < 6) || (7 < count)) {
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
859 count = 0;
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
860 st = u_init;
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
861 }
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
862 } break;
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
863
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
864 case u_reco: {
9
8c65411cd7ab integration work on url scanner
carl
parents: 8
diff changeset
865 if (count > 12) {
8c65411cd7ab integration work on url scanner
carl
parents: 8
diff changeset
866 pending[count-1] = 0;
8c65411cd7ab integration work on url scanner
carl
parents: 8
diff changeset
867 if (strncasecmp((const char *)pending, "http://", 7) == 0) {
11
2c206836b4cc integration work on url scanner
carl
parents: 9
diff changeset
868 char *p = (char *)pending + 7;
2c206836b4cc integration work on url scanner
carl
parents: 9
diff changeset
869 if (strchr(p, '.')) urls->insert(strdup(p)); // require at least one . in a dns name
9
8c65411cd7ab integration work on url scanner
carl
parents: 8
diff changeset
870 }
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
871 }
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
872 } // fall thru
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
873
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
874 case u_init: {
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
875 count = 0; // discard all characters
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
876 } break;
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
877
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
878
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
879 //////////////////////////////
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
880 // mime decoder
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
881 case m_2: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
882 pending[0] = hex_decode[pending[1]] * 16 + hex_decode[pending[2]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
883 count = 1;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
884 st = m_init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
885 } // fall thru
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
886
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
887 case m_init: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
888 if (next) next->push(pending, count);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
889 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
890 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
891
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
892 case m_cr: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
893 count = 1;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
894 st = m_eq;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
895 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
896
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
897 case m_nl: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
898 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
899 st = m_init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
900 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
901
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
902 //////////////////////////////
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
903 // html entity decoder
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
904 case e_semi: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
905 pending[--count] = '\0'; // null terminate the digit string by overwriting the semicolon
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
906 pending[0] = atoi((const char *)pending+2);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
907 count = 1;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
908 st = e_init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
909 } // fall thru
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
910
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
911 case e_init: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
912 if (next) next->push(pending, count);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
913 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
914 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
915
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
916 //////////////////////////////
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
917 // base64 decoder
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
918 case b_lf2: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
919 count--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
920 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
921
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
922 case b_cr: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
923 int cnt = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
924 if ((count % 4) == 1) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
925 count--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
926 // might have proper b64 data
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
927 for (int i=0; i<count; i+=4) {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
928 unsigned long a1 = b64_decode[pending[i]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
929 unsigned long a2 = b64_decode[pending[i+1]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
930 unsigned long a3 = b64_decode[pending[i+2]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
931 unsigned long a4 = b64_decode[pending[i+3]];
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
932 unsigned long a = (a1 << 18) | (a2 << 12) | (a3 << 6) | a4;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
933 pending[cnt++] = (a & 0x00ff0000) >> 16;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
934 pending[cnt++] = (a & 0x0000ff00) >> 8;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
935 pending[cnt++] = (a & 0x000000ff);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
936 if ((char)pending[i+3] == '=') cnt--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
937 if ((char)pending[i+2] == '=') cnt--;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
938 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
939 count = cnt;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
940 st = b_lf2;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
941 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
942 else st = b_init;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
943 } // fall thru
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
944
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
945 case b_lf:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
946 case b_init: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
947 if (next) next->push(pending, count);
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
948 count = 0;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
949 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
950
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
951 //////////////////////////////
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
952 // states that just accumulate characters in the pending buffer
7
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
953 case u_http:
93ff6d1ef647 stable standalone scanner module
carl
parents: 6
diff changeset
954 case u_url:
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
955 case e_amp:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
956 case e_num:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
957 case b_64:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
958 case m_eq:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
959 case m_1:
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
960 default: {
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
961 } break;
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
962 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
963 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
964 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
965
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
966 struct url_scanner {
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
967 fsa *urls_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
968 fsa *html_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
969 fsa *mime_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
970 fsa *b64_parser;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
971
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
972 url_scanner(string_set *urls);
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
973 ~url_scanner();
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
974 void scan(u_char *buffer, size_t length);
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
975 };
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
976
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
977 url_scanner::url_scanner(string_set *urls) {
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
978 urls_parser = new fsa(u_init, NULL, urls);
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
979 html_parser = new fsa(e_init, urls_parser, NULL);
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
980 mime_parser = new fsa(m_init, html_parser, NULL);
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
981 b64_parser = new fsa(b_init, mime_parser, NULL);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
982 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
983
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
984 url_scanner::~url_scanner() {
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
985 delete urls_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
986 delete html_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
987 delete mime_parser;
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
988 delete b64_parser;
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
989 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
990
8
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
991 void url_scanner::scan(u_char *buffer, size_t length) {
dbe18921f741 integration work on url scanner
carl
parents: 7
diff changeset
992 b64_parser->push(buffer, length);
6
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
993 }
cea50d98a6cf start work on content url scanner
carl
parents:
diff changeset
994