1
  
2
  
3
  
4
  
5
  
6
  
7
  
8
  
9
  
10
  
11
  
12
  
13
  
14
  
15
  
16
  
17
  
18
  
19
  
20
  
21
  
22
  
23
  
24
  
25
  
26
  
27
  
28
  
29
  
30
  
31
  
32
  
33
  
34
  
35
  
36
  
37
  
38
  
39
  
40
  
41
  
42
  
43
  
44
  
45
  
46
  
47
  
48
  
49
  
50
  
51
  
52
  
53
  
54
  
55
  
56
  
57
  
58
  
59
  
60
  
61
  
62
  
63
  
64
  
65
  
66
  
67
  
68
  
69
  
70
  
71
  
72
  
73
  
74
  
75
  
76
  
77
  
78
  
79
  
80
  
81
  
82
  
83
  
84
  
85
  
86
  
87
  
88
  
89
  
90
  
91
  
92
  
93
  
94
  
95
  
96
  
97
  
98
  
99
  
100
  
101
  
102
  
103
  
104
  
105
  
106
  
107
  
108
  
109
  
110
  
111
  
112
  
113
  
114
  
115
  
116
  
117
  
118
  
119
  
120
  
121
  
122
  
123
  
124
  
125
  
126
  
127
  
128
  
129
  
130
  
131
  
132
  
133
  
134
  
135
  
136
  
137
  
138
  
139
  
140
  
141
  
142
  
143
  
144
  
145
  
146
  
147
  
148
  
149
  
150
  
151
  
152
  
153
  
154
  
155
  
156
  
157
  
158
  
159
  
160
  
161
  
162
  
163
  
164
  
165
  
166
  
167
  
168
  
169
  
170
  
171
  
172
  
173
  
174
  
175
  
176
  
177
  
178
  
179
  
180
  
181
  
182
  
183
  
184
  
185
  
186
  
187
  
188
  
189
  
190
  
191
  
192
  
193
  
194
  
195
  
196
  
197
  
198
  
199
  
200
  
// This file is part of Roxen Search 
// Copyright © 2001 Roxen IS. All rights reserved. 
// 
// $Id: Utils.pmod,v 1.13 2001/07/12 16:41:22 js Exp $ 
 
public array(string) tokenize_and_normalize( string what ) 
//! This can be optimized quite significantly when compared to 
//! tokenize( normalize( x ) ) in the future, currently it's not all 
//! that much faster, but still faster. 
{ 
  return Unicode.split_words_and_normalize( lower_case(what) ); 
} 
 
public array(string) tokenize(string in) 
//! Tokenize the input string (Note: You should first call normalize 
//! on it) 
{ 
  return Unicode.split_words( in ); 
} 
 
 
public string normalize(string in) 
//! Normalize the input string. Performs unicode NFKD normalization 
//! and then lowercases the whole string 
{ 
  return Unicode.normalize( lower_case(in), "KD" ); 
} 
 
class Logger { 
 
  private string|Sql.Sql logdb; 
  private int profile; 
 
  private Sql.Sql get_db() { 
    Sql.Sql db; 
#if constant(DBManager) 
    if(stringp(logdb)) 
      db = DBManager.get(logdb); 
    else 
#endif 
      db = logdb; 
 
    //    if(!logdb || !logdb->query) 
    //      throw( ({ "Couldn't find any database object.\n", backtrace() }) ); 
 
    return db; 
  } 
 
  void create(string|Sql.Sql _logdb, int _profile) { 
    logdb = _logdb; 
    profile = _profile; 
 
    // create table eventlog (event int unsigned auto_increment primary key, 
    // at timestamp(14) not null, code int unsigned not null, extra varchar(255)) 
 
    Sql.Sql db = get_db(); 
 
    if(catch(db->query("SELECT code FROM eventlog WHERE event=0"))) 
      db->query("CREATE TABLE eventlog (" 
                "event int unsigned auto_increment primary key," 
                "at timestamp(14) not null," 
                "profile int unsigned not null," 
                "code int unsigned not null," 
                "type enum('error','warning','notice') not null," 
                "extra varchar(255))"); 
  } 
 
  void log_event( int code, string type, void|string extra, void|int log_profile ) { 
    Sql.Sql db = get_db(); 
    if(!db) return; 
 
    if(zero_type(log_profile)) 
      log_profile = profile; 
 
    if(extra) 
      db->query("INSERT INTO eventlog (profile,code,type,extra) VALUES (%d,%d,%s,%s)", 
                log_profile, code, type, extra); 
    else 
      db->query("INSERT INTO eventlog (profile, code,type) VALUES (%d,%d,%s)", 
                log_profile, code, type); 
  } 
 
  void log_error( int code, void|string extra, void|int log_profile ) { 
    log_event( code, "error", extra ); 
  } 
 
  void log_warning( int code, void|string extra, void|int log_profile ) { 
    log_event( code, "warning", extra, log_profile ); 
  } 
 
  void log_notice( int code, void|string extra, void|int log_profile ) { 
    log_event( code, "notice", extra, log_profile ); 
  } 
 
  int add_program_name(int code, string name) { 
    int add = search( ({ "multiprocess_crawler", "buffer_c2f", "filter", 
                         "buffer_f2i", "indexer" }), name ); 
    if(add==-1) 
      throw( ({ "Unknown program name \""+name+"\".\n", backtrace() }) ); 
 
    return code + add; 
  } 
 
  private mapping codes = ([ 
    10 : "Started crawler with %s.", 
    11 : "Started crawler-to-filter buffer with %s.", 
    12 : "Started filter with %s.", 
    13 : "Started filter-to-indexer buffer with %s.", 
    14 : "Started indexer with %s.", 
 
    20 : "Exiting crawler due to signal.", 
    21 : "Exiting crawler-to-filter buffer due to signal.", 
    22 : "Exiting filter due to signal.", 
    23 : "Exiting filter-to-indexer buffer due to signal.", 
    24 : "Exiting indexer due to signal.", 
 
    30 : "Crawler failed to set up pipe.", 
    31 : "Crawler-to-filter buffer failed to set up pipe.", 
    32 : "Filter failed to set up pipe.", 
    33 : "Filter-to-indexer buffer failed to set up pipe.", 
    34 : "Indexer failed to set up pipe.", 
 
    40 : "Fetched %s.", 
    41 : "Unknown language code \"%s\".", 
    42 : "Crawler exited normally.", 
    43 : "Cleared search database.", 
    44 : "Sitebuilder commit triggered indexing of %s.", 
 
    50 : "Crawler did not get any connection from the process.", 
    51 : "Crawler-to-filter bufferdid not get any connection from the process.", 
    52 : "Filter did not get any connection from the process.", 
    53 : "Filter-to-indexer buffer did not get any connection from the process.", 
    54 : "Indexer did not get any connection from the process.", 
 
    300: "300 Redirection: Multiple Choices (%s)", 
    301: "301 Redirection: Moved Permanently (%s)", 
    302: "302 Redirection: Found (%s)", 
    303: "303 Redirection: See Other (%s)", 
    304: "304 Redirection: Not Modified (%s)", 
    305: "305 Redirection: Use Proxy (%s)", 
    306: "306 Redirection: (Unused) (%s)", 
    307: "307 Redirection: Temporary Redirect (%s)", 
    400: "400 Client Error: Bad Request (%s)", 
    401: "401 Client Error: Unauthorized (%s)", 
    402: "402 Client Error: Payment Required (%s)", 
    403: "403 Client Error: Forbidden (%s)", 
    404: "404 Client Error: Not Found (%s)", 
    405: "405 Client Error: Method Not Allowed (%s)", 
    406: "406 Client Error: Not Acceptable (%s)", 
    407: "407 Client Error: Proxy Authentication Required (%s)", 
    408: "408 Client Error: Request Timeout (%s)", 
    409: "409 Client Error: Conflict (%s)", 
    410: "410 Client Error: Gone (%s)", 
    411: "411 Client Error: Length Required (%s)", 
    412: "412 Client Error: Precondition Failed (%s)", 
    413: "413 Client Error: Request Entity Too Large (%s)", 
    414: "414 Client Error: Request-URI Too Long (%s)", 
    415: "415 Client Error: Unsupported Media Type (%s)", 
    416: "416 Client Error: Requested Range Not Satisfiable (%s)", 
    417: "417 Client Error: Expectation Failed (%s)", 
    500: "500 Server Error: Internal Server Error (%s)", 
    501: "501 Server Error: Not Implemented (%s)", 
    502: "502 Server Error: Bad Gateway (%s)", 
    503: "503 Server Error: Service Unavailable (%s)", 
    504: "504 Server Error: Gateway Timeout (%s)", 
    505: "505 Server Error: HTTP Version Not Supported (%s)", 
  ]); 
     
 
  array(array(string|int)) get_log( int profile, array(string) types, 
                                int from, int to ) { 
 
    string sql = ""; 
#define SQLADD(X) do{sizeof(sql)?(sql+=" AND "+(X)):(sql=" WHERE "+(X));}while(0) 
    if(profile) 
      SQLADD("profile=" + profile); 
    if(!sizeof(types)) 
      return ({}); 
    if(sizeof(types)!=3) 
      SQLADD("(type='" + (types*"' OR type='") + "')"); 
    if(from) 
      SQLADD("at>" + from); 
    if(to) 
      SQLADD("to<" + to); 
#undef SQLADD 
 
    Sql.Sql db = get_db(); 
    if(!db) return ({}); 
 
    return map(db->query("SELECT unix_timestamp(at) as at,profile,code,type,extra FROM eventlog" + 
                         sql + " ORDER BY event DESC"), 
               lambda(mapping in) { 
                 return ({ (int)in->at, (int)in->profile, in->type, 
                           in->extra?sprintf(codes[(int)in->code], @(in->extra/"\n")): 
                           codes[(int)in->code] }); 
               } ); 
  } 
}